{ "cells": [ { "cell_type": "markdown", "metadata": { "id": "4K4FCNvH8dtm" }, "source": [ "# JAX-CFD demo\n", "\n", "This initial demonstration shows how to use JAX-CFD to simulate decaying turbulence in 2D." ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "executionInfo": { "elapsed": 6549, "status": "ok", "timestamp": 1635284279593, "user": { "displayName": "", "photoUrl": "", "userId": "" }, "user_tz": 420 }, "id": "n2J40uBCo9By" }, "outputs": [], "source": [ "import jax\n", "import jax.numpy as jnp\n", "import jax_cfd.base as cfd\n", "import numpy as np\n", "import seaborn\n", "import xarray" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "executionInfo": { "elapsed": 6551, "status": "ok", "timestamp": 1635284297511, "user": { "displayName": "", "photoUrl": "", "userId": "" }, "user_tz": 420 }, "id": "KcJcpDavpAoi", "outputId": "e07e7188-7fce-464e-9189-52b35748fd76" }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2024-05-21 11:48:31.142056: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_convert_element_type:\n", "2024-05-21 11:48:31.142087: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:31.142095: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:31.142099: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:31.142104: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:31.142108: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:31.142112: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:31.142116: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:31.142120: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:31.142124: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:31.142128: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:31.142132: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:31.142136: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:31.142139: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:31.142143: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:31.142147: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:31.142151: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:31.142155: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:31.142158: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:31.142162: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:31.142166: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:31.142169: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:31.142173: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:31.142177: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:31.142180: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:31.142184: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:31.142188: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:31.142192: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:31.142195: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:31.142199: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:31.142203: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:31.142207: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:31.142210: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:31.142214: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:31.142217: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:31.142221: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:31.142227: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:31.142231: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:31.142234: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:31.142238: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:31.142242: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:31.142245: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:31.142249: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:31.142253: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:31.142256: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:31.142260: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:31.142263: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:31.142267: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:31.142271: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:31.142274: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:31.142278: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:31.142282: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:31.142285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:31.142289: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:31.142293: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:31.142296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:31.142300: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:31.142303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:31.142307: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:31.142311: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:31.142314: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:31.142318: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:31.142321: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:31.142329: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:31.142333: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:34.452399: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__threefry_seed:\n", "2024-05-21 11:48:34.452440: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:34.452466: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:34.452471: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:34.452475: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:34.452479: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:34.452483: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:34.452487: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:34.452491: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:34.452495: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:34.452499: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:34.452503: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:34.452507: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:34.452511: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:34.452514: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:34.452518: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:34.452522: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:34.452525: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:34.452529: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:34.452532: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.452536: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:34.452539: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:34.452543: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:34.452547: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:34.452552: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:34.452556: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:34.452559: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:34.452563: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:34.452567: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:34.452570: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:34.452574: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:34.452577: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:34.452581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:34.452584: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:34.452588: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:34.452594: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:34.452601: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:34.452605: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:34.452609: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:34.452612: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:34.452616: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:34.452619: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:34.452623: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.452627: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.452630: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:34.452634: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:34.452637: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:34.452641: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:34.452645: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:34.452648: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:34.452652: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:34.452657: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:34.452661: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:34.452664: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:34.452668: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:34.452672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:34.452675: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:34.452679: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_detailed_logging: true\n", "2024-05-21 11:48:34.452682: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:34.452686: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:34.452689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:34.452693: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:34.452698: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:34.452702: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:34.452706: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:34.452710: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:34.603707: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__threefry_split:\n", "2024-05-21 11:48:34.603744: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:34.603749: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:34.603755: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:34.603760: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:34.603764: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:34.603768: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:34.603771: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:34.603775: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:34.603779: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:34.603782: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:34.603786: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:34.603790: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:34.603793: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:34.603797: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:34.603801: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:34.603804: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:34.603809: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:34.603813: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:34.603816: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.603820: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:34.603824: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:34.603827: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:34.603831: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:34.603835: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:34.603838: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:34.603842: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:34.603845: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:34.603849: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:34.603853: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:34.603857: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:34.603861: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:34.603865: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:34.603869: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:34.603873: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:34.603876: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:34.603883: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:34.603886: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:34.603890: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:34.603894: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:34.603897: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:34.603902: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:34.603906: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.603909: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.603913: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:34.603918: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:34.603922: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:34.603925: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:34.603929: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:34.603933: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:34.603936: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:34.603940: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:34.603944: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:34.603947: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:34.603951: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:34.603955: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:34.603958: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:34.603962: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_detailed_logging: true\n", "2024-05-21 11:48:34.603966: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:34.603969: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:34.603974: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:34.603978: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:34.603982: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:34.603986: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:34.603990: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:34.603993: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:34.751112: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__unstack:\n", "2024-05-21 11:48:34.751148: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:34.751153: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:34.751158: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:34.751162: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:34.751166: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:34.751171: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:34.751175: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:34.751179: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:34.751182: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:34.751186: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:34.751190: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:34.751194: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:34.751197: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:34.751201: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:34.751205: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:34.751208: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:34.751212: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:34.751216: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:34.751220: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.751224: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:34.751229: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:34.751232: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:34.751236: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:34.751239: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:34.751243: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:34.751247: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:34.751250: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:34.751254: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:34.751258: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:34.751262: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:34.751265: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:34.751269: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:34.751273: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:34.751277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:34.751282: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:34.751289: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:34.751292: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:34.751296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:34.751300: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:34.751303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:34.751307: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:34.751311: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.751314: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.751318: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:34.751325: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:34.751331: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:34.751336: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:34.751341: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:34.751347: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:34.751352: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:34.751358: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:34.751363: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:34.751369: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:34.751373: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:34.751379: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:34.751385: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:34.751391: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:34.751396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:34.751401: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:34.751404: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:34.751408: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:34.751412: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:34.751415: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:34.751419: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:34.930321: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__normal:\n", "2024-05-21 11:48:34.930357: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:34.930363: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:34.930368: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:34.930372: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:34.930376: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:34.930380: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:34.930384: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:34.930388: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:34.930392: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:34.930395: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:34.930399: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:34.930403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:34.930407: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:34.930411: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:34.930416: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:34.930419: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:34.930423: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:34.930427: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:34.930430: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.930434: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:34.930438: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:34.930441: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:34.930445: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:34.930449: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:34.930464: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:34.930468: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:34.930472: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:34.930475: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:34.930481: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:34.930486: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:34.930493: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:34.930498: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:34.930502: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:34.930508: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:34.930514: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:34.930523: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:34.930529: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:34.930535: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:34.930541: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:34.930547: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:34.930552: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:34.930555: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.930559: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:34.930565: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:34.930571: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:34.930577: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:34.930581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:34.930585: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:34.930590: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:34.930596: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:34.930601: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:34.930605: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:34.930609: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:34.930613: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:34.930617: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:34.930622: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:34.930629: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_detailed_logging: true\n", "2024-05-21 11:48:34.930634: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:34.930639: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:34.930642: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:34.930648: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:34.930655: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:34.930662: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:34.930667: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:34.930673: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.163186: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_convert_element_type:\n", "2024-05-21 11:48:35.163224: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.163230: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.163235: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.163239: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.163243: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.163246: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.163250: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.163255: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.163259: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.163263: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.163266: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.163270: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.163274: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.163277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.163281: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.163285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.163288: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.163292: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.163296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.163299: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.163303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.163308: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.163312: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.163315: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.163319: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.163323: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.163326: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.163330: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.163334: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.163337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.163341: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.163345: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.163348: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.163352: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.163356: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.163364: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.163368: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.163372: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.163375: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.163379: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.163383: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.163386: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.163391: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.163397: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.163403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.163409: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.163414: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.163420: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.163425: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.163431: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.163437: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.163443: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.163447: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.163459: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.163463: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.163467: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.163471: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.163474: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.163478: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.163481: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.163485: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.163489: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.163492: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.163496: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.287518: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_broadcast_in_dim:\n", "2024-05-21 11:48:35.287561: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.287567: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.287571: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.287575: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.287580: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.287584: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.287589: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.287592: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.287596: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.287600: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.287603: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.287607: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.287611: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.287614: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.287618: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.287622: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.287625: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.287629: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.287633: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.287638: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.287642: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.287646: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.287651: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.287656: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.287660: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.287666: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.287671: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.287676: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.287683: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.287689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.287695: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.287700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.287704: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.287709: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.287715: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.287725: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.287733: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.287741: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.287747: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.287752: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.287758: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.287764: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.287769: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.287774: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.287778: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.287782: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.287788: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.287793: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.287800: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.287805: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.287811: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.287816: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.287822: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.287827: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.287833: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.287838: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.287842: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.287846: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.287850: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.287855: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.287858: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.287862: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.287866: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.287871: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.423036: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_iota:\n", "2024-05-21 11:48:35.423078: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.423083: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.423087: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.423091: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.423095: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.423099: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.423103: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.423107: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.423111: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.423115: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.423119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.423122: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.423126: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.423130: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.423134: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.423137: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.423141: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.423145: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.423148: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.423152: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.423155: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.423159: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.423164: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.423168: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.423172: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.423175: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.423179: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.423183: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.423186: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.423190: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.423194: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.423197: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.423201: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.423205: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.423208: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.423216: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.423220: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.423224: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.423227: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.423231: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.423235: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.423238: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.423246: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.423251: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.423256: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.423261: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.423267: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.423274: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.423280: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.423285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.423290: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.423295: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.423302: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.423308: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.423314: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.423320: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.423327: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.423331: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.423335: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.423338: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.423342: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.423346: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.423349: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.423353: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.548499: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_broadcast_in_dim:\n", "2024-05-21 11:48:35.548542: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.548548: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.548554: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.548558: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.548561: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.548565: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.548569: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.548573: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.548576: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.548580: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.548584: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.548587: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.548591: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.548595: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.548599: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.548603: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.548607: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.548611: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.548615: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.548618: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.548622: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.548627: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.548632: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.548638: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.548643: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.548648: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.548654: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.548660: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.548666: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.548672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.548678: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.548683: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.548688: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.548694: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.548700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.548712: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.548717: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.548723: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.548727: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.548730: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.548734: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.548738: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.548741: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.548745: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.548751: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.548758: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.548764: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.548769: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.548773: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.548777: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.548783: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.548789: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.548793: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.548797: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.548800: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.548807: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.548814: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.548820: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.548826: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.548831: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.548835: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.548838: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.548842: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.548846: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.674595: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__squeeze:\n", "2024-05-21 11:48:35.674640: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.674647: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.674654: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.674661: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.674666: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.674672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.674677: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.674683: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.674689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.674695: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.674700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.674706: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.674713: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.674719: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.674725: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.674730: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.674737: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.674742: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.674747: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.674752: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.674757: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.674763: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.674769: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.674774: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.674779: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.674785: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.674790: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.674795: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.674800: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.674806: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.674813: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.674817: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.674821: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.674825: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.674829: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.674837: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.674841: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.674845: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.674848: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.674852: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.674856: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.674859: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.674863: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.674867: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.674871: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.674875: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.674880: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.674886: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.674891: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.674895: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.674899: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.674903: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.674906: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.674910: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.674914: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.674917: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.674921: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.674925: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.674930: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.674933: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.674937: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.674941: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.674944: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.674948: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.796615: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_scatter:\n", "2024-05-21 11:48:35.796660: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.796668: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.796675: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.796681: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.796686: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.796692: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.796697: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.796703: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.796709: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.796715: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.796721: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.796728: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.796733: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.796738: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.796745: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.796750: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.796756: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.796761: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.796766: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.796772: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.796778: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.796785: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.796791: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.796796: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.796801: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.796807: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.796813: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.796818: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.796824: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.796830: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.796837: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.796843: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.796848: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.796854: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.796860: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.796869: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.796875: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.796881: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.796887: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.796893: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.796899: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.796906: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.796912: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.796917: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.796923: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.796930: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.796935: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.796942: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.796948: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.796954: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.796960: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.796966: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.796972: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.796977: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.796983: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.796989: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.796995: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.797001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.797007: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.797012: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.797019: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.797025: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.797031: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.797036: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.938508: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_convert_element_type:\n", "2024-05-21 11:48:35.938553: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.938561: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.938568: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.938574: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.938579: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.938585: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.938591: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.938596: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.938602: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.938608: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.938615: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.938620: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.938626: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.938632: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.938638: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.938644: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.938650: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.938655: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.938660: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.938666: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.938671: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.938677: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.938683: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.938688: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.938694: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.938700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.938705: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.938711: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.938718: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.938723: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.938727: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.938730: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.938734: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.938738: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.938741: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.938749: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.938753: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.938756: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.938760: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.938764: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.938769: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.938773: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.938776: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.938780: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.938783: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.938789: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.938794: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.938799: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.938803: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.938807: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.938810: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.938814: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.938818: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.938822: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.938826: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.938830: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.938834: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.938837: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.938841: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.938844: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.938848: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.938852: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.938855: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.938859: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:35.970714: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_true_divide:\n", "2024-05-21 11:48:35.970755: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:35.970763: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:35.970768: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:35.970774: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:35.970780: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:35.970787: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:35.970792: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:35.970798: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:35.970803: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:35.970809: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:35.970815: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:35.970820: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:35.970829: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:35.970835: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:35.970841: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:35.970847: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:35.970852: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:35.970858: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:35.970863: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.970869: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:35.970874: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:35.970880: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:35.970886: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:35.970893: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:35.970899: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:35.970904: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:35.970910: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:35.970915: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:35.970920: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:35.970926: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:35.970931: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:35.970937: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:35.970943: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:35.970949: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:35.970956: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:35.970965: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:35.970971: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:35.970977: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:35.970983: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:35.970989: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:35.970995: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:35.971001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.971008: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:35.971014: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:35.971019: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:35.971025: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:35.971031: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:35.971037: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:35.971042: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:35.971048: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:35.971054: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:35.971059: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:35.971065: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:35.971072: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:35.971077: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:35.971083: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:35.971088: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:35.971094: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:35.971101: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:35.971107: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:35.971113: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:35.971119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:35.971125: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:35.971132: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:36.101378: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:48:36.101424: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:36.101432: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:36.101438: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:36.101443: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:36.101459: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:36.101466: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:36.101473: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:36.101480: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:36.101486: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:36.101492: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:36.101497: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:36.101503: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:36.101508: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:36.101514: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:36.101519: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:36.101526: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:36.101532: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:36.101538: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:36.101543: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.101552: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:36.101557: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:36.101563: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:36.101568: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:36.101574: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:36.101581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:36.101588: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:36.101593: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:36.101598: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:36.101605: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:36.101610: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:36.101616: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:36.101622: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:36.101628: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:36.101633: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:36.101640: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:36.101651: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:36.101656: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:36.101662: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:36.101667: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:36.101672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:36.101678: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:36.101684: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.101689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.101695: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:36.101702: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:36.101708: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:36.101714: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:36.101719: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:36.101724: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:36.101730: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:36.101736: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:36.101742: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:36.101748: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:36.101754: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:36.101761: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:36.101767: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:36.101773: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:36.101778: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:36.101784: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:36.101790: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:36.101796: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:36.101802: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:36.101807: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:36.101812: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:36.236763: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_broadcast_in_dim:\n", "2024-05-21 11:48:36.236812: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:36.236819: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:36.236825: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:36.236831: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:36.236837: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:36.236843: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:36.236848: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:36.236855: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:36.236861: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:36.236868: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:36.236873: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:36.236878: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:36.236887: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:36.236893: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:36.236898: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:36.236904: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:36.236910: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:36.236916: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:36.236923: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.236929: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:36.236935: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:36.236940: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:36.236944: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:36.236950: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:36.236955: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:36.236960: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:36.236967: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:36.236974: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:36.236979: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:36.236984: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:36.236989: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:36.236995: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:36.237001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:36.237007: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:36.237011: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:36.237018: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:36.237023: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:36.237026: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:36.237030: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:36.237034: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:36.237037: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:36.237041: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.237045: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.237048: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:36.237052: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:36.237055: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:36.237059: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:36.237063: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:36.237066: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:36.237070: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:36.237075: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:36.237079: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:36.237083: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:36.237088: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:36.237093: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:36.237099: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:36.237102: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:36.237106: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:36.237110: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:36.237113: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:36.237117: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:36.237121: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:36.237124: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:36.237128: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:36.364287: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_broadcast_in_dim:\n", "2024-05-21 11:48:36.364330: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:36.364337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:36.364343: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:36.364349: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:36.364354: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:36.364360: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:36.364366: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:36.364372: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:36.364378: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:36.364385: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:36.364391: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:36.364396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:36.364402: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:36.364408: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:36.364414: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:36.364419: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:36.364424: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:36.364430: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:36.364437: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.364443: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:36.364448: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:36.364466: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:36.364472: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:36.364477: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:36.364483: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:36.364490: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:36.364497: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:36.364503: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:36.364509: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:36.364514: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:36.364520: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:36.364525: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:36.364530: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:36.364536: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:36.364542: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:36.364553: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:36.364560: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:36.364565: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:36.364570: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:36.364576: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:36.364582: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:36.364587: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.364593: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.364599: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:36.364606: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:36.364613: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:36.364619: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:36.364625: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:36.364631: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:36.364636: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:36.364642: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:36.364648: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:36.364654: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:36.364660: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:36.364667: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:36.364674: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:36.364680: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:36.364686: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:36.364692: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:36.364697: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:36.364703: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:36.364708: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:36.364714: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:36.364720: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:36.492697: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_broadcast_in_dim:\n", "2024-05-21 11:48:36.492742: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:36.492749: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:36.492755: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:36.492761: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:36.492767: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:36.492773: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:36.492779: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:36.492785: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:36.492791: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:36.492796: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:36.492802: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:36.492807: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:36.492813: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:36.492819: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:36.492825: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:36.492831: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:36.492837: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:36.492842: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:36.492848: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.492853: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:36.492858: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:36.492862: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:36.492871: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:36.492876: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:36.492883: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:36.492889: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:36.492895: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:36.492900: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:36.492906: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:36.492910: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:36.492916: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:36.492923: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:36.492928: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:36.492935: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:36.492940: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:36.492946: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:36.492950: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:36.492954: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:36.492957: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:36.492961: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:36.492965: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:36.492968: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.492973: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.492977: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:36.492981: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:36.492984: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:36.492988: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:36.492992: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:36.492995: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:36.492999: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:36.493003: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:36.493006: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:36.493010: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:36.493014: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:36.493019: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:36.493025: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:36.493031: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:36.493035: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:36.493039: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:36.493043: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:36.493046: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:36.493050: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:36.493053: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:36.493057: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:36.621079: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_concatenate:\n", "2024-05-21 11:48:36.621127: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:36.621132: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:36.621137: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:36.621141: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:36.621145: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:36.621149: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:36.621152: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:36.621156: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:36.621160: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:36.621163: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:36.621167: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:36.621172: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:36.621176: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:36.621180: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:36.621183: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:36.621187: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:36.621191: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:36.621194: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:36.621198: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.621202: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:36.621205: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:36.621209: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:36.621213: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:36.621216: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:36.621220: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:36.621225: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:36.621229: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:36.621232: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:36.621236: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:36.621240: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:36.621243: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:36.621249: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:36.621254: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:36.621259: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:36.621264: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:36.621277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:36.621282: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:36.621287: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:36.621291: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:36.621294: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:36.621298: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:36.621303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.621309: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.621315: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:36.621320: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:36.621324: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:36.621329: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:36.621335: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:36.621340: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:36.621345: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:36.621351: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:36.621356: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:36.621359: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:36.621365: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:36.621370: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:36.621375: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:36.621379: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:36.621384: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:36.621388: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:36.621392: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:36.621398: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:36.621403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:36.621408: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:36.621412: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:36.908858: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_norm:\n", "2024-05-21 11:48:36.908900: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:36.908906: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:36.908910: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:36.908914: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:36.908918: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:36.908922: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:36.908925: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:36.908929: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:36.908933: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:36.908936: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:36.908940: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:36.908945: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:36.908949: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:36.908952: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:36.908956: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:36.908960: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:36.908963: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:36.908967: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:36.908971: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.908974: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:36.908978: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:36.908982: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:36.908985: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:36.908989: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:36.908993: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:36.908997: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:36.909001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:36.909005: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:36.909008: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:36.909012: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:36.909016: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:36.909019: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:36.909023: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:36.909026: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:36.909030: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:36.909038: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:36.909042: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:36.909046: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:36.909050: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:36.909054: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:36.909058: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:36.909061: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.909065: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:36.909069: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:36.909072: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:36.909076: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:36.909080: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:36.909083: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:36.909087: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:36.909091: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:36.909094: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:36.909098: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:36.909102: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:36.909107: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:36.909111: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:36.909114: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:36.909118: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:36.909122: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:36.909125: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:36.909129: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:36.909133: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:36.909136: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:36.909140: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:36.909143: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.096035: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:48:37.096079: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.096084: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.096089: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.096093: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.096098: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.096102: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.096106: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.096109: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.096113: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.096117: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.096120: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.096124: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.096127: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.096131: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.096135: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.096138: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.096142: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.096146: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.096150: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.096155: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.096159: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.096163: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.096166: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.096170: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.096173: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.096177: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.096181: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.096184: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.096188: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.096192: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.096196: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.096199: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.096204: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.096208: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.096211: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.096220: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.096224: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.096228: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.096231: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.096235: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.096239: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.096242: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.096246: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.096250: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.096254: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.096258: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.096262: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.096266: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.096270: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.096273: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.096277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.096281: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.096285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.096288: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.096292: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.096296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.096299: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.096303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.096307: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.096311: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.096315: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.096319: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.096323: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.096326: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.229803: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__lambda_:\n", "2024-05-21 11:48:37.229845: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.229852: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.229859: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.229864: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.229868: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.229872: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.229875: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.229879: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.229883: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.229886: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.229890: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.229893: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.229897: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.229901: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.229904: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.229908: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.229911: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.229915: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.229920: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.229925: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.229931: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.229936: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.229940: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.229943: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.229947: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.229950: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.229954: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.229958: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.229961: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.229965: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.229968: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.229973: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.229977: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.229981: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.229984: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.229993: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.229997: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.230001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.230007: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.230012: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.230016: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.230020: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.230023: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.230028: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.230032: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.230035: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.230039: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.230043: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.230046: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.230050: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.230054: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.230057: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.230061: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.230064: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.230068: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.230072: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.230075: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.230081: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.230087: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.230092: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.230096: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.230100: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.230103: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.230107: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.405424: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:48:37.405470: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.405476: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.405480: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.405484: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.405488: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.405492: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.405495: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.405499: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.405503: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.405506: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.405510: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.405514: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.405518: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.405523: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.405526: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.405530: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.405533: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.405537: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.405541: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.405544: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.405548: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.405551: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.405555: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.405559: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.405562: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.405566: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.405570: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.405575: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.405579: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.405582: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.405586: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.405589: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.405593: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.405596: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.405600: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.405608: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.405612: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.405616: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.405619: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.405623: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.405628: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.405631: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.405635: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.405639: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.405642: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.405646: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.405650: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.405653: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.405657: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.405661: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.405664: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.405668: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.405672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.405676: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.405680: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.405684: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.405688: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.405691: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.405695: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.405699: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.405702: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.405706: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.405709: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.405713: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.536125: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__lambda_:\n", "2024-05-21 11:48:37.536173: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.536180: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.536187: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.536193: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.536199: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.536204: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.536210: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.536216: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.536221: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.536227: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.536233: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.536240: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.536245: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.536251: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.536257: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.536263: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.536269: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.536275: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.536280: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.536285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.536291: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.536296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.536302: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.536308: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.536313: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.536319: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.536326: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.536331: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.536337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.536344: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.536349: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.536353: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.536356: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.536360: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.536364: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.536373: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.536377: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.536381: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.536384: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.536388: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.536392: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.536396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.536400: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.536405: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.536408: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.536412: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.536415: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.536419: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.536424: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.536430: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.536435: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.536439: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.536442: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.536446: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.536458: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.536462: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.536466: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.536469: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.536473: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.536477: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.536480: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.536484: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.536487: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.536491: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.719279: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__lambda_:\n", "2024-05-21 11:48:37.719325: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.719331: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.719337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.719343: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.719349: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.719356: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.719362: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.719367: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.719373: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.719379: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.719385: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.719390: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.719395: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.719401: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.719407: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.719413: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.719419: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.719424: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.719429: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.719435: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.719441: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.719446: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.719463: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.719468: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.719474: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.719480: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.719485: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.719490: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.719496: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.719502: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.719508: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.719514: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.719521: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.719526: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.719531: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.719544: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.719550: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.719556: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.719562: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.719569: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.719575: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.719581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.719587: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.719593: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.719599: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.719604: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.719610: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.719616: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.719622: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.719628: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.719634: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.719640: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.719645: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.719650: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.719656: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.719662: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.719668: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.719674: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.719679: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.719685: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.719691: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.719696: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.719702: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.719708: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.855097: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_integer_pow:\n", "2024-05-21 11:48:37.855143: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.855150: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.855158: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.855164: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.855170: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.855175: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.855182: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.855187: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.855193: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.855198: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.855203: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.855210: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.855216: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.855222: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.855228: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.855233: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.855241: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.855246: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.855251: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.855256: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.855262: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.855268: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.855273: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.855279: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.855285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.855290: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.855296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.855301: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.855307: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.855311: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.855316: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.855319: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.855323: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.855327: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.855330: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.855339: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.855343: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.855347: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.855350: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.855354: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.855358: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.855361: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.855366: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.855370: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.855373: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.855377: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.855381: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.855384: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.855388: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.855391: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.855396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.855402: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.855406: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.855410: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.855414: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.855418: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.855422: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.855426: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.855429: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.855433: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.855437: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.855440: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.855444: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.855447: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:37.988850: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__lambda_:\n", "2024-05-21 11:48:37.988897: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:37.988904: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:37.988911: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:37.988917: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:37.988922: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:37.988928: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:37.988934: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:37.988939: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:37.988945: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:37.988950: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:37.988956: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:37.988963: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:37.988969: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:37.988974: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:37.988981: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:37.988986: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:37.988992: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:37.988998: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:37.989003: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.989008: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:37.989014: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:37.989021: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:37.989027: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:37.989033: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:37.989039: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:37.989044: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:37.989050: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:37.989056: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:37.989061: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:37.989067: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:37.989073: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:37.989080: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:37.989086: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:37.989092: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:37.989097: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:37.989108: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:37.989114: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:37.989119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:37.989125: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:37.989131: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:37.989138: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:37.989144: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.989150: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:37.989156: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:37.989161: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:37.989166: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:37.989171: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:37.989178: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:37.989183: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:37.989189: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:37.989196: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:37.989202: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:37.989207: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:37.989213: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:37.989219: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:37.989225: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:37.989230: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:37.989236: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:37.989242: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:37.989248: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:37.989254: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:37.989260: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:37.989266: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:37.989271: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.117556: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_true_divide:\n", "2024-05-21 11:48:38.117599: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.117604: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.117609: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.117613: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.117617: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.117621: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.117625: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.117629: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.117633: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.117636: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.117640: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.117644: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.117647: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.117651: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.117655: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.117658: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.117662: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.117666: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.117669: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.117673: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.117677: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.117681: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.117685: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.117689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.117692: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.117696: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.117700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.117703: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.117707: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.117711: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.117714: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.117718: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.117722: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.117726: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.117730: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.117739: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.117743: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.117747: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.117750: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.117754: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.117758: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.117761: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.117765: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.117769: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.117773: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.117776: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.117780: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.117785: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.117789: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.117793: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.117796: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.117800: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.117804: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.117808: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.117811: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.117815: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.117819: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.117823: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.117826: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.117830: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.117834: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.117839: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.117843: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.117847: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.252896: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_true_divide:\n", "2024-05-21 11:48:38.252939: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.252944: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.252949: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.252953: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.252956: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.252960: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.252964: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.252968: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.252971: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.252975: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.252980: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.252984: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.252987: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.252991: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.252995: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.252999: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.253002: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.253006: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.253010: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.253013: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.253017: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.253021: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.253024: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.253028: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.253033: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.253037: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.253041: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.253044: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.253048: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.253051: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.253055: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.253059: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.253062: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.253066: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.253070: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.253079: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.253084: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.253088: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.253092: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.253096: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.253100: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.253103: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.253107: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.253111: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.253115: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.253119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.253122: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.253126: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.253130: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.253134: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.253139: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.253143: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.253147: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.253151: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.253155: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.253159: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.253162: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.253166: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.253170: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.253174: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.253177: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.253181: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.253185: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.253189: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.387748: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__lambda_:\n", "2024-05-21 11:48:38.387791: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.387796: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.387801: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.387805: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.387809: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.387812: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.387816: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.387821: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.387825: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.387828: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.387832: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.387836: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.387840: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.387843: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.387847: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.387850: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.387854: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.387858: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.387861: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.387865: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.387869: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.387873: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.387877: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.387881: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.387885: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.387888: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.387892: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.387896: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.387899: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.387903: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.387906: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.387910: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.387914: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.387917: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.387921: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.387930: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.387933: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.387937: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.387941: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.387944: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.387948: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.387952: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.387955: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.387959: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.387962: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.387966: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.387970: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.387973: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.387978: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.387982: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.387986: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.387990: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.387993: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.387997: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.388001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.388004: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.388008: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.388011: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.388015: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.388019: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.388022: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.388026: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.388030: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.388034: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.516028: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__lambda_:\n", "2024-05-21 11:48:38.516073: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.516078: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.516083: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.516087: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.516091: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.516094: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.516098: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.516102: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.516106: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.516111: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.516114: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.516118: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.516122: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.516126: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.516129: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.516133: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.516137: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.516140: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.516144: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.516147: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.516151: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.516155: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.516159: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.516164: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.516168: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.516171: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.516175: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.516179: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.516183: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.516186: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.516190: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.516193: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.516197: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.516201: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.516205: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.516213: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.516218: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.516223: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.516227: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.516230: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.516234: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.516238: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.516245: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.516249: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.516253: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.516257: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.516260: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.516264: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.516268: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.516273: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.516277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.516281: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.516284: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.516288: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.516292: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.516296: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.516300: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.516303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.516308: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.516311: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.516315: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.516319: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.516322: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.516326: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.691491: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_integer_pow:\n", "2024-05-21 11:48:38.691535: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.691540: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.691545: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.691550: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.691555: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.691559: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.691562: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.691566: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.691570: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.691573: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.691577: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.691581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.691585: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.691588: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.691592: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.691596: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.691600: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.691604: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.691608: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.691612: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.691616: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.691619: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.691623: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.691627: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.691630: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.691634: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.691638: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.691642: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.691645: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.691649: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.691653: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.691657: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.691661: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.691665: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.691669: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.691678: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.691681: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.691685: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.691689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.691692: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.691696: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.691700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.691703: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.691707: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.691712: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.691716: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.691719: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.691723: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.691727: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.691730: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.691734: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.691738: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.691741: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.691745: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.691749: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.691752: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.691756: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.691760: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.691764: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.691768: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.691772: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.691776: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.691779: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.691783: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.815247: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_true_divide:\n", "2024-05-21 11:48:38.815290: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.815295: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.815300: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.815304: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.815309: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.815313: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.815317: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.815321: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.815324: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.815328: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.815332: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.815335: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.815339: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.815343: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.815346: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.815350: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.815354: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.815358: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.815362: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.815366: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.815370: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.815374: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.815378: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.815381: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.815385: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.815389: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.815392: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.815396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.815400: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.815403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.815407: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.815411: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.815415: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.815420: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.815424: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.815432: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.815436: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.815440: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.815443: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.815447: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.815459: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.815463: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.815467: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.815472: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.815475: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.815479: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.815483: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.815487: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.815490: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.815494: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.815498: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.815501: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.815505: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.815509: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.815512: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.815516: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.815520: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.815525: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.815528: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.815532: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.815536: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.815539: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.815543: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.815547: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:38.956485: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit__where:\n", "2024-05-21 11:48:38.956529: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:38.956534: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:38.956538: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:38.956542: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:38.956546: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:38.956550: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:38.956554: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:38.956557: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:38.956561: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:38.956565: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:38.956569: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:38.956573: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:38.956577: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:38.956581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:38.956584: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:38.956588: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:38.956592: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:38.956595: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:38.956599: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.956603: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:38.956606: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:38.956610: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:38.956613: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:38.956617: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:38.956621: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:38.956626: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:38.956629: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:38.956633: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:38.956637: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:38.956640: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:38.956644: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:38.956647: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:38.956651: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:38.956655: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:38.956658: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:38.956667: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:38.956672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:38.956676: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:38.956680: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:38.956683: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:38.956687: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:38.956691: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.956694: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:38.956698: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:38.956702: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:38.956705: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:38.956709: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:38.956712: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:38.956716: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:38.956720: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:38.956724: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:38.956728: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:38.956732: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:38.956736: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:38.956739: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:38.956743: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:38.956747: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:38.956750: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:38.956754: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:38.956758: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:38.956761: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:38.956765: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:38.956768: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:38.956772: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:39.094147: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fft:\n", "2024-05-21 11:48:39.094192: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:39.094197: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:39.094201: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:39.094205: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:39.094209: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:39.094213: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:39.094217: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:39.094220: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:39.094224: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:39.094228: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:39.094231: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:39.094235: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:39.094240: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:39.094244: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:39.094248: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:39.094252: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:39.094255: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:39.094259: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:39.094263: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.094266: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:39.094270: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:39.094274: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:39.094277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:39.094281: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:39.094285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:39.094289: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:39.094293: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:39.094297: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:39.094302: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:39.094305: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:39.094309: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:39.094313: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:39.094317: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:39.094320: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:39.094324: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:39.094333: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:39.094337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:39.094341: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:39.094345: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:39.094348: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:39.094352: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:39.094356: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.094362: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.094365: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:39.094369: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:39.094373: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:39.094377: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:39.094380: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:39.094385: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:39.094388: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:39.094392: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:39.094396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:39.094400: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:39.094403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:39.094407: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:39.094411: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:39.094416: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:39.094420: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:39.094423: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:39.094427: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:39.094431: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:39.094435: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:39.094438: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:39.094442: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:39.323122: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:48:39.323166: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:39.323171: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:39.323176: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:39.323180: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:39.323184: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:39.323187: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:39.323191: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:39.323195: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:39.323198: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:39.323202: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:39.323207: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:39.323211: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:39.323215: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:39.323219: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:39.323222: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:39.323226: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:39.323230: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:39.323233: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:39.323237: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.323241: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:39.323244: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:39.323248: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:39.323251: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:39.323255: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:39.323260: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:39.323264: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:39.323268: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:39.323271: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:39.323275: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:39.323279: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:39.323282: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:39.323286: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:39.323290: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:39.323293: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:39.323297: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:39.323306: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:39.323310: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:39.323315: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:39.323318: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:39.323322: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:39.323326: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:39.323330: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.323333: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.323337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:39.323341: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:39.323344: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:39.323348: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:39.323352: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:39.323356: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:39.323359: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:39.323364: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:39.323368: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:39.323372: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:39.323376: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:39.323380: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:39.323383: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:39.323387: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:39.323390: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:39.323394: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:39.323398: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:39.323401: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:39.323405: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:39.323409: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:39.323413: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:39.453499: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fft:\n", "2024-05-21 11:48:39.453540: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:39.453545: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:39.453549: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:39.453554: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:39.453558: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:39.453562: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:39.453566: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:39.453569: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:39.453573: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:39.453577: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:39.453580: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:39.453584: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:39.453588: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:39.453591: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:39.453595: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:39.453598: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:39.453602: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:39.453607: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:39.453611: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.453614: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:39.453618: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:39.453622: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:39.453625: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:39.453629: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:39.453633: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:39.453636: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:39.453640: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:39.453643: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:39.453647: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:39.453651: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:39.453654: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:39.453658: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:39.453663: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:39.453666: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:39.453671: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:39.453682: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:39.453686: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:39.453689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:39.453693: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:39.453697: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:39.453700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:39.453704: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.453707: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.453711: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:39.453716: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:39.453720: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:39.453724: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:39.453727: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:39.453731: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:39.453735: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:39.453738: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:39.453742: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:39.453746: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:39.453749: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:39.453753: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:39.453757: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:39.453760: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:39.453764: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:39.453768: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:39.453772: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:39.453777: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:39.453780: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:39.453784: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:39.453788: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:39.587306: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_real:\n", "2024-05-21 11:48:39.587350: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:39.587355: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:39.587360: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:39.587364: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:39.587368: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:39.587371: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:39.587375: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:39.587379: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:39.587383: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:39.587386: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:39.587390: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:39.587395: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:39.587399: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:39.587403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:39.587406: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:39.587410: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:39.587414: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:39.587417: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:39.587421: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.587425: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:39.587428: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:39.587432: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:39.587436: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:39.587439: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:39.587443: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:39.587447: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:39.587459: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:39.587463: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:39.587466: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:39.587470: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:39.587474: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:39.587477: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:39.587481: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:39.587484: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:39.587488: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:39.587497: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:39.587502: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:39.587506: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:39.587510: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:39.587513: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:39.587517: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:39.587520: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.587524: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.587528: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:39.587531: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:39.587535: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:39.587539: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:39.587542: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:39.587546: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:39.587550: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:39.587554: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:39.587558: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:39.587562: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:39.587566: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:39.587570: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:39.587573: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:39.587577: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:39.587581: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:39.587584: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:39.587588: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:39.587591: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:39.587595: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:39.587599: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:39.587602: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:39.845887: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_scan:\n", "2024-05-21 11:48:39.845930: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:39.845935: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:39.845940: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:39.845944: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:39.845948: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:39.845952: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:39.845956: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:39.845959: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:39.845963: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:39.845967: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:39.845972: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:39.845976: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:39.845980: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:39.845983: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:39.845987: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:39.845991: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:39.845995: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:39.845998: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:39.846002: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.846006: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:39.846009: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:39.846013: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:39.846017: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:39.846021: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:39.846025: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:39.846029: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:39.846033: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:39.846037: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:39.846040: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:39.846044: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:39.846048: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:39.846052: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:39.846055: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:39.846059: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:39.846063: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:39.846070: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:39.846073: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:39.846077: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:39.846081: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:39.846085: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:39.846089: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:39.846093: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.846097: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:39.846100: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:39.846104: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:39.846108: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:39.846111: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:39.846115: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:39.846119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:39.846123: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:39.846126: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:39.846130: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:39.846134: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:39.846138: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:39.846142: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:39.846147: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:39.846150: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_detailed_logging: true\n", "2024-05-21 11:48:39.846154: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:39.846158: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:39.846161: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:39.846165: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:39.846169: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:39.846172: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:39.846176: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:39.846180: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:48:41.136495: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_multistep:\n", "2024-05-21 11:48:41.136542: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:48:41.136547: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:48:41.136551: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:48:41.136555: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:48:41.136559: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:48:41.136563: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:48:41.136567: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:48:41.136571: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:48:41.136575: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:48:41.136579: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:48:41.136583: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:48:41.136586: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:48:41.136590: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:48:41.136594: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:48:41.136597: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:48:41.136601: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:48:41.136605: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:48:41.136608: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:48:41.136612: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:41.136615: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:48:41.136619: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:48:41.136623: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:48:41.136628: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:48:41.136631: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:48:41.136635: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:48:41.136638: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:48:41.136642: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:48:41.136646: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:48:41.136649: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:48:41.136653: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:48:41.136657: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:48:41.136660: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:48:41.136664: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:48:41.136668: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:48:41.136672: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:48:41.136678: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:48:41.136682: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:48:41.136685: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:48:41.136689: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:48:41.136693: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:48:41.136696: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:48:41.136700: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:41.136703: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:48:41.136707: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:48:41.136711: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:48:41.136714: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:48:41.136718: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:48:41.136722: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:48:41.136726: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:48:41.136731: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:48:41.136734: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:48:41.136738: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:48:41.136741: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:48:41.136745: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:48:41.136749: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:48:41.136752: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:48:41.136756: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_detailed_logging: true\n", "2024-05-21 11:48:41.136760: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:48:41.136763: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:48:41.136767: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:48:41.136771: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:48:41.136774: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:48:41.136778: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:48:41.136783: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:48:41.136787: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "CPU times: user 1.92 s, sys: 292 ms, total: 2.21 s\n", "Wall time: 2.11 s\n" ] } ], "source": [ "size = 256\n", "density = 1.\n", "viscosity = 1e-3\n", "seed = 0\n", "inner_steps = 25\n", "outer_steps = 200\n", "\n", "max_velocity = 2.0\n", "cfl_safety_factor = 0.5\n", "\n", "# Define the physical dimensions of the simulation.\n", "grid = cfd.grids.Grid((size, size), domain=((0, 2 * jnp.pi), (0, 2 * jnp.pi)))\n", "\n", "# Construct a random initial velocity. The `filtered_velocity_field` function\n", "# ensures that the initial velocity is divergence free and it filters out\n", "# high frequency fluctuations.\n", "v0 = cfd.initial_conditions.filtered_velocity_field(\n", " jax.random.PRNGKey(seed), grid, max_velocity)\n", "\n", "# Choose a time step.\n", "dt = cfd.equations.stable_time_step(\n", " max_velocity, cfl_safety_factor, viscosity, grid)\n", "\n", "# Define a step function and use it to compute a trajectory.\n", "step_fn = cfd.funcutils.repeated(\n", " cfd.equations.semi_implicit_navier_stokes(\n", " density=density, viscosity=viscosity, dt=dt, grid=grid),\n", " steps=inner_steps)\n", "rollout_fn = jax.jit(cfd.funcutils.trajectory(step_fn, outer_steps))\n", "%time _, trajectory = jax.device_get(rollout_fn(v0))" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "executionInfo": { "elapsed": 54, "status": "ok", "timestamp": 1635284856908, "user": { "displayName": "", "photoUrl": "", "userId": "" }, "user_tz": 420 }, "id": "m_q3OSfxjjfY", "outputId": "e9bbb584-c53e-4148-d744-37c08140c28f" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Component 0: GridVariable(array=GridArray(data=array([[[-0.8935042 , ..., -0.8515548 ],\n", " ...,\n", " [-0.9017288 , ..., -0.8609535 ]],\n", "\n", " ...,\n", "\n", " [[-0.06768889, ..., -0.08864684],\n", " ...,\n", " [-0.06688285, ..., -0.08821402]]], dtype=float32), offset=(1.0, 0.5), grid=Grid(shape=(256, 256), step=(0.02454369260617026, 0.02454369260617026), domain=((0.0, 6.283185307179586), (0.0, 6.283185307179586)))), bc=HomogeneousBoundaryConditions(types=(('periodic', 'periodic'), ('periodic', 'periodic')), bc_values=((0.0, 0.0), (0.0, 0.0))))\n", "Component 1: GridVariable(array=GridArray(data=array([[[0.142946 , ..., 0.15117063],\n", " ...,\n", " [0.1722027 , ..., 0.18040818]],\n", "\n", " ...,\n", "\n", " [[0.2864643 , ..., 0.2856583 ],\n", " ...,\n", " [0.2748214 , ..., 0.27287936]]], dtype=float32), offset=(0.5, 1.0), grid=Grid(shape=(256, 256), step=(0.02454369260617026, 0.02454369260617026), domain=((0.0, 6.283185307179586), (0.0, 6.283185307179586)))), bc=HomogeneousBoundaryConditions(types=(('periodic', 'periodic'), ('periodic', 'periodic')), bc_values=((0.0, 0.0), (0.0, 0.0))))\n" ] } ], "source": [ "# JAX-CFD uses GridVariable objects for input/output. These objects contain:\n", "# - array data\n", "# - an \"offset\" that documents the position on the unit-cell where the data\n", "# values are located\n", "# - grid properties\n", "# - boundary conditions on the variable\n", "with np.printoptions(edgeitems=1):\n", " for i, u in enumerate(trajectory):\n", " print(f'Component {i}: {u}')" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "executionInfo": { "elapsed": 57, "status": "ok", "timestamp": 1635284965458, "user": { "displayName": "", "photoUrl": "", "userId": "" }, "user_tz": 420 }, "id": "OpBLRIXZD4ny" }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2024-05-21 11:50:08.659935: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_iota:\n", "2024-05-21 11:50:08.659980: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:50:08.659985: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:50:08.659990: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:50:08.659994: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:50:08.659998: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:50:08.660001: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:50:08.660005: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:50:08.660009: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:50:08.660014: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:50:08.660017: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:50:08.660021: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:50:08.660024: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:50:08.660028: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:50:08.660032: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:50:08.660036: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:50:08.660039: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:50:08.660043: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:50:08.660046: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:50:08.660050: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.660054: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:50:08.660057: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:50:08.660062: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:50:08.660066: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:50:08.660070: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:50:08.660073: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:50:08.660077: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:50:08.660081: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:50:08.660084: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:50:08.660088: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:50:08.660091: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:50:08.660095: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:50:08.660099: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:50:08.660102: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:50:08.660106: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:50:08.660110: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:50:08.660119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:50:08.660123: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:50:08.660127: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:50:08.660130: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:50:08.660134: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:50:08.660138: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:50:08.660141: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.660145: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.660149: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:50:08.660152: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:50:08.660156: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:50:08.660160: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:50:08.660164: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:50:08.660168: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:50:08.660172: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:50:08.660176: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:50:08.660180: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:50:08.660183: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:50:08.660187: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:50:08.660191: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:50:08.660194: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:50:08.660198: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:50:08.660202: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:50:08.660205: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:50:08.660209: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:50:08.660212: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:50:08.660216: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:50:08.660220: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:50:08.660224: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:50:08.789864: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:50:08.789909: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:50:08.789914: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:50:08.789918: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:50:08.789923: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:50:08.789926: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:50:08.789930: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:50:08.789934: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:50:08.789938: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:50:08.789941: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:50:08.789945: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:50:08.789949: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:50:08.789952: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:50:08.789957: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:50:08.789961: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:50:08.789965: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:50:08.789969: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:50:08.789972: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:50:08.789976: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:50:08.789980: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.789983: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:50:08.789987: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:50:08.789991: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:50:08.789994: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:50:08.789998: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:50:08.790002: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:50:08.790005: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:50:08.790010: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:50:08.790014: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:50:08.790017: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:50:08.790021: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:50:08.790025: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:50:08.790028: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:50:08.790032: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:50:08.790036: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:50:08.790039: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:50:08.790052: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:50:08.790057: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:50:08.790062: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:50:08.790066: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:50:08.790070: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:50:08.790074: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:50:08.790077: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.790081: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.790085: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:50:08.790088: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:50:08.790092: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:50:08.790096: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:50:08.790099: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:50:08.790103: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:50:08.790107: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:50:08.790110: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:50:08.790114: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:50:08.790118: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:50:08.790123: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:50:08.790127: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:50:08.790130: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:50:08.790134: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:50:08.790138: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:50:08.790141: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:50:08.790145: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:50:08.790149: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:50:08.790152: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:50:08.790156: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:50:08.790160: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:50:08.930173: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:50:08.930218: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:50:08.930223: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:50:08.930227: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:50:08.930232: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:50:08.930235: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:50:08.930239: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:50:08.930243: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:50:08.930247: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:50:08.930250: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:50:08.930254: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:50:08.930258: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:50:08.930263: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:50:08.930266: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:50:08.930270: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:50:08.930274: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:50:08.930277: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:50:08.930281: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:50:08.930285: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:50:08.930288: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.930292: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:50:08.930295: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:50:08.930299: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:50:08.930303: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:50:08.930306: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:50:08.930310: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:50:08.930315: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:50:08.930319: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:50:08.930322: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:50:08.930326: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:50:08.930329: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:50:08.930333: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:50:08.930337: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:50:08.930340: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:50:08.930344: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:50:08.930348: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:50:08.930357: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:50:08.930361: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:50:08.930366: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:50:08.930370: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:50:08.930374: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:50:08.930377: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:50:08.930381: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.930385: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:08.930388: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:50:08.930392: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:50:08.930396: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:50:08.930399: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:50:08.930403: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:50:08.930407: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:50:08.930410: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:50:08.930414: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:50:08.930418: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:50:08.930423: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:50:08.930427: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:50:08.930431: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:50:08.930434: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:50:08.930438: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:50:08.930442: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:50:08.930445: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:50:08.930449: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:50:08.930461: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:50:08.930465: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:50:08.930468: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:50:08.930472: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n", "2024-05-21 11:50:09.060811: W external/xla/xla/service/gpu/gpu_compiler.cc:555] GpuCompilationEnvironment of hlo_module jit_fn:\n", "2024-05-21 11:50:09.060858: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_backend_optimization_level: 3\n", "2024-05-21 11:50:09.060863: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_eliminate_hlo_implicit_broadcast: true\n", "2024-05-21 11:50:09.060868: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_multi_thread_eigen: true\n", "2024-05-21 11:50:09.060872: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cuda_data_dir: \"./cuda_sdk_lib\"\n", "2024-05-21 11:50:09.060876: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_alias_scope_metadata: true\n", "2024-05-21 11:50:09.060880: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_noalias_metadata: true\n", "2024-05-21 11:50:09.060884: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_llvm_enable_invariant_load_metadata: true\n", "2024-05-21 11:50:09.060888: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_force_host_platform_device_count: 1\n", "2024-05-21 11:50:09.060893: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_nans: true\n", "2024-05-21 11:50:09.060896: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_infs: true\n", "2024-05-21 11:50:09.060900: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_allow_excess_precision: true\n", "2024-05-21 11:50:09.060904: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_autotune_level: 4\n", "2024-05-21 11:50:09.060908: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_division: true\n", "2024-05-21 11:50:09.060912: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_fast_math_honor_functions: true\n", "2024-05-21 11:50:09.060915: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_max_hlo_modules: -1\n", "2024-05-21 11:50:09.060919: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_multiheap_size_constraint_per_heap: -1\n", "2024-05-21 11:50:09.060923: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_async_all_reduce: true\n", "2024-05-21 11:50:09.060926: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_strict_conv_algorithm_picker: true\n", "2024-05-21 11:50:09.060930: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_reduce_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:09.060934: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_frontend: true\n", "2024-05-21 11:50:09.060938: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_nccl_termination_timeout_seconds: -1\n", "2024-05-21 11:50:09.060943: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_shared_constants: true\n", "2024-05-21 11:50:09.060946: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_scratch_max_megabytes: 4096\n", "2024-05-21 11:50:09.060950: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_simplify_all_fp_conversions: true\n", "2024-05-21 11:50:09.060954: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_xla_runtime_executable: true\n", "2024-05-21 11:50:09.060957: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_shape_checks: RUNTIME\n", "2024-05-21 11:50:09.060961: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_normalize_layouts: true\n", "2024-05-21 11:50:09.060965: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_tiling_and_fusion: true\n", "2024-05-21 11:50:09.060969: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_dump_enable_mlir_pretty_form: true\n", "2024-05-21 11:50:09.060973: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_triton_gemm: true\n", "2024-05-21 11:50:09.060977: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cudnn_int8x32_convolution_reordering: true\n", "2024-05-21 11:50:09.060981: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_experimental_deallocation: true\n", "2024-05-21 11:50:09.060984: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_enable_mlir_fusion_outlining: true\n", "2024-05-21 11:50:09.060988: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_m_dim: 8\n", "2024-05-21 11:50:09.060992: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_n_dim: 8\n", "2024-05-21 11:50:09.061004: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_cpu_matmul_tiling_k_dim: 8\n", "2024-05-21 11:50:09.061010: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_num_runs_to_instantiate: -1\n", "2024-05-21 11:50:09.061016: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_lhs_enable_gpu_async_tracker: true\n", "2024-05-21 11:50:09.061021: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_inflation_factor: 1\n", "2024-05-21 11:50:09.061026: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_min_graph_size: 5\n", "2024-05-21 11:50:09.061031: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reassociation_for_converted_ar: true\n", "2024-05-21 11:50:09.061037: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_all_gather_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:09.061042: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_reduce_scatter_combine_threshold_bytes: 31457280\n", "2024-05-21 11:50:09.061048: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_highest_priority_async_stream: true\n", "2024-05-21 11:50:09.061054: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_auto_spmd_partitioning_memory_budget_ratio: 1.1\n", "2024-05-21 11:50:09.061059: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_redzone_padding_bytes: 8388608\n", "2024-05-21 11:50:09.061065: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_triton_fusion_level: 2\n", "2024-05-21 11:50:09.061071: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_graph_eviction_timeout_seconds: 60\n", "2024-05-21 11:50:09.061078: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_gpu2_hal: true\n", "2024-05-21 11:50:09.061084: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_copy_insertion_use_region_analysis: true\n", "2024-05-21 11:50:09.061089: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_collective_permute_decomposer_threshold: 9223372036854775807\n", "2024-05-21 11:50:09.061094: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_split_k_autotuning: true\n", "2024-05-21 11:50:09.061101: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduction_epilogue_fusion: true\n", "2024-05-21 11:50:09.061108: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_cublas_fallback: true\n", "2024-05-21 11:50:09.061113: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_filter_kernels_spilling_registers_on_autotuning: true\n", "2024-05-21 11:50:09.061119: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_debug_buffer_assignment_show_max: 15\n", "2024-05-21 11:50:09.061124: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_enable_dumping: true\n", "2024-05-21 11:50:09.061130: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_all_gather_combine_by_dim: true\n", "2024-05-21 11:50:09.061136: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_reduce_scatter_combine_by_dim: true\n", "2024-05-21 11:50:09.061141: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: FUSION\n", "2024-05-21 11:50:09.061145: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_command_buffer: CUBLAS\n", "2024-05-21 11:50:09.061148: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_enable_cub_radix_sort: true\n", "2024-05-21 11:50:09.061152: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_memory_limit_slop_factor: 95\n", "2024-05-21 11:50:09.061156: W external/xla/xla/service/gpu/gpu_compiler.cc:555] xla_gpu_threshold_for_windowed_einsum_mib: 100000\n" ] } ], "source": [ "# load into xarray for visualization and analysis\n", "ds = xarray.Dataset(\n", " {\n", " 'u': (('time', 'x', 'y'), trajectory[0].data),\n", " 'v': (('time', 'x', 'y'), trajectory[1].data),\n", " },\n", " coords={\n", " 'x': grid.axes()[0],\n", " 'y': grid.axes()[1],\n", " 'time': dt * inner_steps * np.arange(outer_steps)\n", " }\n", ")" ] }, { "cell_type": "code", "execution_count": 6, "metadata": { "colab": { "height": 263 }, "executionInfo": { "elapsed": 60, "status": "ok", "timestamp": 1635284966443, "user": { "displayName": "", "photoUrl": "", "userId": "" }, "user_tz": 420 }, "id": "p4VzDmxoEuha", "outputId": "25639ac6-1386-48ed-8270-05e063a69823" }, "outputs": [ { "data": { "text/html": [ "
<xarray.Dataset> Size: 105MB\n",
"Dimensions: (time: 200, x: 256, y: 256)\n",
"Coordinates:\n",
" * x (x) float32 1kB 0.01227 0.03682 0.06136 ... 6.222 6.246 6.271\n",
" * y (y) float32 1kB 0.01227 0.03682 0.06136 ... 6.222 6.246 6.271\n",
" * time (time) float64 2kB 0.0 0.1534 0.3068 0.4602 ... 30.22 30.37 30.53\n",
"Data variables:\n",
" u (time, x, y) float32 52MB -0.8935 -0.9323 ... -0.1087 -0.08821\n",
" v (time, x, y) float32 52MB 0.1429 0.1357 0.1294 ... 0.2716 0.2729