Skip to content

Commit

Permalink
Remove --xla_gpu_simplify_all_fp_conversions in commands where it i…
Browse files Browse the repository at this point in the history
…s set to the default value of `true`.

PiperOrigin-RevId: 605311817
  • Loading branch information
dimitar-asenov authored and pax authors committed Feb 8, 2024
1 parent 9a8cd95 commit be9c405
Show file tree
Hide file tree
Showing 4 changed files with 4 additions and 4 deletions.
2 changes: 1 addition & 1 deletion paxml/contrib/gpu/scripts_gpu/benchmark_gpt_multinode.sh
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ LOG_DIR=${5:-"test_logdir"}
export VOCAB_PATH=None
export XLA_PYTHON_CLIENT_MEM_FRACTION=${XLA_PYTHON_CLIENT_MEM_FRACTION:-0.85}
BASE_XLA_FLAGS=${BASE_XLA_FLAGS:-"--xla_gpu_enable_latency_hiding_scheduler=true --xla_gpu_enable_triton_gemm=false
--xla_gpu_simplify_all_fp_conversions --xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_reduce_scatter=true --xla_gpu_enable_highest_priority_async_stream=true
--xla_gpu_enable_triton_softmax_fusion=false --xla_gpu_all_reduce_combine_threshold_bytes=51200
--xla_gpu_graph_level=0 --xla_gpu_enable_async_all_reduce=true"}
Expand Down
2 changes: 1 addition & 1 deletion paxml/contrib/gpu/scripts_gpu/run_lambada_singlenode.sh
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ LOG_DIR=$6

export VOCAB_PATH=$VOCAB_PATH
BASE_XLA_FLAGS=${BASE_XLA_FLAGS:-"--xla_gpu_enable_latency_hiding_scheduler=true --xla_gpu_enable_triton_gemm=false
--xla_gpu_simplify_all_fp_conversions --xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_reduce_scatter=true --xla_gpu_enable_highest_priority_async_stream=true
--xla_gpu_enable_triton_softmax_fusion=false --xla_gpu_all_reduce_combine_threshold_bytes=51200
--xla_gpu_graph_level=0 --xla_gpu_enable_async_all_reduce=true"}
Expand Down
2 changes: 1 addition & 1 deletion paxml/contrib/gpu/scripts_gpu/run_pile_multinode.sh
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ LOG_DIR=${6:-"test_logdir"}
export VOCAB_PATH=$VOCAB_PATH
export XLA_PYTHON_CLIENT_MEM_FRACTION=${XLA_PYTHON_CLIENT_MEM_FRACTION:-0.85}
BASE_XLA_FLAGS=${BASE_XLA_FLAGS:-"--xla_gpu_enable_latency_hiding_scheduler=true --xla_gpu_enable_triton_gemm=false
--xla_gpu_simplify_all_fp_conversions --xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_reduce_scatter=true --xla_gpu_enable_highest_priority_async_stream=true
--xla_gpu_enable_triton_softmax_fusion=false --xla_gpu_all_reduce_combine_threshold_bytes=51200
--xla_gpu_graph_level=0 --xla_gpu_enable_async_all_reduce=true"}
Expand Down
2 changes: 1 addition & 1 deletion paxml/contrib/gpu/scripts_gpu/run_pile_singlenode.sh
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ LOG_DIR=${6:-"test_logdir"}
export VOCAB_PATH=$VOCAB_PATH

BASE_XLA_FLAGS=${BASE_XLA_FLAGS:-"--xla_gpu_enable_latency_hiding_scheduler=true --xla_gpu_enable_triton_gemm=false
--xla_gpu_simplify_all_fp_conversions --xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_all_gather=true
--xla_gpu_enable_async_reduce_scatter=true --xla_gpu_enable_highest_priority_async_stream=true
--xla_gpu_enable_triton_softmax_fusion=false --xla_gpu_all_reduce_combine_threshold_bytes=51200
--xla_gpu_graph_level=0 --xla_gpu_enable_async_all_reduce=true"}
Expand Down

0 comments on commit be9c405

Please sign in to comment.