Skip to content

Commit 8cec24d

Browse files
committed
chore: remove deprecated flags from model xla flag configs
Signed-off-by: Terry Kong <[email protected]>
1 parent d1ff3c8 commit 8cec24d

File tree

4 files changed

+0
-8
lines changed

4 files changed

+0
-8
lines changed

rosetta/rosetta/projects/maxtext/xla_flags/llama2-7b-1N8G.env

-2
Original file line numberDiff line numberDiff line change
@@ -6,15 +6,13 @@ export XLA_FLAGS="\
66
--xla_gpu_enable_latency_hiding_scheduler=true \
77
--xla_gpu_enable_triton_gemm=false \
88
--xla_gpu_graph_level=0 \
9-
--xla_gpu_enable_highest_priority_async_stream=true \
109
--xla_gpu_all_reduce_combine_threshold_bytes=${THRESHOLD_BYTES} \
1110
--xla_gpu_all_gather_combine_threshold_bytes=$((THRESHOLD_BYTES/(NUM_NODES*NUM_GPUS))) \
1211
--xla_gpu_reduce_scatter_combine_threshold_bytes=$((THRESHOLD_BYTES/(NUM_NODES*NUM_GPUS*2))) \
1312
--xla_gpu_enable_pipelined_all_gather=true \
1413
--xla_gpu_enable_pipelined_reduce_scatter=true \
1514
--xla_gpu_enable_pipelined_all_reduce=true \
1615
--xla_gpu_enable_while_loop_double_buffering=true \
17-
--xla_gpu_enable_triton_softmax_fusion=false \
1816
--xla_gpu_enable_all_gather_combine_by_dim=false \
1917
--xla_gpu_enable_reduce_scatter_combine_by_dim=false \
2018
--xla_disable_hlo_passes=rematerialization \

rosetta/rosetta/projects/pax/xla_flags/common.env

-2
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,6 @@ THRESHOLD_BYTES=51200
33
export XLA_FLAGS="\
44
--xla_gpu_enable_latency_hiding_scheduler=true \
55
--xla_allow_excess_precision \
6-
--xla_gpu_enable_highest_priority_async_stream=true \
7-
--xla_gpu_enable_triton_softmax_fusion=false \
86
--xla_gpu_all_reduce_combine_threshold_bytes=${THRESHOLD_BYTES} \
97
--xla_gpu_graph_level=0 \
108
"

rosetta/rosetta/projects/pax/xla_flags/gpt-126m.env

-2
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,6 @@ THRESHOLD_BYTES=33554432
33
export XLA_FLAGS="\
44
--xla_gpu_enable_latency_hiding_scheduler=true \
55
--xla_allow_excess_precision \
6-
--xla_gpu_enable_highest_priority_async_stream=true \
7-
--xla_gpu_enable_triton_softmax_fusion=false \
86
--xla_gpu_all_reduce_combine_threshold_bytes=${THRESHOLD_BYTES} \
97
--xla_gpu_graph_level=0 \
108
--xla_gpu_enable_cudnn_fmha=false \

rosetta/rosetta/projects/pax/xla_flags/grok-proxy.env

-2
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,6 @@ REDUCE_SCATTER_THRESHOLD_BYTES=402653184
55
export XLA_FLAGS="\
66
--xla_gpu_enable_latency_hiding_scheduler=true \
77
--xla_allow_excess_precision \
8-
--xla_gpu_enable_highest_priority_async_stream=true \
9-
--xla_gpu_enable_triton_softmax_fusion=false \
108
--xla_gpu_all_reduce_combine_threshold_bytes=${ALL_REDUCE_THRESHOLD_BYTES} \
119
--xla_gpu_graph_level=0 \
1210
--xla_gpu_all_gather_combine_threshold_bytes=${ALL_GATHER_THRESHOLD_BYTES} \

0 commit comments

Comments
 (0)