@@ -68,8 +68,13 @@ def execute():
6868 "--sglang-mem-fraction-static 0.6 "
6969 "--sglang-decode-log-interval 1000 "
7070 "--sglang-enable-metrics "
71+ # "--sglang-enable-deterministic-inference "
72+ # "--sglang-rl-on-policy-target fsdp "
7173 "--sglang-attention-backend fa3 "
7274 "--attn-implementation flash_attention_3 "
75+ "--sglang-cuda-graph-bs 1 2 4 8 16 24 32 40 48 56 64 "
76+ # "--deterministic-mode "
77+ # "--true-on-policy-mode "
7378 )
7479
7580 ci_args = "--ci-test "
@@ -91,6 +96,9 @@ def execute():
9196 )
9297
9398 extra_env_vars = {
99+ # "NCCL_ALGO": "allreduce:tree",
100+ # "NVTE_ALLOW_NONDETERMINISTIC_ALGO": "0",
101+ # "CUBLAS_WORKSPACE_CONFIG": ":4096:8",
94102 "CUDA_DEVICE_MAX_CONNECTIONS" : "1" ,
95103 }
96104
@@ -104,8 +112,6 @@ def execute():
104112
105113if __name__ == "__main__" :
106114 prepare ()
107- os .environ .pop ("http_proxy" , None )
108- os .environ .pop ("https_proxy" , None )
109- os .environ .pop ("HTTP_PROXY" , None )
110- os .environ .pop ("HTTPS_PROXY" , None )
115+ for proxy_var in ("http_proxy" , "https_proxy" , "HTTP_PROXY" , "HTTPS_PROXY" ):
116+ os .environ .pop (proxy_var , None )
111117 execute ()
0 commit comments