diff --git a/etc/mcts_1gpu.conf b/etc/mcts_1gpu.conf index f4628b3..75c47b1 100644 --- a/etc/mcts_1gpu.conf +++ b/etc/mcts_1gpu.conf @@ -9,7 +9,7 @@ eval_wait_batch_timeout_us: 100 model_config { train_dir: "ckpt" enable_tensorrt: 1 - tensorrt_model_path: "zero.ckpt-m8.FP32.PLAN" + tensorrt_model_path: "zero.ckpt-20b-v1.FP32.PLAN" } gpu_list: "0" c_puct: 2.5 diff --git a/etc/mcts_2gpu.conf b/etc/mcts_2gpu.conf index b430d45..f854bee 100644 --- a/etc/mcts_2gpu.conf +++ b/etc/mcts_2gpu.conf @@ -9,7 +9,7 @@ eval_wait_batch_timeout_us: 100 model_config { train_dir: "ckpt" enable_tensorrt: 1 - tensorrt_model_path: "zero.ckpt-m8.FP32.PLAN" + tensorrt_model_path: "zero.ckpt-20b-v1.FP32.PLAN" } gpu_list: "0,1" c_puct: 2.5 diff --git a/etc/mcts_4gpu.conf b/etc/mcts_4gpu.conf index ed1d950..5fb0833 100644 --- a/etc/mcts_4gpu.conf +++ b/etc/mcts_4gpu.conf @@ -9,7 +9,7 @@ eval_wait_batch_timeout_us: 100 model_config { train_dir: "ckpt" enable_tensorrt: 1 - tensorrt_model_path: "zero.ckpt-m8.FP32.PLAN" + tensorrt_model_path: "zero.ckpt-20b-v1.FP32.PLAN" } gpu_list: "0,1,2,3" c_puct: 2.5 diff --git a/etc/mcts_8gpu.conf b/etc/mcts_8gpu.conf index b646ec7..e18b031 100644 --- a/etc/mcts_8gpu.conf +++ b/etc/mcts_8gpu.conf @@ -9,7 +9,7 @@ eval_wait_batch_timeout_us: 100 model_config { train_dir: "ckpt" enable_tensorrt: 1 - tensorrt_model_path: "zero.ckpt-m8.FP32.PLAN" + tensorrt_model_path: "zero.ckpt-20b-v1.FP32.PLAN" } gpu_list: "0,1,2,3,4,5,6,7" c_puct: 2.5 diff --git a/etc/mcts_async_dist.conf b/etc/mcts_async_dist.conf index 7592fb8..dc15a12 100644 --- a/etc/mcts_async_dist.conf +++ b/etc/mcts_async_dist.conf @@ -11,7 +11,7 @@ eval_wait_batch_timeout_us: 100 model_config { train_dir: "ckpt" enable_tensorrt: 1 - tensorrt_model_path: "zero.ckpt-m8.FP32.PLAN" + tensorrt_model_path: "zero.ckpt-20b-v1.FP32.PLAN" } enable_dist: 1 dist_svr_addrs: "ip:port,ip:port,ip:port,ip:port" @@ -85,7 +85,7 @@ dist_config { leaky_bucket_refill_period_ms: 5000 } c_puct: 2.5 -virtual_loss: 1.0 +virtual_loss: 0.5 enable_resign: 1 v_resign: -0.9 enable_dirichlet_noise: 0 @@ -101,7 +101,7 @@ early_stop { enable: 1 check_every_ms: 100 sims_factor: 1.0 - sims_threshold: 2000 + sims_threshold: 100000 } unstable_overtime { enable: 1 diff --git a/etc/mcts_dist.conf b/etc/mcts_dist.conf index cf5702f..9ad5b1d 100644 --- a/etc/mcts_dist.conf +++ b/etc/mcts_dist.conf @@ -9,7 +9,7 @@ eval_wait_batch_timeout_us: 100 model_config { train_dir: "ckpt" enable_tensorrt: 1 - tensorrt_model_path: "zero.ckpt-m8.FP32.PLAN" + tensorrt_model_path: "zero.ckpt-20b-v1.FP32.PLAN" } enable_dist: 1 dist_svr_addrs: "ip:port" @@ -67,7 +67,7 @@ early_stop { enable: 1 check_every_ms: 100 sims_factor: 1.0 - sims_threshold: 2000 + sims_threshold: 10000 } unstable_overtime { enable: 1