add glm-4.7 and mistral-large-2512

kota-row · kota-row · commit f38c389971a5 · 2026-01-05T15:04:05.000+09:00
diff --git a/configs/config-glm-4.7.yaml b/configs/config-glm-4.7.yaml
@@ -0,0 +1,88 @@
+wandb:
+  run_name: zai-org/GLM-4.7
+# api: vllm-docker
+api: openai-compatible
+base_url: http://gb-nvl-059-compute03:8000/v1
+num_gpus: 8
+batch_size: 128
+model:
+  use_wandb_artifacts: false
+  pretrained_model_name_or_path: zai-org/GLM-4.7
+  bfcl_model_id: "unified-oss-fc"
+  size_category: "Large (30B+)"
+  size: 358337791296
+  release_date: 12/22/2025
+
+vllm: # This config not used because vLLM launched manually, but for record
+  vllm_tag: nightly-f1c2c20136cca6ea8798a64855eaf52ee9a42210
+  lifecycle: always_on
+  gpu_memory_utilization: 0.95
+  reasoning_parser: glm45
+  tool_call_parser: glm47
+  enable_auto_tool_choice: true
+  trust_remote_code: true
+
+generator:
+  max_tokens: 202752
+  temperature: 1.0
+  top_p: 0.95
+
+jaster:
+  override_max_tokens: 202752
+
+jbbq:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+
+toxicity:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+
+jtruthfulqa:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+
+swebench:
+  max_tokens: 202752
+
+mtbench:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+  temperature_override:
+    writing: 1.0
+    roleplay: 1.0
+    extraction: 1.0
+    math: 1.0
+    coding: 1.0
+    reasoning: 1.0
+    stem: 1.0
+    humanities: 1.0
+
+bfcl:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+
+hallulens:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+
+hle:
+  generator_config:
+    max_tokens: 202752
+    temperature: 1.0
+    top_p: 0.95
+
+arc_agi:
+  max_output_tokens: 202752
diff --git a/configs/config-mistral-large-3-675b-instruct-2512.yaml b/configs/config-mistral-large-3-675b-instruct-2512.yaml
@@ -0,0 +1,29 @@
+wandb:
+  run_name: mistralai/Mistral-Large-3-675B-Instruct-2512
+# api: vllm-docker
+api: openai-compatible
+base_url: http://gb-nvl-059-compute03:8000/v1
+num_gpus: 8
+batch_size: 256
+model:
+  use_wandb_artifacts: false
+  pretrained_model_name_or_path: mistralai/Mistral-Large-3-675B-Instruct-2512
+  bfcl_model_id: "unified-oss-fc"
+  size_category: "Large (30B+)"
+  size: 676032104960
+  release_date: 12/03/2025
+
+vllm: # This config not used because vLLM launched manually, but for record
+  vllm_tag: v0.12.0
+  lifecycle: always_on
+  gpu_memory_utilization: 0.95
+  enable_auto_tool_choice: true
+  tool_call_parser: mistral
+  extra_args:
+    - "--config_format=mistral"
+    - "--load_format=mistral"
+    - "--tokenizer_mode=mistral"
+
+generator:
+  max_tokens: 262144
+  temperature: 0.0