Upload inference/runner_config/tp32.yaml with huggingface_hub

Files changed (1) hide show

inference/runner_config/tp32.yaml ADDED Viewed

+# coding=utf-8
+# Copyright (c) 2025 Huawei Technologies Co., Ltd. All rights reserved.
+model_name: "pangu_ultra_moe"
+model_path: "./model"
+exe_mode: "eager"        # ["dynamo", "eager"]
+model_config:
+  tokenizer_mode: default # ["default", "chat"]
+  mm_quant_mode: None
+  mla_backend: absorb     # [native, absorb]
+  with_ckpt: 1            # [0, 1]
+  enable_profiler: 0      # [0, 1]
+data_config:
+  input_max_len: 4096
+  max_new_tokens: 28000
+  batch_size: 1
+  max_position_embeddings: 32768
+parallel_config:
+  attn_tp_size: 32
+  moe_tp_size: 32
+  embed_tp_size: 32
+sampling_config:
+  top_n_sigma: 0.05
+  top_p: 1.0
+  temperature: 0.7
+  top_k: -1