File size: 575 Bytes
a96bc78
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
from transformers import PretrainedConfig

class Qwen3MoEConfig(PretrainedConfig):
    model_type = "qwen3moe"

    def __init__(
        self,
        router_model_path=None,
        expert_model_paths=None,
        labels=None,
        torch_dtype="auto",
        tokenizer_path=None,
        **kwargs,
    ):
        super().__init__(**kwargs)
        self.router_model_path = router_model_path
        self.expert_model_paths = expert_model_paths or {}
        self.labels = labels or []
        self.torch_dtype = torch_dtype
        self.tokenizer_path = tokenizer_path