config.json
4.3 KB · 164 lines · json Raw
1 {
2 "architectures": [
3 "Qwen3TTSForConditionalGeneration"
4 ],
5 "assistant_token_id": 77091,
6 "im_end_token_id": 151645,
7 "im_start_token_id": 151644,
8 "tts_bos_token_id": 151672,
9 "tts_eos_token_id": 151673,
10 "tts_pad_token_id": 151671,
11 "model_type": "qwen3_tts",
12 "tokenizer_type": "qwen3_tts_tokenizer_12hz",
13 "tts_model_size": "1b7",
14 "tts_model_type": "voice_design",
15 "talker_config": {
16 "attention_bias": false,
17 "attention_dropout": 0,
18 "code_predictor_config": {
19 "_name_or_path": "",
20 "add_cross_attention": false,
21 "architectures": null,
22 "attention_bias": false,
23 "attention_dropout": 0,
24 "bad_words_ids": null,
25 "begin_suppress_tokens": null,
26 "bos_token_id": null,
27 "chunk_size_feed_forward": 0,
28 "cross_attention_hidden_size": null,
29 "decoder_start_token_id": null,
30 "diversity_penalty": 0.0,
31 "do_sample": false,
32 "early_stopping": false,
33 "encoder_no_repeat_ngram_size": 0,
34 "eos_token_id": null,
35 "exponential_decay_length_penalty": null,
36 "finetuning_task": null,
37 "forced_bos_token_id": null,
38 "forced_eos_token_id": null,
39 "head_dim": 128,
40 "hidden_act": "silu",
41 "hidden_size": 1024,
42 "id2label": {
43 "0": "LABEL_0",
44 "1": "LABEL_1"
45 },
46 "initializer_range": 0.02,
47 "intermediate_size": 3072,
48 "is_decoder": false,
49 "is_encoder_decoder": false,
50 "label2id": {
51 "LABEL_0": 0,
52 "LABEL_1": 1
53 },
54 "layer_types": [
55 "full_attention",
56 "full_attention",
57 "full_attention",
58 "full_attention",
59 "full_attention"
60 ],
61 "length_penalty": 1.0,
62 "max_length": 20,
63 "max_position_embeddings": 65536,
64 "max_window_layers": 28,
65 "min_length": 0,
66 "model_type": "qwen3_tts_talker_code_predictor",
67 "no_repeat_ngram_size": 0,
68 "num_attention_heads": 16,
69 "num_beam_groups": 1,
70 "num_beams": 1,
71 "num_code_groups": 16,
72 "num_hidden_layers": 5,
73 "num_key_value_heads": 8,
74 "num_return_sequences": 1,
75 "output_attentions": false,
76 "output_hidden_states": false,
77 "output_scores": false,
78 "pad_token_id": null,
79 "prefix": null,
80 "problem_type": null,
81 "pruned_heads": {},
82 "remove_invalid_values": false,
83 "repetition_penalty": 1.0,
84 "return_dict": true,
85 "return_dict_in_generate": false,
86 "rms_norm_eps": 1e-06,
87 "rope_scaling": null,
88 "rope_theta": 1000000,
89 "sep_token_id": null,
90 "sliding_window": null,
91 "suppress_tokens": null,
92 "task_specific_params": null,
93 "temperature": 1.0,
94 "tf_legacy_loss": false,
95 "tie_encoder_decoder": false,
96 "tie_word_embeddings": false,
97 "tokenizer_class": null,
98 "top_k": 50,
99 "top_p": 1.0,
100 "dtype": null,
101 "torchscript": false,
102 "typical_p": 1.0,
103 "use_bfloat16": false,
104 "use_cache": true,
105 "use_sliding_window": false,
106 "vocab_size": 2048
107 },
108 "codec_bos_id": 2149,
109 "codec_eos_token_id": 2150,
110 "codec_think_id": 2154,
111 "codec_language_id": {
112 "chinese": 2055,
113 "english": 2050,
114 "german": 2053,
115 "italian": 2070,
116 "portuguese": 2071,
117 "spanish": 2054,
118 "japanese": 2058,
119 "korean": 2064,
120 "french": 2061,
121 "russian": 2069
122 },
123 "codec_nothink_id": 2155,
124 "codec_pad_id": 2148,
125 "codec_think_bos_id": 2156,
126 "codec_think_eos_id": 2157,
127 "spk_id": {
128 },
129 "spk_is_dialect": {
130 },
131 "head_dim": 128,
132 "hidden_act": "silu",
133 "hidden_size": 2048,
134 "initializer_range": 0.02,
135 "intermediate_size": 6144,
136 "max_position_embeddings": 32768,
137 "model_type": "qwen3_tts_talker",
138 "num_attention_heads": 16,
139 "num_code_groups": 16,
140 "num_hidden_layers": 28,
141 "num_key_value_heads": 8,
142 "position_id_per_seconds": 13,
143 "rms_norm_eps": 1e-06,
144 "rope_scaling": {
145 "interleaved": true,
146 "mrope_section": [
147 24,
148 20,
149 20
150 ],
151 "rope_type": "default",
152 "type": "default"
153 },
154 "rope_theta": 1000000,
155 "sliding_window": null,
156 "text_hidden_size": 2048,
157 "text_vocab_size": 151936,
158 "use_cache": true,
159 "use_sliding_window": false,
160 "vocab_size": 3072
161 },
162 "transformers_version": "4.57.3"
163 }
164