pengzhendong commited on
Commit
1b10e1d
·
1 Parent(s): ef76ad9

update model

Browse files
.gitattributes CHANGED
@@ -1,35 +1,48 @@
1
  *.7z filter=lfs diff=lfs merge=lfs -text
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
 
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
 
10
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
  *.model filter=lfs diff=lfs merge=lfs -text
13
  *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
  *.onnx filter=lfs diff=lfs merge=lfs -text
17
  *.ot filter=lfs diff=lfs merge=lfs -text
18
  *.parquet filter=lfs diff=lfs merge=lfs -text
19
  *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
  *.pt filter=lfs diff=lfs merge=lfs -text
23
  *.pth filter=lfs diff=lfs merge=lfs -text
24
  *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
  *.tflite filter=lfs diff=lfs merge=lfs -text
30
  *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
  *.xz filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
  *.7z filter=lfs diff=lfs merge=lfs -text
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bin.* filter=lfs diff=lfs merge=lfs -text
5
  *.bz2 filter=lfs diff=lfs merge=lfs -text
 
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.json filter=lfs diff=lfs merge=lfs -text
11
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
 
12
  *.model filter=lfs diff=lfs merge=lfs -text
13
  *.msgpack filter=lfs diff=lfs merge=lfs -text
 
 
14
  *.onnx filter=lfs diff=lfs merge=lfs -text
15
  *.ot filter=lfs diff=lfs merge=lfs -text
16
  *.parquet filter=lfs diff=lfs merge=lfs -text
17
  *.pb filter=lfs diff=lfs merge=lfs -text
 
 
18
  *.pt filter=lfs diff=lfs merge=lfs -text
19
  *.pth filter=lfs diff=lfs merge=lfs -text
20
  *.rar filter=lfs diff=lfs merge=lfs -text
 
21
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
22
  *.tar.* filter=lfs diff=lfs merge=lfs -text
 
23
  *.tflite filter=lfs diff=lfs merge=lfs -text
24
  *.tgz filter=lfs diff=lfs merge=lfs -text
 
25
  *.xz filter=lfs diff=lfs merge=lfs -text
26
  *.zip filter=lfs diff=lfs merge=lfs -text
27
+ *.zstandard filter=lfs diff=lfs merge=lfs -text
28
+ *.tfevents* filter=lfs diff=lfs merge=lfs -text
29
+ *.db* filter=lfs diff=lfs merge=lfs -text
30
+ *.ark* filter=lfs diff=lfs merge=lfs -text
31
+ **/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
32
+ **/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
33
+ **/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
34
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
35
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
36
+ *.gguf* filter=lfs diff=lfs merge=lfs -text
37
+ *.ggml filter=lfs diff=lfs merge=lfs -text
38
+ *.llamafile* filter=lfs diff=lfs merge=lfs -text
39
+ *.pt2 filter=lfs diff=lfs merge=lfs -text
40
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
41
+ *.npy filter=lfs diff=lfs merge=lfs -text
42
+ *.npz filter=lfs diff=lfs merge=lfs -text
43
+ *.pickle filter=lfs diff=lfs merge=lfs -text
44
+ *.pkl filter=lfs diff=lfs merge=lfs -text
45
+ *.tar filter=lfs diff=lfs merge=lfs -text
46
+ *.wasm filter=lfs diff=lfs merge=lfs -text
47
  *.zst filter=lfs diff=lfs merge=lfs -text
48
  *tfevents* filter=lfs diff=lfs merge=lfs -text
Qwen3-0.6B/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660db3b73d788119c04535e48cf9be5f55bc3100841a718637ae695b442f27dd
3
+ size 726
Qwen3-0.6B/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2325da0f15bb848e018c5ae071b7943332e9f871d6b60e2ed22ca97d4cb993d2
3
+ size 239
Qwen3-0.6B/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
Qwen3-0.6B/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed272ca0a40aa011306dd28becd14c32eeb75cba01db658d3bd5ead894007edd
3
+ size 1503300296
Qwen3-0.6B/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
3
+ size 11422654
Qwen3-0.6B/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5d09f07b48c3086c508b30d1c9114bd1189145b74e982a265350c923acd8101
3
+ size 9732
Qwen3-0.6B/vocab.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
3
+ size 2776833
config.yaml ADDED
@@ -0,0 +1,136 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model: FunASRNano
2
+ model_conf:
3
+ lsm_weight: 0.1
4
+ length_normalized_loss: true
5
+ audio_encoder: iic/SenseVoiceSmall
6
+ audio_encoder_conf:
7
+ hub: ms
8
+ freeze: true
9
+ freeze_layer_num: -1
10
+ feat_permute: true
11
+ llm: Qwen3-0.6b
12
+ llm_conf:
13
+ hub: hf
14
+ freeze: true
15
+ llm_dtype: bf16
16
+ init_param_path: Qwen3-0.6B
17
+ use_lora: false
18
+ lora_conf:
19
+ freeze_lora: true
20
+ task_type: CAUSAL_LM
21
+ r: 16
22
+ lora_alpha: 32
23
+ lora_dropout: 0.05
24
+ bias: none
25
+ target_modules:
26
+ - q_proj
27
+ - v_proj
28
+ init_param_path: ""
29
+ audio_adaptor: Transformer
30
+ audio_adaptor_conf:
31
+ downsample_rate: 1
32
+ ffn_dim: 2048
33
+ llm_dim: 1024
34
+ encoder_dim: 512
35
+ n_layer: 2
36
+ freeze: true
37
+ ctc_decoder: Transformer
38
+ detach_ctc_decoder: true
39
+ ctc_decoder_conf:
40
+ downsample_rate: 1
41
+ ffn_dim: 2048
42
+ llm_dim: 512
43
+ encoder_dim: 512
44
+ n_layer: 5
45
+ freeze: false
46
+ ctc_weight: 1.0
47
+ ctc_conf:
48
+ dropout_rate: 0.0
49
+ ctc_type: builtin
50
+ reduce: true
51
+ ignore_nan_grad: true
52
+ frontend: WavFrontend
53
+ frontend_conf:
54
+ fs: 16000
55
+ window: hamming
56
+ n_mels: 80
57
+ frame_length: 25
58
+ frame_shift: 10
59
+ lfr_m: 7
60
+ lfr_n: 6
61
+ cmvn_file: null
62
+ train_conf:
63
+ use_lora: ${llm_conf.use_lora}
64
+ accum_grad: 1
65
+ grad_clip: 5
66
+ max_epoch: 2
67
+ keep_nbest_models: 200
68
+ log_interval: 100
69
+ effective_save_name_excludes:
70
+ - llm.
71
+ resume: true
72
+ validate_interval: 2000
73
+ save_checkpoint_interval: 2000
74
+ avg_nbest_model: 100
75
+ use_bf16: false
76
+ use_deepspeed: true
77
+ deepspeed_config: null
78
+ save_init_model: false
79
+ optim: adamw
80
+ optim_conf:
81
+ lr: 5.0e-06
82
+ weight_decay: 0.0
83
+ scheduler: warmuplr
84
+ scheduler_conf:
85
+ warmup_steps: 2500
86
+ dataset: FunASRNano
87
+ dataset_conf:
88
+ index_ds: FunASRNano
89
+ batch_sampler: BatchSampler
90
+ batch_type: token
91
+ batch_size: 6000
92
+ max_token_length: 3500
93
+ shuffle: true
94
+ sort_size: 1024
95
+ batch_size_scale_ratio_max: 2
96
+ num_workers: 4
97
+ audio_adaptor_downsample_rate: ${audio_adaptor_conf.downsample_rate}
98
+ audio_encoder_downsample_rate: 6
99
+ data_split_num: 256
100
+ batch_size_sample_max: 10
101
+ retry: 2000
102
+ batch_size_token_max: 6000
103
+ max_source_length: 12000
104
+ max_target_length: 2048
105
+ preprocessor_text: TextPreprocessHasRepeatedWords
106
+ preprocessor_text_conf:
107
+ max_ngram_length: 15
108
+ max_occurrences: 10
109
+ prompt_classes: MultiContextPrompt
110
+ prompt_conf:
111
+ max_neg_hotwords_num: 0
112
+ min_neg_hotwords_num: 0
113
+ use_hist: false
114
+ use_one_pass_result: true
115
+ use_hotwords: true
116
+ use_asr_hotwords: true
117
+ chinese_hotwords_list: null
118
+ english_hotwords_list: null
119
+ ctc_tokenizer: SenseVoiceTokenizer
120
+ ctc_target_normalize: true
121
+ ctc_tokenizer_conf:
122
+ vocab_path: null
123
+ is_multilingual: true
124
+ num_languages: 8749
125
+ min_source_length: 10
126
+ batch_size_scale_threshold: 3000
127
+ use_dynamic_output_ratio: 0.0
128
+ tokenizer: HuggingfaceTokenizer
129
+ tokenizer_conf:
130
+ init_param_path: ${llm_conf.init_param_path}
131
+ enable_tf32: true
132
+ debug: false
133
+ train_data_set_list: null
134
+ valid_data_set_list: null
135
+ init_param: null
136
+ output_dir: null
configuration.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64a3a55d35bcbe2cf4d31f2d3ef25a423d3ba2ebff203298c27fa055f3c7612
3
+ size 398
example/en.mp3 ADDED
Binary file (57.4 kB). View file
 
example/ja.mp3 ADDED
Binary file (57.8 kB). View file
 
example/ko.mp3 ADDED
Binary file (27.9 kB). View file
 
example/yue.mp3 ADDED
Binary file (31.2 kB). View file
 
example/zh.mp3 ADDED
Binary file (45 kB). View file
 
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90f2548b670216f6ff9828f6b5148dc1cd4dd9a0bb6e3905c58d265212460afb
3
+ size 467729307
multilingual.tiktoken ADDED
The diff for this file is too large to render. See raw diff