shangeth commited on
Commit
7eacacf
1 Parent(s): 64a7de7

Upload model

Browse files
Files changed (2) hide show
  1. README.md +44 -45
  2. config.json +1 -6
README.md CHANGED
@@ -1,58 +1,57 @@
1
  ---
 
 
2
  license: apache-2.0
 
3
  datasets:
4
  - mozilla-foundation/common_voice_16_1
5
  - openslr/librispeech_asr
6
- language:
7
- - en
8
  metrics:
9
  - wer
10
- library_name: transformers
11
  model-index:
12
  - name: SpeechLLM
13
  results:
14
- - task:
15
- name: Automatic Speech Recognition
16
- type: automatic-speech-recognition
17
- dataset:
18
- name: LibriSpeech (clean)
19
- type: librispeech_asr
20
- config: clean
21
- split: test
22
- args:
23
- language: en
24
- metrics:
25
- - name: Test WER
26
- type: wer
27
- value: 12.3
28
- - task:
29
- name: Automatic Speech Recognition
30
- type: automatic-speech-recognition
31
- dataset:
32
- name: LibriSpeech (other)
33
- type: librispeech_asr
34
- config: other
35
- split: test
36
- args:
37
- language: en
38
- metrics:
39
- - name: Test WER
40
- type: wer
41
- value: 18.9
42
-
43
- - task:
44
- name: Automatic Speech Recognition
45
- type: automatic-speech-recognition
46
- dataset:
47
- name: Common Voice 16.1
48
- type: common_voice_16_1
49
- split: test
50
- args:
51
- language: en
52
- metrics:
53
- - name: Test WER
54
- type: wer
55
- value: 25.01
56
  ---
57
 
58
  # SpeechLLM
 
1
  ---
2
+ language:
3
+ - en
4
  license: apache-2.0
5
+ library_name: transformers
6
  datasets:
7
  - mozilla-foundation/common_voice_16_1
8
  - openslr/librispeech_asr
 
 
9
  metrics:
10
  - wer
 
11
  model-index:
12
  - name: SpeechLLM
13
  results:
14
+ - task:
15
+ type: automatic-speech-recognition
16
+ name: Automatic Speech Recognition
17
+ dataset:
18
+ name: LibriSpeech (clean)
19
+ type: librispeech_asr
20
+ config: clean
21
+ split: test
22
+ args:
23
+ language: en
24
+ metrics:
25
+ - type: wer
26
+ value: 12.3
27
+ name: Test WER
28
+ - task:
29
+ type: automatic-speech-recognition
30
+ name: Automatic Speech Recognition
31
+ dataset:
32
+ name: LibriSpeech (other)
33
+ type: librispeech_asr
34
+ config: other
35
+ split: test
36
+ args:
37
+ language: en
38
+ metrics:
39
+ - type: wer
40
+ value: 18.9
41
+ name: Test WER
42
+ - task:
43
+ type: automatic-speech-recognition
44
+ name: Automatic Speech Recognition
45
+ dataset:
46
+ name: Common Voice 16.1
47
+ type: common_voice_16_1
48
+ split: test
49
+ args:
50
+ language: en
51
+ metrics:
52
+ - type: wer
53
+ value: 25.01
54
+ name: Test WER
 
55
  ---
56
 
57
  # SpeechLLM
config.json CHANGED
@@ -1,14 +1,9 @@
1
  {
2
- "architectures": [
3
- "SpeechLLMModel"
4
- ],
5
  "audio_enc_dim": 1280,
6
  "auto_map": {
7
- "AutoConfig": "config.SpeechLLMModelConfig",
8
- "AutoModel": "model.SpeechLLMModel"
9
  },
10
  "llm_dim": 2048,
11
  "model_type": "custom_model",
12
- "torch_dtype": "float32",
13
  "transformers_version": "4.38.2"
14
  }
 
1
  {
 
 
 
2
  "audio_enc_dim": 1280,
3
  "auto_map": {
4
+ "AutoConfig": "config.SpeechLLMModelConfig"
 
5
  },
6
  "llm_dim": 2048,
7
  "model_type": "custom_model",
 
8
  "transformers_version": "4.38.2"
9
  }