skit-ai
/

speechllm-2B

Feature Extraction

speech-language

Model card Files Files and versions Community

shangeth commited on Jun 25, 2024

Commit

8252cc5

·

verified ·

1 Parent(s): fbdf999

generate_meta update

Files changed (2) hide show

README.md +3 -3
config.json +1 -6

README.md CHANGED Viewed

@@ -3,6 +3,9 @@ language:
 - en
 license: apache-2.0
 library_name: transformers
 datasets:
 - mozilla-foundation/common_voice_16_1
 - openslr/librispeech_asr
@@ -97,9 +100,6 @@ model-index:
     - type: accuracy
       value: 64.57
       name: Test Accent Accuracy
-tags:
-- multi-modal
-- speech-language
 ---
 # SpeechLLM

 - en
 license: apache-2.0
 library_name: transformers
+tags:
+- multi-modal
+- speech-language
 datasets:
 - mozilla-foundation/common_voice_16_1
 - openslr/librispeech_asr
     - type: accuracy
       value: 64.57
       name: Test Accent Accuracy
 ---
 # SpeechLLM

config.json CHANGED Viewed

@@ -1,18 +1,13 @@
 {
-  "architectures": [
-    "SpeechLLMModel"
-  ],
   "audio_enc_dim": 1280,
   "audio_encoder_name": "facebook/hubert-xlarge-ll60k",
   "audio_processor_name": "facebook/hubert-large-ls960-ft",
   "auto_map": {
-    "AutoConfig": "config.SpeechLLMModelConfig",
-    "AutoModel": "model.SpeechLLMModel"
   },
   "llm_dim": 2048,
   "llm_model_checkpoint": "hf_repo/llm_model_checkpoint",
   "llm_model_name": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
   "model_type": "custom_model",
-  "torch_dtype": "float32",
   "transformers_version": "4.38.2"
 }

 {
   "audio_enc_dim": 1280,
   "audio_encoder_name": "facebook/hubert-xlarge-ll60k",
   "audio_processor_name": "facebook/hubert-large-ls960-ft",
   "auto_map": {
+    "AutoConfig": "config.SpeechLLMModelConfig"
   },
   "llm_dim": 2048,
   "llm_model_checkpoint": "hf_repo/llm_model_checkpoint",
   "llm_model_name": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
   "model_type": "custom_model",
   "transformers_version": "4.38.2"
 }