scb10x
/

llama3.1-typhoon2-audio-8b-instruct

Text Generation

feature-extraction

Model card Files Files and versions Community

kunato commited on Jan 6

Commit

51ee87b

·

verified ·

1 Parent(s): 47d85a6

Update modeling_typhoon2audio.py

Files changed (1) hide show

modeling_typhoon2audio.py +5 -3

modeling_typhoon2audio.py CHANGED Viewed

@@ -18,6 +18,7 @@ from transformers import (
     WhisperModel,
     PreTrainedModel,
     AutoTokenizer,
     AutoModelForCausalLM,
 )
 from transformers.cache_utils import Cache, StaticCache
@@ -63,6 +64,7 @@ from transformers.modeling_utils import (
     apply_chunking_to_forward,
     find_pruneable_heads_and_indices,
     prune_linear_layer,
 )
 from transformers.models.bert.configuration_bert import BertConfig
@@ -841,9 +843,9 @@ class Typhoon2AudioForConditionalGeneration(PreTrainedModel, GenerationMixin):
         self.second_stride = config.second_stride
         # 2. LLM (e.g., Llama3)
-        self.llama_model = AutoModelForCausalLM.from_pretrained(
-            config.llama_base_model, attn_implementation=attn_implementation
-        )
         # tokenizer
         self.llama_tokenizer = AutoTokenizer.from_pretrained(
             config.llama_base_model, use_fast=False

     WhisperModel,
     PreTrainedModel,
     AutoTokenizer,
+    AutoConfig,
     AutoModelForCausalLM,
 )
 from transformers.cache_utils import Cache, StaticCache
     apply_chunking_to_forward,
     find_pruneable_heads_and_indices,
     prune_linear_layer,
+    no_init_weights
 )
 from transformers.models.bert.configuration_bert import BertConfig
         self.second_stride = config.second_stride
         # 2. LLM (e.g., Llama3)
+        with no_init_weights(_enable=True):
+            llm_config = AutoConfig.from_pretrained(config.llama_base_model)
+            self.llama_model = AutoModelForCausalLM.from_config(llm_config, attn_implementation=attn_implementation)
         # tokenizer
         self.llama_tokenizer = AutoTokenizer.from_pretrained(
             config.llama_base_model, use_fast=False