Spaces:

nvidia
/

audio-flamingo-3

Running on Zero

SreyanG-NVIDIA commited on Jul 15

Commit

94b4ec9

verified ·

1 Parent(s): 4369a55

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,12 +18,12 @@ model_single = model_single.to("cuda")
 generation_config_single = model_single.default_generation_config
-# model_think = PeftModel.from_pretrained(
-#             model_single,
-#             MODEL_BASE_THINK,
-#             device_map="auto",
-#             torch_dtype=torch.float16,
-#         )
 # # ---------------------------------
 # # MULTI-TURN MODEL SETUP
@@ -58,7 +58,7 @@ def think_infer(audio_file, prompt_text):
     try:
         sound = llava.Sound(audio_file)
         full_prompt = f"<sound>\n{prompt_text}"
-        response = model_single.generate_content([sound, full_prompt], generation_config=generation_config_single)
         return response
     except Exception as e:
         return f"❌ Error: {str(e)}"

 generation_config_single = model_single.default_generation_config
+model_think = PeftModel.from_pretrained(
+        model_single,
+           MODEL_BASE_THINK,
+device_map="auto",
+          torch_dtype=torch.float16,
+        )
 # # ---------------------------------
 # # MULTI-TURN MODEL SETUP
     try:
         sound = llava.Sound(audio_file)
         full_prompt = f"<sound>\n{prompt_text}"
+        response = model_think.generate_content([sound, full_prompt], generation_config=generation_config_single)
         return response
     except Exception as e:
         return f"❌ Error: {str(e)}"