Spaces:

avin-255
/

open-notebook

Paused

avinash commited on Jul 2

Commit

299633b

1 Parent(s): d425d6c

addedtiny llama

Files changed (4) hide show

app.py CHANGED Viewed

@@ -1,17 +1,23 @@
 import gradio as gr
 from asr import transcribe_audio
-def process_audio(audio):
     if audio is None:
-        return "No audio received!"
-    return transcribe_audio(audio)
 ui = gr.Interface(
-    fn=process_audio,
-    inputs=gr.Audio(type="filepath", label="Upload your voice (.wav / .mp3)"),
-    outputs=gr.Textbox(label="Transcribed Text"),
-    title="🎤 Whisper Tiny ASR Demo",
-    description="Upload a voice file. It uses Whisper-tiny for transcription."
 )
 if __name__ == "__main__":

 import gradio as gr
 from asr import transcribe_audio
+from llm_agent import get_llm_reply
+def voice_to_reply(audio):
     if audio is None:
+        return "No audio received!", "..."
+    text = transcribe_audio(audio)
+    reply = get_llm_reply(text)
+    return text, reply
 ui = gr.Interface(
+    fn=voice_to_reply,
+    inputs=gr.Audio(type="filepath", label="Upload voice (.wav or .mp3)"),
+    outputs=[
+        gr.Textbox(label="📝 Transcribed Text"),
+        gr.Textbox(label="🤖 LLM Reply")
+    ],
+    title="VoiceFreight AI v1: ASR + LLM",
+    description="Upload a voice file. ASR + TinyLlama gives you a response!"
 )
 if __name__ == "__main__":

asr.py CHANGED Viewed

@@ -1,7 +1,6 @@
-# asr.py
 import whisper
-model = whisper.load_model("tiny")  # lightweight + fast
 def transcribe_audio(file_path: str) -> str:
     result = model.transcribe(file_path)

 import whisper
+model = whisper.load_model("tiny")
 def transcribe_audio(file_path: str) -> str:
     result = model.transcribe(file_path)

llm_agent.py ADDED Viewed

+from transformers import AutoTokenizer, AutoModelForCausalLM
+import torch
+# Load the model (TinyLlama)
+model_name = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name)
+def get_llm_reply(user_input: str) -> str:
+    prompt = f"User: {user_input}\nAssistant:"
+    inputs = tokenizer(prompt, return_tensors="pt")
+    output = model.generate(
+        **inputs,
+        max_new_tokens=100,
+        do_sample=True,
+        temperature=0.7
+    )
+    response = tokenizer.decode(output[0], skip_special_tokens=True)
+    return response.replace(prompt, "").strip()

requirements.txt CHANGED Viewed

@@ -3,4 +3,4 @@ openai-whisper
 transformers
 torch
 TTS
-accelerate

 transformers
 torch
 TTS
+accelerate