avinash commited on
Commit
e792350
·
1 Parent(s): bf6f7a9

updated ui2

Browse files
Files changed (4) hide show
  1. loader.py +10 -0
  2. rag_chain.py +20 -0
  3. tts.py +0 -8
  4. tts_engine.py +7 -0
loader.py ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ # loader.py
2
+ from langchain.document_loaders import PyPDFLoader
3
+ from langchain.text_splitter import RecursiveCharacterTextSplitter
4
+
5
+ def load_and_split_pdf(pdf_path):
6
+ loader = PyPDFLoader(pdf_path)
7
+ docs = loader.load()
8
+
9
+ splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
10
+ return splitter.split_documents(docs)
rag_chain.py ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # rag_chain.py
2
+ from langchain.vectorstores import Chroma
3
+ from langchain.embeddings import HuggingFaceEmbeddings
4
+ from langchain.chains import RetrievalQA
5
+ from langchain.llms import HuggingFaceHub
6
+
7
+ def setup_rag_chain(docs):
8
+ embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
9
+ vectorstore = Chroma.from_documents(docs, embedding=embeddings)
10
+
11
+ retriever = vectorstore.as_retriever()
12
+
13
+ # Replace this with your own hosted LLaMA 3.1 if needed
14
+ llm = HuggingFaceHub(
15
+ repo_id="meta-llama/Meta-Llama-3-8B-Instruct",
16
+ model_kwargs={"temperature": 0.3, "max_tokens": 512}
17
+ )
18
+
19
+ qa_chain = RetrievalQA.from_chain_type(llm=llm, retriever=retriever)
20
+ return qa_chain
tts.py DELETED
@@ -1,8 +0,0 @@
1
- from TTS.api import TTS
2
-
3
-
4
- tts = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC", progress_bar=False, gpu=False)
5
-
6
- def generate_speech(text, filename="output.wav"):
7
- tts.tts_to_file(text=text, file_path=filename)
8
- return filename
 
 
 
 
 
 
 
 
 
tts_engine.py ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ from TTS.api import TTS
2
+
3
+ tts = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC", gpu=False)
4
+
5
+ def generate_voice(text, path="podcast.wav"):
6
+ tts.tts_to_file(text=text, file_path=path)
7
+ return path