Spaces:

alexkueck
/

TestInferenceAPI

Sleeping

App Files Files Community

alexkueck commited on Dec 17, 2023

Commit

9501c88

1 Parent(s): 06777f5

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -17

app.py CHANGED Viewed

@@ -182,7 +182,7 @@ def document_storage_chroma(splits):
 #Vektorstore vorbereiten...
 #dokumente in chroma db vektorisiert ablegen können - die Db vorbereiten daüfur
-def document_retrieval_chroma(llm, prompt):
     #OpenAI embeddings -------------------------------
     embeddings = OpenAIEmbeddings()
@@ -259,24 +259,25 @@ def generate_prompt_with_history_openai(prompt, history):
 ##############################################
 def generate(text, history, rag_option, model_option,  temperature=0.5, max_new_tokens=4048, top_p=0.6, repetition_penalty=1.3):
     #mit RAG
-    #später entsprechend mit Vektorstore...
-    #context="Nuremberg is the second-largest city of the German state of Bavaria after its capital Munich, and its 541,000 inhabitants make it the 14th-largest city in Germany. On the Pegnitz River (from its confluence with the Rednitz in Fürth onwards: Regnitz, a tributary of the River Main) and the Rhine–Main–Danube Canal, it lies in the Bavarian administrative region of Middle Franconia, and is the largest city and the unofficial capital of Franconia. Nuremberg forms with the neighbouring cities of Fürth, Erlangen and Schwabach a continuous conurbation with a total population of 812,248 (2022), which is the heart of the urban area region with around 1.4 million inhabitants,[4] while the larger Nuremberg Metropolitan Region has approximately 3.6 million inhabitants. The city lies about 170 kilometres (110 mi) north of Munich. It is the largest city in the East Franconian dialect area."
-    #prompt = f"""Use the following pieces of context to answer the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.
-            #{context} Question: {text}"""
     try:
-        #muss nur einmal ausgeführt werden...
-        if not splittet:
-            splits = document_loading_splitting()
-            document_storage_chroma(splits)
-        db = document_retrieval_chroma(llm, history_text_und_prompt)
-        #result = rag_chain(llm, history_text_und_prompt, db)
-        #mit RAG:
-        neu_text_mit_chunks = rag_chain(text, db)
-        prompt = generate_prompt_with_history_openai(neu_text_mit_chunks, history)
-        #zusammengesetzte Anfrage an Modell...
         #payload = tokenizer.apply_chat_template([{"role":"user","content":prompt}],tokenize=False)
         payload = tokenizer.apply_chat_template(prompt,tokenize=False)
         result = client.text_generation(

 #Vektorstore vorbereiten...
 #dokumente in chroma db vektorisiert ablegen können - die Db vorbereiten daüfur
+def document_retrieval_chroma():
     #OpenAI embeddings -------------------------------
     embeddings = OpenAIEmbeddings()
 ##############################################
 def generate(text, history, rag_option, model_option,  temperature=0.5, max_new_tokens=4048, top_p=0.6, repetition_penalty=1.3):
     #mit RAG
+     if (rag_option is None):
+        raise gr.Error("Retrieval Augmented Generation ist erforderlich.")
+    if (prompt == ""):
+        raise gr.Error("Prompt ist erforderlich.")
     try:
+        if (rag_option == "An"):
+            #muss nur einmal ausgeführt werden...
+            if not splittet:
+                splits = document_loading_splitting()
+                document_storage_chroma(splits)
+            db = document_retrieval_chroma()
+            #mit RAG:
+            neu_text_mit_chunks = rag_chain(text, db)
+            prompt = generate_prompt_with_history_openai(neu_text_mit_chunks, history)
+        else:
+            prompt = generate_prompt_with_history_openai(text, history)
+        #Anfrage an Modell (mit RAG: mit chunks aus Vektorstore, ohne: nur promt und history)
         #payload = tokenizer.apply_chat_template([{"role":"user","content":prompt}],tokenize=False)
         payload = tokenizer.apply_chat_template(prompt,tokenize=False)
         result = client.text_generation(