Spaces:

alexkueck
/

TestInferenceAPI

Sleeping

App Files Files Community

alexkueck commited on Dec 17, 2023

Commit

d7b7c3a

1 Parent(s): 216be95

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -9

app.py CHANGED Viewed

@@ -27,8 +27,8 @@ _ = load_dotenv(find_dotenv())
 # access token with permission to access the model and PRO subscription
-HUGGINGFACEHUB_API_TOKEN = os.getenv("HF_ACCESS_READ")
-#login(token=os.environ["HF_ACCESS_READ"])
 OAI_API_KEY=os.getenv("OPENAI_API_KEY")
@@ -72,14 +72,9 @@ splittet = False
 ##############################################
 print ("Inf.Client")
 #client = InferenceClient("https://api-inference.huggingface.co/models/meta-llama/Llama-2-70b-chat-hf")
-#client = InferenceClient("https://ybdhvwle4ksrawzo.eu-west-1.aws.endpoints.huggingface.cloud")
 #client = InferenceClient(model="TheBloke/Yi-34B-Chat-GGUF")
-#list of models available
-client = InferenceClient()
-print("List of models ......................:")
-print(client.list_deployed_models("text-generation-inference"))
 ##############################################
 # tokenizer for generating prompt
 ##############################################
@@ -87,7 +82,21 @@ print ("Tokenizer")
 #tokenizer = AutoTokenizer.from_pretrained("meta-llama/Llama-2-70b-chat-hf")
 #tokenizer = AutoTokenizer.from_pretrained("TheBloke/Yi-34B-Chat-GGUF")
 #tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
-tokenizer = AutoTokenizer.from_pretrained("bigcode/starcoder")
 #################################################

 # access token with permission to access the model and PRO subscription
+#HUGGINGFACEHUB_API_TOKEN = os.getenv("HF_ACCESS_READ")
+login(token=os.environ["HF_ACCESS_READ"])
 OAI_API_KEY=os.getenv("OPENAI_API_KEY")
 ##############################################
 print ("Inf.Client")
 #client = InferenceClient("https://api-inference.huggingface.co/models/meta-llama/Llama-2-70b-chat-hf")
+client = InferenceClient("https://ybdhvwle4ksrawzo.eu-west-1.aws.endpoints.huggingface.cloud")
 #client = InferenceClient(model="TheBloke/Yi-34B-Chat-GGUF")
 ##############################################
 # tokenizer for generating prompt
 ##############################################
 #tokenizer = AutoTokenizer.from_pretrained("meta-llama/Llama-2-70b-chat-hf")
 #tokenizer = AutoTokenizer.from_pretrained("TheBloke/Yi-34B-Chat-GGUF")
 #tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
+tokenizer =  AutoTokenizer.from_pretrained("mistralai/Mixtral-8x7B-Instruct-v0.1")
+##############################################
+# Zum Testen:
+#list of models available
+#client = InferenceClient()
+#print("List of models ......................:")
+#print(client.list_deployed_models("text-generation-inference"))
+#angezeigt am 17.12.2023:
+#{'text-generation': ['bigcode/starcoder','bigscience/bloom','codellama/CodeLlama-13b-hf','codellama/CodeLlama-34b-Instruct-hf','HuggingFaceH4/zephyr-7b-beta','HuggingFaceM4/idefics-80b-instruct', 'meta-llama/Llama-2-70b-chat-hf',
+                     #'mistralai/Mistral-7B-Instruct-v0.1','mistralai/Mistral-7B-v0.1', 'OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5','openchat/openchat_3.5','TheBloke/vicuna-7B-v1.5-GPTQ','tiiuae/falcon-180B-chat','tiiuae/falcon-7b',
+                     #'tiiuae/falcon-7b-instruct'],'text2text-generation': ['google/flan-t5-xxl']}
 #################################################