Spaces:

dodd869
/

ai

Sleeping

ai / app.py

Update app.py

4c03b44 verified 2 months ago

1.47 kB

	import os
	import gradio as gr
	from huggingface_hub import InferenceClient
	import requests

	url = "https://huggingface.co/models-json?num_parameters=min%3A64B&inference_provider=novita&sort=modified&withCount=true"
	res = requests.get(url).json()
	model_ids = [m['id'] for m in res.get('models', [])]

	client = InferenceClient(provider="novita", api_key=os.environ["HF_TOKEN"])

	def respond(message, history, model):
	history.append((message, ""))
	yield "", history
	full_reply = ""
	for chunk in client.chat.completions.create(
	model=model,
	messages=[{"role": "user", "content": message}],
	stream=True
	):
	if chunk.choices and len(chunk.choices) > 0:
	delta = chunk.choices[0].delta
	if hasattr(delta, 'content') and delta.content:
	full_reply += delta.content
	history[-1] = (message, full_reply)
	yield "", history

	with gr.Blocks() as demo:
	gr.Markdown("## AI")
	chatbot = gr.Chatbot(height=400)
	msg = gr.Textbox(label="Ask me smth")
	model_dd = gr.Dropdown(model_ids, label="Model", value=model_ids[0] if model_ids else "")
	with gr.Row():
	submit_btn = gr.Button("Send")
	clear = gr.Button("Clear")
	msg.submit(respond, [msg, chatbot, model_dd], [msg, chatbot])
	submit_btn.click(respond, [msg, chatbot, model_dd], [msg, chatbot])
	clear.click(lambda: None, None, chatbot, queue=False)

	demo.queue().launch()