Spaces:

UCODE
/

agent

Sleeping

abenkbp commited on Sep 15, 2024

Commit

5180d45

1 Parent(s): 23afa91

rollback

Files changed (1) hide show

data/models/llama3-1-8b.py CHANGED Viewed

@@ -16,12 +16,12 @@ pipeline = transformers.pipeline(
     "text-generation",
     model=model_id,
     model_kwargs={"torch_dtype": torch.bfloat16},
-    device="cpu",
     token=api_key
 )
 @app.route('/chat', methods=['POST'])
-#@spaces.GPU(enable_queue=True)
 def chat_completion():
     data = request.json

     "text-generation",
     model=model_id,
     model_kwargs={"torch_dtype": torch.bfloat16},
+    device="gpu",
     token=api_key
 )
 @app.route('/chat', methods=['POST'])
+@spaces.GPU(enable_queue=True)
 def chat_completion():
     data = request.json