abenkbp commited on
Commit
5180d45
·
1 Parent(s): 23afa91
Files changed (1) hide show
  1. data/models/llama3-1-8b.py +2 -2
data/models/llama3-1-8b.py CHANGED
@@ -16,12 +16,12 @@ pipeline = transformers.pipeline(
16
  "text-generation",
17
  model=model_id,
18
  model_kwargs={"torch_dtype": torch.bfloat16},
19
- device="cpu",
20
  token=api_key
21
  )
22
 
23
  @app.route('/chat', methods=['POST'])
24
- #@spaces.GPU(enable_queue=True)
25
  def chat_completion():
26
  data = request.json
27
 
 
16
  "text-generation",
17
  model=model_id,
18
  model_kwargs={"torch_dtype": torch.bfloat16},
19
+ device="gpu",
20
  token=api_key
21
  )
22
 
23
  @app.route('/chat', methods=['POST'])
24
+ @spaces.GPU(enable_queue=True)
25
  def chat_completion():
26
  data = request.json
27