Spaces:

pinyuchen
/

Gradient-Cuff-Jailbreak-Detector-Granite-2B

Sleeping

gregH commited on Dec 7, 2024

Commit

c3f6d74

verified ·

1 Parent(s): 96cb79d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -110,7 +110,7 @@ def engine(input_embeds):
             batch_input_embeds = input_embeds[start:start+batch_size]
             outputs = m.generate(
                 inputs_embeds = batch_input_embeds.to("cuda"),
-                max_new_tokens = 512,
                 do_sample = True,
                 temperature = 0.6,
                 top_p = 0.9,
@@ -126,7 +126,7 @@ def chat_engine(input_ids):
     with torch.no_grad():
         outputs = m.generate(
             input_ids = input_ids.to("cuda"),
-            max_new_tokens = 64,
             do_sample = True,
             temperature = 0.6,
             top_p = 0.9,

             batch_input_embeds = input_embeds[start:start+batch_size]
             outputs = m.generate(
                 inputs_embeds = batch_input_embeds.to("cuda"),
+                max_new_tokens = 16,
                 do_sample = True,
                 temperature = 0.6,
                 top_p = 0.9,
     with torch.no_grad():
         outputs = m.generate(
             input_ids = input_ids.to("cuda"),
+            max_new_tokens = 512,
             do_sample = True,
             temperature = 0.6,
             top_p = 0.9,