lmassaron
/

gemma-3-4b-finsentiment

Image-Text-to-Text

text-generation-inference

4-bit precision

Model card Files Files and versions

lmassaron commited on Sep 25

Commit

4af2778

·

verified ·

1 Parent(s): d2dc234

Upload Gemma3ForConditionalGeneration

Files changed (3) hide show

config.json +1 -1
generation_config.json +1 -0
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -15,7 +15,7 @@
   "quantization_config": {
     "_load_in_4bit": true,
     "_load_in_8bit": false,
-    "bnb_4bit_compute_dtype": "float16",
     "bnb_4bit_quant_storage": "uint8",
     "bnb_4bit_quant_type": "nf4",
     "bnb_4bit_use_double_quant": true,

   "quantization_config": {
     "_load_in_4bit": true,
     "_load_in_8bit": false,
+    "bnb_4bit_compute_dtype": "bfloat16",
     "bnb_4bit_quant_storage": "uint8",
     "bnb_4bit_quant_type": "nf4",
     "bnb_4bit_use_double_quant": true,

generation_config.json CHANGED Viewed

@@ -1,5 +1,6 @@
 {
   "bos_token_id": 2,
   "do_sample": true,
   "eos_token_id": [
     1,

 {
   "bos_token_id": 2,
+  "cache_implementation": "hybrid",
   "do_sample": true,
   "eos_token_id": [
     1,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b6c01cfa2528370548ee058dd6856aefb55b9b32645b158986ac6722207c1a8f
-size 4589674328

 version https://git-lfs.github.com/spec/v1
+oid sha256:2d3f44a10c2f50aeb6fbde5d654b6045350c1c5d14c37c3e185107eab2602d07
+size 3247160009