Upload Gemma3ForConditionalGeneration (#3)

- Upload Gemma3ForConditionalGeneration (5b3dad501ce477b2820f9508a750b990af5df4e7)

Files changed (3) hide show

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
     "Gemma3ForConditionalGeneration"
   ],
   "boi_token_index": 255999,
   "eoi_token_index": 256000,
   "eos_token_id": [
     1,
@@ -24,38 +25,6 @@
     "initializer_range": 0.02,
     "intermediate_size": 10240,
     "layer_types": [
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "full_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "full_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "full_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "full_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "sliding_attention",
-      "full_attention",
-      "sliding_attention",
-      "sliding_attention",
       "sliding_attention",
       "sliding_attention"
     ],
@@ -76,8 +45,7 @@
     "use_cache": true,
     "vocab_size": 262208
   },
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.56.0.dev0",
   "vision_config": {
     "attention_dropout": 0.0,
     "hidden_act": "gelu_pytorch_tanh",

     "Gemma3ForConditionalGeneration"
   ],
   "boi_token_index": 255999,
+  "dtype": "bfloat16",
   "eoi_token_index": 256000,
   "eos_token_id": [
     1,
     "initializer_range": 0.02,
     "intermediate_size": 10240,
     "layer_types": [
       "sliding_attention",
       "sliding_attention"
     ],
     "use_cache": true,
     "vocab_size": 262208
   },
+  "transformers_version": "4.56.1",
   "vision_config": {
     "attention_dropout": 0.0,
     "hidden_act": "gelu_pytorch_tanh",

generation_config.json CHANGED Viewed

@@ -6,5 +6,5 @@
     106
   ],
   "pad_token_id": 0,
-  "transformers_version": "4.56.0.dev0"
 }

     106
   ],
   "pad_token_id": 0,
+  "transformers_version": "4.56.1"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf90459fa823642f18860212325d52bc76a2e0e520e70ab88d56d132396d673f
 size 11287536

 version https://git-lfs.github.com/spec/v1
+oid sha256:56dc37066c675420391d220a2ed601068b2eb092ed96d8e8d2ba4cd1f9de8e97
 size 11287536