saddam213 commited on
Commit
5ae4186
·
verified ·
1 Parent(s): 41d3bb9

Upload 8 files

Browse files
Gemma-3-12B-IT/config.json CHANGED
@@ -3,7 +3,6 @@
3
  "Gemma3ForConditionalGeneration"
4
  ],
5
  "boi_token_index": 255999,
6
- "dtype": "float32",
7
  "eoi_token_index": 256000,
8
  "eos_token_id": [
9
  1,
@@ -13,13 +12,13 @@
13
  "initializer_range": 0.02,
14
  "mm_tokens_per_image": 256,
15
  "model_type": "gemma3",
 
16
  "text_config": {
17
  "_sliding_window_pattern": 6,
18
  "attention_bias": false,
19
  "attention_dropout": 0.0,
20
  "attn_logit_softcapping": null,
21
  "cache_implementation": "hybrid",
22
- "dtype": "float32",
23
  "final_logit_softcapping": null,
24
  "head_dim": 256,
25
  "hidden_activation": "gelu_pytorch_tanh",
@@ -98,7 +97,6 @@
98
  "transformers_version": "4.57.3",
99
  "vision_config": {
100
  "attention_dropout": 0.0,
101
- "dtype": "float32",
102
  "hidden_act": "gelu_pytorch_tanh",
103
  "hidden_size": 1152,
104
  "image_size": 896,
@@ -111,4 +109,4 @@
111
  "patch_size": 14,
112
  "vision_use_head": false
113
  }
114
- }
 
3
  "Gemma3ForConditionalGeneration"
4
  ],
5
  "boi_token_index": 255999,
 
6
  "eoi_token_index": 256000,
7
  "eos_token_id": [
8
  1,
 
12
  "initializer_range": 0.02,
13
  "mm_tokens_per_image": 256,
14
  "model_type": "gemma3",
15
+ "torch_dtype": "bfloat16",
16
  "text_config": {
17
  "_sliding_window_pattern": 6,
18
  "attention_bias": false,
19
  "attention_dropout": 0.0,
20
  "attn_logit_softcapping": null,
21
  "cache_implementation": "hybrid",
 
22
  "final_logit_softcapping": null,
23
  "head_dim": 256,
24
  "hidden_activation": "gelu_pytorch_tanh",
 
97
  "transformers_version": "4.57.3",
98
  "vision_config": {
99
  "attention_dropout": 0.0,
 
100
  "hidden_act": "gelu_pytorch_tanh",
101
  "hidden_size": 1152,
102
  "image_size": 896,
 
109
  "patch_size": 14,
110
  "vision_use_head": false
111
  }
112
+ }
Gemma-3-12B-IT/generation_config.json CHANGED
@@ -8,4 +8,4 @@
8
  "top_k": 64,
9
  "top_p": 0.95,
10
  "transformers_version": "4.57.3"
11
- }
 
8
  "top_k": 64,
9
  "top_p": 0.95,
10
  "transformers_version": "4.57.3"
11
+ }
Gemma-3-12B-IT/model-00001-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4847447e92599833e8dbaa3067cd201c3bb5c052efa91f11ba891e43234f7832
3
+ size 4979902192
Gemma-3-12B-IT/model-00002-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:891bd54eed03cba9ee1e705533a02a8217fcc29f356e4a1f53e5fd0d178883ad
3
+ size 4931296592
Gemma-3-12B-IT/model-00003-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cee411d9d57324e50ce064a192cc5a858276d508611b12fc599e0c9767112e0
3
+ size 4931296656
Gemma-3-12B-IT/model-00004-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bc75a29a730c9e743cad013feda3b0991a913fafe787c58a1c6e20afad97723
3
+ size 4931296656
Gemma-3-12B-IT/model-00005-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed14bd4908c98fed9f61e8cd410167e0846de9abd78e0452ab092072e5d9252d
3
+ size 4601000928
Gemma-3-12B-IT/model.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff