gimarchetti commited on
Commit
8c75a6f
·
verified ·
1 Parent(s): 3c8125d

Upload PaliGemmaForConditionalGeneration

Browse files

Paligemma 3B trained on ROCO datasets for 6 epochs

README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
 
2
  library_name: transformers
3
  license: gemma
4
- base_model: google/paligemma-3b-pt-448
5
  tags:
6
  - generated_from_trainer
7
  model-index:
 
1
  ---
2
+ base_model: google/paligemma-3b-pt-448
3
  library_name: transformers
4
  license: gemma
 
5
  tags:
6
  - generated_from_trainer
7
  model-index:
config.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "_name_or_path": "google/paligemma-3b-pt-448",
 
3
  "architectures": [
4
  "PaliGemmaForConditionalGeneration"
5
  ],
6
  "bos_token_id": 2,
7
  "eos_token_id": 1,
8
  "hidden_size": 2048,
9
- "ignore_index": -100,
10
  "image_token_index": 257152,
11
  "model_type": "paligemma",
12
  "pad_token_id": 0,
@@ -22,8 +22,8 @@
22
  "torch_dtype": "float32",
23
  "vocab_size": 257216
24
  },
25
- "torch_dtype": "bfloat16",
26
- "transformers_version": "4.44.2",
27
  "vision_config": {
28
  "hidden_size": 1152,
29
  "image_size": 448,
 
1
  {
2
+ "_name_or_path": "content/paligemma_rocov2/checkpoint-95000",
3
+ "_vocab_size": 257216,
4
  "architectures": [
5
  "PaliGemmaForConditionalGeneration"
6
  ],
7
  "bos_token_id": 2,
8
  "eos_token_id": 1,
9
  "hidden_size": 2048,
 
10
  "image_token_index": 257152,
11
  "model_type": "paligemma",
12
  "pad_token_id": 0,
 
22
  "torch_dtype": "float32",
23
  "vocab_size": 257216
24
  },
25
+ "torch_dtype": "float32",
26
+ "transformers_version": "4.45.1",
27
  "vision_config": {
28
  "hidden_size": 1152,
29
  "image_size": 448,
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 2,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.44.2"
7
  }
 
3
  "bos_token_id": 2,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.45.1"
7
  }
model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4caea4eb1a8ff0de1be4ae08def46c8c6f79a9faa74d333e40fda1f5ddabad8f
3
+ size 4956951424
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b68b180520b4ae71341479b03e4cc698f44d057594ec397fc26e3e06e7beb8c5
3
+ size 4999820608
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2396be16e026cdc11486af3f9a59282916e15c208b0e9740e60a6f39a40dad13
3
+ size 1740714288
model.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff