Divyasreepat commited on
Commit
4a67c64
·
verified ·
1 Parent(s): ab2b75c

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ assets/tokenizer/vocabulary.spm filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: keras-hub
3
+ ---
4
+ This is a [`SigLIP` model](https://keras.io/api/keras_hub/models/sig_lip) uploaded using the KerasHub library and can be used with JAX, TensorFlow, and PyTorch backends.
5
+ Model config:
6
+ * **name:** sig_lip_backbone
7
+ * **trainable:** True
8
+ * **vision_encoder:** {'module': 'keras_hub.src.models.siglip.siglip_vision_encoder', 'class_name': 'SigLIPVisionEncoder', 'config': {'name': 'sig_lip_vision_encoder', 'trainable': True, 'patch_size': 16, 'hidden_dim': 1024, 'num_layers': 24, 'num_heads': 16, 'intermediate_dim': 4096, 'intermediate_activation': 'gelu_approximate', 'layer_norm_epsilon': 1e-06, 'image_shape': [384, 384, 3]}, 'registered_name': 'keras_hub>SigLIPVisionEncoder'}
9
+ * **text_encoder:** {'module': 'keras_hub.src.models.siglip.siglip_text_encoder', 'class_name': 'SigLIPTextEncoder', 'config': {'name': 'sig_lip_text_encoder', 'trainable': True, 'vocabulary_size': 32000, 'embedding_dim': 1024, 'hidden_dim': 1024, 'num_layers': 24, 'num_heads': 16, 'intermediate_dim': 4096, 'intermediate_activation': 'gelu_approximate', 'layer_norm_epsilon': 1e-06, 'max_sequence_length': 64}, 'registered_name': 'keras_hub>SigLIPTextEncoder'}
10
+
11
+ This model card has been generated automatically and should be completed by the model author. See [Model Cards documentation](https://huggingface.co/docs/hub/model-cards) for more information.
assets/tokenizer/vocabulary.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e5036bed065526c3c212dfbe288752391797c4bb1a284aa18c9a0b23fcaf8ec
3
+ size 798330
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_hub.src.models.siglip.siglip_backbone",
3
+ "class_name": "SigLIPBackbone",
4
+ "config": {
5
+ "name": "sig_lip_backbone",
6
+ "trainable": true,
7
+ "vision_encoder": {
8
+ "module": "keras_hub.src.models.siglip.siglip_vision_encoder",
9
+ "class_name": "SigLIPVisionEncoder",
10
+ "config": {
11
+ "name": "sig_lip_vision_encoder",
12
+ "trainable": true,
13
+ "patch_size": 16,
14
+ "hidden_dim": 1024,
15
+ "num_layers": 24,
16
+ "num_heads": 16,
17
+ "intermediate_dim": 4096,
18
+ "intermediate_activation": "gelu_approximate",
19
+ "layer_norm_epsilon": 1e-06,
20
+ "image_shape": [
21
+ 384,
22
+ 384,
23
+ 3
24
+ ]
25
+ },
26
+ "registered_name": "keras_hub>SigLIPVisionEncoder"
27
+ },
28
+ "text_encoder": {
29
+ "module": "keras_hub.src.models.siglip.siglip_text_encoder",
30
+ "class_name": "SigLIPTextEncoder",
31
+ "config": {
32
+ "name": "sig_lip_text_encoder",
33
+ "trainable": true,
34
+ "vocabulary_size": 32000,
35
+ "embedding_dim": 1024,
36
+ "hidden_dim": 1024,
37
+ "num_layers": 24,
38
+ "num_heads": 16,
39
+ "intermediate_dim": 4096,
40
+ "intermediate_activation": "gelu_approximate",
41
+ "layer_norm_epsilon": 1e-06,
42
+ "max_sequence_length": 64
43
+ },
44
+ "registered_name": "keras_hub>SigLIPTextEncoder"
45
+ }
46
+ },
47
+ "registered_name": "keras_hub>SigLIPBackbone"
48
+ }
image_converter.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_hub.src.models.siglip.siglip_image_converter",
3
+ "class_name": "SigLIPImageConverter",
4
+ "config": {
5
+ "name": "sig_lip_image_converter",
6
+ "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "float32"
12
+ },
13
+ "registered_name": null
14
+ },
15
+ "image_size": [
16
+ 384,
17
+ 384
18
+ ],
19
+ "scale": [
20
+ 0.00784313725490196,
21
+ 0.00784313725490196,
22
+ 0.00784313725490196
23
+ ],
24
+ "offset": [
25
+ -1.0,
26
+ -1.0,
27
+ -1.0
28
+ ],
29
+ "interpolation": "bicubic",
30
+ "antialias": true,
31
+ "crop_to_aspect_ratio": false,
32
+ "pad_to_aspect_ratio": false,
33
+ "bounding_box_format": "yxyx"
34
+ },
35
+ "registered_name": "keras_hub>SigLIPImageConverter"
36
+ }
metadata.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "keras_version": "3.8.0",
3
+ "keras_hub_version": "0.19.0",
4
+ "parameter_count": 652479106,
5
+ "date_saved": "2025-03-01@12:11:53",
6
+ "tasks": []
7
+ }
model.weights.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d22fc2b7123b2eea356fbf9e43460a613b598593c75b99ab09f2f993954f3c1
3
+ size 2611500208
tokenizer.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_hub.src.models.siglip.siglip_tokenizer",
3
+ "class_name": "SigLIPTokenizer",
4
+ "config": {
5
+ "name": "sig_lip_tokenizer",
6
+ "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "int32"
12
+ },
13
+ "registered_name": null
14
+ },
15
+ "config_file": "tokenizer.json",
16
+ "proto": null,
17
+ "sequence_length": null,
18
+ "add_bos": false,
19
+ "add_eos": true
20
+ },
21
+ "registered_name": "keras_hub>SigLIPTokenizer"
22
+ }