ManishThota commited on
Commit
f72f988
1 Parent(s): 35a5984

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -39,3 +39,6 @@ LLaVA-NeXT-Video-7B-DPO-7B-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
39
  llava.clip filter=lfs diff=lfs merge=lfs -text
40
  llava.projector filter=lfs diff=lfs merge=lfs -text
41
  vit/mmproj-model-f16.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
39
  llava.clip filter=lfs diff=lfs merge=lfs -text
40
  llava.projector filter=lfs diff=lfs merge=lfs -text
41
  vit/mmproj-model-f16.gguf filter=lfs diff=lfs merge=lfs -text
42
+ mmproj-model-f16.gguf filter=lfs diff=lfs merge=lfs -text
43
+ mmproj-model-f32.gguf filter=lfs diff=lfs merge=lfs -text
44
+ mmproj-model-q8_0.gguf filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -1,16 +1,25 @@
1
  {
2
- "_name_or_path": "model_zoo/LLM/vicuna/7B-V1.5",
3
  "architectures": [
4
- "LlavaLlamaForCausalLM"
5
  ],
6
- "attention_bias": false,
7
  "attention_dropout": 0.0,
8
- "bos_token_id": 1,
9
- "eos_token_id": 2,
10
- "freeze_mm_mlp_adapter": true,
11
- "freeze_mm_vision_resampler": false,
12
- "hidden_act": "silu",
13
- "hidden_size": 4096,
 
 
 
 
 
 
 
 
 
 
14
  "image_aspect_ratio": "anyres",
15
  "image_crop_resolution": 224,
16
  "image_grid_pinpoints": [
@@ -37,41 +46,17 @@
37
  ],
38
  "image_split_resolution": 224,
39
  "initializer_range": 0.02,
40
- "intermediate_size": 11008,
41
  "max_position_embeddings": 4096,
42
  "mm_hidden_size": 1024,
43
  "mm_patch_merge_type": "spatial_unpad",
44
  "mm_projector_lr": null,
45
  "mm_projector_type": "mlp2x_gelu",
46
- "mm_resampler_type": "spatial_pool",
47
- "mm_spatial_pool_mode": "average",
48
- "mm_spatial_pool_out_channels": 1024,
49
- "mm_spatial_pool_stride": 2,
50
  "mm_use_im_patch_token": false,
51
  "mm_use_im_start_end": false,
52
  "mm_vision_select_feature": "patch",
53
  "mm_vision_select_layer": -2,
54
- "mm_vision_tower": "openai/clip-vit-large-patch14-336",
55
- "mm_vision_tower_lr": null,
56
- "model_type": "llava",
57
- "num_attention_heads": 32,
58
- "num_hidden_layers": 32,
59
- "num_key_value_heads": 32,
60
- "pad_token_id": 0,
61
- "patchify_video_feature": false,
62
- "pretraining_tp": 1,
63
- "rms_norm_eps": 1e-05,
64
- "rope_scaling": null,
65
- "rope_theta": 10000.0,
66
- "tie_word_embeddings": false,
67
- "tokenizer_model_max_length": 4096,
68
- "tokenizer_padding_side": "right",
69
- "torch_dtype": "bfloat16",
70
- "transformers_version": "4.39.2",
71
- "tune_mm_mlp_adapter": false,
72
- "tune_mm_vision_resampler": false,
73
- "unfreeze_mm_vision_tower": false,
74
- "use_cache": true,
75
- "use_mm_proj": true,
76
- "vocab_size": 32000
77
  }
 
1
  {
2
+ "_name_or_path": "vit-large336-custom",
3
  "architectures": [
4
+ "CLIPVisionModel"
5
  ],
 
6
  "attention_dropout": 0.0,
7
+ "dropout": 0.0,
8
+ "hidden_act": "quick_gelu",
9
+ "hidden_size": 1024,
10
+ "image_size": 336,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 4096,
14
+ "layer_norm_eps": 1e-05,
15
+ "model_type": "clip_vision_model",
16
+ "num_attention_heads": 16,
17
+ "num_channels": 3,
18
+ "num_hidden_layers": 24,
19
+ "patch_size": 14,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "bfloat16",
22
+ "transformers_version": "4.31.0",
23
  "image_aspect_ratio": "anyres",
24
  "image_crop_resolution": 224,
25
  "image_grid_pinpoints": [
 
46
  ],
47
  "image_split_resolution": 224,
48
  "initializer_range": 0.02,
49
+ "max_length": 4096,
50
  "max_position_embeddings": 4096,
51
  "mm_hidden_size": 1024,
52
  "mm_patch_merge_type": "spatial_unpad",
53
  "mm_projector_lr": null,
54
  "mm_projector_type": "mlp2x_gelu",
55
+ "mm_resampler_type": null,
 
 
 
56
  "mm_use_im_patch_token": false,
57
  "mm_use_im_start_end": false,
58
  "mm_vision_select_feature": "patch",
59
  "mm_vision_select_layer": -2,
60
+ "mm_vision_tower__": "openai/clip-vit-large-patch14-336",
61
+ "mm_vision_tower_lr": 2e-06
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
62
  }
mmproj-model-f16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f870142318cb91f83448d7c8382b6f9136e160cfeca0ddce252d1e7a63deb357
3
+ size 624451168
mmproj-model-f32.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b1477e04fed50d26a03dc7faf8847a4db9ce9296285f2b8a90f37f55cb134f6
3
+ size 1204446816
mmproj-model-q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe7b67aa135e0a95a85c8765a59b035b425478bae0c1d7a6a2e6a9c5e073ad20
3
+ size 1204446816
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d99f87cc57e547eb3a0287b753ca6500aa4e1505c3ead22066f48360bfd485c6
3
+ size 607116558