File size: 3,540 Bytes
2bc621c
 
 
 
37abbb9
2bc621c
 
 
 
 
37abbb9
372cef4
 
2bc621c
 
 
46a8dd2
8ad600e
 
372cef4
 
2bc621c
372cef4
2bc621c
a208037
2bc621c
 
372cef4
 
e38527c
6c6d04d
 
a208037
85c4619
46a8dd2
685879b
8ad600e
685879b
 
 
 
a208037
 
 
 
685879b
 
 
 
a208037
 
 
 
685879b
 
 
 
a208037
 
 
 
685879b
 
 
a208037
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46a8dd2
2bc621c
fcf0427
2bc621c
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
{
    "vit_hidden_dim": 768,
    "vit_inter_dim": 3072,
    "vit_patch_size": 16,
    "vit_img_size": 512,
    "vit_n_heads": 12,
    "vit_dropout": 0.0,
    "vit_n_blocks": 12,
    "vit_ln_eps": 1e-06,
    "vit_cls_flag": false,
    "vit_model_type": "google/siglip2-base-patch16-512",
    "lm_hidden_dim": 576,
    "lm_inter_dim": 1536,
    "lm_rms_eps": 1e-05,
    "lm_re_base": 100000,
    "lm_max_position_embeddings": 8192,
    "lm_base_vocab_size": 49152,
    "extra_token_amount": 66,
    "lm_vocab_size": 49218,
    "lm_n_heads": 9,
    "lm_n_kv_heads": 3,
    "lm_dropout": 0.0,
    "lm_n_blocks": 30,
    "lm_attn_scaling": 1.0,
    "lm_max_length": 4096,
    "lm_use_tokens": false,
    "lm_tie_weights": true,
    "lm_model_type": "HuggingFaceTB/SmolLM2-135M-Instruct",
    "lm_tokenizer": "HuggingFaceTB/SmolLM2-135M-Instruct",
    "lm_chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
    "mp_pixel_shuffle_factor": 4,
    "mp_image_token_length": 64,
    "max_img_size": 2048,
    "resize_to_max_side_len": true,
    "vlm_extra_tokens": {
        "image_token": "<|image|>",
        "global_image_token": "<|global_image|>",
        "r1c1": "<row_1_col_1>",
        "r1c2": "<row_1_col_2>",
        "r1c3": "<row_1_col_3>",
        "r1c4": "<row_1_col_4>",
        "r1c5": "<row_1_col_5>",
        "r1c6": "<row_1_col_6>",
        "r1c7": "<row_1_col_7>",
        "r1c8": "<row_1_col_8>",
        "r2c1": "<row_2_col_1>",
        "r2c2": "<row_2_col_2>",
        "r2c3": "<row_2_col_3>",
        "r2c4": "<row_2_col_4>",
        "r2c5": "<row_2_col_5>",
        "r2c6": "<row_2_col_6>",
        "r2c7": "<row_2_col_7>",
        "r2c8": "<row_2_col_8>",
        "r3c1": "<row_3_col_1>",
        "r3c2": "<row_3_col_2>",
        "r3c3": "<row_3_col_3>",
        "r3c4": "<row_3_col_4>",
        "r3c5": "<row_3_col_5>",
        "r3c6": "<row_3_col_6>",
        "r3c7": "<row_3_col_7>",
        "r3c8": "<row_3_col_8>",
        "r4c1": "<row_4_col_1>",
        "r4c2": "<row_4_col_2>",
        "r4c3": "<row_4_col_3>",
        "r4c4": "<row_4_col_4>",
        "r4c5": "<row_4_col_5>",
        "r4c6": "<row_4_col_6>",
        "r4c7": "<row_4_col_7>",
        "r4c8": "<row_4_col_8>",
        "r5c1": "<row_5_col_1>",
        "r5c2": "<row_5_col_2>",
        "r5c3": "<row_5_col_3>",
        "r5c4": "<row_5_col_4>",
        "r5c5": "<row_5_col_5>",
        "r5c6": "<row_5_col_6>",
        "r5c7": "<row_5_col_7>",
        "r5c8": "<row_5_col_8>",
        "r6c1": "<row_6_col_1>",
        "r6c2": "<row_6_col_2>",
        "r6c3": "<row_6_col_3>",
        "r6c4": "<row_6_col_4>",
        "r6c5": "<row_6_col_5>",
        "r6c6": "<row_6_col_6>",
        "r6c7": "<row_6_col_7>",
        "r6c8": "<row_6_col_8>",
        "r7c1": "<row_7_col_1>",
        "r7c2": "<row_7_col_2>",
        "r7c3": "<row_7_col_3>",
        "r7c4": "<row_7_col_4>",
        "r7c5": "<row_7_col_5>",
        "r7c6": "<row_7_col_6>",
        "r7c7": "<row_7_col_7>",
        "r7c8": "<row_7_col_8>",
        "r8c1": "<row_8_col_1>",
        "r8c2": "<row_8_col_2>",
        "r8c3": "<row_8_col_3>",
        "r8c4": "<row_8_col_4>",
        "r8c5": "<row_8_col_5>",
        "r8c6": "<row_8_col_6>",
        "r8c7": "<row_8_col_7>",
        "r8c8": "<row_8_col_8>"
    },
    "vlm_load_backbone_weights": true,
    "vlm_checkpoint_path": "checkpoints",
    "hf_repo_name": "nanoVLM"
}