Skip to content

Commit 263d3e7

Browse files
committed
upload configs
1 parent 6dd2ae6 commit 263d3e7

File tree

50 files changed

+4118
-0
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

50 files changed

+4118
-0
lines changed
Lines changed: 94 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,94 @@
1+
{
2+
"model": {
3+
"Base_SmolVLM2_2B": {
4+
"class": "SmolVLM2",
5+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
6+
},
7+
"TTAugAdapter_SmolVLM2_2B_8_SimplePara_average": {
8+
"class": "TTAugAdapter_SmolVLM2",
9+
"model_args": {
10+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
11+
},
12+
"text_aug_args": {
13+
"gpt_paraphraser_strategy": "simple_paraphraser",
14+
"save_or_load": null,
15+
"path_text_aug_to_file": null
16+
},
17+
"image_aug_args": {
18+
"aug_strength": "high",
19+
"save_or_load_generativeimg": null,
20+
"strength_gen_aug": 0.25,
21+
"path_generativeimg_to_directory": null
22+
},
23+
"token_selection_aggregation_method": "average",
24+
"number_of_versions": 8,
25+
"save_inputs_for_debugging": false
26+
},
27+
"TTAugAdapter_SmolVLM2_2B_8_SimplePara_mostconf": {
28+
"class": "TTAugAdapter_SmolVLM2",
29+
"model_args": {
30+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
31+
},
32+
"text_aug_args": {
33+
"gpt_paraphraser_strategy": "simple_paraphraser",
34+
"save_or_load": null,
35+
"path_text_aug_to_file": null
36+
},
37+
"image_aug_args": {
38+
"aug_strength": "high",
39+
"save_or_load_generativeimg": null,
40+
"strength_gen_aug": 0.25,
41+
"path_generativeimg_to_directory": null
42+
},
43+
"token_selection_aggregation_method": "mostconfident",
44+
"number_of_versions": 8,
45+
"save_inputs_for_debugging": false
46+
}
47+
},
48+
"data": {
49+
"OCRBench": {
50+
"class": "OCRBench",
51+
"dataset": "OCRBench"
52+
},
53+
"MME-RealWorld-Lite": {
54+
"class": "MMERealWorld",
55+
"dataset": "MME-RealWorld-Lite"
56+
},
57+
"AMBER": {
58+
"class": "ImageYORNDataset",
59+
"dataset": "AMBER"
60+
},
61+
"TextVQA_VAL": {
62+
"class": "ImageVQADataset",
63+
"dataset": "TextVQA_VAL"
64+
},
65+
"TableVQABench": {
66+
"class": "TableVQABench",
67+
"dataset": "TableVQABench"
68+
},
69+
"AI2D_TEST": {
70+
"class": "ImageMCQDataset",
71+
"dataset": "AI2D_TEST"
72+
},
73+
"OCRVQA_TEST": {
74+
"class": "ImageVQADataset",
75+
"dataset": "OCRVQA_TEST"
76+
},
77+
"ChartQA_TEST": {
78+
"class": "ImageVQADataset",
79+
"dataset": "ChartQA_TEST"
80+
},
81+
"GQA_TestDev_Balanced": {
82+
"class": "ImageVQADataset",
83+
"dataset": "GQA_TestDev_Balanced"
84+
},
85+
"COCO_VAL": {
86+
"class": "ImageCaptionDataset",
87+
"dataset": "COCO_VAL"
88+
},
89+
"CCBench": {
90+
"class": "ImageMCQDataset",
91+
"dataset": "CCBench"
92+
}
93+
}
94+
}
Lines changed: 231 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,231 @@
1+
{
2+
"model": {
3+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer4": {
4+
"class": "TTAugAdapter_SmolVLM2",
5+
"model_args": {
6+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
7+
},
8+
"text_aug_args": {
9+
"gpt_paraphraser_strategy": "simple_paraphraser",
10+
"save_or_load": null,
11+
"path_text_aug_to_file": null
12+
},
13+
"image_aug_args": {
14+
"aug_strength": "high",
15+
"save_or_load_generativeimg": null,
16+
"strength_gen_aug": 0.25,
17+
"path_generativeimg_to_directory": null
18+
},
19+
"token_selection_aggregation_method": "average_features_early_layer",
20+
"average_features_early_layer": 4,
21+
"number_of_versions": 16,
22+
"save_inputs_for_debugging": false
23+
},
24+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer8": {
25+
"class": "TTAugAdapter_SmolVLM2",
26+
"model_args": {
27+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
28+
},
29+
"text_aug_args": {
30+
"gpt_paraphraser_strategy": "simple_paraphraser",
31+
"save_or_load": null,
32+
"path_text_aug_to_file": null
33+
},
34+
"image_aug_args": {
35+
"aug_strength": "high",
36+
"save_or_load_generativeimg": null,
37+
"strength_gen_aug": 0.25,
38+
"path_generativeimg_to_directory": null
39+
},
40+
"token_selection_aggregation_method": "average_features_early_layer",
41+
"average_features_early_layer": 8,
42+
"number_of_versions": 16,
43+
"save_inputs_for_debugging": false
44+
},
45+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer10": {
46+
"class": "TTAugAdapter_SmolVLM2",
47+
"model_args": {
48+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
49+
},
50+
"text_aug_args": {
51+
"gpt_paraphraser_strategy": "simple_paraphraser",
52+
"save_or_load": null,
53+
"path_text_aug_to_file": null
54+
},
55+
"image_aug_args": {
56+
"aug_strength": "high",
57+
"save_or_load_generativeimg": null,
58+
"strength_gen_aug": 0.25,
59+
"path_generativeimg_to_directory": null
60+
},
61+
"token_selection_aggregation_method": "average_features_early_layer",
62+
"average_features_early_layer": 10,
63+
"number_of_versions": 16,
64+
"save_inputs_for_debugging": false
65+
},
66+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer12": {
67+
"class": "TTAugAdapter_SmolVLM2",
68+
"model_args": {
69+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
70+
},
71+
"text_aug_args": {
72+
"gpt_paraphraser_strategy": "simple_paraphraser",
73+
"save_or_load": null,
74+
"path_text_aug_to_file": null
75+
},
76+
"image_aug_args": {
77+
"aug_strength": "high",
78+
"save_or_load_generativeimg": null,
79+
"strength_gen_aug": 0.25,
80+
"path_generativeimg_to_directory": null
81+
},
82+
"token_selection_aggregation_method": "average_features_early_layer",
83+
"average_features_early_layer": 12,
84+
"number_of_versions": 16,
85+
"save_inputs_for_debugging": false
86+
},
87+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer16": {
88+
"class": "TTAugAdapter_SmolVLM2",
89+
"model_args": {
90+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
91+
},
92+
"text_aug_args": {
93+
"gpt_paraphraser_strategy": "simple_paraphraser",
94+
"save_or_load": null,
95+
"path_text_aug_to_file": null
96+
},
97+
"image_aug_args": {
98+
"aug_strength": "high",
99+
"save_or_load_generativeimg": null,
100+
"strength_gen_aug": 0.25,
101+
"path_generativeimg_to_directory": null
102+
},
103+
"token_selection_aggregation_method": "average_features_early_layer",
104+
"average_features_early_layer": 16,
105+
"number_of_versions": 16,
106+
"save_inputs_for_debugging": false
107+
},
108+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer20": {
109+
"class": "TTAugAdapter_SmolVLM2",
110+
"model_args": {
111+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
112+
},
113+
"text_aug_args": {
114+
"gpt_paraphraser_strategy": "simple_paraphraser",
115+
"save_or_load": null,
116+
"path_text_aug_to_file": null
117+
},
118+
"image_aug_args": {
119+
"aug_strength": "high",
120+
"save_or_load_generativeimg": null,
121+
"strength_gen_aug": 0.25,
122+
"path_generativeimg_to_directory": null
123+
},
124+
"token_selection_aggregation_method": "average_features_early_layer",
125+
"average_features_early_layer": 20,
126+
"number_of_versions": 16,
127+
"save_inputs_for_debugging": false
128+
},
129+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer22": {
130+
"class": "TTAugAdapter_SmolVLM2",
131+
"model_args": {
132+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
133+
},
134+
"text_aug_args": {
135+
"gpt_paraphraser_strategy": "simple_paraphraser",
136+
"save_or_load": null,
137+
"path_text_aug_to_file": null
138+
},
139+
"image_aug_args": {
140+
"aug_strength": "high",
141+
"save_or_load_generativeimg": null,
142+
"strength_gen_aug": 0.25,
143+
"path_generativeimg_to_directory": null
144+
},
145+
"token_selection_aggregation_method": "average_features_early_layer",
146+
"average_features_early_layer": 22,
147+
"number_of_versions": 16,
148+
"save_inputs_for_debugging": false
149+
},
150+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer23": {
151+
"class": "TTAugAdapter_SmolVLM2",
152+
"model_args": {
153+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
154+
},
155+
"text_aug_args": {
156+
"gpt_paraphraser_strategy": "simple_paraphraser",
157+
"save_or_load": null,
158+
"path_text_aug_to_file": null
159+
},
160+
"image_aug_args": {
161+
"aug_strength": "high",
162+
"save_or_load_generativeimg": null,
163+
"strength_gen_aug": 0.25,
164+
"path_generativeimg_to_directory": null
165+
},
166+
"token_selection_aggregation_method": "average_features_early_layer",
167+
"average_features_early_layer": 23,
168+
"number_of_versions": 16,
169+
"save_inputs_for_debugging": false
170+
},
171+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_AverageEarlyLayer24": {
172+
"class": "TTAugAdapter_SmolVLM2",
173+
"model_args": {
174+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
175+
},
176+
"text_aug_args": {
177+
"gpt_paraphraser_strategy": "simple_paraphraser",
178+
"save_or_load": null,
179+
"path_text_aug_to_file": null
180+
},
181+
"image_aug_args": {
182+
"aug_strength": "high",
183+
"save_or_load_generativeimg": null,
184+
"strength_gen_aug": 0.25,
185+
"path_generativeimg_to_directory": null
186+
},
187+
"token_selection_aggregation_method": "average_features_early_layer",
188+
"average_features_early_layer": 24,
189+
"number_of_versions": 16,
190+
"save_inputs_for_debugging": false
191+
}
192+
},
193+
"data": {
194+
"OCRBench": {
195+
"class": "OCRBench",
196+
"dataset": "OCRBench"
197+
},
198+
"AMBER": {
199+
"class": "ImageYORNDataset",
200+
"dataset": "AMBER"
201+
},
202+
"TextVQA_VAL": {
203+
"class": "ImageVQADataset",
204+
"dataset": "TextVQA_VAL"
205+
},
206+
"AI2D_TEST": {
207+
"class": "ImageMCQDataset",
208+
"dataset": "AI2D_TEST"
209+
},
210+
"OCRVQA_TEST": {
211+
"class": "ImageVQADataset",
212+
"dataset": "OCRVQA_TEST"
213+
},
214+
"ChartQA_TEST": {
215+
"class": "ImageVQADataset",
216+
"dataset": "ChartQA_TEST"
217+
},
218+
"GQA_TestDev_Balanced": {
219+
"class": "ImageVQADataset",
220+
"dataset": "GQA_TestDev_Balanced"
221+
},
222+
"COCO_VAL": {
223+
"class": "ImageCaptionDataset",
224+
"dataset": "COCO_VAL"
225+
},
226+
"MME-RealWorld-Lite": {
227+
"class": "MMERealWorld",
228+
"dataset": "MME-RealWorld-Lite"
229+
}
230+
}
231+
}
Lines changed: 62 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,62 @@
1+
{
2+
"model": {
3+
"TTAugAdapter_SmolVLM2_2B_16_SimplePara_LearnedModel": {
4+
"class": "TTAugAdapter_SmolVLM2",
5+
"model_args": {
6+
"model_path": "HuggingFaceTB/SmolVLM2-2.2B-Instruct"
7+
},
8+
"text_aug_args": {
9+
"gpt_paraphraser_strategy": "simple_paraphraser",
10+
"save_or_load": null,
11+
"path_text_aug_to_file": null
12+
},
13+
"image_aug_args": {
14+
"aug_strength": "high",
15+
"save_or_load_generativeimg": null,
16+
"strength_gen_aug": 0.25,
17+
"path_generativeimg_to_directory": null
18+
},
19+
"token_selection_aggregation_method": "learned_model",
20+
"number_of_versions": 16,
21+
"save_inputs_for_debugging": false
22+
}
23+
},
24+
"data": {
25+
"OCRBench": {
26+
"class": "OCRBench",
27+
"dataset": "OCRBench"
28+
},
29+
"AMBER": {
30+
"class": "ImageYORNDataset",
31+
"dataset": "AMBER"
32+
},
33+
"TextVQA_VAL": {
34+
"class": "ImageVQADataset",
35+
"dataset": "TextVQA_VAL"
36+
},
37+
"AI2D_TEST": {
38+
"class": "ImageMCQDataset",
39+
"dataset": "AI2D_TEST"
40+
},
41+
"OCRVQA_TEST": {
42+
"class": "ImageVQADataset",
43+
"dataset": "OCRVQA_TEST"
44+
},
45+
"ChartQA_TEST": {
46+
"class": "ImageVQADataset",
47+
"dataset": "ChartQA_TEST"
48+
},
49+
"GQA_TestDev_Balanced": {
50+
"class": "ImageVQADataset",
51+
"dataset": "GQA_TestDev_Balanced"
52+
},
53+
"COCO_VAL": {
54+
"class": "ImageCaptionDataset",
55+
"dataset": "COCO_VAL"
56+
},
57+
"MME-RealWorld-Lite": {
58+
"class": "MMERealWorld",
59+
"dataset": "MME-RealWorld-Lite"
60+
}
61+
}
62+
}

0 commit comments

Comments
 (0)