alana89 commited on
Commit
cb041f3
·
verified ·
1 Parent(s): 28c86fa

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. .DS_Store +0 -0
  2. config.json +24 -0
  3. model.safetensors +3 -0
  4. pretrain_args.json +415 -0
.DS_Store ADDED
Binary file (6.15 kB). View file
 
config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "TabStarModel"
4
+ ],
5
+ "batch_size": 32,
6
+ "bert_lr_factor": 1.0,
7
+ "d_model": 384,
8
+ "downstream_mode": null,
9
+ "e5_model": "intfloat/e5-small-v2",
10
+ "is_pretrain": true,
11
+ "lr": 5e-05,
12
+ "macro_batch_size": 128,
13
+ "model_type": "tabstar",
14
+ "num_layers": 6,
15
+ "numbers_fusion": "attention",
16
+ "p_mask": 0,
17
+ "scheduler": "cycle",
18
+ "tabular_encoder_type": "d1",
19
+ "torch_dtype": "float32",
20
+ "transformers_version": "4.49.0",
21
+ "unfreeze_layers": 6,
22
+ "weight_balance": "uniform",
23
+ "weight_decay": 0.001
24
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92ff18fa412a375b5a91a22d01480fb25e3833a6e0f522b28c22a6fe6e596b0
3
+ size 189091544
pretrain_args.json ADDED
@@ -0,0 +1,415 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "raw_exp_name": "tabstar_sota_k3",
3
+ "tabular_layers": 6,
4
+ "e5": "intfloat/e5-small-v2",
5
+ "tabular_encoder_type": "d1",
6
+ "numbers_fusion": "attention",
7
+ "base_lr": 5e-05,
8
+ "bert_lr_factor": 1.0,
9
+ "weight_decay": 0.001,
10
+ "weight": "uniform",
11
+ "numbers_verbalization": "full",
12
+ "unfreeze_layers": 6,
13
+ "light": false,
14
+ "debug": false,
15
+ "max_epoch_examples": 2048,
16
+ "datasets": [
17
+ 41164,
18
+ 48,
19
+ 46684,
20
+ 41142,
21
+ 40753,
22
+ 23381,
23
+ "sukritchatterjee/used-cars-dataset-cardekho/cars_details_merges.csv",
24
+ 46674,
25
+ 507,
26
+ 541,
27
+ 185,
28
+ 44957,
29
+ 41156,
30
+ 46441,
31
+ 1480,
32
+ 40927,
33
+ 44969,
34
+ 42343,
35
+ 5,
36
+ 1487,
37
+ 1503,
38
+ 558,
39
+ 1464,
40
+ 300,
41
+ 46701,
42
+ 44974,
43
+ 44975,
44
+ "stefanoleone992/filmtv-movies-dataset/filmtv_movies.csv",
45
+ 46606,
46
+ 1049,
47
+ 46708,
48
+ 44964,
49
+ 458,
50
+ 46584,
51
+ "ajinkyablaze/football-manager-data/dataset.csv",
52
+ 40693,
53
+ 1459,
54
+ 42729,
55
+ 45567,
56
+ 42734,
57
+ 43748,
58
+ 46659,
59
+ 40975,
60
+ 40900,
61
+ 28,
62
+ 40672,
63
+ "imuhammad/us-2020-presidential-election-speeches/us_2020_election_speeches.csv",
64
+ 44970,
65
+ 505,
66
+ 1485,
67
+ 41169,
68
+ 40677,
69
+ 42806,
70
+ 1567,
71
+ 57,
72
+ 1099,
73
+ 525,
74
+ 46678,
75
+ 45577,
76
+ 1483,
77
+ 25,
78
+ 24,
79
+ 46,
80
+ "noorrizki/top-korean-drama-list-1500/kdrama_list.csv",
81
+ 2,
82
+ 26,
83
+ 1466,
84
+ 40996,
85
+ 566,
86
+ "limtis/wikiliq-dataset/spirits_data.csv",
87
+ 560,
88
+ 43743,
89
+ 45064,
90
+ 43822,
91
+ 44973,
92
+ 563,
93
+ 41161,
94
+ 40985,
95
+ 46719,
96
+ 44146,
97
+ "http://pages.cs.wisc.edu/~anhai/data/784_data/movies1/csv_files/rotten_tomatoes.csv",
98
+ 940,
99
+ 42731,
100
+ 1046,
101
+ 43660,
102
+ 41159,
103
+ 42570,
104
+ 42563,
105
+ 1510,
106
+ 11,
107
+ 43712,
108
+ 40701,
109
+ 307,
110
+ 43420,
111
+ 45012,
112
+ 554,
113
+ 43595,
114
+ 44231,
115
+ 43435,
116
+ 43344,
117
+ 41162,
118
+ 1457,
119
+ 42712,
120
+ 40983,
121
+ 1111,
122
+ 46359,
123
+ 41990,
124
+ 41143,
125
+ 43643,
126
+ 43766,
127
+ "ruthgn/beer-profile-and-ratings-data-set/beer_profile_and_ratings.csv",
128
+ 46656,
129
+ 1486,
130
+ 46654,
131
+ 42225,
132
+ 41167,
133
+ "mattop/nba-draft-basketball-player-data-19892021/nbaplayersdraft.csv",
134
+ 44976,
135
+ 40984,
136
+ 45062,
137
+ 42345,
138
+ 215,
139
+ 46607,
140
+ 41147,
141
+ 44125,
142
+ 546,
143
+ 40922,
144
+ 46669,
145
+ 223,
146
+ "http://pages.cs.wisc.edu/~anhai/data/784_data/books2/csv_files/goodreads.csv",
147
+ "mustafaimam/used-car-prices-in-pakistan-2021/Used_car_prices_in_Pakistan_cleaned.csv",
148
+ 4549,
149
+ 4538,
150
+ 516,
151
+ 15,
152
+ 43071,
153
+ 45039,
154
+ 46762,
155
+ "joshuakalobbowles/vivino-wine-data/vivino.csv",
156
+ 43397,
157
+ 4134,
158
+ 43502,
159
+ 422,
160
+ 46430,
161
+ 3050,
162
+ 41150,
163
+ 46444,
164
+ 1116,
165
+ 44963,
166
+ 4541,
167
+ 201,
168
+ 503,
169
+ 41157,
170
+ 41168,
171
+ 42732,
172
+ 43687,
173
+ 377,
174
+ 42165,
175
+ 1515,
176
+ 666,
177
+ 43342,
178
+ 44156,
179
+ 1169,
180
+ 41165,
181
+ 44227,
182
+ 46646,
183
+ 470,
184
+ 41021,
185
+ 504,
186
+ 574,
187
+ 42895,
188
+ 45560,
189
+ 13,
190
+ 46610,
191
+ "http://pages.cs.wisc.edu/~anhai/data/784_data/bikes/csv_files/bikewale.csv",
192
+ 1493,
193
+ 1475,
194
+ 451,
195
+ 43588,
196
+ 42194,
197
+ 44962,
198
+ 4534,
199
+ 42746,
200
+ 44994,
201
+ 529,
202
+ 32,
203
+ 40966,
204
+ 40971,
205
+ 181,
206
+ 1494,
207
+ 43838,
208
+ 43389,
209
+ 46660,
210
+ 42125,
211
+ 334,
212
+ 1067,
213
+ 188,
214
+ 46603,
215
+ 40705,
216
+ 45547,
217
+ 45038,
218
+ 40945,
219
+ 1495,
220
+ 7,
221
+ 43635,
222
+ 41158,
223
+ 46709,
224
+ 41163,
225
+ 6,
226
+ 564,
227
+ 416,
228
+ 46467,
229
+ 45950,
230
+ 46667,
231
+ 41138,
232
+ 43157,
233
+ 372,
234
+ "ngshiheng/michelin-guide-restaurants-2021/michelin_my_maps.csv",
235
+ 43160,
236
+ 43454,
237
+ "https://opendata.vancouver.ca/api/records/1.0/download/?dataset=employee-remuneration-and-expenses-earning-over-75000&format=csv",
238
+ 46726,
239
+ 40978,
240
+ 42572,
241
+ 46372,
242
+ 1461,
243
+ 44228,
244
+ 42571,
245
+ 46664,
246
+ 46328,
247
+ 54,
248
+ 40498,
249
+ 42730,
250
+ 43337,
251
+ 1489,
252
+ "markusschmitz/museums/museums_prep.csv",
253
+ 1507,
254
+ 43544,
255
+ 46681,
256
+ 469,
257
+ 531,
258
+ "himanshupoddar/zomato-bangalore-restaurants/zomato.csv",
259
+ 42727,
260
+ 46676,
261
+ 42705,
262
+ 42733,
263
+ 40650,
264
+ 44960,
265
+ 46686,
266
+ 44157,
267
+ 43044,
268
+ 44983,
269
+ "https://ai-jobs.net/salaries/download/salaries.csv",
270
+ 44984,
271
+ "peopledatalabssf/free-7-million-company-dataset/companies_sorted.csv",
272
+ 1596,
273
+ "omkarsabnis/yelp-reviews-dataset/yelp.csv",
274
+ 40981,
275
+ 56,
276
+ 344,
277
+ 44978,
278
+ 1039,
279
+ 311,
280
+ 46661,
281
+ 46604,
282
+ 549,
283
+ 4552,
284
+ 1128,
285
+ 44959,
286
+ 1547,
287
+ 40685,
288
+ 43826,
289
+ 41540,
290
+ 14,
291
+ 43622,
292
+ 46369,
293
+ 41210,
294
+ 42688,
295
+ 46605,
296
+ 40670,
297
+ 46280,
298
+ 40994,
299
+ 951,
300
+ 46640,
301
+ 43479,
302
+ 44993,
303
+ 44230,
304
+ 43573,
305
+ 455,
306
+ 46653,
307
+ 41991,
308
+ 46683,
309
+ 41144,
310
+ 40536,
311
+ 44981,
312
+ 41146,
313
+ 46655,
314
+ 46662,
315
+ 22,
316
+ 46721,
317
+ 31,
318
+ 41972,
319
+ 43672,
320
+ 216,
321
+ 43721,
322
+ 44965,
323
+ 46648,
324
+ 310,
325
+ 1471,
326
+ "http://pages.cs.wisc.edu/~anhai/data/784_data/baby_products/csv_files/babies_r_us.csv",
327
+ 23,
328
+ 46665,
329
+ 46592,
330
+ 23517,
331
+ "eilamshapira/human-choice-prediction-in-language-based-games/OPE_train.csv",
332
+ 46598,
333
+ 279,
334
+ 44145,
335
+ 42164,
336
+ 44,
337
+ 43648,
338
+ 40668,
339
+ 45545,
340
+ 547,
341
+ 43618,
342
+ "neilcosgrove/scotch-whiskey-reviews-update-2020/scotch_review2020.csv",
343
+ 10,
344
+ "maharshipandya/-spotify-tracks-dataset/dataset.csv",
345
+ 44958,
346
+ 30,
347
+ 46254,
348
+ 1479,
349
+ "albenft/game-of-thrones-script-all-seasons/Game_of_Thrones_Script.csv",
350
+ 42726,
351
+ 46585,
352
+ 45554,
353
+ 44226,
354
+ 44980,
355
+ 679,
356
+ 43463,
357
+ 45955,
358
+ 50,
359
+ 375,
360
+ 23380,
361
+ 1497,
362
+ 1509,
363
+ 41980,
364
+ 1542,
365
+ "ankanhore545/top-ramen-ratings-2022/Top Ramen Ratings .csv",
366
+ 44992,
367
+ 40982,
368
+ 44966,
369
+ 1590,
370
+ 43551,
371
+ 550,
372
+ 42769,
373
+ 44977,
374
+ 43584,
375
+ 3,
376
+ 41166,
377
+ 43072,
378
+ 1511,
379
+ 4135,
380
+ 46668,
381
+ "hanifalirsyad/coffee-scrap-coffeereview/coffee_clean.csv",
382
+ 46677,
383
+ 44223,
384
+ "https://www.scimagojr.com/journalrank.php?out=xls",
385
+ 46597,
386
+ 1502,
387
+ 43395,
388
+ 41027,
389
+ 46692,
390
+ 1468,
391
+ 43466,
392
+ 42,
393
+ 60,
394
+ "hernan4444/animeplanet-recommendation-database-2020/anime.csv",
395
+ 42972,
396
+ 46652,
397
+ 41145,
398
+ 3277,
399
+ 43893,
400
+ 6332,
401
+ 46651,
402
+ 44967,
403
+ 42931,
404
+ 42742,
405
+ 12,
406
+ 43653
407
+ ],
408
+ "scheduler": "cycle",
409
+ "fold": 3,
410
+ "num_folds": 5,
411
+ "p_mask": 0,
412
+ "full_exp_name": "2025_05_03__tabstar_sota_k3__data_390__tab_6__e5_small__axial_d1__fusion_attention__layers_6__num_verb_full__scheduler_cycle__lr_5e-05__bert_lr_10__wd_0001__mask_0__weight_uniform__git_9019a12__fold_3from5",
413
+ "cached": false,
414
+ "num_datasets": 390
415
+ }