tensorboy commited on
Commit
c52a547
·
verified ·
1 Parent(s): 8b14c33

Upload folder using huggingface_hub

Browse files
0.codes.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6664b514fa0778d4932917e165421c5689daf2fbde0a6f9c52eca9e764b56c80
3
+ size 111004
0.metadata.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "passage_offset": 0,
3
+ "num_passages": 247,
4
+ "num_embeddings": 27460,
5
+ "embedding_offset": 0
6
+ }
0.residuals.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfbd8098e8d1552cc29908ac3654b120f7e911f96b35d036563b337ff6b62423
3
+ size 1758640
1.codes.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53e810b6eefe41a74c4b29d42ae8038c6e7a14ba0a539a65c3d7f6cfbb18a3cf
3
+ size 94876
1.metadata.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "passage_offset": 247,
3
+ "num_passages": 245,
4
+ "num_embeddings": 23429,
5
+ "embedding_offset": 27460
6
+ }
1.residuals.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffdd5a9c04aaa82047e635d4f4afa322ce093a1bf37c8c14f9114f804b8d6eeb
3
+ size 1500656
avg_residual.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d10a46236c65fab3b4f06c69e1b3c13997255fbbd372c09dfef5c5d4f19716b4
3
+ size 1205
buckets.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70cd8898111101d50a06fb691cd43fe7717d7d137d9e0e23c570fc2a5f9e81c0
3
+ size 1432
centroids.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6ee8215c83ad635e9d3d51605ecb9154ca7f03996d428581b385e5714ce9548
3
+ size 525478
collection.json ADDED
The diff for this file is too large to render. See raw diff
 
doclens.0.json ADDED
@@ -0,0 +1 @@
 
 
1
+ [135,130,100,123,98,93,29,102,90,93,44,119,79,131,123,64,130,108,145,143,149,134,71,135,127,153,130,144,147,133,128,131,108,126,63,101,56,50,127,119,114,136,119,103,99,147,133,94,95,146,85,139,139,146,135,132,45,125,133,110,96,122,117,123,96,122,121,102,117,88,131,52,115,52,89,126,112,123,137,52,126,107,137,134,44,121,125,129,132,130,76,93,71,134,96,124,134,120,125,120,128,67,118,131,57,96,123,129,131,101,120,76,119,137,51,107,129,75,21,22,105,124,59,129,77,115,129,129,82,122,97,101,132,69,138,104,89,75,121,113,140,135,143,144,116,88,137,131,138,100,101,129,99,103,141,140,125,129,153,110,91,122,126,150,109,142,117,138,85,142,94,122,126,65,117,85,105,99,136,141,133,94,143,112,111,124,106,99,136,22,120,52,141,95,43,96,107,139,138,144,131,103,85,130,131,92,114,129,134,141,148,133,117,143,146,62,90,109,123,113,100,122,101,116,127,128,97,121,80,96,99,92,115,121,101,141,109,124,126,83,86,124,87,109,131,69,107]
doclens.1.json ADDED
@@ -0,0 +1 @@
 
 
1
+ [136,138,43,138,124,105,133,130,118,131,131,38,130,71,138,116,120,148,67,45,148,89,142,126,130,137,125,143,125,110,126,83,75,84,129,124,83,136,57,136,128,46,117,117,141,135,63,139,149,120,137,122,4,38,134,44,113,126,112,129,122,102,102,118,64,117,111,111,128,109,116,50,88,142,149,146,121,138,116,118,110,109,139,123,56,113,142,45,104,114,64,106,129,142,142,135,125,80,40,134,122,111,140,129,118,115,113,122,86,70,74,98,47,68,132,51,120,88,66,138,57,90,148,24,138,109,116,106,103,115,113,60,105,89,110,104,109,48,118,121,144,135,144,75,141,58,59,73,67,70,126,65,21,131,124,96,48,81,72,131,94,126,65,96,67,48,70,126,65,131,124,72,21,131,124,96,21,70,48,81,81,96,72,131,30,31,16,26,5,25,4,126,65,96,76,67,48,70,126,65,131,124,131,124,96,15,52,21,10,70,48,81,147,5,81,96,72,131,94,126,65,96,76,67,48,70,126,65,131,124,72,21,131,124,96,15,21,70,48,81,147,5,81,96,72]
ivf.pid.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bdb246d18e8e8fc44c4073b14a5b54c875dfd828b1a6f610b89621a9bcc82f3
3
+ size 110040
metadata.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config":{
3
+ "query_token_id":"[unused0]",
4
+ "doc_token_id":"[unused1]",
5
+ "query_token":"[Q]",
6
+ "doc_token":"[D]",
7
+ "ncells":null,
8
+ "centroid_score_threshold":null,
9
+ "ndocs":null,
10
+ "load_index_with_mmap":false,
11
+ "index_path":null,
12
+ "index_bsize":32,
13
+ "nbits":4,
14
+ "kmeans_niters":20,
15
+ "resume":false,
16
+ "pool_factor":1,
17
+ "clustering_mode":"hierarchical",
18
+ "protected_tokens":0,
19
+ "similarity":"cosine",
20
+ "bsize":64,
21
+ "accumsteps":1,
22
+ "lr":0.000005,
23
+ "maxsteps":3000,
24
+ "save_every":9,
25
+ "warmup":9,
26
+ "warmup_bert":null,
27
+ "relu":false,
28
+ "nway":2,
29
+ "use_ib_negatives":true,
30
+ "reranker":false,
31
+ "distillation_alpha":1.0,
32
+ "ignore_scores":false,
33
+ "model_name":"chunks_colbert_v2",
34
+ "query_maxlen":32,
35
+ "attend_to_mask_tokens":false,
36
+ "interaction":"colbert",
37
+ "dim":128,
38
+ "doc_maxlen":180,
39
+ "mask_punctuation":true,
40
+ "checkpoint":".ragatouille/colbert/none/2024-09/26/13.47.00/checkpoints/colbert",
41
+ "triples":"/kaggle/working/train/triples.train.colbert.jsonl",
42
+ "collection":[
43
+ "list with 492 elements starting with...",
44
+ [
45
+ "'Probation \\\\\\\\nEvery new team member will be put on probation for the first 3 months of their service in the \\\\\\\\norganization counted from the date of joining. At the end of the third month, the team member will be \\\\\\\\ninformed whether or not s/he has successfully crossed the probation period based on his/her \\\\\\\\nperformance. \\\\\\\\nThe team member can take upto 3 leaves during the probation period, the remaining leaves will be \\\\\\\\naccrued and can be availed post the probation. The 3 leaves will include planned / emergency/ sick \\\\\\\\nleaves etc but will not include wedding/maternity/paternity leaves. Leaves are to be planned in advance \\\\\\\\nin consultation with the concerned manager to the extent possible.",
46
+ "Leaves are to be planned in advance \\\\\\\\nin consultation with the concerned manager to the extent possible. Leave encashment is not applicable if \\\\\\\\nexit takes place within the probation period. \\\\\\\\nIncase of termination or resignation during/at the end of probation period, the applicable notice period \\\\\\\\nwill be of 1 week (5 working days). No leaves will be permitted during notice period.' /n/nLink to policy document: https://docs.google.com/document/d/1Fqa1FBqUVFJGq0uDqwFqF3rW_t7_zu4xXC9KMKY_lIM/edit#heading=h.5kumi7cfdp5o.'",
47
+ "'1. Self-initiated: The team member voluntarily resigns from the organization. \\\\\\\\n2. Firm-initiated: The firm initiates the termination of a team member on account of \\\\\\\\nnon-performance, unauthorized absence (absconding) or on behavioral grounds.' /n/nLink to policy document: https://docs.google.com/document/d/1Fqa1FBqUVFJGq0uDqwFqF3rW_t7_zu4xXC9KMKY_lIM/edit#heading=h.5kumi7cfdp5o.'"
48
+ ]
49
+ ],
50
+ "queries":"/kaggle/working/train/queries.train.colbert.tsv",
51
+ "index_name":"chunks_colbertv2_3000_steps_index",
52
+ "overwrite":false,
53
+ "root":".ragatouille/",
54
+ "experiment":"colbert",
55
+ "index_root":null,
56
+ "name":"2024-09/26/13.47.00",
57
+ "rank":0,
58
+ "nranks":2,
59
+ "amp":true,
60
+ "gpus":2,
61
+ "avoid_fork_if_possible":false
62
+ },
63
+ "num_chunks":2,
64
+ "num_partitions":2048,
65
+ "num_embeddings":50889,
66
+ "avg_doclen":103.4329268293,
67
+ "RAGatouille":{
68
+ "index_config":{
69
+ "index_type":"PLAID",
70
+ "index_name":"chunks_colbertv2_3000_steps_index"
71
+ }
72
+ }
73
+ }
pid_docid_map.json ADDED
@@ -0,0 +1,494 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "0":"1",
3
+ "1":"1",
4
+ "2":"2",
5
+ "3":"3",
6
+ "4":"3",
7
+ "5":"4",
8
+ "6":"4",
9
+ "7":"5",
10
+ "8":"5",
11
+ "9":"6",
12
+ "10":"6",
13
+ "11":"7",
14
+ "12":"7",
15
+ "13":"8",
16
+ "14":"8",
17
+ "15":"8",
18
+ "16":"8",
19
+ "17":"9",
20
+ "18":"10",
21
+ "19":"10",
22
+ "20":"10",
23
+ "21":"10",
24
+ "22":"10",
25
+ "23":"11",
26
+ "24":"11",
27
+ "25":"11",
28
+ "26":"11",
29
+ "27":"11",
30
+ "28":"11",
31
+ "29":"11",
32
+ "30":"12",
33
+ "31":"12",
34
+ "32":"13",
35
+ "33":"14",
36
+ "34":"14",
37
+ "35":"14",
38
+ "36":"14",
39
+ "37":"15",
40
+ "38":"15",
41
+ "39":"16",
42
+ "40":"17",
43
+ "41":"17",
44
+ "42":"18",
45
+ "43":"18",
46
+ "44":"19",
47
+ "45":"19",
48
+ "46":"19",
49
+ "47":"19",
50
+ "48":"20",
51
+ "49":"21",
52
+ "50":"21",
53
+ "51":"22",
54
+ "52":"23",
55
+ "53":"23",
56
+ "54":"24",
57
+ "55":"24",
58
+ "56":"24",
59
+ "57":"25",
60
+ "58":"26",
61
+ "59":"27",
62
+ "60":"27",
63
+ "61":"28",
64
+ "62":"28",
65
+ "63":"29",
66
+ "64":"29",
67
+ "65":"30",
68
+ "66":"31",
69
+ "67":"31",
70
+ "68":"32",
71
+ "69":"32",
72
+ "70":"32",
73
+ "71":"32",
74
+ "72":"33",
75
+ "73":"33",
76
+ "74":"34",
77
+ "75":"34",
78
+ "76":"35",
79
+ "77":"36",
80
+ "78":"36",
81
+ "79":"36",
82
+ "80":"37",
83
+ "81":"37",
84
+ "82":"38",
85
+ "83":"39",
86
+ "84":"40",
87
+ "85":"40",
88
+ "86":"41",
89
+ "87":"42",
90
+ "88":"43",
91
+ "89":"43",
92
+ "90":"44",
93
+ "91":"44",
94
+ "92":"45",
95
+ "93":"45",
96
+ "94":"46",
97
+ "95":"46",
98
+ "96":"47",
99
+ "97":"48",
100
+ "98":"48",
101
+ "99":"48",
102
+ "100":"49",
103
+ "101":"49",
104
+ "102":"50",
105
+ "103":"51",
106
+ "104":"52",
107
+ "105":"53",
108
+ "106":"53",
109
+ "107":"54",
110
+ "108":"55",
111
+ "109":"56",
112
+ "110":"56",
113
+ "111":"56",
114
+ "112":"57",
115
+ "113":"58",
116
+ "114":"59",
117
+ "115":"60",
118
+ "116":"61",
119
+ "117":"62",
120
+ "118":"63",
121
+ "119":"64",
122
+ "120":"65",
123
+ "121":"66",
124
+ "122":"66",
125
+ "123":"67",
126
+ "124":"67",
127
+ "125":"68",
128
+ "126":"68",
129
+ "127":"69",
130
+ "128":"69",
131
+ "129":"70",
132
+ "130":"70",
133
+ "131":"71",
134
+ "132":"72",
135
+ "133":"73",
136
+ "134":"74",
137
+ "135":"75",
138
+ "136":"75",
139
+ "137":"76",
140
+ "138":"76",
141
+ "139":"77",
142
+ "140":"77",
143
+ "141":"77",
144
+ "142":"77",
145
+ "143":"77",
146
+ "144":"77",
147
+ "145":"78",
148
+ "146":"78",
149
+ "147":"79",
150
+ "148":"80",
151
+ "149":"81",
152
+ "150":"81",
153
+ "151":"82",
154
+ "152":"83",
155
+ "153":"83",
156
+ "154":"84",
157
+ "155":"85",
158
+ "156":"85",
159
+ "157":"85",
160
+ "158":"85",
161
+ "159":"85",
162
+ "160":"85",
163
+ "161":"86",
164
+ "162":"86",
165
+ "163":"87",
166
+ "164":"87",
167
+ "165":"87",
168
+ "166":"87",
169
+ "167":"88",
170
+ "168":"88",
171
+ "169":"88",
172
+ "170":"88",
173
+ "171":"89",
174
+ "172":"89",
175
+ "173":"89",
176
+ "174":"89",
177
+ "175":"90",
178
+ "176":"90",
179
+ "177":"91",
180
+ "178":"91",
181
+ "179":"92",
182
+ "180":"93",
183
+ "181":"93",
184
+ "182":"94",
185
+ "183":"95",
186
+ "184":"95",
187
+ "185":"96",
188
+ "186":"96",
189
+ "187":"97",
190
+ "188":"97",
191
+ "189":"98",
192
+ "190":"98",
193
+ "191":"98",
194
+ "192":"99",
195
+ "193":"100",
196
+ "194":"100",
197
+ "195":"101",
198
+ "196":"101",
199
+ "197":"102",
200
+ "198":"103",
201
+ "199":"104",
202
+ "200":"105",
203
+ "201":"106",
204
+ "202":"107",
205
+ "203":"107",
206
+ "204":"108",
207
+ "205":"108",
208
+ "206":"108",
209
+ "207":"109",
210
+ "208":"110",
211
+ "209":"110",
212
+ "210":"110",
213
+ "211":"110",
214
+ "212":"110",
215
+ "213":"110",
216
+ "214":"110",
217
+ "215":"110",
218
+ "216":"111",
219
+ "217":"112",
220
+ "218":"113",
221
+ "219":"113",
222
+ "220":"114",
223
+ "221":"114",
224
+ "222":"114",
225
+ "223":"115",
226
+ "224":"115",
227
+ "225":"115",
228
+ "226":"115",
229
+ "227":"116",
230
+ "228":"116",
231
+ "229":"117",
232
+ "230":"117",
233
+ "231":"117",
234
+ "232":"117",
235
+ "233":"118",
236
+ "234":"119",
237
+ "235":"119",
238
+ "236":"120",
239
+ "237":"120",
240
+ "238":"120",
241
+ "239":"120",
242
+ "240":"121",
243
+ "241":"121",
244
+ "242":"121",
245
+ "243":"122",
246
+ "244":"123",
247
+ "245":"123",
248
+ "246":"124",
249
+ "247":"125",
250
+ "248":"125",
251
+ "249":"125",
252
+ "250":"126",
253
+ "251":"126",
254
+ "252":"126",
255
+ "253":"126",
256
+ "254":"127",
257
+ "255":"127",
258
+ "256":"127",
259
+ "257":"127",
260
+ "258":"127",
261
+ "259":"127",
262
+ "260":"128",
263
+ "261":"129",
264
+ "262":"130",
265
+ "263":"130",
266
+ "264":"131",
267
+ "265":"131",
268
+ "266":"132",
269
+ "267":"132",
270
+ "268":"132",
271
+ "269":"133",
272
+ "270":"134",
273
+ "271":"134",
274
+ "272":"134",
275
+ "273":"134",
276
+ "274":"135",
277
+ "275":"136",
278
+ "276":"136",
279
+ "277":"136",
280
+ "278":"136",
281
+ "279":"137",
282
+ "280":"138",
283
+ "281":"138",
284
+ "282":"138",
285
+ "283":"138",
286
+ "284":"139",
287
+ "285":"139",
288
+ "286":"140",
289
+ "287":"141",
290
+ "288":"141",
291
+ "289":"142",
292
+ "290":"143",
293
+ "291":"143",
294
+ "292":"143",
295
+ "293":"144",
296
+ "294":"145",
297
+ "295":"145",
298
+ "296":"145",
299
+ "297":"145",
300
+ "298":"146",
301
+ "299":"146",
302
+ "300":"146",
303
+ "301":"146",
304
+ "302":"146",
305
+ "303":"147",
306
+ "304":"147",
307
+ "305":"147",
308
+ "306":"148",
309
+ "307":"148",
310
+ "308":"149",
311
+ "309":"150",
312
+ "310":"151",
313
+ "311":"151",
314
+ "312":"152",
315
+ "313":"152",
316
+ "314":"152",
317
+ "315":"152",
318
+ "316":"153",
319
+ "317":"154",
320
+ "318":"155",
321
+ "319":"156",
322
+ "320":"156",
323
+ "321":"157",
324
+ "322":"157",
325
+ "323":"158",
326
+ "324":"158",
327
+ "325":"158",
328
+ "326":"159",
329
+ "327":"159",
330
+ "328":"160",
331
+ "329":"161",
332
+ "330":"161",
333
+ "331":"161",
334
+ "332":"162",
335
+ "333":"162",
336
+ "334":"162",
337
+ "335":"163",
338
+ "336":"163",
339
+ "337":"163",
340
+ "338":"164",
341
+ "339":"164",
342
+ "340":"165",
343
+ "341":"165",
344
+ "342":"165",
345
+ "343":"166",
346
+ "344":"166",
347
+ "345":"167",
348
+ "346":"167",
349
+ "347":"168",
350
+ "348":"168",
351
+ "349":"169",
352
+ "350":"169",
353
+ "351":"169",
354
+ "352":"170",
355
+ "353":"171",
356
+ "354":"171",
357
+ "355":"172",
358
+ "356":"173",
359
+ "357":"174",
360
+ "358":"175",
361
+ "359":"176",
362
+ "360":"177",
363
+ "361":"178",
364
+ "362":"178",
365
+ "363":"179",
366
+ "364":"180",
367
+ "365":"181",
368
+ "366":"182",
369
+ "367":"182",
370
+ "368":"183",
371
+ "369":"184",
372
+ "370":"185",
373
+ "371":"186",
374
+ "372":"186",
375
+ "373":"186",
376
+ "374":"186",
377
+ "375":"186",
378
+ "376":"187",
379
+ "377":"187",
380
+ "378":"187",
381
+ "379":"187",
382
+ "380":"188",
383
+ "381":"188",
384
+ "382":"189",
385
+ "383":"189",
386
+ "384":"189",
387
+ "385":"189",
388
+ "386":"190",
389
+ "387":"190",
390
+ "388":"191",
391
+ "389":"192",
392
+ "390":"192",
393
+ "391":"192",
394
+ "392":"193",
395
+ "393":"194",
396
+ "394":"195",
397
+ "395":"196",
398
+ "396":"197",
399
+ "397":"198",
400
+ "398":"198",
401
+ "399":"199",
402
+ "400":"200",
403
+ "401":"200",
404
+ "402":"201",
405
+ "403":"202",
406
+ "404":"203",
407
+ "405":"204",
408
+ "406":"205",
409
+ "407":"206",
410
+ "408":"207",
411
+ "409":"207",
412
+ "410":"208",
413
+ "411":"209",
414
+ "412":"210",
415
+ "413":"211",
416
+ "414":"212",
417
+ "415":"212",
418
+ "416":"213",
419
+ "417":"213",
420
+ "418":"214",
421
+ "419":"215",
422
+ "420":"216",
423
+ "421":"216",
424
+ "422":"217",
425
+ "423":"218",
426
+ "424":"219",
427
+ "425":"220",
428
+ "426":"221",
429
+ "427":"222",
430
+ "428":"223",
431
+ "429":"224",
432
+ "430":"225",
433
+ "431":"226",
434
+ "432":"227",
435
+ "433":"228",
436
+ "434":"229",
437
+ "435":"230",
438
+ "436":"231",
439
+ "437":"232",
440
+ "438":"233",
441
+ "439":"233",
442
+ "440":"234",
443
+ "441":"235",
444
+ "442":"236",
445
+ "443":"237",
446
+ "444":"238",
447
+ "445":"239",
448
+ "446":"239",
449
+ "447":"240",
450
+ "448":"240",
451
+ "449":"241",
452
+ "450":"241",
453
+ "451":"242",
454
+ "452":"243",
455
+ "453":"244",
456
+ "454":"245",
457
+ "455":"246",
458
+ "456":"247",
459
+ "457":"248",
460
+ "458":"249",
461
+ "459":"250",
462
+ "460":"251",
463
+ "461":"252",
464
+ "462":"253",
465
+ "463":"254",
466
+ "464":"255",
467
+ "465":"256",
468
+ "466":"257",
469
+ "467":"257",
470
+ "468":"258",
471
+ "469":"259",
472
+ "470":"260",
473
+ "471":"261",
474
+ "472":"262",
475
+ "473":"263",
476
+ "474":"263",
477
+ "475":"264",
478
+ "476":"264",
479
+ "477":"265",
480
+ "478":"266",
481
+ "479":"267",
482
+ "480":"267",
483
+ "481":"268",
484
+ "482":"269",
485
+ "483":"270",
486
+ "484":"271",
487
+ "485":"272",
488
+ "486":"273",
489
+ "487":"274",
490
+ "488":"275",
491
+ "489":"276",
492
+ "490":"277",
493
+ "491":"278"
494
+ }
plan.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "query_token_id": "[unused0]",
4
+ "doc_token_id": "[unused1]",
5
+ "query_token": "[Q]",
6
+ "doc_token": "[D]",
7
+ "ncells": null,
8
+ "centroid_score_threshold": null,
9
+ "ndocs": null,
10
+ "load_index_with_mmap": false,
11
+ "index_path": null,
12
+ "index_bsize": 32,
13
+ "nbits": 4,
14
+ "kmeans_niters": 20,
15
+ "resume": false,
16
+ "pool_factor": 1,
17
+ "clustering_mode": "hierarchical",
18
+ "protected_tokens": 0,
19
+ "similarity": "cosine",
20
+ "bsize": 64,
21
+ "accumsteps": 1,
22
+ "lr": 5e-6,
23
+ "maxsteps": 3000,
24
+ "save_every": 9,
25
+ "warmup": 9,
26
+ "warmup_bert": null,
27
+ "relu": false,
28
+ "nway": 2,
29
+ "use_ib_negatives": true,
30
+ "reranker": false,
31
+ "distillation_alpha": 1.0,
32
+ "ignore_scores": false,
33
+ "model_name": "chunks_colbert_v2",
34
+ "query_maxlen": 32,
35
+ "attend_to_mask_tokens": false,
36
+ "interaction": "colbert",
37
+ "dim": 128,
38
+ "doc_maxlen": 180,
39
+ "mask_punctuation": true,
40
+ "checkpoint": ".ragatouille\/colbert\/none\/2024-09\/26\/13.47.00\/checkpoints\/colbert",
41
+ "triples": "\/kaggle\/working\/train\/triples.train.colbert.jsonl",
42
+ "collection": [
43
+ "list with 492 elements starting with...",
44
+ [
45
+ "'Probation \\\\\\\\nEvery new team member will be put on probation for the first 3 months of their service in the \\\\\\\\norganization counted from the date of joining. At the end of the third month, the team member will be \\\\\\\\ninformed whether or not s\/he has successfully crossed the probation period based on his\/her \\\\\\\\nperformance. \\\\\\\\nThe team member can take upto 3 leaves during the probation period, the remaining leaves will be \\\\\\\\naccrued and can be availed post the probation. The 3 leaves will include planned \/ emergency\/ sick \\\\\\\\nleaves etc but will not include wedding\/maternity\/paternity leaves. Leaves are to be planned in advance \\\\\\\\nin consultation with the concerned manager to the extent possible.",
46
+ "Leaves are to be planned in advance \\\\\\\\nin consultation with the concerned manager to the extent possible. Leave encashment is not applicable if \\\\\\\\nexit takes place within the probation period. \\\\\\\\nIncase of termination or resignation during\/at the end of probation period, the applicable notice period \\\\\\\\nwill be of 1 week (5 working days). No leaves will be permitted during notice period.' \/n\/nLink to policy document: https:\/\/docs.google.com\/document\/d\/1Fqa1FBqUVFJGq0uDqwFqF3rW_t7_zu4xXC9KMKY_lIM\/edit#heading=h.5kumi7cfdp5o.'",
47
+ "'1. Self-initiated: The team member voluntarily resigns from the organization. \\\\\\\\n2. Firm-initiated: The firm initiates the termination of a team member on account of \\\\\\\\nnon-performance, unauthorized absence (absconding) or on behavioral grounds.' \/n\/nLink to policy document: https:\/\/docs.google.com\/document\/d\/1Fqa1FBqUVFJGq0uDqwFqF3rW_t7_zu4xXC9KMKY_lIM\/edit#heading=h.5kumi7cfdp5o.'"
48
+ ]
49
+ ],
50
+ "queries": "\/kaggle\/working\/train\/queries.train.colbert.tsv",
51
+ "index_name": "chunks_colbertv2_3000_steps_index",
52
+ "overwrite": false,
53
+ "root": ".ragatouille\/",
54
+ "experiment": "colbert",
55
+ "index_root": null,
56
+ "name": "2024-09\/26\/13.47.00",
57
+ "rank": 0,
58
+ "nranks": 2,
59
+ "amp": true,
60
+ "gpus": 2,
61
+ "avoid_fork_if_possible": false
62
+ },
63
+ "num_chunks": 2,
64
+ "num_partitions": 2048,
65
+ "num_embeddings_est": 50873.45388793945,
66
+ "avg_doclen_est": 103.40132904052734
67
+ }