OSainz commited on
Commit
d4d0c64
β€’
1 Parent(s): 4a1e5cc
Files changed (2) hide show
  1. contamination_report.csv +30 -30
  2. postprocessing.py +1 -1
contamination_report.csv CHANGED
@@ -244,43 +244,19 @@ natural_questions;;FLAN;;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652
244
  natural_questions;;GLaM;;model;;3.9;;data-based;https://arxiv.org/abs/2112.06905;13
245
  natural_questions;;GPT-3;;model;;;1.0;data-based;https://arxiv.org/abs/2005.14165;13
246
 
247
- nyu-mll/glue;BoolQ;allenai/c4;;corpus;;;2.4;data-based;https://arxiv.org/abs/2104.08758;6
248
-
249
- nyu-mll/glue;CoLA;allenai/c4;;corpus;;;14.4;data-based;https://arxiv.org/abs/2104.08758;6
250
-
251
- nyu-mll/glue;MNLI-hypothesis;allenai/c4;;corpus;;;14.2;data-based;https://arxiv.org/abs/2104.08758;6
252
-
253
- nyu-mll/glue;MNLI-premise;allenai/c4;;corpus;;;15.2;data-based;https://arxiv.org/abs/2104.08758;6
254
-
255
- nyu-mll/glue;MRPC-sentence-1;allenai/c4;;corpus;;;2.7;data-based;https://arxiv.org/abs/2104.08758;6
256
-
257
- nyu-mll/glue;MRPC-sentence-2;allenai/c4;;corpus;;;2.7;data-based;https://arxiv.org/abs/2104.08758;6
258
-
259
- nyu-mll/glue;QNLI-question;allenai/c4;;corpus;;;1.8;data-based;https://arxiv.org/abs/2104.08758;6
260
-
261
- nyu-mll/glue;QNLI-sentence;allenai/c4;;corpus;;;53.6;data-based;https://arxiv.org/abs/2104.08758;6
262
-
263
- nyu-mll/glue;RTE-sentence-1;allenai/c4;;corpus;;;6;data-based;https://arxiv.org/abs/2104.08758;6
264
-
265
- nyu-mll/glue;RTE-sentence-2;allenai/c4;;corpus;;;10.8;data-based;https://arxiv.org/abs/2104.08758;6
266
-
267
- nyu-mll/glue;SST-2;allenai/c4;;corpus;;;11;data-based;https://arxiv.org/abs/2104.08758;6
268
-
269
- nyu-mll/glue;STS-B-sentence-1;allenai/c4;;corpus;;;18.3;data-based;https://arxiv.org/abs/2104.08758;6
270
-
271
- nyu-mll/glue;STS-B-sentence-2;allenai/c4;;corpus;;;18.6;data-based;https://arxiv.org/abs/2104.08758;6
272
-
273
- nyu-mll/glue;WNLI-sentence-1;allenai/c4;;corpus;;;4.8;data-based;https://arxiv.org/abs/2104.08758;6
274
-
275
- nyu-mll/glue;WNLI-sentence-2;allenai/c4;;corpus;;;2.1;data-based;https://arxiv.org/abs/2104.08758;6
276
-
277
  nyu-mll/glue;ax;EleutherAI/pile;;corpus;;;5.07;data-based;https://arxiv.org/abs/2310.20707;2
278
  nyu-mll/glue;ax;allenai/c4;;corpus;;;1.99;data-based;https://arxiv.org/abs/2310.20707;2
279
  nyu-mll/glue;ax;oscar-corpus/OSCAR-2301;;corpus;;;1.45;data-based;https://arxiv.org/abs/2310.20707;2
280
  nyu-mll/glue;ax;togethercomputer/RedPajama-Data-V2;;corpus;;;6.16;data-based;https://arxiv.org/abs/2310.20707;2
281
 
 
 
 
 
282
  nyu-mll/glue;mnli;GPT-3.5;;model;100.0;100.0;;model-based;https://hitz-zentroa.github.io/lm-contamination/blog/;7
283
 
 
 
284
  nyu-mll/glue;mnli-matched;EleutherAI/pile;;corpus;;;2.17;data-based;https://arxiv.org/abs/2310.20707;2
285
  nyu-mll/glue;mnli-matched;allenai/c4;;corpus;;;1.65;data-based;https://arxiv.org/abs/2310.20707;2
286
  nyu-mll/glue;mnli-matched;oscar-corpus/OSCAR-2301;;corpus;;;1.77;data-based;https://arxiv.org/abs/2310.20707;2
@@ -291,16 +267,26 @@ nyu-mll/glue;mnli-mismatched;allenai/c4;;corpus;;;1.73;data-based;https://arxiv.
291
  nyu-mll/glue;mnli-mismatched;oscar-corpus/OSCAR-2301;;corpus;;;1.91;data-based;https://arxiv.org/abs/2310.20707;2
292
  nyu-mll/glue;mnli-mismatched;togethercomputer/RedPajama-Data-V2;;corpus;;;2.17;data-based;https://arxiv.org/abs/2310.20707;2
293
 
 
 
294
  nyu-mll/glue;mrpc;EleutherAI/pile;;corpus;;;0.64;data-based;https://arxiv.org/abs/2310.20707;2
295
  nyu-mll/glue;mrpc;allenai/c4;;corpus;;;0.06;data-based;https://arxiv.org/abs/2310.20707;2
296
  nyu-mll/glue;mrpc;oscar-corpus/OSCAR-2301;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
297
  nyu-mll/glue;mrpc;togethercomputer/RedPajama-Data-V2;;corpus;;;1.16;data-based;https://arxiv.org/abs/2310.20707;2
298
 
 
 
 
 
299
  nyu-mll/glue;qnli;EleutherAI/pile;;corpus;;;1.48;data-based;https://arxiv.org/abs/2310.20707;2
300
  nyu-mll/glue;qnli;allenai/c4;;corpus;;;0.13;data-based;https://arxiv.org/abs/2310.20707;2
301
  nyu-mll/glue;qnli;oscar-corpus/OSCAR-2301;;corpus;;;0.04;data-based;https://arxiv.org/abs/2310.20707;2
302
  nyu-mll/glue;qnli;togethercomputer/RedPajama-Data-V2;;corpus;;;1.21;data-based;https://arxiv.org/abs/2310.20707;2
303
 
 
 
 
 
304
  nyu-mll/glue;rte;EleutherAI/pile;;corpus;;;0.13;data-based;https://arxiv.org/abs/2310.20707;2
305
  nyu-mll/glue;rte;GPT-3.5;;model;0.0;;0.0;model-based;https://arxiv.org/abs/2308.08493;3
306
  nyu-mll/glue;rte;GPT-3.5;;model;;71.00;;model-based;https://arxiv.org/abs/2311.06233;8
@@ -310,11 +296,21 @@ nyu-mll/glue;rte;allenai/c4;;corpus;;;0.2;data-based;https://arxiv.org/abs/2310.
310
  nyu-mll/glue;rte;oscar-corpus/OSCAR-2301;;corpus;;;0.17;data-based;https://arxiv.org/abs/2310.20707;2
311
  nyu-mll/glue;rte;togethercomputer/RedPajama-Data-V2;;corpus;;;67.47;data-based;https://arxiv.org/abs/2310.20707;2
312
 
 
 
 
 
 
 
313
  nyu-mll/glue;stsb;EleutherAI/pile;;corpus;;;11.09;data-based;https://arxiv.org/abs/2310.20707;2
314
  nyu-mll/glue;stsb;allenai/c4;;corpus;;;3.48;data-based;https://arxiv.org/abs/2310.20707;2
315
  nyu-mll/glue;stsb;oscar-corpus/OSCAR-2301;;corpus;;;3.12;data-based;https://arxiv.org/abs/2310.20707;2
316
  nyu-mll/glue;stsb;togethercomputer/RedPajama-Data-V2;;corpus;;;9.86;data-based;https://arxiv.org/abs/2310.20707;2
317
 
 
 
 
 
318
  nyu-mll/glue;wnli;EleutherAI/pile;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
319
  nyu-mll/glue;wnli;GPT-3.5;;model;0.0;;0.0;model-based;https://arxiv.org/abs/2308.08493;3
320
  nyu-mll/glue;wnli;GPT-3.5;;model;;12.68;;model-based;https://arxiv.org/abs/2311.06233;8
@@ -324,6 +320,10 @@ nyu-mll/glue;wnli;allenai/c4;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310
324
  nyu-mll/glue;wnli;oscar-corpus/OSCAR-2301;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
325
  nyu-mll/glue;wnli;togethercomputer/RedPajama-Data-V2;;corpus;;;2.05;data-based;https://arxiv.org/abs/2310.20707;2
326
 
 
 
 
 
327
  openai_humaneval;;EleutherAI/pile;;corpus;;;12.2;data-based;https://arxiv.org/abs/2403.04811;12
328
  openai_humaneval;;EleutherAI/pile;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
329
  openai_humaneval;;GPT-3.5-turbo;0613;model;;;23.79;model-based;https://arxiv.org/abs/2402.15938;16
 
244
  natural_questions;;GLaM;;model;;3.9;;data-based;https://arxiv.org/abs/2112.06905;13
245
  natural_questions;;GPT-3;;model;;;1.0;data-based;https://arxiv.org/abs/2005.14165;13
246
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
247
  nyu-mll/glue;ax;EleutherAI/pile;;corpus;;;5.07;data-based;https://arxiv.org/abs/2310.20707;2
248
  nyu-mll/glue;ax;allenai/c4;;corpus;;;1.99;data-based;https://arxiv.org/abs/2310.20707;2
249
  nyu-mll/glue;ax;oscar-corpus/OSCAR-2301;;corpus;;;1.45;data-based;https://arxiv.org/abs/2310.20707;2
250
  nyu-mll/glue;ax;togethercomputer/RedPajama-Data-V2;;corpus;;;6.16;data-based;https://arxiv.org/abs/2310.20707;2
251
 
252
+ nyu-mll/glue;boolq;allenai/c4;;corpus;;;2.4;data-based;https://arxiv.org/abs/2104.08758;6
253
+
254
+ nyu-mll/glue;cola;allenai/c4;;corpus;;;14.4;data-based;https://arxiv.org/abs/2104.08758;6
255
+
256
  nyu-mll/glue;mnli;GPT-3.5;;model;100.0;100.0;;model-based;https://hitz-zentroa.github.io/lm-contamination/blog/;7
257
 
258
+ nyu-mll/glue;mnli-hypothesis;allenai/c4;;corpus;;;14.2;data-based;https://arxiv.org/abs/2104.08758;6
259
+
260
  nyu-mll/glue;mnli-matched;EleutherAI/pile;;corpus;;;2.17;data-based;https://arxiv.org/abs/2310.20707;2
261
  nyu-mll/glue;mnli-matched;allenai/c4;;corpus;;;1.65;data-based;https://arxiv.org/abs/2310.20707;2
262
  nyu-mll/glue;mnli-matched;oscar-corpus/OSCAR-2301;;corpus;;;1.77;data-based;https://arxiv.org/abs/2310.20707;2
 
267
  nyu-mll/glue;mnli-mismatched;oscar-corpus/OSCAR-2301;;corpus;;;1.91;data-based;https://arxiv.org/abs/2310.20707;2
268
  nyu-mll/glue;mnli-mismatched;togethercomputer/RedPajama-Data-V2;;corpus;;;2.17;data-based;https://arxiv.org/abs/2310.20707;2
269
 
270
+ nyu-mll/glue;mnli-premise;allenai/c4;;corpus;;;15.2;data-based;https://arxiv.org/abs/2104.08758;6
271
+
272
  nyu-mll/glue;mrpc;EleutherAI/pile;;corpus;;;0.64;data-based;https://arxiv.org/abs/2310.20707;2
273
  nyu-mll/glue;mrpc;allenai/c4;;corpus;;;0.06;data-based;https://arxiv.org/abs/2310.20707;2
274
  nyu-mll/glue;mrpc;oscar-corpus/OSCAR-2301;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
275
  nyu-mll/glue;mrpc;togethercomputer/RedPajama-Data-V2;;corpus;;;1.16;data-based;https://arxiv.org/abs/2310.20707;2
276
 
277
+ nyu-mll/glue;mrpc-sentence-1;allenai/c4;;corpus;;;2.7;data-based;https://arxiv.org/abs/2104.08758;6
278
+
279
+ nyu-mll/glue;mrpc-sentence-2;allenai/c4;;corpus;;;2.7;data-based;https://arxiv.org/abs/2104.08758;6
280
+
281
  nyu-mll/glue;qnli;EleutherAI/pile;;corpus;;;1.48;data-based;https://arxiv.org/abs/2310.20707;2
282
  nyu-mll/glue;qnli;allenai/c4;;corpus;;;0.13;data-based;https://arxiv.org/abs/2310.20707;2
283
  nyu-mll/glue;qnli;oscar-corpus/OSCAR-2301;;corpus;;;0.04;data-based;https://arxiv.org/abs/2310.20707;2
284
  nyu-mll/glue;qnli;togethercomputer/RedPajama-Data-V2;;corpus;;;1.21;data-based;https://arxiv.org/abs/2310.20707;2
285
 
286
+ nyu-mll/glue;qnli-question;allenai/c4;;corpus;;;1.8;data-based;https://arxiv.org/abs/2104.08758;6
287
+
288
+ nyu-mll/glue;qnli-sentence;allenai/c4;;corpus;;;53.6;data-based;https://arxiv.org/abs/2104.08758;6
289
+
290
  nyu-mll/glue;rte;EleutherAI/pile;;corpus;;;0.13;data-based;https://arxiv.org/abs/2310.20707;2
291
  nyu-mll/glue;rte;GPT-3.5;;model;0.0;;0.0;model-based;https://arxiv.org/abs/2308.08493;3
292
  nyu-mll/glue;rte;GPT-3.5;;model;;71.00;;model-based;https://arxiv.org/abs/2311.06233;8
 
296
  nyu-mll/glue;rte;oscar-corpus/OSCAR-2301;;corpus;;;0.17;data-based;https://arxiv.org/abs/2310.20707;2
297
  nyu-mll/glue;rte;togethercomputer/RedPajama-Data-V2;;corpus;;;67.47;data-based;https://arxiv.org/abs/2310.20707;2
298
 
299
+ nyu-mll/glue;rte-sentence-1;allenai/c4;;corpus;;;6;data-based;https://arxiv.org/abs/2104.08758;6
300
+
301
+ nyu-mll/glue;rte-sentence-2;allenai/c4;;corpus;;;10.8;data-based;https://arxiv.org/abs/2104.08758;6
302
+
303
+ nyu-mll/glue;sst2;allenai/c4;;corpus;;;11;data-based;https://arxiv.org/abs/2104.08758;6
304
+
305
  nyu-mll/glue;stsb;EleutherAI/pile;;corpus;;;11.09;data-based;https://arxiv.org/abs/2310.20707;2
306
  nyu-mll/glue;stsb;allenai/c4;;corpus;;;3.48;data-based;https://arxiv.org/abs/2310.20707;2
307
  nyu-mll/glue;stsb;oscar-corpus/OSCAR-2301;;corpus;;;3.12;data-based;https://arxiv.org/abs/2310.20707;2
308
  nyu-mll/glue;stsb;togethercomputer/RedPajama-Data-V2;;corpus;;;9.86;data-based;https://arxiv.org/abs/2310.20707;2
309
 
310
+ nyu-mll/glue;stsb-sentence-1;allenai/c4;;corpus;;;18.3;data-based;https://arxiv.org/abs/2104.08758;6
311
+
312
+ nyu-mll/glue;stsb-sentence-2;allenai/c4;;corpus;;;18.6;data-based;https://arxiv.org/abs/2104.08758;6
313
+
314
  nyu-mll/glue;wnli;EleutherAI/pile;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
315
  nyu-mll/glue;wnli;GPT-3.5;;model;0.0;;0.0;model-based;https://arxiv.org/abs/2308.08493;3
316
  nyu-mll/glue;wnli;GPT-3.5;;model;;12.68;;model-based;https://arxiv.org/abs/2311.06233;8
 
320
  nyu-mll/glue;wnli;oscar-corpus/OSCAR-2301;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
321
  nyu-mll/glue;wnli;togethercomputer/RedPajama-Data-V2;;corpus;;;2.05;data-based;https://arxiv.org/abs/2310.20707;2
322
 
323
+ nyu-mll/glue;wnli-sentence-1;allenai/c4;;corpus;;;4.8;data-based;https://arxiv.org/abs/2104.08758;6
324
+
325
+ nyu-mll/glue;wnli-sentence-2;allenai/c4;;corpus;;;2.1;data-based;https://arxiv.org/abs/2104.08758;6
326
+
327
  openai_humaneval;;EleutherAI/pile;;corpus;;;12.2;data-based;https://arxiv.org/abs/2403.04811;12
328
  openai_humaneval;;EleutherAI/pile;;corpus;;;0.0;data-based;https://arxiv.org/abs/2310.20707;2
329
  openai_humaneval;;GPT-3.5-turbo;0613;model;;;23.79;model-based;https://arxiv.org/abs/2402.15938;16
postprocessing.py CHANGED
@@ -35,7 +35,7 @@ def main():
35
  if key != past_key:
36
  f.write("\n")
37
  past_key = key
38
- line = line[:3] + [""] + line[3:]
39
  f.write(";".join(line) + "\n")
40
 
41
 
 
35
  if key != past_key:
36
  f.write("\n")
37
  past_key = key
38
+ line = line[:3] + line[3:]
39
  f.write(";".join(line) + "\n")
40
 
41