Muennighoff commited on Feb 13, 2023

Commit

076928f

1 Parent(s): afa9fd2

Add babi

Browse files

Files changed (30) hide show

2b855b50c4py/evaluation/2b855b50c4py_0_babi.json +22 -0
2b855b50c4py/evaluation/2b855b50c4py_1_babi.json +22 -0
2b855b50c4py/evaluation/2b855b50c4py_2_babi.json +22 -0
2b855b50c4py/evaluation/2b855b50c4py_3_babi.json +22 -0
2b855b50c4py/evaluation/2b855b50c4py_4_babi.json +22 -0
2b855b50c4py/evaluation/2b855b50c4py_5_babi.json +4 -4
2b855b60c4py/evaluation/2b855b60c4py_0_babi.json +22 -0
2b855b60c4py/evaluation/2b855b60c4py_1_babi.json +22 -0
2b855b60c4py/evaluation/2b855b60c4py_2_babi.json +22 -0
2b855b60c4py/evaluation/2b855b60c4py_3_babi.json +22 -0
2b855b60c4py/evaluation/2b855b60c4py_4_babi.json +22 -0
2b855b60c4py/evaluation/2b855b60c4py_5_babi.json +4 -4
2b855b70c4py/evaluation/2b855b70c4py_0_babi.json +22 -0
2b855b70c4py/evaluation/2b855b70c4py_1_babi.json +22 -0
2b855b70c4py/evaluation/2b855b70c4py_2_babi.json +22 -0
2b855b70c4py/evaluation/2b855b70c4py_3_babi.json +22 -0
2b855b70c4py/evaluation/2b855b70c4py_4_babi.json +22 -0
2b855b70c4py/evaluation/2b855b70c4py_5_babi.json +4 -4
2b855b80c4py/evaluation/2b855b80c4py_0_babi.json +22 -0
2b855b80c4py/evaluation/2b855b80c4py_1_babi.json +22 -0
2b855b80c4py/evaluation/2b855b80c4py_2_babi.json +22 -0
2b855b80c4py/evaluation/2b855b80c4py_3_babi.json +22 -0
2b855b80c4py/evaluation/2b855b80c4py_4_babi.json +22 -0
2b855b80c4py/evaluation/2b855b80c4py_5_babi.json +4 -4
2b855b90c4py/evaluation/2b855b90c4py_0_babi.json +22 -0
2b855b90c4py/evaluation/2b855b90c4py_1_babi.json +22 -0
2b855b90c4py/evaluation/2b855b90c4py_2_babi.json +22 -0
2b855b90c4py/evaluation/2b855b90c4py_3_babi.json +22 -0
2b855b90c4py/evaluation/2b855b90c4py_4_babi.json +22 -0
2b855b90c4py/evaluation/2b855b90c4py_5_babi.json +4 -4

2b855b50c4py/evaluation/2b855b50c4py_0_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.0,
+      "em_stderr": 0.0
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b50c4py/transformers",
+    "num_fewshot": 0,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b50c4py/evaluation/2b855b50c4py_1_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.06666666666666667,
+      "em_stderr": 0.004554959563627512
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b50c4py/transformers",
+    "num_fewshot": 1,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b50c4py/evaluation/2b855b50c4py_2_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.14633333333333334,
+      "em_stderr": 0.006453979205019232
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b50c4py/transformers",
+    "num_fewshot": 2,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b50c4py/evaluation/2b855b50c4py_3_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.2,
+      "em_stderr": 0.007304184899016065
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b50c4py/transformers",
+    "num_fewshot": 3,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b50c4py/evaluation/2b855b50c4py_4_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.235,
+      "em_stderr": 0.007742414459363012
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b50c4py/transformers",
+    "num_fewshot": 4,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b50c4py/evaluation/2b855b50c4py_5_babi.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "results": {
     "babi": {
-      "em": 0.26600441501103755,
-      "em_stderr": 0.014688141802812468
     }
   },
   "versions": {
@@ -14,8 +14,8 @@
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
-    "no_cache": false,
-    "limit": 906,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

 {
   "results": {
     "babi": {
+      "em": 0.25866666666666666,
+      "em_stderr": 0.007996294203008543
     }
   },
   "versions": {
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
+    "no_cache": true,
+    "limit": 3000,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

2b855b60c4py/evaluation/2b855b60c4py_0_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.0,
+      "em_stderr": 0.0
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b60c4py/transformers",
+    "num_fewshot": 0,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b60c4py/evaluation/2b855b60c4py_1_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.07366666666666667,
+      "em_stderr": 0.0047701377724078675
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b60c4py/transformers",
+    "num_fewshot": 1,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b60c4py/evaluation/2b855b60c4py_2_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.14433333333333334,
+      "em_stderr": 0.00641722689389614
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b60c4py/transformers",
+    "num_fewshot": 2,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b60c4py/evaluation/2b855b60c4py_3_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.193,
+      "em_stderr": 0.007206546429264379
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b60c4py/transformers",
+    "num_fewshot": 3,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b60c4py/evaluation/2b855b60c4py_4_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.23066666666666666,
+      "em_stderr": 0.007692392962423979
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b60c4py/transformers",
+    "num_fewshot": 4,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b60c4py/evaluation/2b855b60c4py_5_babi.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "results": {
     "babi": {
-      "em": 0.2560706401766004,
-      "em_stderr": 0.014508464567494349
     }
   },
   "versions": {
@@ -14,8 +14,8 @@
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
-    "no_cache": false,
-    "limit": 906,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

 {
   "results": {
     "babi": {
+      "em": 0.24633333333333332,
+      "em_stderr": 0.00786797575120501
     }
   },
   "versions": {
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
+    "no_cache": true,
+    "limit": 3000,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

2b855b70c4py/evaluation/2b855b70c4py_0_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.0,
+      "em_stderr": 0.0
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 0,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b70c4py/evaluation/2b855b70c4py_1_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.071,
+      "em_stderr": 0.004689740350472808
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 1,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b70c4py/evaluation/2b855b70c4py_2_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.149,
+      "em_stderr": 0.006502340102527321
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 2,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b70c4py/evaluation/2b855b70c4py_3_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.19233333333333333,
+      "em_stderr": 0.007197060045498059
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 3,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b70c4py/evaluation/2b855b70c4py_4_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.21133333333333335,
+      "em_stderr": 0.007454911831939557
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 4,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b70c4py/evaluation/2b855b70c4py_5_babi.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "results": {
     "babi": {
-      "em": 0.2229580573951435,
-      "em_stderr": 0.013835967302718943
     }
   },
   "versions": {
@@ -14,8 +14,8 @@
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
-    "no_cache": false,
-    "limit": 906,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

 {
   "results": {
     "babi": {
+      "em": 0.22633333333333333,
+      "em_stderr": 0.007641224680860716
     }
   },
   "versions": {
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
+    "no_cache": true,
+    "limit": 3000,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

2b855b80c4py/evaluation/2b855b80c4py_0_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.0,
+      "em_stderr": 0.0
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 0,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b80c4py/evaluation/2b855b80c4py_1_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.071,
+      "em_stderr": 0.004689740350472808
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 1,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b80c4py/evaluation/2b855b80c4py_2_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.149,
+      "em_stderr": 0.006502340102527321
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 2,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b80c4py/evaluation/2b855b80c4py_3_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.19233333333333333,
+      "em_stderr": 0.007197060045498059
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 3,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b80c4py/evaluation/2b855b80c4py_4_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.21133333333333335,
+      "em_stderr": 0.007454911831939557
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b70c4py/transformers",
+    "num_fewshot": 4,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b80c4py/evaluation/2b855b80c4py_5_babi.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "results": {
     "babi": {
-      "em": 0.2229580573951435,
-      "em_stderr": 0.013835967302718943
     }
   },
   "versions": {
@@ -14,8 +14,8 @@
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
-    "no_cache": false,
-    "limit": 906,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

 {
   "results": {
     "babi": {
+      "em": 0.22633333333333333,
+      "em_stderr": 0.007641224680860716
     }
   },
   "versions": {
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
+    "no_cache": true,
+    "limit": 3000,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

2b855b90c4py/evaluation/2b855b90c4py_0_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.0,
+      "em_stderr": 0.0
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b90c4py/transformers",
+    "num_fewshot": 0,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b90c4py/evaluation/2b855b90c4py_1_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.012,
+      "em_stderr": 0.0019882951925181257
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b90c4py/transformers",
+    "num_fewshot": 1,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b90c4py/evaluation/2b855b90c4py_2_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.03866666666666667,
+      "em_stderr": 0.0035206036511572203
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b90c4py/transformers",
+    "num_fewshot": 2,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b90c4py/evaluation/2b855b90c4py_3_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.06566666666666666,
+      "em_stderr": 0.004523089426985369
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b90c4py/transformers",
+    "num_fewshot": 3,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b90c4py/evaluation/2b855b90c4py_4_babi.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "results": {
+    "babi": {
+      "em": 0.07433333333333333,
+      "em_stderr": 0.004789948938479642
+    }
+  },
+  "versions": {
+    "babi": 0
+  },
+  "config": {
+    "model": "gpt2",
+    "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-c4py/2b855b90c4py/transformers",
+    "num_fewshot": 4,
+    "batch_size": null,
+    "device": null,
+    "no_cache": true,
+    "limit": 3000,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

2b855b90c4py/evaluation/2b855b90c4py_5_babi.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "results": {
     "babi": {
-      "em": 0.07836644591611479,
-      "em_stderr": 0.008933464682765763
     }
   },
   "versions": {
@@ -14,8 +14,8 @@
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
-    "no_cache": false,
-    "limit": 906,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }

 {
   "results": {
     "babi": {
+      "em": 0.08333333333333333,
+      "em_stderr": 0.005046925147795103
     }
   },
   "versions": {
     "num_fewshot": 5,
     "batch_size": null,
     "device": null,
+    "no_cache": true,
+    "limit": 3000,
     "bootstrap_iters": 100000,
     "description_dict": {}
   }