cassanof commited on
Commit
7ac0864
1 Parent(s): 06ad8a5

r_full_1b-epoch1

Browse files
Files changed (4) hide show
  1. README.md +12 -28
  2. config.json +2 -2
  3. generation_config.json +1 -2
  4. model.safetensors +3 -0
README.md CHANGED
@@ -1,49 +1,33 @@
1
  ---
2
  license: bigscience-openrail-m
3
- datasets:
4
- - nuprl/MultiPL-T
5
- metrics:
6
- - code_eval
7
  library_name: transformers
8
  tags:
9
  - code
10
  - gpt_bigcode
 
 
 
 
11
  model-index:
12
- - name: MultiPLCoder-1b-Lua
13
  results:
14
  - task:
15
  type: text-generation
16
  dataset:
17
- type: nuprl/MultiPL-E
18
  name: MultiPL-HumanEval (Lua)
 
19
  metrics:
20
- - name: pass@1
21
- type: pass@1
22
  value: 0.173
 
23
  verified: true
24
- - name: MultiPLCoder-1b-Racket
25
- results:
26
- - task:
27
- type: text-generation
28
- dataset:
29
- type: nuprl/MultiPL-E
30
- name: MultiPL-HumanEval (Racket)
31
- metrics:
32
- - name: pass@1
33
- type: pass@1
34
  value: 0.113
 
35
  verified: true
36
- - name: MultiPLCoder-1b-OCaml
37
- results:
38
- - task:
39
- type: text-generation
40
- dataset:
41
- type: nuprl/MultiPL-E
42
- name: MultiPL-HumanEval (OCaml)
43
- metrics:
44
- - name: pass@1
45
- type: pass@1
46
  value: 0.097
 
47
  verified: true
48
  ---
49
  # MultiPLCoder-1b
 
1
  ---
2
  license: bigscience-openrail-m
 
 
 
 
3
  library_name: transformers
4
  tags:
5
  - code
6
  - gpt_bigcode
7
+ datasets:
8
+ - nuprl/MultiPL-T
9
+ metrics:
10
+ - code_eval
11
  model-index:
12
+ - name: MultiPLCoder-1b-OCaml
13
  results:
14
  - task:
15
  type: text-generation
16
  dataset:
 
17
  name: MultiPL-HumanEval (Lua)
18
+ type: nuprl/MultiPL-E
19
  metrics:
20
+ - type: pass@1
 
21
  value: 0.173
22
+ name: pass@1
23
  verified: true
24
+ - type: pass@1
 
 
 
 
 
 
 
 
 
25
  value: 0.113
26
+ name: pass@1
27
  verified: true
28
+ - type: pass@1
 
 
 
 
 
 
 
 
 
29
  value: 0.097
30
+ name: pass@1
31
  verified: true
32
  ---
33
  # MultiPLCoder-1b
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "jl_full_1b/checkpoint_16590",
3
  "activation_function": "gelu_pytorch_tanh",
4
  "architectures": [
5
  "GPTBigCodeForCausalLM"
@@ -32,7 +32,7 @@
32
  "summary_type": "cls_index",
33
  "summary_use_proj": true,
34
  "torch_dtype": "bfloat16",
35
- "transformers_version": "4.34.0",
36
  "use_cache": false,
37
  "validate_runner_input": true,
38
  "vocab_size": 49152
 
1
  {
2
+ "_name_or_path": "r_full_1b/checkpoint_2233",
3
  "activation_function": "gelu_pytorch_tanh",
4
  "architectures": [
5
  "GPTBigCodeForCausalLM"
 
32
  "summary_type": "cls_index",
33
  "summary_use_proj": true,
34
  "torch_dtype": "bfloat16",
35
+ "transformers_version": "4.37.2",
36
  "use_cache": false,
37
  "validate_runner_input": true,
38
  "vocab_size": 49152
generation_config.json CHANGED
@@ -2,6 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
- "transformers_version": "4.34.0",
6
- "use_cache": false
7
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
+ "transformers_version": "4.37.2"
 
6
  }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bdb35a2470d9f59dba53e2d81ba74dcbeba525bdd0ed0c431cc514323582b91
3
+ size 2274445296