veronica-girolimetti commited on
Commit
21a3881
1 Parent(s): d6f4f7e

Training in progress, step 150

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "epfl-llm/meditron-7b",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "gate_proj",
 
 
24
  "k_proj",
25
  "o_proj",
26
- "down_proj",
27
- "v_proj",
28
- "q_proj",
29
- "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/mistral-7b-v0.3-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "q_proj",
24
  "gate_proj",
25
+ "up_proj",
26
+ "v_proj",
27
  "k_proj",
28
  "o_proj",
29
+ "down_proj"
 
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0862f2be3a18c7c81a0c2496e90314de79df36adfc02aa503929484095abc990
3
- size 5117112704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82006092c7bc42be2d059e6e8787ea77406e49ecbfb11e3f2cf2124901f5019b
3
+ size 5368770952
runs/Nov20_21-16-49_d45c3fdb09f3/events.out.tfevents.1732137418.d45c3fdb09f3.3419.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b43bcfed2dd2d62e41e439f0796771cb18c33d08199bb361f8171861e36b08ea
3
+ size 11602
special_tokens_map.json CHANGED
@@ -1,28 +1,7 @@
1
  {
2
- "additional_special_tokens": [
3
- "[bib_ref]",
4
- "[/bib_ref]",
5
- "[fig_ref]",
6
- "[/fig_ref]",
7
- "[bib]",
8
- "[/bib]",
9
- "[fig]",
10
- "[/fig]",
11
- "[table]",
12
- "[/table]",
13
- "[formula]",
14
- "[/formula]"
15
- ],
16
  "bos_token": {
17
  "content": "<s>",
18
  "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "cls_token": {
24
- "content": "<CLS>",
25
- "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
@@ -30,26 +9,12 @@
30
  "eos_token": {
31
  "content": "</s>",
32
  "lstrip": false,
33
- "normalized": true,
34
- "rstrip": false,
35
- "single_word": false
36
- },
37
- "mask_token": {
38
- "content": "<MASK>",
39
- "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
42
  "single_word": false
43
  },
44
  "pad_token": {
45
- "content": "<PAD>",
46
- "lstrip": false,
47
- "normalized": false,
48
- "rstrip": false,
49
- "single_word": false
50
- },
51
- "sep_token": {
52
- "content": "<SEP>",
53
  "lstrip": false,
54
  "normalized": false,
55
  "rstrip": false,
@@ -58,7 +23,7 @@
58
  "unk_token": {
59
  "content": "<unk>",
60
  "lstrip": false,
61
- "normalized": true,
62
  "rstrip": false,
63
  "single_word": false
64
  }
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
 
 
 
 
 
 
 
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
 
9
  "eos_token": {
10
  "content": "</s>",
11
  "lstrip": false,
 
 
 
 
 
 
 
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "pad_token": {
17
+ "content": "[control_768]",
 
 
 
 
 
 
 
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
 
23
  "unk_token": {
24
  "content": "<unk>",
25
  "lstrip": false,
26
+ "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
29
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
- size 499723
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
3
+ size 587404
tokenizer_config.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:969128597ef42987d3235a68a16a144ffc4a6ff652783340129f5ee05e74e8b5
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ab2f7d06536b58b2556ecd875ce696f671e42bf94eb055a13e6b60f76500493
3
+ size 5560