cnatale/Mistral-7B-Instruct-v0.1-Txt-2-Presto-SQL

Files changed (7) hide show

README.md CHANGED Viewed

@@ -20,7 +20,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.1](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1) on the generator dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.6078
 ## Model description
@@ -53,12 +53,12 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 0.8119        | 1.33  | 20   | 0.7276          |
-| 0.6364        | 2.67  | 40   | 0.6203          |
-| 0.5394        | 4.0   | 60   | 0.5812          |
-| 0.4848        | 5.33  | 80   | 0.5949          |
-| 0.4164        | 6.67  | 100  | 0.6019          |
-| 0.385         | 8.0   | 120  | 0.6078          |
 ### Framework versions

 This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.1](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1) on the generator dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6143
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 0.8588        | 1.33  | 20   | 0.7602          |
+| 0.6494        | 2.67  | 40   | 0.6310          |
+| 0.5549        | 4.0   | 60   | 0.5919          |
+| 0.4855        | 5.33  | 80   | 0.6051          |
+| 0.4283        | 6.67  | 100  | 0.6050          |
+| 0.3904        | 8.0   | 120  | 0.6143          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -19,8 +19,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM"
 }

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
+    "v_proj"
   ],
   "task_type": "CAUSAL_LM"
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:92dfefee380c7cc88a07e57586271a03466e5b59126e326892b8b810babc4821
 size 109069176

 version https://git-lfs.github.com/spec/v1
+oid sha256:1abbe85561b652b5746f919cb017f565519376439ecfe3740d496dfe8c3dd600
 size 109069176

runs/Jan02_00-57-36_c16c6898537f/events.out.tfevents.1704157057.c16c6898537f.1158.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b6b6de26b6da2df5c2dbbad3640481fa529143612092a932311e966b30f6146
+size 8617

special_tokens_map.json CHANGED Viewed

@@ -13,6 +13,7 @@
     "rstrip": false,
     "single_word": false
   },
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

     "rstrip": false,
     "single_word": false
   },
+  "pad_token": "</s>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -33,7 +33,7 @@
   "eos_token": "</s>",
   "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
-  "pad_token": null,
   "sp_model_kwargs": {},
   "spaces_between_special_tokens": false,
   "tokenizer_class": "LlamaTokenizer",

   "eos_token": "</s>",
   "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "</s>",
   "sp_model_kwargs": {},
   "spaces_between_special_tokens": false,
   "tokenizer_class": "LlamaTokenizer",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd5223a55753e94567b8eb2e919eec3d9a40cc5b2d056802d9259112f247e0ed
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:31696b5a25f77c15b40627919ea506fa6982e8d8c8ad696eecdb750ddaf0ac09
 size 4728