inflaton commited on
Commit
f584ea4
·
1 Parent(s): 88d67f6

Qwen2.5 fine-tuned

Browse files
data/Mistral-7B-v0.3-Chinese-Chat_results.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data/Qwen2.5-3B-Instruct_results.csv ADDED
The diff for this file is too large to render. See raw diff
 
scripts/eval-mgtv-qwen2.5.sh ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/sh
2
+
3
+ BASEDIR=$(dirname "$0")
4
+ cd $BASEDIR/..
5
+ echo Current Directory:
6
+ pwd
7
+
8
+ BASEDIR=`pwd`
9
+
10
+ nvidia-smi
11
+ uname -a
12
+ cat /etc/os-release
13
+ lscpu
14
+ grep MemTotal /proc/meminfo
15
+
16
+ export LOGICAL_REASONING_DATA_PATH=datasets/mgtv
17
+ export RESIZE_TOKEN_EMBEDDINGS=true
18
+ export USING_LLAMA_FACTORY=true
19
+ export USING_P1_PROMPT_TEMPLATE=false
20
+ #export LOAD_IN_4BIT=true
21
+
22
+ export MODEL_PREFIX=Qwen2.5-3B-Instruct
23
+ export MODEL_NAME=qwen/$MODEL_PREFIX
24
+
25
+ export LOGICAL_REASONING_RESULTS_PATH=data/${MODEL_PREFIX}_results.csv
26
+ export ADAPTER_PATH_BASE=llama-factory/saves/$MODEL_PREFIX
27
+
28
+ echo "Eval $MODEL_NAME with $ADAPTER_PATH_BASE"
29
+ python llm_toolkit/eval_logical_reasoning_all_epochs.py
scripts/eval-mgtv-shots-qwen2.5.sh ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/sh
2
+
3
+ BASEDIR=$(dirname "$0")
4
+ cd $BASEDIR/..
5
+ echo Current Directory:
6
+ pwd
7
+
8
+ BASEDIR=`pwd`
9
+
10
+ nvidia-smi
11
+ uname -a
12
+ cat /etc/os-release
13
+ lscpu
14
+ grep MemTotal /proc/meminfo
15
+
16
+ export START_NUM_SHOTS=5
17
+
18
+ $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-3B-Instruct
19
+
20
+ #$BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-7B-Instruct
scripts/tune-mgtv-bf16.sh CHANGED
@@ -25,8 +25,10 @@ export LOGICAL_REASONING_RESULTS_PATH=results/mgtv-results_bf16.csv
25
 
26
  # $BASEDIR/scripts/tune-lf_v2.sh internlm internlm2_5-7b-chat intern2
27
 
28
- $BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-3B-Instruct qwen
29
 
30
- $BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-1.5B-Instruct qwen
31
 
32
- $BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-0.5B-Instruct qwen
 
 
 
25
 
26
  # $BASEDIR/scripts/tune-lf_v2.sh internlm internlm2_5-7b-chat intern2
27
 
28
+ $BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-7B-Instruct qwen
29
 
30
+ #$BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-3B-Instruct qwen
31
 
32
+ #$BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-1.5B-Instruct qwen
33
+
34
+ #$BASEDIR/scripts/tune-lf_v2.sh Qwen Qwen2.5-0.5B-Instruct qwen