inflaton commited on
Commit
e9947be
·
1 Parent(s): fbf56c6

generic prompt results

Browse files
logs/internlm-7b.txt ADDED
The diff for this file is too large to render. See raw diff
 
results/mac-results_rpp_with_mnt_2048_generic_prompt.csv CHANGED
The diff for this file is too large to render. See raw diff
 
scripts/eval-4gpu.sh CHANGED
@@ -11,6 +11,8 @@ cat /etc/os-release
11
  lscpu
12
  grep MemTotal /proc/meminfo
13
 
 
 
14
  #pip install torch torchvision torchaudio
15
 
16
  # pip install -r requirements.txt
@@ -38,6 +40,6 @@ export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048_generic_prompt.csv
38
  # export USING_CHAT_TEMPLATE=true
39
  # export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048.csv
40
 
41
- ./scripts/eval-rpp.sh shenzhi-wang Llama3.1-70B-Chinese-Chat checkpoint-210
42
 
43
  ./scripts/eval-rpp.sh Qwen Qwen2-72B-Instruct checkpoint-560
 
11
  lscpu
12
  grep MemTotal /proc/meminfo
13
 
14
+ cd ../rapget-v2; python eval_modules/calc_bert_scores.py; cd -
15
+
16
  #pip install torch torchvision torchaudio
17
 
18
  # pip install -r requirements.txt
 
40
  # export USING_CHAT_TEMPLATE=true
41
  # export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048.csv
42
 
43
+ #./scripts/eval-rpp.sh shenzhi-wang Llama3.1-70B-Chinese-Chat checkpoint-210
44
 
45
  ./scripts/eval-rpp.sh Qwen Qwen2-72B-Instruct checkpoint-560
scripts/eval-h100.sh ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/sh
2
+
3
+ BASEDIR=$(dirname "$0")
4
+ cd $BASEDIR/..
5
+ echo Current Directory:
6
+ pwd
7
+
8
+ nvidia-smi
9
+ uname -a
10
+ cat /etc/os-release
11
+ lscpu
12
+ grep MemTotal /proc/meminfo
13
+
14
+ # pip install torch torchvision torchaudio
15
+ # pip install -r requirements.txt
16
+
17
+ # export START_NUM_SHOTS=50
18
+
19
+ export RESULTS_PATH=results/mac-results_few_shots.csv
20
+
21
+ # ./scripts/eval-model.sh internlm/internlm2_5-7b-chat
22
+
23
+ # ./scripts/eval-model.sh Qwen/Qwen2-7B-Instruct
24
+
25
+ # ./scripts/eval-model.sh shenzhi-wang/Mistral-7B-v0.3-Chinese-Chat
26
+
27
+ # ./scripts/eval-model.sh shenzhi-wang/Llama3.1-8B-Chinese-Chat
28
+
29
+ # ./scripts/eval-model.sh microsoft/Phi-3.5-mini-instruct
30
+
31
+ export RESULTS_PATH=results/mac-results_fine_tuned.csv
32
+
33
+ # ./scripts/eval-epochs.sh internlm internlm2_5-7b-chat
34
+
35
+ # ./scripts/eval-epochs.sh Qwen Qwen2-7B-Instruct
36
+
37
+ # ./scripts/eval-epochs.sh shenzhi-wang Mistral-7B-v0.3-Chinese-Chat
38
+
39
+ # ./scripts/eval-epochs.sh shenzhi-wang Llama3.1-8B-Chinese-Chat
40
+
41
+ # ./scripts/eval-epochs.sh microsoft Phi-3.5-mini-instruct
42
+
43
+ export MAX_NEW_TOKENS=2048
44
+ export START_REPETITION_PENALTY=1.0
45
+ export END_REPETITION_PENALTY=1.1
46
+
47
+ export USING_CHAT_TEMPLATE=false
48
+ export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048_generic_prompt.csv
49
+
50
+ # export USING_CHAT_TEMPLATE=true
51
+ # export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048.csv
52
+
53
+ #./scripts/eval-rpp.sh internlm internlm2_5-7b-chat checkpoint-140
54
+
55
+ #./scripts/eval-rpp.sh Qwen Qwen2-7B-Instruct checkpoint-105
56
+
57
+ export BATCH_SIZE=1
58
+ export LOAD_IN_4BIT=true
59
+
60
+ ./scripts/eval-rpp.sh Qwen Qwen2-72B-Instruct checkpoint-105
61
+
62
+
63
+ export BATCH_SIZE=4
64
+ export LOAD_IN_4BIT=false
65
+
66
+ ./scripts/eval-rpp.sh shenzhi-wang Mistral-7B-v0.3-Chinese-Chat checkpoint-70
67
+
68
+ ./scripts/eval-rpp.sh shenzhi-wang Llama3.1-8B-Chinese-Chat checkpoint-105
69
+
70
+ ./scripts/eval-rpp.sh microsoft Phi-3.5-mini-instruct checkpoint-210
scripts/eval-mac.sh CHANGED
@@ -50,9 +50,11 @@ export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048_generic_prompt.csv
50
  # export USING_CHAT_TEMPLATE=true
51
  # export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048.csv
52
 
53
- ./scripts/eval-rpp.sh internlm internlm2_5-7b-chat checkpoint-140
54
 
55
- ./scripts/eval-rpp.sh Qwen Qwen2-7B-Instruct checkpoint-105
 
 
56
 
57
  ./scripts/eval-rpp.sh shenzhi-wang Mistral-7B-v0.3-Chinese-Chat checkpoint-70
58
 
 
50
  # export USING_CHAT_TEMPLATE=true
51
  # export RESULTS_PATH=results/mac-results_rpp_with_mnt_2048.csv
52
 
53
+ #./scripts/eval-rpp.sh internlm internlm2_5-7b-chat checkpoint-140
54
 
55
+ #./scripts/eval-rpp.sh Qwen Qwen2-7B-Instruct checkpoint-105
56
+
57
+ cd ../rapget-v2; pip install -r requirements.txt; python eval_modules/calc_bert_scores.py; cd -
58
 
59
  ./scripts/eval-rpp.sh shenzhi-wang Mistral-7B-v0.3-Chinese-Chat checkpoint-70
60