dh-mc commited on
Commit
031ff20
·
1 Parent(s): 20bd1d6

re-run qwen2.5 smaller models

Browse files
llm_toolkit/eval_shots.py CHANGED
@@ -30,6 +30,7 @@ batch_size = int(os.getenv("BATCH_SIZE", 1))
30
  using_llama_factory = os.getenv("USING_LLAMA_FACTORY") == "true"
31
  max_new_tokens = int(os.getenv("MAX_NEW_TOKENS", 2048))
32
  start_num_shots = int(os.getenv("START_NUM_SHOTS", 0))
 
33
 
34
  print(
35
  model_name,
@@ -99,6 +100,7 @@ def evaluate_model_with_num_shots(
99
  model_name,
100
  data_path,
101
  start_num_shots=0,
 
102
  range_num_shots=[0, 5, 10, 20, 30, 40, 50],
103
  batch_size=1,
104
  max_new_tokens=2048,
@@ -109,6 +111,9 @@ def evaluate_model_with_num_shots(
109
  for num_shots in range_num_shots:
110
  if num_shots < start_num_shots:
111
  continue
 
 
 
112
 
113
  print(f"*** Evaluating with num_shots: {num_shots}")
114
 
@@ -157,6 +162,7 @@ evaluate_model_with_num_shots(
157
  max_new_tokens=max_new_tokens,
158
  device=device,
159
  start_num_shots=start_num_shots,
 
160
  )
161
 
162
  if is_cuda:
 
30
  using_llama_factory = os.getenv("USING_LLAMA_FACTORY") == "true"
31
  max_new_tokens = int(os.getenv("MAX_NEW_TOKENS", 2048))
32
  start_num_shots = int(os.getenv("START_NUM_SHOTS", 0))
33
+ end_num_shots = int(os.getenv("END_NUM_SHOTS", 50)
34
 
35
  print(
36
  model_name,
 
100
  model_name,
101
  data_path,
102
  start_num_shots=0,
103
+ end_num_shots=50,
104
  range_num_shots=[0, 5, 10, 20, 30, 40, 50],
105
  batch_size=1,
106
  max_new_tokens=2048,
 
111
  for num_shots in range_num_shots:
112
  if num_shots < start_num_shots:
113
  continue
114
+
115
+ if num_shots > end_num_shots:
116
+ break
117
 
118
  print(f"*** Evaluating with num_shots: {num_shots}")
119
 
 
162
  max_new_tokens=max_new_tokens,
163
  device=device,
164
  start_num_shots=start_num_shots,
165
+ end_num_shots=end_num_shots,
166
  )
167
 
168
  if is_cuda:
scripts/eval-mgtv-qwen2.5_3b.sh CHANGED
@@ -13,18 +13,18 @@ cat /etc/os-release
13
  lscpu
14
  grep MemTotal /proc/meminfo
15
 
16
- # $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-3B-Instruct
 
17
 
18
- # $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-1.5B-Instruct
19
 
20
- # $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-0.5B-Instruct
21
 
22
- # $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-3B-Instruct
23
 
24
- # $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-1.5B-Instruct
25
 
26
- # $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-0.5B-Instruct
27
 
28
- export START_NUM_SHOTS=40
29
  $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-0.5B-Instruct
30
 
 
13
  lscpu
14
  grep MemTotal /proc/meminfo
15
 
16
+ export USING_LLAMA_FACTORY=true
17
+ export LOAD_IN_4BIT=false
18
 
19
+ $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-3B-Instruct
20
 
21
+ $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-3B-Instruct
22
 
23
+ $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-1.5B-Instruct
24
 
25
+ $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-1.5B-Instruct
26
 
27
+ $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-0.5B-Instruct
28
 
 
29
  $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-0.5B-Instruct
30
 
scripts/eval-mgtv.sh CHANGED
@@ -1 +1 @@
1
- eval-mgtv-qwen2.5_4bit.sh
 
1
+ eval-mgtv-qwen2.5_3b.sh