update
Browse files- .run_experiment2.sh.un~ +0 -0
- =0.26.0 +35 -0
- nb-distil-whisper-large-flax7 +1 -0
- run_experiment2.sh +2 -2
.run_experiment2.sh.un~
CHANGED
Binary files a/.run_experiment2.sh.un~ and b/.run_experiment2.sh.un~ differ
|
|
=0.26.0
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Requirement already satisfied: accelerate in /home/perk/distil-env/lib/python3.10/site-packages (1.1.1)
|
2 |
+
Requirement already satisfied: huggingface-hub>=0.21.0 in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (0.26.2)
|
3 |
+
Requirement already satisfied: numpy<3.0.0,>=1.17 in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (1.26.4)
|
4 |
+
Requirement already satisfied: packaging>=20.0 in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (24.2)
|
5 |
+
Requirement already satisfied: psutil in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (6.1.0)
|
6 |
+
Requirement already satisfied: pyyaml in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (6.0.2)
|
7 |
+
Requirement already satisfied: safetensors>=0.4.3 in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (0.4.5)
|
8 |
+
Requirement already satisfied: torch>=1.10.0 in /home/perk/distil-env/lib/python3.10/site-packages (from accelerate) (2.5.1)
|
9 |
+
Requirement already satisfied: filelock in /home/perk/distil-env/lib/python3.10/site-packages (from huggingface-hub>=0.21.0->accelerate) (3.16.1)
|
10 |
+
Requirement already satisfied: fsspec>=2023.5.0 in /home/perk/distil-env/lib/python3.10/site-packages (from huggingface-hub>=0.21.0->accelerate) (2024.9.0)
|
11 |
+
Requirement already satisfied: requests in /home/perk/distil-env/lib/python3.10/site-packages (from huggingface-hub>=0.21.0->accelerate) (2.32.3)
|
12 |
+
Requirement already satisfied: tqdm>=4.42.1 in /home/perk/distil-env/lib/python3.10/site-packages (from huggingface-hub>=0.21.0->accelerate) (4.67.0)
|
13 |
+
Requirement already satisfied: typing-extensions>=3.7.4.3 in /home/perk/distil-env/lib/python3.10/site-packages (from huggingface-hub>=0.21.0->accelerate) (4.12.2)
|
14 |
+
Requirement already satisfied: networkx in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (3.4.2)
|
15 |
+
Requirement already satisfied: jinja2 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (3.1.4)
|
16 |
+
Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.4.127 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.4.127)
|
17 |
+
Requirement already satisfied: nvidia-cuda-runtime-cu12==12.4.127 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.4.127)
|
18 |
+
Requirement already satisfied: nvidia-cuda-cupti-cu12==12.4.127 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.4.127)
|
19 |
+
Requirement already satisfied: nvidia-cudnn-cu12==9.1.0.70 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (9.1.0.70)
|
20 |
+
Requirement already satisfied: nvidia-cublas-cu12==12.4.5.8 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.4.5.8)
|
21 |
+
Requirement already satisfied: nvidia-cufft-cu12==11.2.1.3 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (11.2.1.3)
|
22 |
+
Requirement already satisfied: nvidia-curand-cu12==10.3.5.147 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (10.3.5.147)
|
23 |
+
Requirement already satisfied: nvidia-cusolver-cu12==11.6.1.9 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (11.6.1.9)
|
24 |
+
Requirement already satisfied: nvidia-cusparse-cu12==12.3.1.170 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.3.1.170)
|
25 |
+
Requirement already satisfied: nvidia-nccl-cu12==2.21.5 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (2.21.5)
|
26 |
+
Requirement already satisfied: nvidia-nvtx-cu12==12.4.127 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.4.127)
|
27 |
+
Requirement already satisfied: nvidia-nvjitlink-cu12==12.4.127 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (12.4.127)
|
28 |
+
Requirement already satisfied: triton==3.1.0 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (3.1.0)
|
29 |
+
Requirement already satisfied: sympy==1.13.1 in /home/perk/distil-env/lib/python3.10/site-packages (from torch>=1.10.0->accelerate) (1.13.1)
|
30 |
+
Requirement already satisfied: mpmath<1.4,>=1.1.0 in /home/perk/distil-env/lib/python3.10/site-packages (from sympy==1.13.1->torch>=1.10.0->accelerate) (1.3.0)
|
31 |
+
Requirement already satisfied: MarkupSafe>=2.0 in /home/perk/distil-env/lib/python3.10/site-packages (from jinja2->torch>=1.10.0->accelerate) (3.0.2)
|
32 |
+
Requirement already satisfied: charset-normalizer<4,>=2 in /home/perk/distil-env/lib/python3.10/site-packages (from requests->huggingface-hub>=0.21.0->accelerate) (3.4.0)
|
33 |
+
Requirement already satisfied: idna<4,>=2.5 in /home/perk/distil-env/lib/python3.10/site-packages (from requests->huggingface-hub>=0.21.0->accelerate) (3.10)
|
34 |
+
Requirement already satisfied: urllib3<3,>=1.21.1 in /home/perk/distil-env/lib/python3.10/site-packages (from requests->huggingface-hub>=0.21.0->accelerate) (2.2.3)
|
35 |
+
Requirement already satisfied: certifi>=2017.4.17 in /home/perk/distil-env/lib/python3.10/site-packages (from requests->huggingface-hub>=0.21.0->accelerate) (2024.8.30)
|
nb-distil-whisper-large-flax7
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
Subproject commit aae0a3f56d9db255e9f41ba6958dfaccf3cfdccf
|
run_experiment2.sh
CHANGED
@@ -21,7 +21,7 @@ TOKENIZERS_PARALLELISM=false python3 run_distillation.py \
|
|
21 |
--per_device_eval_batch_size 4 \
|
22 |
--dataloader_num_workers 8 \
|
23 |
--dtype "bfloat16" \
|
24 |
-
--output_dir "./nb-distil-whisper-
|
25 |
--do_train \
|
26 |
--do_eval \
|
27 |
--use_scan \
|
@@ -36,6 +36,6 @@ TOKENIZERS_PARALLELISM=false python3 run_distillation.py \
|
|
36 |
--wandb_name "flax_experiment1_bs4_v5_1e4_wer10" \
|
37 |
--save_code_to_wandb \
|
38 |
--save_train_state \
|
39 |
-
--hub_model_id "NbAiLab/nb-distil-whisper-large-
|
40 |
--push_to_hub
|
41 |
|
|
|
21 |
--per_device_eval_batch_size 4 \
|
22 |
--dataloader_num_workers 8 \
|
23 |
--dtype "bfloat16" \
|
24 |
+
--output_dir "./nb-distil-whisper-lare7-flax6" \
|
25 |
--do_train \
|
26 |
--do_eval \
|
27 |
--use_scan \
|
|
|
36 |
--wandb_name "flax_experiment1_bs4_v5_1e4_wer10" \
|
37 |
--save_code_to_wandb \
|
38 |
--save_train_state \
|
39 |
+
--hub_model_id "NbAiLab/nb-distil-whisper-large-flax7"\
|
40 |
--push_to_hub
|
41 |
|