bjelkenhed commited on
Commit
6664ab6
1 Parent(s): b70d900
Files changed (2) hide show
  1. README.md +61 -0
  2. run.sh +2 -1
README.md ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+ ----------------------------------------------------------------
4
+ Clona Whisper small or medium modellproject
5
+ ----------------------------------------------------------------
6
+
7
+ git clone https://huggingface.co/bjelkenhed/whisper-small-sv
8
+ git clone https://huggingface.co/bjelkenhed/whisper-medium-sv
9
+
10
+
11
+ ----------------------------------------------------------------
12
+ Install requirements
13
+ ----------------------------------------------------------------
14
+
15
+ sudo add-apt-repository -y ppa:jonathonf/ffmpeg-4
16
+ sudo apt update
17
+ sudo apt install -y ffmpeg
18
+ sudo apt-get install git-lfs
19
+
20
+ ----------------------------------------------------------------
21
+ Install python libraries
22
+ ----------------------------------------------------------------
23
+
24
+ env_name=babelbox
25
+
26
+ python3 -m venv $env_name
27
+
28
+ source ~/$env_name/bin/activate
29
+
30
+ git clone https://github.com/huggingface/community-events.git
31
+
32
+ pip install -r community-events/whisper-fine-tuning-event/requirements.txt
33
+
34
+ python -c "import torch; print(torch.cuda.is_available())"
35
+
36
+
37
+ ----------------------------------------------------------------
38
+ Log in to Huggingface
39
+ ----------------------------------------------------------------
40
+
41
+ git config --global credential.helper store
42
+ huggingface-cli login
43
+
44
+ Type your Huggingface access token
45
+
46
+
47
+ ----------------------------------------------------------------
48
+ Create HF modell or clone existing
49
+ ----------------------------------------------------------------
50
+
51
+ #huggingface-cli repo create whisper-small-sv
52
+
53
+ git clone https://huggingface.co/bjelkenhed/whisper-small-sv
54
+
55
+ git config --global user.email "bjelkenhed@gmail.com"
56
+ git config --global user.name "Magnus Bjelkenhed"
57
+
58
+ tmux new -s mysession
59
+
60
+
61
+ tmux a -t mysession
run.sh CHANGED
@@ -10,8 +10,9 @@ python run_speech_recognition_seq2seq_streaming.py \
10
  --model_index_name="Whisper Small Swedish" \
11
  --max_steps="5000" \
12
  --output_dir="./" \
13
- --per_device_train_batch_size="64" \
14
  --per_device_eval_batch_size="32" \
 
15
  --logging_steps="25" \
16
  --learning_rate="1e-5" \
17
  --warmup_steps="500" \
 
10
  --model_index_name="Whisper Small Swedish" \
11
  --max_steps="5000" \
12
  --output_dir="./" \
13
+ --per_device_train_batch_size="32" \
14
  --per_device_eval_batch_size="32" \
15
+ --gradient_accumulation_steps="2" \
16
  --logging_steps="25" \
17
  --learning_rate="1e-5" \
18
  --warmup_steps="500" \