bjelkenhed
commited on
Commit
·
6664ab6
1
Parent(s):
b70d900
README
Browse files
README.md
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
|
3 |
+
----------------------------------------------------------------
|
4 |
+
Clona Whisper small or medium modellproject
|
5 |
+
----------------------------------------------------------------
|
6 |
+
|
7 |
+
git clone https://huggingface.co/bjelkenhed/whisper-small-sv
|
8 |
+
git clone https://huggingface.co/bjelkenhed/whisper-medium-sv
|
9 |
+
|
10 |
+
|
11 |
+
----------------------------------------------------------------
|
12 |
+
Install requirements
|
13 |
+
----------------------------------------------------------------
|
14 |
+
|
15 |
+
sudo add-apt-repository -y ppa:jonathonf/ffmpeg-4
|
16 |
+
sudo apt update
|
17 |
+
sudo apt install -y ffmpeg
|
18 |
+
sudo apt-get install git-lfs
|
19 |
+
|
20 |
+
----------------------------------------------------------------
|
21 |
+
Install python libraries
|
22 |
+
----------------------------------------------------------------
|
23 |
+
|
24 |
+
env_name=babelbox
|
25 |
+
|
26 |
+
python3 -m venv $env_name
|
27 |
+
|
28 |
+
source ~/$env_name/bin/activate
|
29 |
+
|
30 |
+
git clone https://github.com/huggingface/community-events.git
|
31 |
+
|
32 |
+
pip install -r community-events/whisper-fine-tuning-event/requirements.txt
|
33 |
+
|
34 |
+
python -c "import torch; print(torch.cuda.is_available())"
|
35 |
+
|
36 |
+
|
37 |
+
----------------------------------------------------------------
|
38 |
+
Log in to Huggingface
|
39 |
+
----------------------------------------------------------------
|
40 |
+
|
41 |
+
git config --global credential.helper store
|
42 |
+
huggingface-cli login
|
43 |
+
|
44 |
+
Type your Huggingface access token
|
45 |
+
|
46 |
+
|
47 |
+
----------------------------------------------------------------
|
48 |
+
Create HF modell or clone existing
|
49 |
+
----------------------------------------------------------------
|
50 |
+
|
51 |
+
#huggingface-cli repo create whisper-small-sv
|
52 |
+
|
53 |
+
git clone https://huggingface.co/bjelkenhed/whisper-small-sv
|
54 |
+
|
55 |
+
git config --global user.email "[email protected]"
|
56 |
+
git config --global user.name "Magnus Bjelkenhed"
|
57 |
+
|
58 |
+
tmux new -s mysession
|
59 |
+
|
60 |
+
|
61 |
+
tmux a -t mysession
|
run.sh
CHANGED
@@ -10,8 +10,9 @@ python run_speech_recognition_seq2seq_streaming.py \
|
|
10 |
--model_index_name="Whisper Small Swedish" \
|
11 |
--max_steps="5000" \
|
12 |
--output_dir="./" \
|
13 |
-
--per_device_train_batch_size="
|
14 |
--per_device_eval_batch_size="32" \
|
|
|
15 |
--logging_steps="25" \
|
16 |
--learning_rate="1e-5" \
|
17 |
--warmup_steps="500" \
|
|
|
10 |
--model_index_name="Whisper Small Swedish" \
|
11 |
--max_steps="5000" \
|
12 |
--output_dir="./" \
|
13 |
+
--per_device_train_batch_size="32" \
|
14 |
--per_device_eval_batch_size="32" \
|
15 |
+
--gradient_accumulation_steps="2" \
|
16 |
--logging_steps="25" \
|
17 |
--learning_rate="1e-5" \
|
18 |
--warmup_steps="500" \
|