Lguyogiro commited on
Commit
1556da5
·
verified ·
1 Parent(s): 7140b0b

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +4 -4
  2. vocab.json +33 -33
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  license: cc-by-nc-4.0
3
- base_model: facebook/mms-1b-all
4
  tags:
5
  - generated_from_trainer
 
6
  datasets:
7
  - audiofolder
8
  metrics:
@@ -11,8 +11,8 @@ model-index:
11
  - name: wav2vec2-large-mms-1b-nhi-adapterft-orig-ortho_fold1
12
  results:
13
  - task:
14
- name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
 
16
  dataset:
17
  name: audiofolder
18
  type: audiofolder
@@ -20,9 +20,9 @@ model-index:
20
  split: test
21
  args: default
22
  metrics:
23
- - name: Wer
24
- type: wer
25
  value: 0.4133971291866029
 
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
1
  ---
2
  license: cc-by-nc-4.0
 
3
  tags:
4
  - generated_from_trainer
5
+ base_model: facebook/mms-1b-all
6
  datasets:
7
  - audiofolder
8
  metrics:
 
11
  - name: wav2vec2-large-mms-1b-nhi-adapterft-orig-ortho_fold1
12
  results:
13
  - task:
 
14
  type: automatic-speech-recognition
15
+ name: Automatic Speech Recognition
16
  dataset:
17
  name: audiofolder
18
  type: audiofolder
 
20
  split: test
21
  args: default
22
  metrics:
23
+ - type: wer
 
24
  value: 0.4133971291866029
25
+ name: Wer
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
vocab.json CHANGED
@@ -1,40 +1,40 @@
1
  {
2
  "nhi": {
3
- "2": 1,
4
- "8": 2,
5
  "[PAD]": 35,
6
  "[UNK]": 34,
7
- "_": 3,
8
- "a": 4,
9
- "b": 5,
10
- "c": 6,
11
- "d": 7,
12
- "e": 8,
13
- "f": 9,
14
- "g": 10,
15
- "h": 11,
16
- "i": 12,
17
- "j": 13,
18
- "k": 14,
19
- "l": 15,
20
- "m": 16,
21
- "n": 17,
22
- "o": 18,
23
- "p": 19,
24
- "q": 20,
25
- "r": 21,
26
- "s": 22,
27
- "t": 23,
28
- "u": 24,
29
- "v": 25,
30
- "w": 26,
31
- "x": 27,
32
- "y": 28,
33
- "z": 29,
34
  "|": 0,
35
- "¨": 30,
36
- "´": 31,
37
- "¿": 32,
38
- "ñ": 33
 
 
 
39
  }
40
  }
 
1
  {
2
  "nhi": {
 
 
3
  "[PAD]": 35,
4
  "[UNK]": 34,
5
+ "a": 1,
6
+ "b": 2,
7
+ "c": 3,
8
+ "d": 4,
9
+ "e": 5,
10
+ "f": 6,
11
+ "g": 7,
12
+ "h": 8,
13
+ "i": 9,
14
+ "j": 10,
15
+ "k": 11,
16
+ "l": 12,
17
+ "m": 13,
18
+ "n": 14,
19
+ "o": 15,
20
+ "p": 16,
21
+ "q": 17,
22
+ "r": 18,
23
+ "s": 19,
24
+ "t": 20,
25
+ "u": 21,
26
+ "v": 22,
27
+ "w": 23,
28
+ "x": 24,
29
+ "y": 25,
30
+ "z": 26,
 
31
  "|": 0,
32
+ "á": 27,
33
+ "é": 28,
34
+ "ì": 29,
35
+ "í": 30,
36
+ "ñ": 31,
37
+ "ó": 32,
38
+ "ú": 33
39
  }
40
  }