tanthinhdt
commited on
Upload folder using huggingface_hub
Browse files- .gitattributes +4 -0
- test/vasr/audio/cer.132842 +25 -0
- test/vasr/audio/decode.log +0 -0
- test/vasr/audio/decode_test.log +3 -0
- test/vasr/audio/hypo-132842.json +3 -0
- test/vasr/audio/wer.132842 +25 -0
- test/vasr/audio_visual/cer.132842 +25 -0
- test/vasr/audio_visual/decode.log +0 -0
- test/vasr/audio_visual/decode_test.log +3 -0
- test/vasr/audio_visual/hypo-132842.json +3 -0
- test/vasr/audio_visual/wer.132842 +25 -0
.gitattributes
CHANGED
@@ -35,3 +35,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
test/decode_test.log filter=lfs diff=lfs merge=lfs -text
|
37 |
test/hypo-132842.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
test/decode_test.log filter=lfs diff=lfs merge=lfs -text
|
37 |
test/hypo-132842.json filter=lfs diff=lfs merge=lfs -text
|
38 |
+
test/vasr/audio/decode_test.log filter=lfs diff=lfs merge=lfs -text
|
39 |
+
test/vasr/audio/hypo-132842.json filter=lfs diff=lfs merge=lfs -text
|
40 |
+
test/vasr/audio_visual/decode_test.log filter=lfs diff=lfs merge=lfs -text
|
41 |
+
test/vasr/audio_visual/hypo-132842.json filter=lfs diff=lfs merge=lfs -text
|
test/vasr/audio/cer.132842
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
CER: 8.092690478125157
|
2 |
+
err / num_ref_chars = 156363 / 1932151
|
3 |
+
|
4 |
+
_name: null
|
5 |
+
max_length: 300
|
6 |
+
max_new_tokens: null
|
7 |
+
min_length: 0
|
8 |
+
min_new_tokens: null
|
9 |
+
max_time: null
|
10 |
+
do_sample: false
|
11 |
+
num_beams: 20
|
12 |
+
num_beam_groups: 1
|
13 |
+
temperature: 1.0
|
14 |
+
top_k: 50
|
15 |
+
top_p: 1.0
|
16 |
+
min_p: null
|
17 |
+
typical_p: 1.0
|
18 |
+
epsilon_cutoff: 0.0
|
19 |
+
eta_cutoff: 0.0
|
20 |
+
diversity_penalty: 0.0
|
21 |
+
repetition_penalty: 1.0
|
22 |
+
encoder_repetition_penalty: 1.0
|
23 |
+
length_penalty: 1.0
|
24 |
+
no_repeat_ngram_size: 0.0
|
25 |
+
exponential_decay_length_penalty: null
|
test/vasr/audio/decode.log
ADDED
File without changes
|
test/vasr/audio/decode_test.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38be3c45a4fce70c3c4f03e8f7b80d994aa680f4efe1ff1aaa4d3f105f784545
|
3 |
+
size 17238337
|
test/vasr/audio/hypo-132842.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0fc737bfeede00e79d13f762babf2a409d991ebaec6f62299c77832d018f091
|
3 |
+
size 12000529
|
test/vasr/audio/wer.132842
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
WER: 13.254824520514276
|
2 |
+
err / num_ref_words = 62558 / 471964
|
3 |
+
|
4 |
+
_name: null
|
5 |
+
max_length: 300
|
6 |
+
max_new_tokens: null
|
7 |
+
min_length: 0
|
8 |
+
min_new_tokens: null
|
9 |
+
max_time: null
|
10 |
+
do_sample: false
|
11 |
+
num_beams: 20
|
12 |
+
num_beam_groups: 1
|
13 |
+
temperature: 1.0
|
14 |
+
top_k: 50
|
15 |
+
top_p: 1.0
|
16 |
+
min_p: null
|
17 |
+
typical_p: 1.0
|
18 |
+
epsilon_cutoff: 0.0
|
19 |
+
eta_cutoff: 0.0
|
20 |
+
diversity_penalty: 0.0
|
21 |
+
repetition_penalty: 1.0
|
22 |
+
encoder_repetition_penalty: 1.0
|
23 |
+
length_penalty: 1.0
|
24 |
+
no_repeat_ngram_size: 0.0
|
25 |
+
exponential_decay_length_penalty: null
|
test/vasr/audio_visual/cer.132842
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
CER: 7.241048965634674
|
2 |
+
err / num_ref_chars = 139908 / 1932151
|
3 |
+
|
4 |
+
_name: null
|
5 |
+
max_length: 300
|
6 |
+
max_new_tokens: null
|
7 |
+
min_length: 0
|
8 |
+
min_new_tokens: null
|
9 |
+
max_time: null
|
10 |
+
do_sample: false
|
11 |
+
num_beams: 20
|
12 |
+
num_beam_groups: 1
|
13 |
+
temperature: 1.0
|
14 |
+
top_k: 50
|
15 |
+
top_p: 1.0
|
16 |
+
min_p: null
|
17 |
+
typical_p: 1.0
|
18 |
+
epsilon_cutoff: 0.0
|
19 |
+
eta_cutoff: 0.0
|
20 |
+
diversity_penalty: 0.0
|
21 |
+
repetition_penalty: 1.0
|
22 |
+
encoder_repetition_penalty: 1.0
|
23 |
+
length_penalty: 1.0
|
24 |
+
no_repeat_ngram_size: 0.0
|
25 |
+
exponential_decay_length_penalty: null
|
test/vasr/audio_visual/decode.log
ADDED
File without changes
|
test/vasr/audio_visual/decode_test.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1e88618adbd58943a01f40c7b61e0ef64647ea96a4c950f605ec27f282ccd29
|
3 |
+
size 17267482
|
test/vasr/audio_visual/hypo-132842.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86a8444a245523bab1bb21611afa2d543f4b5e1eb63a389689e05c7977274774
|
3 |
+
size 12026967
|
test/vasr/audio_visual/wer.132842
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
WER: 12.029095439482672
|
2 |
+
err / num_ref_words = 56773 / 471964
|
3 |
+
|
4 |
+
_name: null
|
5 |
+
max_length: 300
|
6 |
+
max_new_tokens: null
|
7 |
+
min_length: 0
|
8 |
+
min_new_tokens: null
|
9 |
+
max_time: null
|
10 |
+
do_sample: false
|
11 |
+
num_beams: 20
|
12 |
+
num_beam_groups: 1
|
13 |
+
temperature: 1.0
|
14 |
+
top_k: 50
|
15 |
+
top_p: 1.0
|
16 |
+
min_p: null
|
17 |
+
typical_p: 1.0
|
18 |
+
epsilon_cutoff: 0.0
|
19 |
+
eta_cutoff: 0.0
|
20 |
+
diversity_penalty: 0.0
|
21 |
+
repetition_penalty: 1.0
|
22 |
+
encoder_repetition_penalty: 1.0
|
23 |
+
length_penalty: 1.0
|
24 |
+
no_repeat_ngram_size: 0.0
|
25 |
+
exponential_decay_length_penalty: null
|