Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
Torchaudio
Commits
0a5e29db
"src/git@developer.sourcefind.cn:renzhc/diffusers_dcu.git" did not exist on "f69511ecc618330212e7148265e1c0323d2fa5cf"
Unverified
Commit
0a5e29db
authored
Jul 27, 2020
by
Brandon Lin
Committed by
GitHub
Jul 27, 2020
Browse files
Add test for Speech Commands dataset (#824)
parent
6fcbff9c
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
109 additions
and
5 deletions
+109
-5
test/assets/SpeechCommands/speech_commands_v0.02/go/0a9f9af7_nohash_0.wav
...chCommands/speech_commands_v0.02/go/0a9f9af7_nohash_0.wav
+0
-0
test/datasets/datasets_test.py
test/datasets/datasets_test.py
+0
-5
test/datasets/speechcommands_test.py
test/datasets/speechcommands_test.py
+109
-0
No files found.
test/assets/SpeechCommands/speech_commands_v0.02/go/0a9f9af7_nohash_0.wav
deleted
100644 → 0
View file @
6fcbff9c
File deleted
test/datasets/datasets_test.py
View file @
0a5e29db
from
torchaudio.datasets.commonvoice
import
COMMONVOICE
from
torchaudio.datasets.commonvoice
import
COMMONVOICE
from
torchaudio.datasets.speechcommands
import
SPEECHCOMMANDS
from
torchaudio.datasets.utils
import
diskcache_iterator
,
bg_iterator
from
torchaudio.datasets.utils
import
diskcache_iterator
,
bg_iterator
from
torchaudio.datasets.vctk
import
VCTK
from
torchaudio.datasets.vctk
import
VCTK
from
torchaudio.datasets.cmuarctic
import
CMUARCTIC
from
torchaudio.datasets.cmuarctic
import
CMUARCTIC
...
@@ -18,10 +17,6 @@ class TestDatasets(TorchaudioTestCase):
...
@@ -18,10 +17,6 @@ class TestDatasets(TorchaudioTestCase):
data
=
VCTK
(
self
.
path
)
data
=
VCTK
(
self
.
path
)
data
[
0
]
data
[
0
]
def
test_speechcommands
(
self
):
data
=
SPEECHCOMMANDS
(
self
.
path
)
data
[
0
]
def
test_cmuarctic
(
self
):
def
test_cmuarctic
(
self
):
data
=
CMUARCTIC
(
self
.
path
)
data
=
CMUARCTIC
(
self
.
path
)
data
[
0
]
data
[
0
]
...
...
test/datasets/speechcommands_test.py
0 → 100644
View file @
0a5e29db
import
os
from
torchaudio.datasets
import
speechcommands
from
..common_utils
import
(
TempDirMixin
,
TorchaudioTestCase
,
get_whitenoise
,
normalize_wav
,
save_wav
,
)
LABELS
=
[
"bed"
,
"bird"
,
"cat"
,
"dog"
,
"down"
,
"eight"
,
"five"
,
"follow"
,
"forward"
,
"four"
,
"go"
,
"happy"
,
"house"
,
"learn"
,
"left"
,
"marvin"
,
"nine"
,
"no"
,
"off"
,
"on"
,
"one"
,
"right"
,
"seven"
,
"sheila"
,
"six"
,
"stop"
,
"three"
,
"tree"
,
"two"
,
"up"
,
"visual"
,
"wow"
,
"yes"
,
"zero"
,
]
class
TestSpeechCommands
(
TempDirMixin
,
TorchaudioTestCase
):
backend
=
"default"
root_dir
=
None
samples
=
[]
@
classmethod
def
setUp
(
cls
):
cls
.
root_dir
=
cls
.
get_base_temp_dir
()
dataset_dir
=
os
.
path
.
join
(
cls
.
root_dir
,
speechcommands
.
FOLDER_IN_ARCHIVE
,
speechcommands
.
URL
)
os
.
makedirs
(
dataset_dir
,
exist_ok
=
True
)
sample_rate
=
16000
# 16kHz sample rate
seed
=
0
for
label
in
LABELS
:
path
=
os
.
path
.
join
(
dataset_dir
,
label
)
os
.
makedirs
(
path
,
exist_ok
=
True
)
for
j
in
range
(
2
):
# generate hash ID for speaker
speaker
=
"{:08x}"
.
format
(
j
)
for
utterance
in
range
(
3
):
filename
=
f
"
{
speaker
}{
speechcommands
.
HASH_DIVIDER
}{
utterance
}
.wav"
file_path
=
os
.
path
.
join
(
path
,
filename
)
seed
+=
1
data
=
get_whitenoise
(
sample_rate
=
sample_rate
,
duration
=
0.01
,
n_channels
=
1
,
dtype
=
"int16"
,
seed
=
seed
,
)
save_wav
(
file_path
,
data
,
sample_rate
)
sample
=
(
normalize_wav
(
data
),
sample_rate
,
label
,
speaker
,
utterance
,
)
cls
.
samples
.
append
(
sample
)
def
testSpeechCommands
(
self
):
dataset
=
speechcommands
.
SPEECHCOMMANDS
(
self
.
root_dir
)
print
(
dataset
.
_path
)
num_samples
=
0
for
i
,
(
data
,
sample_rate
,
label
,
speaker_id
,
utterance_number
)
in
enumerate
(
dataset
):
self
.
assertEqual
(
data
,
self
.
samples
[
i
][
0
],
atol
=
5e-5
,
rtol
=
1e-8
)
assert
sample_rate
==
self
.
samples
[
i
][
1
]
assert
label
==
self
.
samples
[
i
][
2
]
assert
speaker_id
==
self
.
samples
[
i
][
3
]
assert
utterance_number
==
self
.
samples
[
i
][
4
]
num_samples
+=
1
assert
num_samples
==
len
(
self
.
samples
)
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment