Spaces:
Runtime error
Runtime error
anonymoussubmitter222
commited on
Commit
•
3485e08
1
Parent(s):
bf7e6b5
now handles stereo input
Browse files- TunisianASR/results/14epoch_tunisian/1234/app.py +6 -10
- TunisianASR/results/14epoch_tunisian/1234/env.log +1 -1
- TunisianASR/results/14epoch_tunisian/1234/log.txt +491 -0
- app.py +6 -10
- results/non_semi_final_stac/app.py +6 -10
- results/non_semi_final_stac/env.log +1 -1
- results/non_semi_final_stac/log.txt +0 -0
TunisianASR/results/14epoch_tunisian/1234/app.py
CHANGED
@@ -744,18 +744,9 @@ mixer.checkpointer.recover_if_possible(device="cpu")
|
|
744 |
mixer.modules.eval()
|
745 |
|
746 |
|
747 |
-
label_encoder = sb.dataio.encoder.CTCTextEncoder()
|
748 |
|
749 |
|
750 |
-
# We dynamicaly add the tokenizer to our brain class.
|
751 |
-
# NB: This tokenizer corresponds to the one used for the LM!!
|
752 |
|
753 |
-
decoder = build_ctcdecoder(
|
754 |
-
labels,
|
755 |
-
kenlm_model_path= "arpas/everything.arpa", # either .arpa or .bin file
|
756 |
-
alpha=0.5, # tuned on a val set
|
757 |
-
beta=1, # tuned on a val set
|
758 |
-
)
|
759 |
|
760 |
|
761 |
|
@@ -785,7 +776,12 @@ def treat_wav_file(file_mic,file_upload ,asr=mixer, device="cpu") :
|
|
785 |
wav = file_mic
|
786 |
else:
|
787 |
wav = file_upload
|
788 |
-
|
|
|
|
|
|
|
|
|
|
|
789 |
tensor_wav = sig.to(device)
|
790 |
resampled = torchaudio.functional.resample( tensor_wav, sr, 16000)
|
791 |
sentence = asr.treat_wav(resampled)
|
|
|
744 |
mixer.modules.eval()
|
745 |
|
746 |
|
|
|
747 |
|
748 |
|
|
|
|
|
749 |
|
|
|
|
|
|
|
|
|
|
|
|
|
750 |
|
751 |
|
752 |
|
|
|
776 |
wav = file_mic
|
777 |
else:
|
778 |
wav = file_upload
|
779 |
+
info = torchaudio.info(wav)
|
780 |
+
sr = info.sample_rate
|
781 |
+
sig = sb.dataio.dataio.read_audio(wav)
|
782 |
+
if len(sig.shape)>1 :
|
783 |
+
sig = torch.mean(sig, dim=1)
|
784 |
+
sig = torch.unsqueeze(sig, 0)
|
785 |
tensor_wav = sig.to(device)
|
786 |
resampled = torchaudio.functional.resample( tensor_wav, sr, 16000)
|
787 |
sentence = asr.treat_wav(resampled)
|
TunisianASR/results/14epoch_tunisian/1234/env.log
CHANGED
@@ -473,7 +473,7 @@ youtube-dl==2021.6.6
|
|
473 |
zipp==3.6.0
|
474 |
==============================
|
475 |
Git revision:
|
476 |
-
|
477 |
==============================
|
478 |
CUDA version:
|
479 |
11.7
|
|
|
473 |
zipp==3.6.0
|
474 |
==============================
|
475 |
Git revision:
|
476 |
+
bf7e6b5
|
477 |
==============================
|
478 |
CUDA version:
|
479 |
11.7
|
TunisianASR/results/14epoch_tunisian/1234/log.txt
CHANGED
@@ -1830,3 +1830,494 @@ zipp==3.6.0
|
|
1830 |
2023-09-25 12:30:16,221 - speechbrain.core - INFO - 314.4M trainable parameters in ASR
|
1831 |
2023-09-25 12:30:16,224 - speechbrain.utils.checkpoints - INFO - Loading a checkpoint from TunisianASR/results/14epoch_tunisian/1234/save/CKPT+2023-08-03+01-38-38+00
|
1832 |
2023-09-25 12:30:16,534 - speechbrain.utils.distributed - INFO - distributed_launch flag is disabled, this experiment will be executed without DDP.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1830 |
2023-09-25 12:30:16,221 - speechbrain.core - INFO - 314.4M trainable parameters in ASR
|
1831 |
2023-09-25 12:30:16,224 - speechbrain.utils.checkpoints - INFO - Loading a checkpoint from TunisianASR/results/14epoch_tunisian/1234/save/CKPT+2023-08-03+01-38-38+00
|
1832 |
2023-09-25 12:30:16,534 - speechbrain.utils.distributed - INFO - distributed_launch flag is disabled, this experiment will be executed without DDP.
|
1833 |
+
2023-09-25 15:14:42,745 - speechbrain.core - INFO - Beginning experiment!
|
1834 |
+
2023-09-25 15:14:42,745 - speechbrain.core - INFO - Experiment folder: TunisianASR/results/14epoch_tunisian/1234/
|
1835 |
+
2023-09-25 15:14:43,231 - speechbrain.utils.superpowers - DEBUG - abkhazia==1.0
|
1836 |
+
absl-py==0.11.0
|
1837 |
+
aiofiles==23.2.1
|
1838 |
+
aiohttp==3.8.0
|
1839 |
+
aiosignal==1.2.0
|
1840 |
+
alabaster==0.7.12
|
1841 |
+
alembic==1.7.4
|
1842 |
+
altair==4.2.0
|
1843 |
+
altgraph==0.17
|
1844 |
+
antlr4-python3-runtime==4.9.3
|
1845 |
+
anyio==3.6.2
|
1846 |
+
appdirs==1.4.4
|
1847 |
+
argcomplete==1.12.2
|
1848 |
+
argon2-cffi==20.1.0
|
1849 |
+
arrow==1.2.3
|
1850 |
+
asgiref==3.6.0
|
1851 |
+
asteroid-filterbanks==0.4.0
|
1852 |
+
astunparse==1.6.3
|
1853 |
+
async-generator==1.10
|
1854 |
+
async-timeout==4.0.0
|
1855 |
+
attrdict==2.0.1
|
1856 |
+
attrs==20.3.0
|
1857 |
+
audeer==1.16.0
|
1858 |
+
audformat==0.11.5
|
1859 |
+
audinterface==0.7.0
|
1860 |
+
audiofile==1.0.0
|
1861 |
+
audiomentations==0.25.0
|
1862 |
+
audioread==2.1.9
|
1863 |
+
audobject==0.4.14
|
1864 |
+
audresample==0.1.6
|
1865 |
+
-e git+https://github.com/facebookresearch/WavAugment.git@54afcdb00ccc852c2f030f239f8532c9562b550e#egg=augment
|
1866 |
+
autopage==0.4.0
|
1867 |
+
Babel==2.9.0
|
1868 |
+
backcall==0.2.0
|
1869 |
+
backports.cached-property==1.0.2
|
1870 |
+
beautifulsoup4==4.10.0
|
1871 |
+
black==19.10b0
|
1872 |
+
bleach==3.3.0
|
1873 |
+
blessed==1.20.0
|
1874 |
+
boto3==1.20.2
|
1875 |
+
botocore==1.23.2
|
1876 |
+
bpemb==0.3.4
|
1877 |
+
braceexpand==0.1.7
|
1878 |
+
cachetools==4.2.0
|
1879 |
+
certifi @ file:///croot/certifi_1671487769961/work/certifi
|
1880 |
+
cffi==1.14.3
|
1881 |
+
cfgv==3.2.0
|
1882 |
+
chardet==3.0.4
|
1883 |
+
charset-normalizer==2.0.7
|
1884 |
+
click==7.1.2
|
1885 |
+
cliff==3.9.0
|
1886 |
+
clldutils==3.5.4
|
1887 |
+
cloudpickle==2.2.1
|
1888 |
+
cmaes==0.8.2
|
1889 |
+
cmake==3.18.4.post1
|
1890 |
+
cmd2==2.2.0
|
1891 |
+
colorama==0.4.4
|
1892 |
+
colorlog==4.6.2
|
1893 |
+
configparser==5.1.0
|
1894 |
+
conllu==4.5.3
|
1895 |
+
croniter==1.3.15
|
1896 |
+
cryptography==38.0.4
|
1897 |
+
csrgraph==0.1.28
|
1898 |
+
csvw==1.8.1
|
1899 |
+
cycler==0.10.0
|
1900 |
+
Cython==0.29.21
|
1901 |
+
dataclasses==0.6
|
1902 |
+
dateutils==0.6.12
|
1903 |
+
decorator==4.4.2
|
1904 |
+
deepdiff==6.3.0
|
1905 |
+
deepspeech==0.9.1
|
1906 |
+
defusedxml==0.7.1
|
1907 |
+
Deprecated==1.2.14
|
1908 |
+
dill==0.3.3
|
1909 |
+
Distance==0.1.3
|
1910 |
+
distlib==0.3.1
|
1911 |
+
Django==3.2.16
|
1912 |
+
django-auditlog==2.2.1
|
1913 |
+
django-filter==22.1
|
1914 |
+
django-js-asset==1.2.2
|
1915 |
+
django-mptt==0.14.0
|
1916 |
+
djangorestframework==3.14.0
|
1917 |
+
docker-pycreds==0.4.0
|
1918 |
+
docopt==0.6.2
|
1919 |
+
docutils==0.16
|
1920 |
+
drf-excel==2.2.0
|
1921 |
+
drf-flex-fields==1.0.0
|
1922 |
+
drf-renderer-xlsx==0.4.1
|
1923 |
+
easyocr==1.2.1
|
1924 |
+
editdistance==0.6.0
|
1925 |
+
einops==0.3.2
|
1926 |
+
emoji==2.2.0
|
1927 |
+
entrypoints==0.3
|
1928 |
+
et-xmlfile==1.1.0
|
1929 |
+
exceptiongroup==1.1.0
|
1930 |
+
farasapy==0.0.14
|
1931 |
+
fastapi==0.98.0
|
1932 |
+
fastjsonschema==2.17.1
|
1933 |
+
fasttext==0.9.2
|
1934 |
+
ffmpeg-python==0.2.0
|
1935 |
+
ffmpy==0.3.0
|
1936 |
+
filelock==3.0.12
|
1937 |
+
flair==0.12.2
|
1938 |
+
flake8==3.7.9
|
1939 |
+
flatbuffers==1.12
|
1940 |
+
frozendict==2.0.7
|
1941 |
+
frozenlist==1.2.0
|
1942 |
+
fsspec==2021.11.0
|
1943 |
+
ftfy==6.1.1
|
1944 |
+
future==0.18.2
|
1945 |
+
g2p-en==2.1.0
|
1946 |
+
gast==0.3.3
|
1947 |
+
gdown==4.4.0
|
1948 |
+
gdrive==0.1.5
|
1949 |
+
gensim==4.0.1
|
1950 |
+
gitdb==4.0.9
|
1951 |
+
GitPython==3.1.24
|
1952 |
+
google-api-core==2.11.1
|
1953 |
+
google-api-python-client==2.43.0
|
1954 |
+
google-auth==1.24.0
|
1955 |
+
google-auth-httplib2==0.1.0
|
1956 |
+
google-auth-oauthlib==0.5.3
|
1957 |
+
google-pasta==0.2.0
|
1958 |
+
googleapis-common-protos==1.59.1
|
1959 |
+
gradio==3.44.4
|
1960 |
+
gradio-client==0.5.1
|
1961 |
+
greenlet==1.1.2
|
1962 |
+
grpcio==1.32.0
|
1963 |
+
h11==0.14.0
|
1964 |
+
h5features==1.3.2
|
1965 |
+
h5py==2.10.0
|
1966 |
+
hierarchy==0.4.0
|
1967 |
+
hmmlearn==0.2.8
|
1968 |
+
htk-io==0.5
|
1969 |
+
httpcore==0.16.3
|
1970 |
+
httplib2==0.22.0
|
1971 |
+
httpx==0.23.3
|
1972 |
+
huggingface-hub==0.15.1
|
1973 |
+
hydra-colorlog==0.1.4
|
1974 |
+
hydra-core==1.3.2
|
1975 |
+
hyperopt==0.2.7
|
1976 |
+
HyperPyYAML==1.1.0
|
1977 |
+
hypothesis==6.61.2
|
1978 |
+
identify==1.5.10
|
1979 |
+
idna==2.10
|
1980 |
+
imageio==2.9.0
|
1981 |
+
imagesize==1.2.0
|
1982 |
+
importlib-metadata==4.8.1
|
1983 |
+
importlib-resources==5.2.2
|
1984 |
+
inflect==5.3.0
|
1985 |
+
inquirer==3.1.3
|
1986 |
+
ipadic==1.0.0
|
1987 |
+
ipyevents==2.0.1
|
1988 |
+
ipykernel==5.3.4
|
1989 |
+
ipython==7.19.0
|
1990 |
+
ipython-genutils==0.2.0
|
1991 |
+
ipywebrtc==0.6.0
|
1992 |
+
ipywidgets==7.6.3
|
1993 |
+
iso-639==0.4.5
|
1994 |
+
isodate==0.6.0
|
1995 |
+
isort==4.3.21
|
1996 |
+
itsdangerous==2.1.2
|
1997 |
+
Janome==0.5.0
|
1998 |
+
jedi==0.17.2
|
1999 |
+
jeepney==0.8.0
|
2000 |
+
jieba==0.42.1
|
2001 |
+
Jinja2==3.0.3
|
2002 |
+
jiwer==2.2.0
|
2003 |
+
jmespath==0.10.0
|
2004 |
+
joblib==0.17.0
|
2005 |
+
jsonschema==3.2.0
|
2006 |
+
julius==0.2.7
|
2007 |
+
jupyter-client==6.1.7
|
2008 |
+
jupyter-core==4.7.0
|
2009 |
+
jupyterlab-pygments==0.1.2
|
2010 |
+
jupyterlab-widgets==1.0.0
|
2011 |
+
kaitaistruct==0.9
|
2012 |
+
kaldi-io==0.9.4
|
2013 |
+
kaldi-python-io==1.2.2
|
2014 |
+
kaldiio==2.17.2
|
2015 |
+
kenlm @ https://github.com/kpu/kenlm/archive/master.zip
|
2016 |
+
Keras-Preprocessing==1.1.2
|
2017 |
+
kiwisolver==1.3.1
|
2018 |
+
lang-trans==0.6.0
|
2019 |
+
langdetect==1.0.9
|
2020 |
+
latexcodec==2.0.1
|
2021 |
+
ldap3==2.9.1
|
2022 |
+
librosa==0.9.0
|
2023 |
+
lightning-cloud==0.5.37
|
2024 |
+
lightning-utilities==0.8.0
|
2025 |
+
linkify-it-py==1.0.3
|
2026 |
+
lit==16.0.6
|
2027 |
+
llvmlite==0.35.0
|
2028 |
+
lxml==4.9.0
|
2029 |
+
Mako==1.1.5
|
2030 |
+
Markdown==3.3.3
|
2031 |
+
markdown-it-py==3.0.0
|
2032 |
+
MarkupSafe==2.1.3
|
2033 |
+
marshmallow==3.14.0
|
2034 |
+
matplotlib==3.3.3
|
2035 |
+
mccabe==0.6.1
|
2036 |
+
mcd==0.4
|
2037 |
+
mdit-py-plugins==0.3.3
|
2038 |
+
mdurl==0.1.2
|
2039 |
+
mecab-python3==1.0.3
|
2040 |
+
megatron-lm==2.2.0
|
2041 |
+
metrics==0.3.3
|
2042 |
+
mido==1.2.10
|
2043 |
+
mistune==0.8.4
|
2044 |
+
more-itertools==8.6.0
|
2045 |
+
mpld3==0.3
|
2046 |
+
mpmath==1.2.1
|
2047 |
+
multidict==5.2.0
|
2048 |
+
multiprocess==0.70.11.1
|
2049 |
+
nbclient==0.5.3
|
2050 |
+
nbconvert==5.6.1
|
2051 |
+
nbformat==5.9.0
|
2052 |
+
NEMO==4.3.2
|
2053 |
+
nemo-toolkit==1.4.0
|
2054 |
+
nest-asyncio==1.5.1
|
2055 |
+
networkx==2.8.8
|
2056 |
+
nltk==3.2.4
|
2057 |
+
nodeenv==1.5.0
|
2058 |
+
normalize==2.0.2
|
2059 |
+
notebook==6.3.0
|
2060 |
+
numba==0.52.0
|
2061 |
+
numpy==1.19.4
|
2062 |
+
nvidia-cublas-cu11==11.10.3.66
|
2063 |
+
nvidia-cuda-cupti-cu11==11.7.101
|
2064 |
+
nvidia-cuda-nvrtc-cu11==11.7.99
|
2065 |
+
nvidia-cuda-runtime-cu11==11.7.99
|
2066 |
+
nvidia-cudnn-cu11==8.5.0.96
|
2067 |
+
nvidia-cufft-cu11==10.9.0.58
|
2068 |
+
nvidia-curand-cu11==10.2.10.91
|
2069 |
+
nvidia-cusolver-cu11==11.4.0.1
|
2070 |
+
nvidia-cusparse-cu11==11.7.4.91
|
2071 |
+
nvidia-nccl-cu11==2.14.3
|
2072 |
+
nvidia-nvtx-cu11==11.7.91
|
2073 |
+
oauthlib==3.1.0
|
2074 |
+
omegaconf==2.3.0
|
2075 |
+
onnx==1.10.2
|
2076 |
+
OpenCC==1.1.2
|
2077 |
+
opencv-python==4.4.0.46
|
2078 |
+
openpyxl==3.0.9
|
2079 |
+
opensmile==2.2.0
|
2080 |
+
opt-einsum==3.3.0
|
2081 |
+
optuna==2.10.0
|
2082 |
+
ordered-set==4.1.0
|
2083 |
+
orjson==3.8.4
|
2084 |
+
oyaml==1.0
|
2085 |
+
packaging==22.0
|
2086 |
+
pandas==1.2.5
|
2087 |
+
pandocfilters==1.4.3
|
2088 |
+
pangu==4.0.6.1
|
2089 |
+
parameterized==0.8.1
|
2090 |
+
parso==0.7.1
|
2091 |
+
pathlib2==2.3.7.post1
|
2092 |
+
pathspec==0.5.5
|
2093 |
+
pathtools==0.1.2
|
2094 |
+
pbr==5.6.0
|
2095 |
+
pefile==2019.4.18
|
2096 |
+
pescador==2.1.0
|
2097 |
+
pesq==0.0.3
|
2098 |
+
pexpect==4.8.0
|
2099 |
+
phonemizer==2.2.1
|
2100 |
+
pickleshare==0.7.5
|
2101 |
+
Pillow==9.3.0
|
2102 |
+
pip-api==0.0.23
|
2103 |
+
pipreqs==0.4.11
|
2104 |
+
pluggy==0.13.1
|
2105 |
+
pooch==1.3.0
|
2106 |
+
portalocker==2.3.2
|
2107 |
+
pptree==3.1
|
2108 |
+
pre-commit==2.9.0
|
2109 |
+
preprocessing==0.1.13
|
2110 |
+
pretty-midi==0.2.9
|
2111 |
+
prettytable==2.2.1
|
2112 |
+
primePy==1.3
|
2113 |
+
progressbar2==3.53.1
|
2114 |
+
prometheus-client==0.10.1
|
2115 |
+
promise==2.3
|
2116 |
+
prompt-toolkit==3.0.8
|
2117 |
+
protobuf==3.20.3
|
2118 |
+
psutil==5.6.6
|
2119 |
+
ptyprocess==0.6.0
|
2120 |
+
py==1.9.0
|
2121 |
+
py-espeak-ng==0.1.8
|
2122 |
+
py4j==0.10.9.7
|
2123 |
+
pyannote.audio==2.1.1
|
2124 |
+
pyannote.core==4.5
|
2125 |
+
pyannote.database==4.1.3
|
2126 |
+
pyannote.metrics==3.2.1
|
2127 |
+
pyannote.pipeline==2.3
|
2128 |
+
pyannotebook==0.1.0.dev0
|
2129 |
+
PyArabic==0.6.15
|
2130 |
+
pyarrow==3.0.0
|
2131 |
+
pyasn1==0.4.8
|
2132 |
+
pyasn1-modules==0.2.8
|
2133 |
+
pybind11==2.8.1
|
2134 |
+
pybtex==0.24.0
|
2135 |
+
pybtex-docutils==1.0.1
|
2136 |
+
pycodestyle==2.5.0
|
2137 |
+
pycparser==2.20
|
2138 |
+
pycryptodome==3.16.0
|
2139 |
+
pyctcdecode==0.4.0
|
2140 |
+
pydantic==1.10.4
|
2141 |
+
pyDeprecate==0.3.1
|
2142 |
+
pydub==0.25.1
|
2143 |
+
pyflakes==2.1.1
|
2144 |
+
Pygments==2.15.1
|
2145 |
+
pygtrie==2.5.0
|
2146 |
+
PyJWT==2.7.0
|
2147 |
+
pymodbus==2.5.3
|
2148 |
+
pyparsing==2.4.7
|
2149 |
+
pyperclip==1.8.2
|
2150 |
+
pypinyin==0.43.0
|
2151 |
+
pyrsistent==0.17.3
|
2152 |
+
pyserial==3.5
|
2153 |
+
PySocks==1.7.1
|
2154 |
+
pystoi==0.3.3
|
2155 |
+
pytest==5.4.1
|
2156 |
+
pytest-runner==5.3.1
|
2157 |
+
python-bidi==0.4.2
|
2158 |
+
python-crfsuite==0.9.7
|
2159 |
+
python-dateutil==2.8.2
|
2160 |
+
python-editor==1.0.4
|
2161 |
+
python-Levenshtein==0.12.2
|
2162 |
+
python-multipart==0.0.5
|
2163 |
+
python-utils==2.4.0
|
2164 |
+
pytorch-lightning==1.6.5
|
2165 |
+
pytorch-metric-learning==1.7.3
|
2166 |
+
pytorch-revgrad==0.2.0
|
2167 |
+
pytube==11.0.1
|
2168 |
+
pytz==2022.6
|
2169 |
+
PyWavelets==1.1.1
|
2170 |
+
PyYAML==6.0
|
2171 |
+
pyzmq==20.0.0
|
2172 |
+
rapidfuzz==1.8.2
|
2173 |
+
readchar==4.0.5
|
2174 |
+
regex==2020.11.13
|
2175 |
+
requests==2.28.1
|
2176 |
+
requests-oauthlib==1.3.0
|
2177 |
+
resampy==0.2.2
|
2178 |
+
rfc3986==1.4.0
|
2179 |
+
rich==13.4.2
|
2180 |
+
richenum==1.3.1
|
2181 |
+
rsa==4.7
|
2182 |
+
ruamel.yaml==0.17.21
|
2183 |
+
ruamel.yaml.clib==0.2.7
|
2184 |
+
s3m==1.1.0
|
2185 |
+
s3transfer==0.5.0
|
2186 |
+
sacrebleu==2.0.0
|
2187 |
+
sacremoses==0.0.44
|
2188 |
+
safetensors==0.3.1
|
2189 |
+
scikit-image==0.18.1
|
2190 |
+
scikit-learn==0.23.2
|
2191 |
+
scipy==1.5.4
|
2192 |
+
-e git+https://github.com/sanghack81/SDCIT@00d060dde733fde9345154a494f81e97fb395ca7#egg=SDCIT
|
2193 |
+
seaborn==0.11.1
|
2194 |
+
SecretStorage==3.3.3
|
2195 |
+
segments==2.1.3
|
2196 |
+
segtok==1.5.11
|
2197 |
+
semantic-version==2.10.0
|
2198 |
+
semver==2.13.0
|
2199 |
+
Send2Trash==1.5.0
|
2200 |
+
sentencepiece==0.1.99
|
2201 |
+
sentry-sdk==1.4.3
|
2202 |
+
shellingham==1.4.0
|
2203 |
+
shortuuid==1.0.7
|
2204 |
+
SIDEKIT==1.3.8.5.2
|
2205 |
+
simplejson==3.17.5
|
2206 |
+
singledispatchmethod==1.0
|
2207 |
+
six==1.15.0
|
2208 |
+
smart-open==5.0.0
|
2209 |
+
smmap==5.0.0
|
2210 |
+
sniffio==1.3.0
|
2211 |
+
snowballstemmer==2.0.0
|
2212 |
+
sortedcollections==2.1.0
|
2213 |
+
sortedcontainers==2.4.0
|
2214 |
+
sounddevice==0.4.5
|
2215 |
+
SoundFile==0.10.3.post1
|
2216 |
+
soupsieve==2.3
|
2217 |
+
sox==1.4.1
|
2218 |
+
sparsemax==0.1.9
|
2219 |
+
speechbrain==0.5.14
|
2220 |
+
sphfile==1.0.3
|
2221 |
+
Sphinx==3.3.1
|
2222 |
+
sphinx-rtd-theme==0.2.4
|
2223 |
+
sphinxcontrib-applehelp==1.0.2
|
2224 |
+
sphinxcontrib-bibtex==2.4.1
|
2225 |
+
sphinxcontrib-devhelp==1.0.2
|
2226 |
+
sphinxcontrib-htmlhelp==1.0.3
|
2227 |
+
sphinxcontrib-jsmath==1.0.1
|
2228 |
+
sphinxcontrib-qthelp==1.0.3
|
2229 |
+
sphinxcontrib-serializinghtml==1.1.4
|
2230 |
+
SQLAlchemy==1.4.25
|
2231 |
+
sqlitedict==2.1.0
|
2232 |
+
sqlparse==0.4.2
|
2233 |
+
stanza==1.4.2
|
2234 |
+
starlette==0.27.0
|
2235 |
+
starsessions==1.3.0
|
2236 |
+
stevedore==3.4.0
|
2237 |
+
subprocess32==3.5.4
|
2238 |
+
sympy==1.9
|
2239 |
+
tabulate==0.8.9
|
2240 |
+
tensorboard==2.4.0
|
2241 |
+
tensorboard-plugin-wit==1.7.0
|
2242 |
+
tensorboardX==2.6.1
|
2243 |
+
tensorflow==2.4.0
|
2244 |
+
tensorflow-estimator==2.4.0
|
2245 |
+
termcolor==1.1.0
|
2246 |
+
terminado==0.9.4
|
2247 |
+
testpath==0.4.4
|
2248 |
+
threadpoolctl==2.1.0
|
2249 |
+
tifffile==2020.12.8
|
2250 |
+
tikzplotlib==0.9.8
|
2251 |
+
tinycss2==1.2.1
|
2252 |
+
tkseem==0.0.3
|
2253 |
+
tokenizers==0.13.3
|
2254 |
+
toml==0.10.2
|
2255 |
+
toolz==0.12.0
|
2256 |
+
torch==1.13.1
|
2257 |
+
torch-audiomentations==0.11.0
|
2258 |
+
torch-pitch-shift==1.2.4
|
2259 |
+
torch-stft==0.1.4
|
2260 |
+
torchaudio==0.13.1
|
2261 |
+
torchmetrics==0.11.4
|
2262 |
+
torchvision==0.14.1
|
2263 |
+
tornado==6.1
|
2264 |
+
tqdm==4.61.1
|
2265 |
+
trackrip==1.2.1
|
2266 |
+
traitlets==5.9.0
|
2267 |
+
transformer-smaller-training-vocab==0.3.1
|
2268 |
+
transformers==4.30.2
|
2269 |
+
triton==2.0.0
|
2270 |
+
typed-ast==1.4.1
|
2271 |
+
typer==0.4.0
|
2272 |
+
typing-extensions==4.4.0
|
2273 |
+
uc-micro-py==1.0.1
|
2274 |
+
Unidecode==1.3.2
|
2275 |
+
uritemplate==3.0.1
|
2276 |
+
urllib3==1.26.2
|
2277 |
+
uvicorn==0.20.0
|
2278 |
+
versioneer==0.28
|
2279 |
+
virtualenv==20.2.1
|
2280 |
+
wandb==0.12.6
|
2281 |
+
wcwidth==0.2.5
|
2282 |
+
webdataset==0.1.62
|
2283 |
+
webencodings==0.5.1
|
2284 |
+
websocket-client==1.6.1
|
2285 |
+
websockets==10.4
|
2286 |
+
Werkzeug==1.0.1
|
2287 |
+
wget==3.2
|
2288 |
+
widgetsnbextension==3.5.1
|
2289 |
+
Wikipedia-API==0.6.0
|
2290 |
+
wordninja==2.0.0
|
2291 |
+
wrapt==1.12.1
|
2292 |
+
xmltodict==0.13.0
|
2293 |
+
xxhash==2.0.0
|
2294 |
+
yamllint==1.23.0
|
2295 |
+
yarg==0.1.9
|
2296 |
+
yarl==1.7.2
|
2297 |
+
yaspin==2.1.0
|
2298 |
+
youtokentome==1.0.6
|
2299 |
+
youtube-dl==2021.6.6
|
2300 |
+
zipp==3.6.0
|
2301 |
+
|
2302 |
+
|
2303 |
+
2023-09-25 15:14:43,263 - speechbrain.utils.superpowers - DEBUG - bf7e6b5
|
2304 |
+
|
2305 |
+
|
2306 |
+
2023-09-25 15:14:43,325 - speechbrain.pretrained.fetching - INFO - Fetch hyperparams.yaml: Using existing file/symlink in pretrained_models/asr-wav2vec2-commonvoice-fr/hyperparams.yaml.
|
2307 |
+
2023-09-25 15:14:43,325 - speechbrain.pretrained.fetching - INFO - Fetch custom.py: Linking to local file in /home/salah/Code-Switched-Tunisian-SpeechToText/asr-wav2vec2-commonvoice-fr/custom.py.
|
2308 |
+
2023-09-25 15:14:46,203 - speechbrain.lobes.models.huggingface_wav2vec - WARNING - speechbrain.lobes.models.huggingface_wav2vec - wav2vec 2.0 is frozen.
|
2309 |
+
2023-09-25 15:14:46,206 - speechbrain.utils.parameter_transfer - DEBUG - Collecting files (or symlinks) for pretraining in pretrained_models/asr-wav2vec2-commonvoice-fr.
|
2310 |
+
2023-09-25 15:14:46,207 - speechbrain.pretrained.fetching - INFO - Fetch wav2vec2.ckpt: Using existing file/symlink in pretrained_models/asr-wav2vec2-commonvoice-fr/wav2vec2.ckpt.
|
2311 |
+
2023-09-25 15:14:46,207 - speechbrain.pretrained.fetching - INFO - Fetch asr.ckpt: Using existing file/symlink in pretrained_models/asr-wav2vec2-commonvoice-fr/asr.ckpt.
|
2312 |
+
2023-09-25 15:14:46,207 - speechbrain.pretrained.fetching - INFO - Fetch tokenizer.ckpt: Using existing file/symlink in pretrained_models/asr-wav2vec2-commonvoice-fr/tokenizer.ckpt.
|
2313 |
+
2023-09-25 15:14:46,208 - speechbrain.utils.parameter_transfer - INFO - Loading pretrained files for: wav2vec2, asr, tokenizer
|
2314 |
+
2023-09-25 15:14:50,143 - speechbrain.lobes.models.huggingface_wav2vec - WARNING - speechbrain.lobes.models.huggingface_wav2vec - wav2vec 2.0 feature extractor is frozen.
|
2315 |
+
2023-09-25 15:14:50,144 - speechbrain.core - INFO - Info: auto_mix_prec arg from hparam file is used
|
2316 |
+
2023-09-25 15:14:50,145 - speechbrain.core - INFO - Info: ckpt_interval_minutes arg from hparam file is used
|
2317 |
+
2023-09-25 15:14:50,148 - speechbrain.core - INFO - 314.4M trainable parameters in ASRCV
|
2318 |
+
2023-09-25 15:14:50,157 - speechbrain.utils.checkpoints - INFO - Loading a checkpoint from EnglishCV/results/wav2vec2_ctc_en/1234/save/CKPT+2023-09-06+22-56-31+00
|
2319 |
+
2023-09-25 15:14:51,202 - speechbrain.core - INFO - Info: auto_mix_prec arg from hparam file is used
|
2320 |
+
2023-09-25 15:14:51,202 - speechbrain.core - INFO - Info: ckpt_interval_minutes arg from hparam file is used
|
2321 |
+
2023-09-25 15:14:51,207 - speechbrain.core - INFO - 314.4M trainable parameters in ASR
|
2322 |
+
2023-09-25 15:14:51,211 - speechbrain.utils.checkpoints - INFO - Loading a checkpoint from TunisianASR/results/14epoch_tunisian/1234/save/CKPT+2023-08-03+01-38-38+00
|
2323 |
+
2023-09-25 15:14:52,244 - speechbrain.utils.distributed - INFO - distributed_launch flag is disabled, this experiment will be executed without DDP.
|
app.py
CHANGED
@@ -744,18 +744,9 @@ mixer.checkpointer.recover_if_possible(device="cpu")
|
|
744 |
mixer.modules.eval()
|
745 |
|
746 |
|
747 |
-
label_encoder = sb.dataio.encoder.CTCTextEncoder()
|
748 |
|
749 |
|
750 |
-
# We dynamicaly add the tokenizer to our brain class.
|
751 |
-
# NB: This tokenizer corresponds to the one used for the LM!!
|
752 |
|
753 |
-
decoder = build_ctcdecoder(
|
754 |
-
labels,
|
755 |
-
kenlm_model_path= "arpas/everything.arpa", # either .arpa or .bin file
|
756 |
-
alpha=0.5, # tuned on a val set
|
757 |
-
beta=1, # tuned on a val set
|
758 |
-
)
|
759 |
|
760 |
|
761 |
|
@@ -785,7 +776,12 @@ def treat_wav_file(file_mic,file_upload ,asr=mixer, device="cpu") :
|
|
785 |
wav = file_mic
|
786 |
else:
|
787 |
wav = file_upload
|
788 |
-
|
|
|
|
|
|
|
|
|
|
|
789 |
tensor_wav = sig.to(device)
|
790 |
resampled = torchaudio.functional.resample( tensor_wav, sr, 16000)
|
791 |
sentence = asr.treat_wav(resampled)
|
|
|
744 |
mixer.modules.eval()
|
745 |
|
746 |
|
|
|
747 |
|
748 |
|
|
|
|
|
749 |
|
|
|
|
|
|
|
|
|
|
|
|
|
750 |
|
751 |
|
752 |
|
|
|
776 |
wav = file_mic
|
777 |
else:
|
778 |
wav = file_upload
|
779 |
+
info = torchaudio.info(wav)
|
780 |
+
sr = info.sample_rate
|
781 |
+
sig = sb.dataio.dataio.read_audio(wav)
|
782 |
+
if len(sig.shape)>1 :
|
783 |
+
sig = torch.mean(sig, dim=1)
|
784 |
+
sig = torch.unsqueeze(sig, 0)
|
785 |
tensor_wav = sig.to(device)
|
786 |
resampled = torchaudio.functional.resample( tensor_wav, sr, 16000)
|
787 |
sentence = asr.treat_wav(resampled)
|
results/non_semi_final_stac/app.py
CHANGED
@@ -744,18 +744,9 @@ mixer.checkpointer.recover_if_possible(device="cpu")
|
|
744 |
mixer.modules.eval()
|
745 |
|
746 |
|
747 |
-
label_encoder = sb.dataio.encoder.CTCTextEncoder()
|
748 |
|
749 |
|
750 |
-
# We dynamicaly add the tokenizer to our brain class.
|
751 |
-
# NB: This tokenizer corresponds to the one used for the LM!!
|
752 |
|
753 |
-
decoder = build_ctcdecoder(
|
754 |
-
labels,
|
755 |
-
kenlm_model_path= "arpas/everything.arpa", # either .arpa or .bin file
|
756 |
-
alpha=0.5, # tuned on a val set
|
757 |
-
beta=1, # tuned on a val set
|
758 |
-
)
|
759 |
|
760 |
|
761 |
|
@@ -785,7 +776,12 @@ def treat_wav_file(file_mic,file_upload ,asr=mixer, device="cpu") :
|
|
785 |
wav = file_mic
|
786 |
else:
|
787 |
wav = file_upload
|
788 |
-
|
|
|
|
|
|
|
|
|
|
|
789 |
tensor_wav = sig.to(device)
|
790 |
resampled = torchaudio.functional.resample( tensor_wav, sr, 16000)
|
791 |
sentence = asr.treat_wav(resampled)
|
|
|
744 |
mixer.modules.eval()
|
745 |
|
746 |
|
|
|
747 |
|
748 |
|
|
|
|
|
749 |
|
|
|
|
|
|
|
|
|
|
|
|
|
750 |
|
751 |
|
752 |
|
|
|
776 |
wav = file_mic
|
777 |
else:
|
778 |
wav = file_upload
|
779 |
+
info = torchaudio.info(wav)
|
780 |
+
sr = info.sample_rate
|
781 |
+
sig = sb.dataio.dataio.read_audio(wav)
|
782 |
+
if len(sig.shape)>1 :
|
783 |
+
sig = torch.mean(sig, dim=1)
|
784 |
+
sig = torch.unsqueeze(sig, 0)
|
785 |
tensor_wav = sig.to(device)
|
786 |
resampled = torchaudio.functional.resample( tensor_wav, sr, 16000)
|
787 |
sentence = asr.treat_wav(resampled)
|
results/non_semi_final_stac/env.log
CHANGED
@@ -473,7 +473,7 @@ youtube-dl==2021.6.6
|
|
473 |
zipp==3.6.0
|
474 |
==============================
|
475 |
Git revision:
|
476 |
-
|
477 |
==============================
|
478 |
CUDA version:
|
479 |
11.7
|
|
|
473 |
zipp==3.6.0
|
474 |
==============================
|
475 |
Git revision:
|
476 |
+
bf7e6b5
|
477 |
==============================
|
478 |
CUDA version:
|
479 |
11.7
|
results/non_semi_final_stac/log.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|