karthik's picture
Add files
940185f
raw
history blame contribute delete
No virus
11.1 kB
config: conf/train_hubert.yaml
print_config: false
log_level: INFO
dry_run: false
iterator_type: sequence
output_dir: exp/asr_stats_raw_en_word/logdir/stats.33
ngpu: 0
seed: 0
num_workers: 1
num_att_plot: 3
dist_backend: nccl
dist_init_method: env://
dist_world_size: null
dist_rank: null
local_rank: null
dist_master_addr: null
dist_master_port: null
dist_launcher: null
multiprocessing_distributed: false
unused_parameters: false
sharded_ddp: false
cudnn_enabled: true
cudnn_benchmark: false
cudnn_deterministic: true
collect_stats: true
write_collected_feats: false
max_epoch: 50
patience: null
val_scheduler_criterion:
- valid
- loss
early_stopping_criterion:
- valid
- loss
- min
best_model_criterion:
- - valid
- acc
- max
keep_nbest_models: 10
grad_clip: 5.0
grad_clip_type: 2.0
grad_noise: false
accum_grad: 1
no_forward_run: false
resume: false
train_dtype: float32
use_amp: false
log_interval: null
use_tensorboard: true
use_wandb: false
wandb_project: null
wandb_id: null
wandb_entity: null
wandb_name: null
wandb_model_log_interval: -1
detect_anomaly: false
pretrain_path: null
init_param: []
ignore_init_mismatch: false
freeze_param:
- frontend.upstream
num_iters_per_epoch: null
batch_size: 20
valid_batch_size: null
batch_bins: 1000000
valid_batch_bins: null
train_shape_file:
- exp/asr_stats_raw_en_word/logdir/train.33.scp
valid_shape_file:
- exp/asr_stats_raw_en_word/logdir/valid.33.scp
batch_type: folded
valid_batch_type: null
fold_length: []
sort_in_batch: descending
sort_batch: descending
multiple_iterator: false
chunk_length: 500
chunk_shift_ratio: 0.5
num_cache_chunks: 1024
train_data_path_and_name_and_type:
- - dump/raw/train/wav.scp
- speech
- sound
- - dump/raw/train/text
- text
- text
valid_data_path_and_name_and_type:
- - dump/raw/valid/wav.scp
- speech
- sound
- - dump/raw/valid/text
- text
- text
allow_variable_data_keys: false
max_cache_size: 0.0
max_cache_fd: 32
valid_max_cache_size: null
optim: adam
optim_conf:
lr: 0.0002
scheduler: warmuplr
scheduler_conf:
warmup_steps: 25000
token_list:
- <blank>
- <unk>
- <utt>
- <sep>
- bye
- the
- food
- you
- thank
- thankyou
- good
- request-phone
- number
- phone
- request-addr
- address
- restaurant
- of
- i
- what
- is
- a
- in
- town
- reqalts
- part
- inform-this-dontcare
- for
- and
- looking
- im
- whats
- about
- inform-pricerange-moderate
- dont
- that
- care
- affirm
- cheap
- inform-pricerange-cheap
- south
- inform-area-south
- how
- serves
- have
- moderately
- 'yes'
- priced
- expensive
- north
- any
- inform-pricerange-expensive
- can
- request-postcode
- anything
- else
- inform-area-north
- code
- post
- it
- price
- west
- inform-area-west
- east
- type
- inform-area-east
- range
- there
- request-food
- okay
- oriental
- goodbye
- european
- request-pricerange
- area
- want
- an
- inform-food-indian
- indian
- matter
- doesnt
- uh
- thai
- serve
- request-area
- inform-food-thai
- inform-food-asian
- asian
- chinese
- like
- inform-area-centre
- find
- inform-food-chinese
- inform-food-italian
- italian
- negate
- center
- 'no'
- moderate
- please
- get
- to
- their
- inform-food-european
- serving
- may
- inform-area-dontcare
- do
- korean
- spanish
- inform-food-spanish
- vietnamese
- inform-food-vietnamese
- inform-food-korean
- id
- could
- american
- british
- inform-food-british
- kind
- need
- inform-food-turkish
- turkish
- um
- inform-food-portuguese
- gastropub
- portuguese
- does
- inform-food-gastropub
- inform-food-french
- french
- would
- inform-food-mediterranean
- mediterranean
- they
- modern
- hello
- inform-food-modern
- noise
- inform-pricerange-dontcare
- its
- inform-food-international
- international
- me
- should
- inform-food-north
- repeat
- right
- give
- inform-food-seafood
- inform-food-japanese
- japanese
- jamaican
- inform-food-jamaican
- inform-food-creative
- creative
- are
- inform-food-mexican
- mexican
- telephone
- another
- one
- hungarian
- ah
- something
- inform-food-dontcare
- inform-food-cantonese
- cantonese
- inform-food-cuban
- cuban
- inform-food-hungarian
- hi
- breath
- sea
- yea
- am
- inform-food-traditional
- traditional
- caribbean
- restaurants
- ack
- inform-food-world
- world
- with
- inform-food-caribbean
- barbecue
- inform-food-corsica
- corsica
- inform-food-lebanese
- lebanese
- be
- inform-food-basque
- postcode
- inform-food-romanian
- romanian
- inform-food-greek
- greek
- inform-food-barbeque
- inform-food-african
- african
- side
- other
- pan
- inform-food-english
- english
- inform-food-danish
- danish
- venue
- inform-food-malaysian
- australian
- inform-food-unusual
- unusual
- inform-food-moroccan
- inform-food-kosher
- kosher
- thats
- inform-food-scandinavian
- inform-food-afghan
- afghan
- inform-food-polynesian
- polynesian
- bout
- inform-food-german
- german
- not
- inform-food-vegetarian
- inform-food-persian
- persian
- scandinavian
- basque
- inform-food-belgian
- malaysian
- inform-food-australian
- moroccan
- christmas
- inform-food-catalan
- inform-food-canapes
- vegetarian
- 'on'
- swedish
- inform-food-irish
- irish
- canapes
- inform-food-christmas
- catalan
- inform-food-venetian
- inform-food-swedish
- where
- inform-food-tuscan
- tuscan
- inform-food-eritrean
- venetian
- inform-food-steakhouse
- fusion
- unintelligible
- inform-food-bistro
- bistro
- yeah
- alright
- inform-food-swiss
- swiss
- inform-food-singaporean
- seafood
- know
- confirm-pricerange-expensive
- confirm-pricerange-moderate
- next
- oh
- inform-food-brazilian
- brazilian
- inform-food-scottish
- scottish
- inform-food-fusion
- inform-food-russian
- russian
- singaporean
- kay
- fine
- inform-food-welsh
- welsh
- over
- belgium
- belgian
- great
- addre
- inform-food-crossover
- cool
- steakhouse
- confirm-food-chinese
- inform-food-austrian
- austrian
- inform-food-polish
- polish
- again
- centre
- then
- ok
- halal
- steak
- back
- thanks
- inform-food-indonesian
- indonesian
- correct
- well
- confirm-area-centre
- confirm-area-north
- inform-food-halal
- see
- welcome
- house
- postal
- pri
- more
- anywhere
- central
- crossover
- much
- very
- located
- my
- confirm-pricerange-cheap
- restart
- start
- go
- just
- iam
- confirm-food-thai
- confirm-food-korean
- city
- as
- wok
- option
- was
- two
- your
- confirm-food-gastropub
- time
- chiquito
- inform-name-prezzo
- prezzo
- fuck
- prices
- reqmore
- bask
- different
- cambridge
- turkiesh
- show
- chineese
- confirm-area-east
- rest
- request-name
- name
- try
- sorry
- foo
- ye
- ser
- sells
- change
- confirm-food-hungarian
- eritrean
- but
- eartrain
- options
- location
- served
- cross
- k
- inform-name-chiquito
- bar
- tv_noise
- confirm-food-canapes
- day
- parts
- malyasian
- airitran
- so
- new
- at
- confirm-food-indian
- confirm-food-portuguese
- place
- tell
- though
- choice
- awesome
- stop
- inform-food-australasian
- portugese
- missing
- sock
- deny-name-golden
- golden
- park
- tur
- vinci
- pizzeria
- endonesian
- needs
- deny-food-korean
- confirm-area-west
- t
- trying
- dear
- thatll
- excellent
- baskaye
- confirm-food-basque
- p
- if
- india
- some
- ran
- moroccon
- confirm-food-european
- hut
- all
- airatarin
- canope
- tailand
- vanessa
- earatrain
- shit
- ts
- confirm-food-steakhouse
- cantonates
- vegitarian
- knocking
- signaporian
- mail
- foods
- got
- us
- lets
- f
- medium
- un
- downtown
- portugeuse
- venues
- talking
- nymber
- every
- this
- moron
- says
- sucks
- itailian
- chinses
- elses
- request-signature
- special
- restaurnt
- confirm-food-fusion
- spensive
- scandinavia
- gastro
- pub
- anyone
- deny-food-chinese
- res
- derately
- down
- fancy
- wha
- alternative
- confirm-food-mediterranean
- confirm-food-caribbean
- first
- least
- bart
- selection
- finally
- somewhere
- ko
- sounds
- said
- eat
- huh
- searching
- s
- wrong
- cute
- ffood
- earetree
- earatree
- confirm-food-modern
- confirm-food-christmas
- long
- class
- restauran
- turk
- deny-name-the
- beside
- yourself
- hate
- signaporean
- restuarant
- did
- inform-name-da
- da
- only
- int
- inform-name-bloomsbury
- bloomsbury
- inaudible
- scandanavian
- done
- confirm-food-indonesian
- cancun
- gasper
- o
- meant
- plea
- halo
- inner
- confirm-food-swedish
- confirm-food-asian
- wanna
- catalanian
- darling
- canape
- baskey
- indians
- bat
- europ
- now
- canopy
- restaraunt
- medterranean
- cant
- deosnt
- ostro
- addrss
- damn
- deny-name-hk
- hk
- signapore
- probably
- ly
- moderat
- modereate
- let
- zip
- spani
- adddress
- ori
- euorpean
- confirm-food-seafood
- mistakes
- ooh
- confirm-food-spanish
- worth
- mediteranian
- music
- others
- b
- types
- thing
- fish
- besides
- confirm-food-halal
- inform-name-pizza
- pizza
- ever
- surprise
- ones
- train
- arotrian
- modertley
- calling
- minuet
- york
- sh
- cost
- confirm-area-south
- bristish
- confirm-food-british
- loo
- think
- medetanian
- wheres
- his
- confirm-food-turkish
- inform-name-restaurant
- euro
- wondering
- theres
- afternoon
- sure
- might
- umh
- deny-food-vietnamese
- art
- rerestaurant
- vietna
- ne
- take
- modreately
- air
- tran
- crosstalk
- mind
- ya
- god
- really
- believe
- confirm-food-italian
- confirm-food-jamaican
- preference
- <sos/eos>
init: null
input_size: null
ctc_conf:
dropout_rate: 0.0
ctc_type: builtin
reduce: true
ignore_nan_grad: true
model_conf:
ctc_weight: 0.3
lsm_weight: 0.1
length_normalized_loss: false
extract_feats_in_collect_stats: false
use_preprocessor: true
token_type: word
bpemodel: null
non_linguistic_symbols: null
cleaner: null
g2p: null
speech_volume_normalize: null
rir_scp: null
rir_apply_prob: 1.0
noise_scp: null
noise_apply_prob: 1.0
noise_db_range: '13_15'
frontend: s3prl
frontend_conf:
frontend_conf:
upstream: hubert_large_ll60k
download_dir: ./hub
multilayer_feature: true
fs: 16k
specaug: specaug
specaug_conf:
apply_time_warp: true
time_warp_window: 5
time_warp_mode: bicubic
apply_freq_mask: true
freq_mask_width_range:
- 0
- 30
num_freq_mask: 2
apply_time_mask: true
time_mask_width_range:
- 0
- 40
num_time_mask: 2
normalize: utterance_mvn
normalize_conf: {}
preencoder: linear
preencoder_conf:
input_size: 1024
output_size: 80
encoder: conformer
encoder_conf:
output_size: 512
attention_heads: 8
linear_units: 2048
num_blocks: 12
dropout_rate: 0.1
positional_dropout_rate: 0.1
attention_dropout_rate: 0.1
input_layer: conv2d
normalize_before: true
macaron_style: true
pos_enc_layer_type: rel_pos
selfattention_layer_type: rel_selfattn
activation_type: swish
use_cnn_module: true
cnn_module_kernel: 31
postencoder: null
postencoder_conf: {}
decoder: transformer
decoder_conf:
attention_heads: 8
linear_units: 2048
num_blocks: 6
dropout_rate: 0.1
positional_dropout_rate: 0.1
self_attention_dropout_rate: 0.1
src_attention_dropout_rate: 0.1
required:
- output_dir
- token_list
version: 0.10.3a3
distributed: false