nelfproject
/

ASR_verbatim_v1

Model card Files Files and versions Community

ASR_verbatim_v1 / train_config.yaml

Jakob Poncelet

First model version

e2baad4 12 months ago

No virus

1.43 kB

	batch_size: 32
	accum_grad: 32
	max_epoch: 350
	patience: none
	# The initialization method for model parameters
	init: xavier_uniform
	best_model_criterion:
	- - valid
	- acc
	- max
	keep_nbest_models: 10

	encoder: conformer
	encoder_conf:
	output_size: 256
	attention_heads: 4
	linear_units: 2048
	num_blocks: 12
	dropout_rate: 0.1
	positional_dropout_rate: 0.1
	attention_dropout_rate: 0.0
	input_layer: conv2d
	normalize_before: true
	macaron_style: true
	rel_pos_type: latest
	pos_enc_layer_type: rel_pos
	selfattention_layer_type: rel_selfattn
	activation_type: swish
	use_cnn_module: true
	cnn_module_kernel: 31
	interctc_layer_idx: [6]

	decoder: transformer
	decoder_conf:
	attention_heads: 4
	linear_units: 2048
	num_blocks: 6
	dropout_rate: 0.1
	positional_dropout_rate: 0.1
	self_attention_dropout_rate: 0.0
	src_attention_dropout_rate: 0.0

	model_conf:
	ctc_weight: 0.3
	lsm_weight: 0.1
	length_normalized_loss: false
	interctc_weight: 0.3

	optim: adam
	optim_conf:
	lr: 0.004
	scheduler: warmuplr
	scheduler_conf:
	warmup_steps: 25000

	specaug: specaug
	specaug_conf:
	apply_time_warp: true
	time_warp_window: 5
	time_warp_mode: bicubic
	apply_freq_mask: true
	freq_mask_width_range:
	- 0
	- 30
	num_freq_mask: 2
	apply_time_mask: true
	time_mask_width_range:
	- 0
	- 40
	num_time_mask: 2