Elyadata
/

ADI-whisper-ADI20

Audio Classification

Model card Files Files and versions

ADI-whisper-ADI20 / hyperparams.yaml

HarounElleuch's picture

Upload folder using huggingface_hub

bbbc9ba verified 3 months ago

history blame contribute delete

1.67 kB

	# ##########################################################################################
	# Model: Whisper-large-v3 Encoder + Attion pooling for Arabic Dialect Identification
	#
	# Author: Haroun Elleuch
	############################################################################################


	pretrained_path: Elyadata/ADI-whisper-ADI20
	whisper_hub: openai/whisper-large-v3

	n_languages: 20
	features_dim: 1280

	whisper: !new:speechbrain.lobes.models.huggingface_transformers.whisper.Whisper
	source: !ref <whisper_hub>
	encoder_only: True
	freeze_encoder: False
	save_path: !ref <whisper_hub>

	attention_pooling: !new:speechbrain.nnet.pooling.AttentionPooling
	input_dim: !ref <features_dim>

	output_mlp: !new:speechbrain.nnet.linear.Linear
	input_size: !ref <features_dim>
	n_neurons: !ref <n_languages>
	bias: False


	modules:
	whisper: !ref <whisper>
	attention_pooling: !ref <attention_pooling>
	output_mlp: !ref <output_mlp>

	log_softmax: !new:speechbrain.nnet.activations.Softmax
	apply_log: True

	label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder

	pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
	loadables:
	whisper: !ref <whisper>
	attention_pooling: !ref <attention_pooling>
	output_mlp: !ref <output_mlp>
	label_encoder: !ref <label_encoder>
	paths:
	whisper: !ref <pretrained_path>/whisper.ckpt
	attention_pooling: !ref <pretrained_path>/attention_pooling.ckpt
	output_mlp: !ref <pretrained_path>/output_mlp.ckpt
	label_encoder: !ref <pretrained_path>/dialect_encoder.txt