salmanshahid
/

segmentation

Voice Activity Detection

speaker-segmentation

overlapped-speech-detection

Model card Files Files and versions Metrics Training metrics Community

segmentation / config.yaml

salmanshahid's picture

Upload folder using huggingface_hub

07d5bbe verified 6 days ago

history blame contribute delete

1.98 kB

	protocol: X.SpeakerDiarization.Custom
	patience: 20
	task:
	_target_: pyannote.audio.tasks.Segmentation
	duration: 5.0
	warm_up: 0.0
	balance: null
	overlap:
	probability: 0.5
	snr_min: 0.0
	snr_max: 10.0
	weight: null
	batch_size: 32
	num_workers: 10
	pin_memory: false
	loss: bce
	vad_loss: bce
	model:
	_target_: pyannote.audio.models.segmentation.PyanNet
	sincnet:
	stride: 10
	lstm:
	num_layers: 4
	monolithic: true
	dropout: 0.5
	linear:
	num_layers: 2
	optimizer:
	_target_: torch.optim.Adam
	lr: 0.001
	betas:
	- 0.9
	- 0.999
	eps: 1.0e-08
	weight_decay: 0
	amsgrad: false
	trainer:
	_target_: pytorch_lightning.Trainer
	accelerator: ddp
	accumulate_grad_batches: 1
	amp_backend: native
	amp_level: O2
	auto_lr_find: false
	auto_scale_batch_size: false
	auto_select_gpus: true
	benchmark: true
	check_val_every_n_epoch: 1
	checkpoint_callback: true
	deterministic: false
	fast_dev_run: false
	flush_logs_every_n_steps: 100
	gpus: -1
	gradient_clip_val: 0.5
	limit_test_batches: 1.0
	limit_train_batches: 1.0
	limit_val_batches: 1.0
	log_every_n_steps: 50
	log_gpu_memory: null
	max_epochs: 1000
	max_steps: null
	min_epochs: 1
	min_steps: null
	num_nodes: 1
	num_processes: 1
	num_sanity_val_steps: 2
	overfit_batches: 0.0
	precision: 32
	prepare_data_per_node: true
	process_position: 0
	profiler: null
	progress_bar_refresh_rate: 1
	reload_dataloaders_every_epoch: false
	replace_sampler_ddp: true
	sync_batchnorm: false
	terminate_on_nan: false
	tpu_cores: null
	track_grad_norm: -1
	truncated_bptt_steps: null
	val_check_interval: 1.0
	weights_save_path: null
	weights_summary: top
	augmentation:
	transform: Compose
	params:
	shuffle: false
	transforms:
	- transform: AddBackgroundNoise
	params:
	background_paths: /gpfswork/rech/eie/commun/data/background/musan
	min_snr_in_db: 5.0
	max_snr_in_db: 15.0
	mode: per_example
	p: 0.9