# @package _group_ common: fp16: true log_format: json log_interval: 200 tensorboard_logdir: tb checkpoint: save_interval: 5 save_interval_updates: 25000 keep_interval_updates: 1 no_epoch_checkpoints: true task: _name: audio_pretraining data: ??? max_sample_size: 320000 min_sample_size: 32000 normalize: true dataset: num_workers: 6 max_tokens: 3800000 skip_invalid_size_inputs_valid_test: true validate_interval: 5 required_batch_size_multiple: 1 disable_validation: false distributed_training: distributed_world_size: 16 ddp_backend: legacy_ddp criterion: _name: model log_keys: - ema_decay - target_var - pred_var optimization: max_update: 400000 lr: [0.0005] optimizer: _name: adam adam_betas: (0.9,0.98) adam_eps: 1e-06 weight_decay: 0.01 lr_scheduler: _name: tri_stage phase_ratio: [0.03,0.9,0.07] model: _name: data2vec_audio extractor_mode: layer_norm encoder_layerdrop: 0.05 dropout_input: 0.0 dropout_features: 0.0 feature_grad_mult: 1.0 encoder_embed_dim: 768 mask_prob: 0.65 mask_length: 10 loss_beta: 0 loss_scale: null instance_norm_target_layer: true average_top_k_layers: 8 pos_conv_depth: 5 conv_pos: 95 ema_decay: 0.999 ema_end_decay: 0.9999 ema_anneal_end_step: 30000 ema_transformer_only: true ema_layers_only: true require_same_masks: true mask_dropout: 0 final_proj_dim: 256 cluster_factor: 16 scale_factor: 0.3 num_negatives: 100 cross_sample_negatives: 0