| # Macros: |
| # ============================================================================== |
| batch_size = 384 |
| new_freq = 24000 |
|
|
| # Parameters for |
| # ============================================================================== |
| AllMPNetBaseV2.model_id |
|
|
| # Parameters |
| # ============================================================================== |
| AudioDataModule.num_workers |
|
|
| # Parameters |
| # ============================================================================== |
| AudioDataset.half_precision |
| AudioDataset.mono |
| AudioDataset.new_freq |
| AudioDataset.num_frames |
| AudioDataset.orig_freq |
|
|
| # Parameters |
| # ============================================================================== |
| build_dev_datamodule.datamodule |
|
|
| # Parameters |
| # ============================================================================== |
| build_module.ckpt_path |
| '/home/jovyan/shared/palonso/data/logs/mtg-text-audio/dt86c2jx/checkpoints/epoch=287-step=148032.ckpt' |
| build_module.module |
| build_module.net |
| build_module.representation |
| [@nets.melspectrogram.MelSpectrogram, |
| @nets.waveform.Waveform, |
| @nets.cqt.CQT, |
| @nets.encodec.EnCodec] |
|
|
| # Parameters |
| # ============================================================================== |
| CLAP.aggregation_type |
| CLAP.audio_encoder |
| CLAP.loss_type |
| CLAP.lr |
| CLAP.n_pool_att_heads |
| CLAP.proj_size |
| CLAP.seed |
| CLAP.temp |
| CLAP.text_encoder |
| CLAP.tokenizers_parallelism |
| CLAP.train_audio_encoder |
| CLAP.train_text_encoder |
| CLAP.weight_decay |
|
|
| # Parameters |
| # ============================================================================== |
| ConcatTextAudioDataModule.batch_size |
| ConcatTextAudioDataModule.datamodules |
| [@DiscotubeTextAudioCleanDataModule, |
| @MSDTextAudioDataModule, |
| @FreesoundTextAudioDataModule, |
| @PSETextAudioDataModule] |
| ConcatTextAudioDataModule.num_workers |
| ConcatTextAudioDataModule.ratios |
|
|
| # Parameters |
| # ============================================================================== |
| Conformer.alpha_deepnorm |
| Conformer.beta_deepnorm |
| Conformer.conv_kernel_size |
| Conformer.depth |
| Conformer.dropout |
| Conformer.embed_dim |
| Conformer.input_dropout |
| Conformer.mlp_ratio |
| Conformer.mlp_residual_factor |
| Conformer.num_heads |
| Conformer.num_patches |
| Conformer.use_deepnorm |
| Conformer.use_rope |
|
|
| # Parameters |
| # ============================================================================== |
| CosineAnnealingCallback.eta_min |
| CosineAnnealingCallback.warmup_steps |
|
|
| # Parameters |
| # ============================================================================== |
| CQT.bins_per_octave |
| CQT.f_min |
| CQT.hop_len |
| CQT.logC |
| CQT.magnitude |
| CQT.n_bins |
| CQT.norm_mean |
| CQT.norm_std |
| CQT.patch_size |
| CQT.power |
| CQT.sr |
|
|
| # Parameters |
| # ============================================================================== |
| def_module.module |
|
|
| # Parameters |
| # ============================================================================== |
| DiscotubeTextAudioCleanDataModule.batch_size |
| DiscotubeTextAudioCleanDataModule.data_dir |
| DiscotubeTextAudioCleanDataModule.filelist_train |
| '/home/jovyan/shared/palonso/data/discotube/metadata/mmap_ids_train' |
| DiscotubeTextAudioCleanDataModule.filelist_val |
| '/home/jovyan/shared/palonso/data/discotube/metadata/mmap_ids_val' |
| DiscotubeTextAudioCleanDataModule.max_sentences |
| DiscotubeTextAudioCleanDataModule.num_workers |
| DiscotubeTextAudioCleanDataModule.text_file |
| '/home/jovyan/shared/palonso/data/discotube/metadata/Qwen_Qwen2.5-32B__chatgpt_v2__t0.5__1.1.jsonl' |
|
|
| # Parameters |
| # ============================================================================== |
| DiscotubeTextAudioCleanDataset.num_frames |
|
|
| # Parameters |
| # ============================================================================== |
| EnCodec.norm_type |
| EnCodec.orig_sr |
| EnCodec.patch_size |
| EnCodec.stats_path |
| EnCodec.weights_path |
|
|
| # Parameters |
| # ============================================================================== |
| FreesoundTextAudioDataModule.batch_size |
| FreesoundTextAudioDataModule.data_dir |
| '/home/jovyan/shared/palonso/data/freesound/mmaps/' |
| FreesoundTextAudioDataModule.description_prob |
| FreesoundTextAudioDataModule.filelist_train |
| '/home/jovyan/shared/palonso/data/freesound/filelist_full_train_mmap.txt' |
| FreesoundTextAudioDataModule.filelist_val |
| '/home/jovyan/shared/palonso/data/freesound/filelist_full_val_mmap.txt' |
| FreesoundTextAudioDataModule.num_workers |
| FreesoundTextAudioDataModule.text_file |
| '/home/jovyan/shared/palonso/data/freesound/freesound_metadata.jsonl' |
|
|
| # Parameters |
| # ============================================================================== |
| FreesoundTextAudioDataset.num_frames |
|
|
| # Parameters |
| # ============================================================================== |
| MaskingModel.codebook_dim |
| MaskingModel.codebook_size |
| MaskingModel.diff_input |
| MaskingModel.input_representation |
| MaskingModel.lr |
| MaskingModel.mask_prob |
| MaskingModel.mask_seconds |
| MaskingModel.num_codebooks |
| MaskingModel.plot_tokens |
| MaskingModel.seed |
| MaskingModel.weight_decay |
|
|
| # Parameters |
| # ============================================================================== |
| MelSpectrogram.freq_mask_param |
| MelSpectrogram.hop_len |
| MelSpectrogram.mel_scale |
| MelSpectrogram.n_mel |
| MelSpectrogram.norm |
| MelSpectrogram.norm_mean |
| MelSpectrogram.norm_std |
| MelSpectrogram.patch_size |
| MelSpectrogram.power |
| MelSpectrogram.sr |
| MelSpectrogram.stretch_factor |
| MelSpectrogram.time_mask_param |
| MelSpectrogram.win_len |
|
|
| # Parameters |
| # ============================================================================== |
| MSDTextAudioDataModule.batch_size |
| MSDTextAudioDataModule.data_dir |
| MSDTextAudioDataModule.description_prob |
| MSDTextAudioDataModule.filelist_train |
| '/home/jovyan/shared/palonso/data/msd/filelist_train_mmap.txt' |
| MSDTextAudioDataModule.filelist_val |
| '/home/jovyan/shared/palonso/data/msd/filelist_val_mmap.txt' |
| MSDTextAudioDataModule.num_workers |
|
|
| # Parameters |
| # ============================================================================== |
| MSDTextAudioDataset.num_frames |
|
|
| # Parameters |
| # ============================================================================== |
| OMARRQ.model_id |
|
|
| # Parameters |
| # ============================================================================== |
| PSETextAudioDataModule.batch_size |
| PSETextAudioDataModule.data_dir |
| '/home/jovyan/shared/palonso/data/pse/mmaps/pse_data_december_2024/data/' |
| PSETextAudioDataModule.filelist_train |
| '/home/jovyan/shared/palonso/data/pse/filelist_train.txt' |
| PSETextAudioDataModule.filelist_val |
| '/home/jovyan/shared/palonso/data/pse/filelist_val.txt' |
| PSETextAudioDataModule.num_workers |
|
|
| # Parameters |
| # ============================================================================== |
| PSETextAudioDataset.num_frames |
|
|
| # Parameters |
| # ============================================================================== |
| train.ckpt_save_every_n_epochs |
| train.datamodule |
| train.hf_ckpt |
| train.params |
| {'accelerator': 'gpu', |
| 'check_val_every_n_epoch': 8, |
| 'devices': 8, |
| 'log_every_n_steps': 50, |
| 'max_steps': 150000, |
| 'num_nodes': 1, |
| 'num_sanity_val_steps': -1, |
| 'precision': 'bf16-mixed', |
| 'strategy': 'ddp_find_unused_parameters_true'} |
| train.wandb_params |
| {'entity': 'mtg-upf', |
| 'group': 'vanilla_clap', |
| 'name': 'config_clap_mpnet_base_v2_ssl_mp_10s_small_clap_dt_msd_fs_pse_lr_5e-6', |
| 'offline': False, |
| 'project': 'mtg-text-audio', |
| 'save_dir': '/home/jovyan/shared/palonso/data/logs'} |
|
|
| # Parameters |
| # ============================================================================== |
| Waveform.norm_mean |
| Waveform.norm_std |
| Waveform.patch_size |
| Waveform.sr |
|
|