64 lines
1.1 KiB
INI
64 lines
1.1 KiB
INI
[project]
|
|
neptune_key = eyJhcGlfYWRkcmVzcyI6Imh0dHBzOi8vdWkubmVwdHVuZS5haSIsImFwaV91cmwiOiJodHRwczovL3VpLm5lcHR1bmUuYWkiLCJhcGlfa2V5IjoiZmI0OGMzNzUtOTg1NS00Yzg2LThjMzYtMWFiYjUwMDUyMjVlIn0=
|
|
debug = 1
|
|
eval = True
|
|
seed = 69
|
|
owner = si11ium
|
|
model_name = CNNBaseline
|
|
data_name = PrimatesLibrosaDatamodule
|
|
|
|
[data]
|
|
num_worker = 0
|
|
data_root = data
|
|
reset = False
|
|
n_mels = 64
|
|
sr = 16000
|
|
hop_length = 256
|
|
n_fft = 512
|
|
|
|
loudness_ratio = 0.0
|
|
shift_ratio = 0.0
|
|
noise_ratio = 0
|
|
mask_ratio = 0.3
|
|
speed_amount = 0
|
|
speed_min = 0
|
|
speed_max = 0
|
|
|
|
[model_cnn]
|
|
weight_init = xavier_normal_
|
|
activation = gelu
|
|
use_bias = True
|
|
use_norm = True
|
|
dropout = 0.2
|
|
lat_dim = 128
|
|
features = 64
|
|
filters = [32, 64, 128, 64]
|
|
|
|
[model_attn]
|
|
name = VerticalVisualTransformer
|
|
weight_init = xavier_normal_
|
|
activation = gelu
|
|
use_bias = True
|
|
use_norm = True
|
|
dropout = 0.2
|
|
lat_dim = 128
|
|
features = 64
|
|
patch_size = 3
|
|
attn_depth = 3
|
|
heads = 8
|
|
embedding_size = 64
|
|
|
|
[train]
|
|
outpath = output
|
|
version = None
|
|
gpus=0
|
|
sto_weight_avg = False
|
|
weight_decay = 0
|
|
opt_reset_interval = 0
|
|
epochs = 100
|
|
batch_size = 30
|
|
lr = 0.01
|
|
lr_warmup_steps = 0
|
|
num_sanity_val_steps = 0
|
|
|