topkautoencoder_baseline / tiny_topk.json
cherrvak's picture
Upload 5 files
e21f84e verified
raw
history blame contribute delete
835 Bytes
{
"whisper_config": {
"model": "tiny",
"layer_name": "encoder.blocks.2"
},
"autoencoder_variant": "topk",
"autoencoder_config": {
"expansion_factor": 16,
"normalize_decoder": true,
"k": 32,
"multi_topk": false,
"auxk_alpha": 0.03125,
"dead_feature_threshold": 1000000.0
},
"seed": 0,
"train_folder": "activations/tiny_block_2_train",
"val_folder": "activations/tiny_block_2_dev",
"device": "cuda",
"run_dir": "runs/topkautoencoder_baseline",
"lr": 1e-4,
"weight_decay": 0.0,
"steps": 100000,
"clip_thresh": 1.0,
"batch_size": 50,
"dl_max_workers": 0,
"log_tb_every": 10,
"save_every": 1000,
"val_every": 100,
"optimizer": "adam",
"scheduler": "linear",
"scheduler_params": {
"num_warmup_steps": 1000
},
"start_checkpoint": null,
"from_disk": true
}