{ "bs_dim": 6, "feature_dim": 512, "period": 30, "max_seq_len": 5000, "batch_size": 128, "gpu0_bs": 32, "valid_batch_size": 4, "experiment_name": "pose2posi_hubertbase_tf", "data_root": "/mnt/ssd/PianoPose-new", "preload": true, "tiny": false, "adjust": true, "is_random": true, "return_beta": false, "up_list": [ "1467634", "66685747" ], "continue_train": false, "pretrained_model_path": "pretrained_model/EmoTalk.pth", "pretrained_mode": "wo_bs_map", "wav2vec_path": "./checkpoints/hubert-base-ls960", "fine_map": 0, "encoder_type": "transformer", "num_layer": 2, "pe": false, "latest_layer": "tanh", "loss_mode": "naive_l1", "weight_rec": 1.0, "weight_vel": 1.0, "iterations": 100000, "train_sec": 8, "fps": 30, "lr": 2e-05, "check_val_every_n_iteration": 1000, "limit_val_batches": 0.6, "save_every_n_iteration": 1000, "save_top_k": 5, "logdir": "logs" }