nethack-vae / training_data.json
CatkinChen's picture
Add training data
3bdd0a9 verified
{
"train_losses": [
2136.5024682617186,
1198.3308361816407,
1161.5707946777343,
1123.9894409179688,
1090.3879553222657,
1057.5052581787108,
1034.7834246826171,
1018.692387084961,
1008.2613201904297,
1000.2829901123047,
993.2367407226562,
987.9076995849609,
984.4344122314453,
982.5031854248047,
980.7457598876953
],
"test_losses": [
1273.5531799316407,
1226.4591247558594,
1197.41689453125,
1164.7423767089845,
1098.9119689941406,
1046.8178466796876,
1028.4834930419922,
1017.2713775634766,
1018.4531524658203,
1009.554721069336,
1002.5865447998046,
985.553515625,
986.9031860351563,
991.0865600585937,
990.1863067626953
],
"config": {
"epochs": 15,
"batch_size": 32,
"max_learning_rate": 0.001,
"sequence_size": 32,
"shuffle_batches": true,
"shuffle_within_batch": true,
"vae_config": {
"latent_dim": 96,
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"initial_mi_beta": 1.0,
"final_mi_beta": 1.0,
"mi_beta_shape": "constant",
"initial_tc_beta": 0.0,
"final_tc_beta": 10.0,
"tc_beta_shape": "custom",
"initial_dw_beta": 0.2,
"final_dw_beta": 1.0,
"dw_beta_shape": "custom",
"warmup_epoch_ratio": 0.2,
"free_bits": 0.75,
"focal_loss_alpha": 0.5,
"focal_loss_gamma": 2.0
},
"adaptive_weighting": {
"initial_mi_beta": 1.0,
"final_mi_beta": 1.0,
"mi_beta_shape": "constant",
"initial_tc_beta": 0.0,
"final_tc_beta": 10.0,
"tc_beta_shape": "custom",
"initial_dw_beta": 0.2,
"final_dw_beta": 1.0,
"dw_beta_shape": "custom",
"warmup_epoch_ratio": 0.2
},
"regularization": {
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"free_bits": 0.75,
"focal_loss_alpha": 0.5,
"focal_loss_gamma": 2.0
},
"early_stopping": {
"enabled": false,
"patience": 3,
"min_delta": 0.01,
"triggered": false,
"best_epoch": null
}
},
"final_train_loss": 980.7457598876953,
"final_test_loss": 990.1863067626953,
"total_epochs": 15,
"best_train_loss": 980.7457598876953,
"best_test_loss": 985.553515625
}