Skip to content
Snippets Groups Projects
Commit 915e419e authored by Léo Schneider's avatar Léo Schneider Committed by Schneider Leo
Browse files

res

parent a790c5c2
No related branches found
No related tags found
No related merge requests found
Showing
with 90 additions and 0 deletions
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2194.870497816191,1719550479,checkpoint_000000,True,False,1,e1c21a5b,2024-06-28_06-54-39,72.34097814559937,72.34097814559937,242786,r8i6n8,10.159.28.66,72.34097814559937,1
2184.85587340828,1719550537,checkpoint_000001,True,False,2,e1c21a5b,2024-06-28_06-55-37,58.70789837837219,131.04887652397156,242786,r8i6n8,10.159.28.66,131.04887652397156,2
2170.870687169353,1719550596,checkpoint_000002,True,False,3,e1c21a5b,2024-06-28_06-56-36,58.806477069854736,189.8553535938263,242786,r8i6n8,10.159.28.66,189.8553535938263,3
2174.422803503322,1719550655,checkpoint_000003,True,False,4,e1c21a5b,2024-06-28_06-57-35,59.22593355178833,249.08128714561462,242786,r8i6n8,10.159.28.66,249.08128714561462,4
2172.285528228039,1719550714,checkpoint_000004,True,False,5,e1c21a5b,2024-06-28_06-58-34,58.81974387168884,307.90103101730347,242786,r8i6n8,10.159.28.66,307.90103101730347,5
2169.101529819759,1719550773,checkpoint_000005,True,False,6,e1c21a5b,2024-06-28_06-59-33,58.76822781562805,366.6692588329315,242786,r8i6n8,10.159.28.66,366.6692588329315,6
2163.793571412094,1719550832,checkpoint_000006,True,False,7,e1c21a5b,2024-06-28_07-00-32,58.85833549499512,425.52759432792664,242786,r8i6n8,10.159.28.66,425.52759432792664,7
2165.50454832062,1719550891,checkpoint_000007,True,False,8,e1c21a5b,2024-06-28_07-01-31,58.795005321502686,484.3225996494293,242786,r8i6n8,10.159.28.66,484.3225996494293,8
2161.298410971334,1719550950,checkpoint_000008,True,False,9,e1c21a5b,2024-06-28_07-02-30,59.305978536605835,543.6285781860352,242786,r8i6n8,10.159.28.66,543.6285781860352,9
2166.0535782941683,1719551009,checkpoint_000009,True,False,10,e1c21a5b,2024-06-28_07-03-29,58.87797403335571,602.5065522193909,242786,r8i6n8,10.159.28.66,602.5065522193909,10
{"loss": 2194.870497816191, "timestamp": 1719550479, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "e1c21a5b", "date": "2024-06-28_06-54-39", "time_this_iter_s": 72.34097814559937, "time_total_s": 72.34097814559937, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 72.34097814559937, "iterations_since_restore": 1}
{"loss": 2184.85587340828, "timestamp": 1719550537, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "e1c21a5b", "date": "2024-06-28_06-55-37", "time_this_iter_s": 58.70789837837219, "time_total_s": 131.04887652397156, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 131.04887652397156, "iterations_since_restore": 2}
{"loss": 2170.870687169353, "timestamp": 1719550596, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "e1c21a5b", "date": "2024-06-28_06-56-36", "time_this_iter_s": 58.806477069854736, "time_total_s": 189.8553535938263, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 189.8553535938263, "iterations_since_restore": 3}
{"loss": 2174.422803503322, "timestamp": 1719550655, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "e1c21a5b", "date": "2024-06-28_06-57-35", "time_this_iter_s": 59.22593355178833, "time_total_s": 249.08128714561462, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 249.08128714561462, "iterations_since_restore": 4}
{"loss": 2172.285528228039, "timestamp": 1719550714, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "e1c21a5b", "date": "2024-06-28_06-58-34", "time_this_iter_s": 58.81974387168884, "time_total_s": 307.90103101730347, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 307.90103101730347, "iterations_since_restore": 5}
{"loss": 2169.101529819759, "timestamp": 1719550773, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "e1c21a5b", "date": "2024-06-28_06-59-33", "time_this_iter_s": 58.76822781562805, "time_total_s": 366.6692588329315, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 366.6692588329315, "iterations_since_restore": 6}
{"loss": 2163.793571412094, "timestamp": 1719550832, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "e1c21a5b", "date": "2024-06-28_07-00-32", "time_this_iter_s": 58.85833549499512, "time_total_s": 425.52759432792664, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 425.52759432792664, "iterations_since_restore": 7}
{"loss": 2165.50454832062, "timestamp": 1719550891, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "e1c21a5b", "date": "2024-06-28_07-01-31", "time_this_iter_s": 58.795005321502686, "time_total_s": 484.3225996494293, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 484.3225996494293, "iterations_since_restore": 8}
{"loss": 2161.298410971334, "timestamp": 1719550950, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "e1c21a5b", "date": "2024-06-28_07-02-30", "time_this_iter_s": 59.305978536605835, "time_total_s": 543.6285781860352, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 543.6285781860352, "iterations_since_restore": 9}
{"loss": 2166.0535782941683, "timestamp": 1719551009, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "e1c21a5b", "date": "2024-06-28_07-03-29", "time_this_iter_s": 58.87797403335571, "time_total_s": 602.5065522193909, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9609532957830483, "lr": 0.0003819692551562951, "batch_size": 2048}, "time_since_restore": 602.5065522193909, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 2048,
"decoder_rt_num_layer": 8,
"drop_rate": 0.3870437260805145,
"embedding_dim": 64,
"encoder_ff": 512,
"encoder_num_layer": 1,
"lr": 0.00016963815672588173,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
719.9917376660925,1719491430,checkpoint_000000,True,False,1,e4c88f47,2024-06-27_14-30-30,123.22117924690247,123.22117924690247,35196,r8i6n8,10.159.28.66,123.22117924690247,1
456.510295717735,1719494041,checkpoint_000001,True,False,2,e4c88f47,2024-06-27_15-14-01,123.05968236923218,246.28086161613464,69992,r8i6n8,10.159.28.66,123.05968236923218,1
361.41261712021713,1719495092,checkpoint_000002,True,False,3,e4c88f47,2024-06-27_15-31-32,123.89350652694702,370.17436814308167,69992,r8i6n8,10.159.28.66,123.89350652694702,1
282.4288875549797,1719495202,checkpoint_000003,True,False,4,e4c88f47,2024-06-27_15-33-22,110.45332741737366,480.6276955604553,69992,r8i6n8,10.159.28.66,234.34683394432068,2
{"loss": 719.9917376660925, "timestamp": 1719491430, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "e4c88f47", "date": "2024-06-27_14-30-30", "time_this_iter_s": 123.22117924690247, "time_total_s": 123.22117924690247, "pid": 35196, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3870437260805145, "lr": 0.00016963815672588173, "batch_size": 2048}, "time_since_restore": 123.22117924690247, "iterations_since_restore": 1}
{"loss": 456.510295717735, "timestamp": 1719494041, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "e4c88f47", "date": "2024-06-27_15-14-01", "time_this_iter_s": 123.05968236923218, "time_total_s": 246.28086161613464, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3870437260805145, "lr": 0.00016963815672588173, "batch_size": 2048}, "time_since_restore": 123.05968236923218, "iterations_since_restore": 1}
{"loss": 361.41261712021713, "timestamp": 1719495092, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "e4c88f47", "date": "2024-06-27_15-31-32", "time_this_iter_s": 123.89350652694702, "time_total_s": 370.17436814308167, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3870437260805145, "lr": 0.00016963815672588173, "batch_size": 2048}, "time_since_restore": 123.89350652694702, "iterations_since_restore": 1}
{"loss": 282.4288875549797, "timestamp": 1719495202, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "e4c88f47", "date": "2024-06-27_15-33-22", "time_this_iter_s": 110.45332741737366, "time_total_s": 480.6276955604553, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3870437260805145, "lr": 0.00016963815672588173, "batch_size": 2048}, "time_since_restore": 234.34683394432068, "iterations_since_restore": 2}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 4,
"drop_rate": 0.6516917077514637,
"embedding_dim": 64,
"encoder_ff": 512,
"encoder_num_layer": 1,
"lr": 0.00012016483134334655,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1395.3380626768578,1719538220,checkpoint_000000,True,False,1,f1df685b,2024-06-28_03-30-20,74.64295077323914,74.64295077323914,242786,r8i6n8,10.159.28.66,74.64295077323914,1
843.0610409233514,1719538282,checkpoint_000001,True,False,2,f1df685b,2024-06-28_03-31-22,61.71093678474426,136.3538875579834,242786,r8i6n8,10.159.28.66,136.3538875579834,2
649.7034859244279,1719538343,checkpoint_000002,True,False,3,f1df685b,2024-06-28_03-32-23,61.319239377975464,197.67312693595886,242786,r8i6n8,10.159.28.66,197.67312693595886,3
538.8246248500553,1719538404,checkpoint_000003,True,False,4,f1df685b,2024-06-28_03-33-24,61.17716383934021,258.8502907752991,242786,r8i6n8,10.159.28.66,258.8502907752991,4
476.29196431317666,1719538465,checkpoint_000004,True,False,5,f1df685b,2024-06-28_03-34-25,61.00002908706665,319.8503198623657,242786,r8i6n8,10.159.28.66,319.8503198623657,5
434.38929231898993,1719538527,checkpoint_000005,True,False,6,f1df685b,2024-06-28_03-35-27,61.93894553184509,381.7892653942108,242786,r8i6n8,10.159.28.66,381.7892653942108,6
406.3274053138072,1719538590,checkpoint_000006,True,False,7,f1df685b,2024-06-28_03-36-30,62.708914041519165,444.49817943573,242786,r8i6n8,10.159.28.66,444.49817943573,7
384.7530104269193,1719538652,checkpoint_000007,True,False,8,f1df685b,2024-06-28_03-37-32,62.19302701950073,506.6912064552307,242786,r8i6n8,10.159.28.66,506.6912064552307,8
372.8606783649114,1719538714,checkpoint_000008,True,False,9,f1df685b,2024-06-28_03-38-34,62.220932483673096,568.9121389389038,242786,r8i6n8,10.159.28.66,568.9121389389038,9
349.91690856453005,1719538777,checkpoint_000009,True,False,10,f1df685b,2024-06-28_03-39-37,62.24173164367676,631.1538705825806,242786,r8i6n8,10.159.28.66,631.1538705825806,10
{"loss": 1395.3380626768578, "timestamp": 1719538220, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "f1df685b", "date": "2024-06-28_03-30-20", "time_this_iter_s": 74.64295077323914, "time_total_s": 74.64295077323914, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 74.64295077323914, "iterations_since_restore": 1}
{"loss": 843.0610409233514, "timestamp": 1719538282, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "f1df685b", "date": "2024-06-28_03-31-22", "time_this_iter_s": 61.71093678474426, "time_total_s": 136.3538875579834, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 136.3538875579834, "iterations_since_restore": 2}
{"loss": 649.7034859244279, "timestamp": 1719538343, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "f1df685b", "date": "2024-06-28_03-32-23", "time_this_iter_s": 61.319239377975464, "time_total_s": 197.67312693595886, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 197.67312693595886, "iterations_since_restore": 3}
{"loss": 538.8246248500553, "timestamp": 1719538404, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "f1df685b", "date": "2024-06-28_03-33-24", "time_this_iter_s": 61.17716383934021, "time_total_s": 258.8502907752991, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 258.8502907752991, "iterations_since_restore": 4}
{"loss": 476.29196431317666, "timestamp": 1719538465, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "f1df685b", "date": "2024-06-28_03-34-25", "time_this_iter_s": 61.00002908706665, "time_total_s": 319.8503198623657, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 319.8503198623657, "iterations_since_restore": 5}
{"loss": 434.38929231898993, "timestamp": 1719538527, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "f1df685b", "date": "2024-06-28_03-35-27", "time_this_iter_s": 61.93894553184509, "time_total_s": 381.7892653942108, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 381.7892653942108, "iterations_since_restore": 6}
{"loss": 406.3274053138072, "timestamp": 1719538590, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "f1df685b", "date": "2024-06-28_03-36-30", "time_this_iter_s": 62.708914041519165, "time_total_s": 444.49817943573, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 444.49817943573, "iterations_since_restore": 7}
{"loss": 384.7530104269193, "timestamp": 1719538652, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "f1df685b", "date": "2024-06-28_03-37-32", "time_this_iter_s": 62.19302701950073, "time_total_s": 506.6912064552307, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 506.6912064552307, "iterations_since_restore": 8}
{"loss": 372.8606783649114, "timestamp": 1719538714, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "f1df685b", "date": "2024-06-28_03-38-34", "time_this_iter_s": 62.220932483673096, "time_total_s": 568.9121389389038, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 568.9121389389038, "iterations_since_restore": 9}
{"loss": 349.91690856453005, "timestamp": 1719538777, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "f1df685b", "date": "2024-06-28_03-39-37", "time_this_iter_s": 62.24173164367676, "time_total_s": 631.1538705825806, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.6516917077514637, "lr": 0.00012016483134334655, "batch_size": 2048}, "time_since_restore": 631.1538705825806, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.4230793088582453,
"embedding_dim": 16,
"encoder_ff": 1024,
"encoder_num_layer": 1,
"lr": 0.00288155269334617,
"n_head": 8
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment