Skip to content
Snippets Groups Projects
Commit a790c5c2 authored by Léo Schneider's avatar Léo Schneider Committed by Schneider Leo
Browse files

res

parent efd6839c
No related branches found
No related tags found
No related merge requests found
Showing
with 81 additions and 0 deletions
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 4,
"drop_rate": 0.22544213936627444,
"embedding_dim": 16,
"encoder_ff": 1024,
"encoder_num_layer": 1,
"lr": 0.0013157536168827595,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
253.8278117743064,1719328526,checkpoint_000000,True,False,1,a00d3259,2024-06-25_17-15-26,70.23847699165344,70.23847699165344,2195253,r8i6n2,10.159.28.60,70.23847699165344,1
168.6947938813938,1719330587,checkpoint_000001,True,False,2,a00d3259,2024-06-25_17-49-47,69.5678973197937,139.80637431144714,2195253,r8i6n2,10.159.28.60,69.5678973197937,1
159.82500259519563,1719331219,checkpoint_000002,True,False,3,a00d3259,2024-06-25_18-00-19,88.16569352149963,227.97206783294678,2195253,r8i6n2,10.159.28.60,88.16569352149963,1
140.64553523626853,1719331282,checkpoint_000003,True,False,4,a00d3259,2024-06-25_18-01-22,62.607720375061035,290.5797882080078,2195253,r8i6n2,10.159.28.60,150.77341389656067,2
150.0000455060343,1719331896,checkpoint_000004,True,False,5,a00d3259,2024-06-25_18-11-36,72.27389621734619,362.853684425354,2195253,r8i6n2,10.159.28.60,72.27389621734619,1
130.9991111755371,1719331954,checkpoint_000005,True,False,6,a00d3259,2024-06-25_18-12-34,58.202213287353516,421.0558977127075,2195253,r8i6n2,10.159.28.60,130.4761095046997,2
124.42158469252699,1719332013,checkpoint_000006,True,False,7,a00d3259,2024-06-25_18-13-33,58.22797513008118,479.2838728427887,2195253,r8i6n2,10.159.28.60,188.70408463478088,3
119.19234625748761,1719332071,checkpoint_000007,True,False,8,a00d3259,2024-06-25_18-14-31,58.22098970413208,537.5048625469208,2195253,r8i6n2,10.159.28.60,246.92507433891296,4
{"loss": 253.8278117743064, "timestamp": 1719328526, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "a00d3259", "date": "2024-06-25_17-15-26", "time_this_iter_s": 70.23847699165344, "time_total_s": 70.23847699165344, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 70.23847699165344, "iterations_since_restore": 1}
{"loss": 168.6947938813938, "timestamp": 1719330587, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "a00d3259", "date": "2024-06-25_17-49-47", "time_this_iter_s": 69.5678973197937, "time_total_s": 139.80637431144714, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 69.5678973197937, "iterations_since_restore": 1}
{"loss": 159.82500259519563, "timestamp": 1719331219, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "a00d3259", "date": "2024-06-25_18-00-19", "time_this_iter_s": 88.16569352149963, "time_total_s": 227.97206783294678, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 88.16569352149963, "iterations_since_restore": 1}
{"loss": 140.64553523626853, "timestamp": 1719331282, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "a00d3259", "date": "2024-06-25_18-01-22", "time_this_iter_s": 62.607720375061035, "time_total_s": 290.5797882080078, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 150.77341389656067, "iterations_since_restore": 2}
{"loss": 150.0000455060343, "timestamp": 1719331896, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "a00d3259", "date": "2024-06-25_18-11-36", "time_this_iter_s": 72.27389621734619, "time_total_s": 362.853684425354, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 72.27389621734619, "iterations_since_restore": 1}
{"loss": 130.9991111755371, "timestamp": 1719331954, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "a00d3259", "date": "2024-06-25_18-12-34", "time_this_iter_s": 58.202213287353516, "time_total_s": 421.0558977127075, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 130.4761095046997, "iterations_since_restore": 2}
{"loss": 124.42158469252699, "timestamp": 1719332013, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "a00d3259", "date": "2024-06-25_18-13-33", "time_this_iter_s": 58.22797513008118, "time_total_s": 479.2838728427887, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 188.70408463478088, "iterations_since_restore": 3}
{"loss": 119.19234625748761, "timestamp": 1719332071, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "a00d3259", "date": "2024-06-25_18-14-31", "time_this_iter_s": 58.22098970413208, "time_total_s": 537.5048625469208, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.22544213936627444, "lr": 0.0013157536168827595, "batch_size": 1024}, "time_since_restore": 246.92507433891296, "iterations_since_restore": 4}
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.23338023981015343,
"embedding_dim": 16,
"encoder_ff": 1024,
"encoder_num_layer": 8,
"lr": 0.00010269515886648154,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
983.9757466954509,1719330446,checkpoint_000000,True,False,1,a01c9b2d,2024-06-25_17-47-26,83.82870721817017,83.82870721817017,2195253,r8i6n2,10.159.28.60,83.82870721817017,1
501.4262033297321,1719330517,checkpoint_000001,True,False,2,a01c9b2d,2024-06-25_17-48-37,70.83729195594788,154.66599917411804,2195253,r8i6n2,10.159.28.60,154.66599917411804,2
362.6629641074834,1719331736,checkpoint_000002,True,False,3,a01c9b2d,2024-06-25_18-08-56,101.81216025352478,256.4781594276428,2195253,r8i6n2,10.159.28.60,101.81216025352478,1
290.2177711246521,1719331824,checkpoint_000003,True,True,4,a01c9b2d,2024-06-25_18-10-24,87.97965884208679,344.4578182697296,2195253,r8i6n2,10.159.28.60,189.79181909561157,2
{"loss": 983.9757466954509, "timestamp": 1719330446, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "a01c9b2d", "date": "2024-06-25_17-47-26", "time_this_iter_s": 83.82870721817017, "time_total_s": 83.82870721817017, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.23338023981015343, "lr": 0.00010269515886648154, "batch_size": 1024}, "time_since_restore": 83.82870721817017, "iterations_since_restore": 1}
{"loss": 501.4262033297321, "timestamp": 1719330517, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "a01c9b2d", "date": "2024-06-25_17-48-37", "time_this_iter_s": 70.83729195594788, "time_total_s": 154.66599917411804, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.23338023981015343, "lr": 0.00010269515886648154, "batch_size": 1024}, "time_since_restore": 154.66599917411804, "iterations_since_restore": 2}
{"loss": 362.6629641074834, "timestamp": 1719331736, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "a01c9b2d", "date": "2024-06-25_18-08-56", "time_this_iter_s": 101.81216025352478, "time_total_s": 256.4781594276428, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.23338023981015343, "lr": 0.00010269515886648154, "batch_size": 1024}, "time_since_restore": 101.81216025352478, "iterations_since_restore": 1}
{"loss": 290.2177711246521, "timestamp": 1719331824, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": true, "training_iteration": 4, "trial_id": "a01c9b2d", "date": "2024-06-25_18-10-24", "time_this_iter_s": 87.97965884208679, "time_total_s": 344.4578182697296, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.23338023981015343, "lr": 0.00010269515886648154, "batch_size": 1024}, "time_since_restore": 189.79181909561157, "iterations_since_restore": 2}
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 8,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.4534009171604666,
"embedding_dim": 256,
"encoder_ff": 2048,
"encoder_num_layer": 2,
"lr": 0.019472817375775914,
"n_head": 8
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2773.484795037217,1719324574,checkpoint_000000,True,False,1,a0e8b2af,2024-06-25_16-09-34,89.29933595657349,89.29933595657349,69318,r3i5n6,10.159.8.159,89.29933595657349,1
{"loss": 2773.484795037217, "timestamp": 1719324574, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "a0e8b2af", "date": "2024-06-25_16-09-34", "time_this_iter_s": 89.29933595657349, "time_total_s": 89.29933595657349, "pid": 69318, "hostname": "r3i5n6", "node_ip": "10.159.8.159", "config": {"encoder_num_layer": 2, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 8, "embedding_dim": 256, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.4534009171604666, "lr": 0.019472817375775914, "batch_size": 1024}, "time_since_restore": 89.29933595657349, "iterations_since_restore": 1}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.9358999268282086,
"embedding_dim": 1024,
"encoder_ff": 1024,
"encoder_num_layer": 1,
"lr": 0.00020838214141938324,
"n_head": 4
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment