Skip to content
Snippets Groups Projects
Commit a790c5c2 authored by Léo Schneider's avatar Léo Schneider Committed by Schneider Leo
Browse files

res

parent efd6839c
No related branches found
No related tags found
No related merge requests found
Showing
with 73 additions and 0 deletions
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 4,
"drop_rate": 0.8101220088903347,
"embedding_dim": 64,
"encoder_ff": 1024,
"encoder_num_layer": 4,
"lr": 0.0005780102991375737,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2012.1837220680056,1719332857,checkpoint_000000,True,False,1,bea15841,2024-06-25_18-27-37,89.14307808876038,89.14307808876038,2195253,r8i6n2,10.159.28.60,89.14307808876038,1
2008.3096395177165,1719332932,checkpoint_000001,True,False,2,bea15841,2024-06-25_18-28-52,75.03496551513672,164.1780436038971,2195253,r8i6n2,10.159.28.60,164.1780436038971,2
{"loss": 2012.1837220680056, "timestamp": 1719332857, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "bea15841", "date": "2024-06-25_18-27-37", "time_this_iter_s": 89.14307808876038, "time_total_s": 89.14307808876038, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.8101220088903347, "lr": 0.0005780102991375737, "batch_size": 1024}, "time_since_restore": 89.14307808876038, "iterations_since_restore": 1}
{"loss": 2008.3096395177165, "timestamp": 1719332932, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "bea15841", "date": "2024-06-25_18-28-52", "time_this_iter_s": 75.03496551513672, "time_total_s": 164.1780436038971, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.8101220088903347, "lr": 0.0005780102991375737, "batch_size": 1024}, "time_since_restore": 164.1780436038971, "iterations_since_restore": 2}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.5887703154000944,
"embedding_dim": 1024,
"encoder_ff": 1024,
"encoder_num_layer": 4,
"lr": 0.0008721653331207079,
"n_head": 1
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1987.1915456216166,1719333389,checkpoint_000000,True,False,1,c2c99680,2024-06-25_18-36-29,456.8247263431549,456.8247263431549,2195253,r8i6n2,10.159.28.60,456.8247263431549,1
1982.5428274560163,1719333829,checkpoint_000001,True,False,2,c2c99680,2024-06-25_18-43-49,440.0058114528656,896.8305377960205,2195253,r8i6n2,10.159.28.60,896.8305377960205,2
2012.3732496847317,1719337749,checkpoint_000002,True,False,3,c2c99680,2024-06-25_19-49-10,454.0293221473694,1350.85985994339,2195253,r8i6n2,10.159.28.60,454.0293221473694,1
2023.2190220149482,1719338188,checkpoint_000003,True,False,4,c2c99680,2024-06-25_19-56-29,439.1456036567688,1790.0054636001587,2195253,r8i6n2,10.159.28.60,893.1749258041382,2
{"loss": 1987.1915456216166, "timestamp": 1719333389, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "c2c99680", "date": "2024-06-25_18-36-29", "time_this_iter_s": 456.8247263431549, "time_total_s": 456.8247263431549, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 456.8247263431549, "iterations_since_restore": 1}
{"loss": 1982.5428274560163, "timestamp": 1719333829, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "c2c99680", "date": "2024-06-25_18-43-49", "time_this_iter_s": 440.0058114528656, "time_total_s": 896.8305377960205, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 896.8305377960205, "iterations_since_restore": 2}
{"loss": 2012.3732496847317, "timestamp": 1719337749, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "c2c99680", "date": "2024-06-25_19-49-10", "time_this_iter_s": 454.0293221473694, "time_total_s": 1350.85985994339, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 454.0293221473694, "iterations_since_restore": 1}
{"loss": 2023.2190220149482, "timestamp": 1719338188, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "c2c99680", "date": "2024-06-25_19-56-29", "time_this_iter_s": 439.1456036567688, "time_total_s": 1790.0054636001587, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 893.1749258041382, "iterations_since_restore": 2}
{
"batch_size": 2048,
"decoder_int_ff": 2048,
"decoder_int_num_layer": 8,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.4176788223006639,
"embedding_dim": 256,
"encoder_ff": 1024,
"encoder_num_layer": 2,
"lr": 0.00038150746043137153,
"n_head": 2
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
357.444681242695,1719325234,checkpoint_000000,True,False,1,c4172973,2024-06-25_16-20-34,78.41421294212341,78.41421294212341,69318,r3i5n6,10.159.8.159,78.41421294212341,1
261.25574487400803,1719327690,checkpoint_000001,True,False,2,c4172973,2024-06-25_17-01-30,79.34292578697205,157.75713872909546,130020,r3i5n6,10.159.8.159,79.34292578697205,1
{"loss": 357.444681242695, "timestamp": 1719325234, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "c4172973", "date": "2024-06-25_16-20-34", "time_this_iter_s": 78.41421294212341, "time_total_s": 78.41421294212341, "pid": 69318, "hostname": "r3i5n6", "node_ip": "10.159.8.159", "config": {"encoder_num_layer": 2, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 8, "embedding_dim": 256, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 2048, "n_head": 2, "drop_rate": 0.4176788223006639, "lr": 0.00038150746043137153, "batch_size": 2048}, "time_since_restore": 78.41421294212341, "iterations_since_restore": 1}
{"loss": 261.25574487400803, "timestamp": 1719327690, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "c4172973", "date": "2024-06-25_17-01-30", "time_this_iter_s": 79.34292578697205, "time_total_s": 157.75713872909546, "pid": 130020, "hostname": "r3i5n6", "node_ip": "10.159.8.159", "config": {"encoder_num_layer": 2, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 8, "embedding_dim": 256, "encoder_ff": 1024, "decoder_rt_ff": 512, "decoder_int_ff": 2048, "n_head": 2, "drop_rate": 0.4176788223006639, "lr": 0.00038150746043137153, "batch_size": 2048}, "time_since_restore": 79.34292578697205, "iterations_since_restore": 1}
{
"batch_size": 2048,
"decoder_int_ff": 1024,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.7776595209025089,
"embedding_dim": 16,
"encoder_ff": 1024,
"encoder_num_layer": 8,
"lr": 0.0006106789085082022,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2001.7704808993603,1719321692,checkpoint_000000,True,False,1,dd950274,2024-06-25_15-21-32,89.34920597076416,89.34920597076416,355319,r7i5n7,10.159.24.56,89.34920597076416,1
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment