Skip to content
Snippets Groups Projects
Commit 02f95633 authored by Schneider Leo's avatar Schneider Leo
Browse files

del raysesult

parent b844726e
No related branches found
No related tags found
No related merge requests found
Showing
with 0 additions and 85 deletions
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1977.4159521868849,1719491515,checkpoint_000000,True,False,1,c02405fc,2024-06-27_14-31-55,85.07843685150146,85.07843685150146,35196,r8i6n8,10.159.28.66,85.07843685150146,1
1978.1414919875738,1719494127,checkpoint_000001,True,False,2,c02405fc,2024-06-27_15-15-27,85.28851962089539,170.36695647239685,69992,r8i6n8,10.159.28.66,85.28851962089539,1
{"loss": 1977.4159521868849, "timestamp": 1719491515, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "c02405fc", "date": "2024-06-27_14-31-55", "time_this_iter_s": 85.07843685150146, "time_total_s": 85.07843685150146, "pid": 35196, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 256, "encoder_ff": 1024, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 2, "drop_rate": 0.5345579147076132, "lr": 0.0017624805585372257, "batch_size": 2048}, "time_since_restore": 85.07843685150146, "iterations_since_restore": 1}
{"loss": 1978.1414919875738, "timestamp": 1719494127, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "c02405fc", "date": "2024-06-27_15-15-27", "time_this_iter_s": 85.28851962089539, "time_total_s": 170.36695647239685, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 256, "encoder_ff": 1024, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 2, "drop_rate": 0.5345579147076132, "lr": 0.0017624805585372257, "batch_size": 2048}, "time_since_restore": 85.28851962089539, "iterations_since_restore": 1}
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.37340656523341487,
"embedding_dim": 64,
"encoder_ff": 512,
"encoder_num_layer": 1,
"lr": 0.0007457945749126396,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
248.8490186075526,1719493632,checkpoint_000000,True,False,1,c04d8657,2024-06-27_15-07-12,69.30736112594604,69.30736112594604,69992,r8i6n8,10.159.28.66,69.30736112594604,1
176.55898278904712,1719494854,checkpoint_000001,True,False,2,c04d8657,2024-06-27_15-27-34,70.9636754989624,140.27103662490845,69992,r8i6n8,10.159.28.66,70.9636754989624,1
153.5841199018824,1719494911,checkpoint_000002,True,False,3,c04d8657,2024-06-27_15-28-31,56.80309820175171,197.07413482666016,69992,r8i6n8,10.159.28.66,127.76677370071411,2
141.87842869195413,1719494968,checkpoint_000003,True,False,4,c04d8657,2024-06-27_15-29-28,56.76813840866089,253.84227323532104,69992,r8i6n8,10.159.28.66,184.534912109375,3
132.76247937660517,1719496213,checkpoint_000004,True,False,5,c04d8657,2024-06-27_15-50-13,70.93559050559998,324.777863740921,69992,r8i6n8,10.159.28.66,70.93559050559998,1
127.65858931053342,1719496269,checkpoint_000005,True,False,6,c04d8657,2024-06-27_15-51-09,56.18658232688904,380.96444606781006,69992,r8i6n8,10.159.28.66,127.12217283248901,2
128.54880821047806,1719496325,checkpoint_000006,True,False,7,c04d8657,2024-06-27_15-52-05,55.70376706123352,436.6682131290436,69992,r8i6n8,10.159.28.66,182.82593989372253,3
121.30412758053757,1719496382,checkpoint_000007,True,False,8,c04d8657,2024-06-27_15-53-02,56.52959203720093,493.1978051662445,69992,r8i6n8,10.159.28.66,239.35553193092346,4
124.07332433865766,1719496438,checkpoint_000008,True,False,9,c04d8657,2024-06-27_15-53-58,56.19808506965637,549.3958902359009,69992,r8i6n8,10.159.28.66,295.55361700057983,5
115.79139270932656,1719496495,checkpoint_000009,True,False,10,c04d8657,2024-06-27_15-54-55,57.11151361465454,606.5074038505554,69992,r8i6n8,10.159.28.66,352.6651306152344,6
113.53236323078787,1719496551,checkpoint_000010,True,False,11,c04d8657,2024-06-27_15-55-51,56.11752891540527,662.6249327659607,69992,r8i6n8,10.159.28.66,408.78265953063965,7
112.30559909249854,1719496607,checkpoint_000011,True,False,12,c04d8657,2024-06-27_15-56-47,55.55129075050354,718.1762235164642,69992,r8i6n8,10.159.28.66,464.3339502811432,8
113.81121531809409,1719496663,checkpoint_000012,True,False,13,c04d8657,2024-06-27_15-57-43,56.53476905822754,774.7109925746918,69992,r8i6n8,10.159.28.66,520.8687193393707,9
110.44758017232098,1719496719,checkpoint_000013,True,False,14,c04d8657,2024-06-27_15-58-39,56.147799015045166,830.8587915897369,69992,r8i6n8,10.159.28.66,577.0165183544159,10
{"loss": 248.8490186075526, "timestamp": 1719493632, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "c04d8657", "date": "2024-06-27_15-07-12", "time_this_iter_s": 69.30736112594604, "time_total_s": 69.30736112594604, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 69.30736112594604, "iterations_since_restore": 1}
{"loss": 176.55898278904712, "timestamp": 1719494854, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "c04d8657", "date": "2024-06-27_15-27-34", "time_this_iter_s": 70.9636754989624, "time_total_s": 140.27103662490845, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 70.9636754989624, "iterations_since_restore": 1}
{"loss": 153.5841199018824, "timestamp": 1719494911, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "c04d8657", "date": "2024-06-27_15-28-31", "time_this_iter_s": 56.80309820175171, "time_total_s": 197.07413482666016, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 127.76677370071411, "iterations_since_restore": 2}
{"loss": 141.87842869195413, "timestamp": 1719494968, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "c04d8657", "date": "2024-06-27_15-29-28", "time_this_iter_s": 56.76813840866089, "time_total_s": 253.84227323532104, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 184.534912109375, "iterations_since_restore": 3}
{"loss": 132.76247937660517, "timestamp": 1719496213, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "c04d8657", "date": "2024-06-27_15-50-13", "time_this_iter_s": 70.93559050559998, "time_total_s": 324.777863740921, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 70.93559050559998, "iterations_since_restore": 1}
{"loss": 127.65858931053342, "timestamp": 1719496269, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "c04d8657", "date": "2024-06-27_15-51-09", "time_this_iter_s": 56.18658232688904, "time_total_s": 380.96444606781006, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 127.12217283248901, "iterations_since_restore": 2}
{"loss": 128.54880821047806, "timestamp": 1719496325, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "c04d8657", "date": "2024-06-27_15-52-05", "time_this_iter_s": 55.70376706123352, "time_total_s": 436.6682131290436, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 182.82593989372253, "iterations_since_restore": 3}
{"loss": 121.30412758053757, "timestamp": 1719496382, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "c04d8657", "date": "2024-06-27_15-53-02", "time_this_iter_s": 56.52959203720093, "time_total_s": 493.1978051662445, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 239.35553193092346, "iterations_since_restore": 4}
{"loss": 124.07332433865766, "timestamp": 1719496438, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "c04d8657", "date": "2024-06-27_15-53-58", "time_this_iter_s": 56.19808506965637, "time_total_s": 549.3958902359009, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 295.55361700057983, "iterations_since_restore": 5}
{"loss": 115.79139270932656, "timestamp": 1719496495, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "c04d8657", "date": "2024-06-27_15-54-55", "time_this_iter_s": 57.11151361465454, "time_total_s": 606.5074038505554, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 352.6651306152344, "iterations_since_restore": 6}
{"loss": 113.53236323078787, "timestamp": 1719496551, "checkpoint_dir_name": "checkpoint_000010", "should_checkpoint": true, "done": false, "training_iteration": 11, "trial_id": "c04d8657", "date": "2024-06-27_15-55-51", "time_this_iter_s": 56.11752891540527, "time_total_s": 662.6249327659607, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 408.78265953063965, "iterations_since_restore": 7}
{"loss": 112.30559909249854, "timestamp": 1719496607, "checkpoint_dir_name": "checkpoint_000011", "should_checkpoint": true, "done": false, "training_iteration": 12, "trial_id": "c04d8657", "date": "2024-06-27_15-56-47", "time_this_iter_s": 55.55129075050354, "time_total_s": 718.1762235164642, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 464.3339502811432, "iterations_since_restore": 8}
{"loss": 113.81121531809409, "timestamp": 1719496663, "checkpoint_dir_name": "checkpoint_000012", "should_checkpoint": true, "done": false, "training_iteration": 13, "trial_id": "c04d8657", "date": "2024-06-27_15-57-43", "time_this_iter_s": 56.53476905822754, "time_total_s": 774.7109925746918, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 520.8687193393707, "iterations_since_restore": 9}
{"loss": 110.44758017232098, "timestamp": 1719496719, "checkpoint_dir_name": "checkpoint_000013", "should_checkpoint": true, "done": false, "training_iteration": 14, "trial_id": "c04d8657", "date": "2024-06-27_15-58-39", "time_this_iter_s": 56.147799015045166, "time_total_s": 830.8587915897369, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.37340656523341487, "lr": 0.0007457945749126396, "batch_size": 1024}, "time_since_restore": 577.0165183544159, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.5887703154000944,
"embedding_dim": 1024,
"encoder_ff": 1024,
"encoder_num_layer": 4,
"lr": 0.0008721653331207079,
"n_head": 1
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1987.1915456216166,1719333389,checkpoint_000000,True,False,1,c2c99680,2024-06-25_18-36-29,456.8247263431549,456.8247263431549,2195253,r8i6n2,10.159.28.60,456.8247263431549,1
1982.5428274560163,1719333829,checkpoint_000001,True,False,2,c2c99680,2024-06-25_18-43-49,440.0058114528656,896.8305377960205,2195253,r8i6n2,10.159.28.60,896.8305377960205,2
2012.3732496847317,1719337749,checkpoint_000002,True,False,3,c2c99680,2024-06-25_19-49-10,454.0293221473694,1350.85985994339,2195253,r8i6n2,10.159.28.60,454.0293221473694,1
2023.2190220149482,1719338188,checkpoint_000003,True,False,4,c2c99680,2024-06-25_19-56-29,439.1456036567688,1790.0054636001587,2195253,r8i6n2,10.159.28.60,893.1749258041382,2
{"loss": 1987.1915456216166, "timestamp": 1719333389, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "c2c99680", "date": "2024-06-25_18-36-29", "time_this_iter_s": 456.8247263431549, "time_total_s": 456.8247263431549, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 456.8247263431549, "iterations_since_restore": 1}
{"loss": 1982.5428274560163, "timestamp": 1719333829, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "c2c99680", "date": "2024-06-25_18-43-49", "time_this_iter_s": 440.0058114528656, "time_total_s": 896.8305377960205, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 896.8305377960205, "iterations_since_restore": 2}
{"loss": 2012.3732496847317, "timestamp": 1719337749, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "c2c99680", "date": "2024-06-25_19-49-10", "time_this_iter_s": 454.0293221473694, "time_total_s": 1350.85985994339, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 454.0293221473694, "iterations_since_restore": 1}
{"loss": 2023.2190220149482, "timestamp": 1719338188, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "c2c99680", "date": "2024-06-25_19-56-29", "time_this_iter_s": 439.1456036567688, "time_total_s": 1790.0054636001587, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5887703154000944, "lr": 0.0008721653331207079, "batch_size": 2048}, "time_since_restore": 893.1749258041382, "iterations_since_restore": 2}
{
"batch_size": 2048,
"decoder_int_ff": 2048,
"decoder_int_num_layer": 8,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.4176788223006639,
"embedding_dim": 256,
"encoder_ff": 1024,
"encoder_num_layer": 2,
"lr": 0.00038150746043137153,
"n_head": 2
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
357.444681242695,1719325234,checkpoint_000000,True,False,1,c4172973,2024-06-25_16-20-34,78.41421294212341,78.41421294212341,69318,r3i5n6,10.159.8.159,78.41421294212341,1
261.25574487400803,1719327690,checkpoint_000001,True,False,2,c4172973,2024-06-25_17-01-30,79.34292578697205,157.75713872909546,130020,r3i5n6,10.159.8.159,79.34292578697205,1
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment