Skip to content
Snippets Groups Projects
Commit 915e419e authored by Léo Schneider's avatar Léo Schneider Committed by Schneider Leo
Browse files

res

parent a790c5c2
No related branches found
No related tags found
No related merge requests found
Showing
with 107 additions and 0 deletions
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.9027598279893692,
"embedding_dim": 1024,
"encoder_ff": 512,
"encoder_num_layer": 8,
"lr": 0.00800097877874484,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2406.545863834892,1719501495,checkpoint_000000,True,False,1,e0b92d48,2024-06-27_17-18-15,724.5406517982483,724.5406517982483,242786,r8i6n8,10.159.28.66,724.5406517982483,1
2331.1488584984004,1719502199,checkpoint_000001,True,False,2,e0b92d48,2024-06-27_17-29-59,703.9930710792542,1428.5337228775024,242786,r8i6n8,10.159.28.66,1428.5337228775024,2
{"loss": 2406.545863834892, "timestamp": 1719501495, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "e0b92d48", "date": "2024-06-27_17-18-15", "time_this_iter_s": 724.5406517982483, "time_total_s": 724.5406517982483, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 512, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9027598279893692, "lr": 0.00800097877874484, "batch_size": 2048}, "time_since_restore": 724.5406517982483, "iterations_since_restore": 1}
{"loss": 2331.1488584984004, "timestamp": 1719502199, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "e0b92d48", "date": "2024-06-27_17-29-59", "time_this_iter_s": 703.9930710792542, "time_total_s": 1428.5337228775024, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 1024, "encoder_ff": 512, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.9027598279893692, "lr": 0.00800097877874484, "batch_size": 2048}, "time_since_restore": 1428.5337228775024, "iterations_since_restore": 2}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 1,
"drop_rate": 0.3372755257890534,
"embedding_dim": 16,
"encoder_ff": 512,
"encoder_num_layer": 8,
"lr": 0.00018514260159136858,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1182.49372251015,1719518905,checkpoint_000000,True,False,1,e0cd883e,2024-06-27_22-08-25,83.27375411987305,83.27375411987305,242786,r8i6n8,10.159.28.66,83.27375411987305,1
645.4160598394438,1719518975,checkpoint_000001,True,False,2,e0cd883e,2024-06-27_22-09-35,70.14381790161133,153.41757202148438,242786,r8i6n8,10.159.28.66,153.41757202148438,2
522.639965147484,1719519045,checkpoint_000002,True,False,3,e0cd883e,2024-06-27_22-10-45,70.15310597419739,223.57067799568176,242786,r8i6n8,10.159.28.66,223.57067799568176,3
459.74198444997234,1719519116,checkpoint_000003,True,False,4,e0cd883e,2024-06-27_22-11-56,70.06108522415161,293.6317632198334,242786,r8i6n8,10.159.28.66,293.6317632198334,4
391.3528187669168,1719519186,checkpoint_000004,True,False,5,e0cd883e,2024-06-27_22-13-06,70.20780396461487,363.83956718444824,242786,r8i6n8,10.159.28.66,363.83956718444824,5
335.89961062453864,1719519255,checkpoint_000005,True,False,6,e0cd883e,2024-06-27_22-14-15,69.51625561714172,433.35582280158997,242786,r8i6n8,10.159.28.66,433.35582280158997,6
310.48668424351007,1719519325,checkpoint_000006,True,False,7,e0cd883e,2024-06-27_22-15-25,70.04849791526794,503.4043207168579,242786,r8i6n8,10.159.28.66,503.4043207168579,7
265.2837000569021,1719519395,checkpoint_000007,True,False,8,e0cd883e,2024-06-27_22-16-35,70.00017595291138,573.4044966697693,242786,r8i6n8,10.159.28.66,573.4044966697693,8
242.94229570523962,1719519465,checkpoint_000008,True,False,9,e0cd883e,2024-06-27_22-17-45,69.56129503250122,642.9657917022705,242786,r8i6n8,10.159.28.66,642.9657917022705,9
226.0272181953971,1719519535,checkpoint_000009,True,False,10,e0cd883e,2024-06-27_22-18-55,70.02730536460876,712.9930970668793,242786,r8i6n8,10.159.28.66,712.9930970668793,10
{"loss": 1182.49372251015, "timestamp": 1719518905, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "e0cd883e", "date": "2024-06-27_22-08-25", "time_this_iter_s": 83.27375411987305, "time_total_s": 83.27375411987305, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 83.27375411987305, "iterations_since_restore": 1}
{"loss": 645.4160598394438, "timestamp": 1719518975, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "e0cd883e", "date": "2024-06-27_22-09-35", "time_this_iter_s": 70.14381790161133, "time_total_s": 153.41757202148438, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 153.41757202148438, "iterations_since_restore": 2}
{"loss": 522.639965147484, "timestamp": 1719519045, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "e0cd883e", "date": "2024-06-27_22-10-45", "time_this_iter_s": 70.15310597419739, "time_total_s": 223.57067799568176, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 223.57067799568176, "iterations_since_restore": 3}
{"loss": 459.74198444997234, "timestamp": 1719519116, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "e0cd883e", "date": "2024-06-27_22-11-56", "time_this_iter_s": 70.06108522415161, "time_total_s": 293.6317632198334, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 293.6317632198334, "iterations_since_restore": 4}
{"loss": 391.3528187669168, "timestamp": 1719519186, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "e0cd883e", "date": "2024-06-27_22-13-06", "time_this_iter_s": 70.20780396461487, "time_total_s": 363.83956718444824, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 363.83956718444824, "iterations_since_restore": 5}
{"loss": 335.89961062453864, "timestamp": 1719519255, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "e0cd883e", "date": "2024-06-27_22-14-15", "time_this_iter_s": 69.51625561714172, "time_total_s": 433.35582280158997, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 433.35582280158997, "iterations_since_restore": 6}
{"loss": 310.48668424351007, "timestamp": 1719519325, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "e0cd883e", "date": "2024-06-27_22-15-25", "time_this_iter_s": 70.04849791526794, "time_total_s": 503.4043207168579, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 503.4043207168579, "iterations_since_restore": 7}
{"loss": 265.2837000569021, "timestamp": 1719519395, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "e0cd883e", "date": "2024-06-27_22-16-35", "time_this_iter_s": 70.00017595291138, "time_total_s": 573.4044966697693, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 573.4044966697693, "iterations_since_restore": 8}
{"loss": 242.94229570523962, "timestamp": 1719519465, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "e0cd883e", "date": "2024-06-27_22-17-45", "time_this_iter_s": 69.56129503250122, "time_total_s": 642.9657917022705, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 642.9657917022705, "iterations_since_restore": 9}
{"loss": 226.0272181953971, "timestamp": 1719519535, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "e0cd883e", "date": "2024-06-27_22-18-55", "time_this_iter_s": 70.02730536460876, "time_total_s": 712.9930970668793, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 512, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.3372755257890534, "lr": 0.00018514260159136858, "batch_size": 2048}, "time_since_restore": 712.9930970668793, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 8,
"drop_rate": 0.03611990882258942,
"embedding_dim": 16,
"encoder_ff": 2048,
"encoder_num_layer": 4,
"lr": 0.00028375287963234745,
"n_head": 8
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1954.021998608206,1719498933,checkpoint_000000,True,False,1,e0cf80c0,2024-06-27_16-35-33,97.99486684799194,97.99486684799194,242786,r8i6n8,10.159.28.66,97.99486684799194,1
1955.7363098625124,1719499017,checkpoint_000001,True,False,2,e0cf80c0,2024-06-27_16-36-57,83.9807825088501,181.97564935684204,242786,r8i6n8,10.159.28.66,181.97564935684204,2
1953.048192782665,1719504822,checkpoint_000002,True,False,3,e0cf80c0,2024-06-27_18-13-42,99.29927706718445,281.2749264240265,242786,r8i6n8,10.159.28.66,99.29927706718445,1
1955.8478513702632,1719504907,checkpoint_000003,True,False,4,e0cf80c0,2024-06-27_18-15-07,84.75202250480652,366.026948928833,242786,r8i6n8,10.159.28.66,184.05129957199097,2
1954.159799650898,1719506222,checkpoint_000004,True,False,5,e0cf80c0,2024-06-27_18-37-02,99.05570006370544,465.08264899253845,242786,r8i6n8,10.159.28.66,99.05570006370544,1
1953.744985505352,1719506307,checkpoint_000005,True,False,6,e0cf80c0,2024-06-27_18-38-27,84.97408151626587,550.0567305088043,242786,r8i6n8,10.159.28.66,184.0297815799713,2
1953.285723348302,1719506392,checkpoint_000006,True,False,7,e0cf80c0,2024-06-27_18-39-52,85.0238299369812,635.0805604457855,242786,r8i6n8,10.159.28.66,269.0536115169525,3
1954.5312970979946,1719506476,checkpoint_000007,True,False,8,e0cf80c0,2024-06-27_18-41-16,84.54337477684021,719.6239352226257,242786,r8i6n8,10.159.28.66,353.5969862937927,4
1954.3730785940577,1719506561,checkpoint_000008,True,False,9,e0cf80c0,2024-06-27_18-42-41,85.04393577575684,804.6678709983826,242786,r8i6n8,10.159.28.66,438.64092206954956,5
1955.718712513841,1719506647,checkpoint_000009,True,False,10,e0cf80c0,2024-06-27_18-44-07,85.06691837310791,889.7347893714905,242786,r8i6n8,10.159.28.66,523.7078404426575,6
1958.7154714028666,1719506732,checkpoint_000010,True,False,11,e0cf80c0,2024-06-27_18-45-32,85.6172399520874,975.3520293235779,242786,r8i6n8,10.159.28.66,609.3250803947449,7
1953.2071273683564,1719506817,checkpoint_000011,True,False,12,e0cf80c0,2024-06-27_18-46-57,84.71766662597656,1060.0696959495544,242786,r8i6n8,10.159.28.66,694.0427470207214,8
1952.5803078478716,1719506902,checkpoint_000012,True,False,13,e0cf80c0,2024-06-27_18-48-22,85.59679841995239,1145.6664943695068,242786,r8i6n8,10.159.28.66,779.6395454406738,9
1954.0447209876354,1719506988,checkpoint_000013,True,False,14,e0cf80c0,2024-06-27_18-49-48,85.16450333595276,1230.8309977054596,242786,r8i6n8,10.159.28.66,864.8040487766266,10
{"loss": 1954.021998608206, "timestamp": 1719498933, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "e0cf80c0", "date": "2024-06-27_16-35-33", "time_this_iter_s": 97.99486684799194, "time_total_s": 97.99486684799194, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 97.99486684799194, "iterations_since_restore": 1}
{"loss": 1955.7363098625124, "timestamp": 1719499017, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "e0cf80c0", "date": "2024-06-27_16-36-57", "time_this_iter_s": 83.9807825088501, "time_total_s": 181.97564935684204, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 181.97564935684204, "iterations_since_restore": 2}
{"loss": 1953.048192782665, "timestamp": 1719504822, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "e0cf80c0", "date": "2024-06-27_18-13-42", "time_this_iter_s": 99.29927706718445, "time_total_s": 281.2749264240265, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 99.29927706718445, "iterations_since_restore": 1}
{"loss": 1955.8478513702632, "timestamp": 1719504907, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "e0cf80c0", "date": "2024-06-27_18-15-07", "time_this_iter_s": 84.75202250480652, "time_total_s": 366.026948928833, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 184.05129957199097, "iterations_since_restore": 2}
{"loss": 1954.159799650898, "timestamp": 1719506222, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "e0cf80c0", "date": "2024-06-27_18-37-02", "time_this_iter_s": 99.05570006370544, "time_total_s": 465.08264899253845, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 99.05570006370544, "iterations_since_restore": 1}
{"loss": 1953.744985505352, "timestamp": 1719506307, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "e0cf80c0", "date": "2024-06-27_18-38-27", "time_this_iter_s": 84.97408151626587, "time_total_s": 550.0567305088043, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 184.0297815799713, "iterations_since_restore": 2}
{"loss": 1953.285723348302, "timestamp": 1719506392, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "e0cf80c0", "date": "2024-06-27_18-39-52", "time_this_iter_s": 85.0238299369812, "time_total_s": 635.0805604457855, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 269.0536115169525, "iterations_since_restore": 3}
{"loss": 1954.5312970979946, "timestamp": 1719506476, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "e0cf80c0", "date": "2024-06-27_18-41-16", "time_this_iter_s": 84.54337477684021, "time_total_s": 719.6239352226257, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 353.5969862937927, "iterations_since_restore": 4}
{"loss": 1954.3730785940577, "timestamp": 1719506561, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "e0cf80c0", "date": "2024-06-27_18-42-41", "time_this_iter_s": 85.04393577575684, "time_total_s": 804.6678709983826, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 438.64092206954956, "iterations_since_restore": 5}
{"loss": 1955.718712513841, "timestamp": 1719506647, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "e0cf80c0", "date": "2024-06-27_18-44-07", "time_this_iter_s": 85.06691837310791, "time_total_s": 889.7347893714905, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 523.7078404426575, "iterations_since_restore": 6}
{"loss": 1958.7154714028666, "timestamp": 1719506732, "checkpoint_dir_name": "checkpoint_000010", "should_checkpoint": true, "done": false, "training_iteration": 11, "trial_id": "e0cf80c0", "date": "2024-06-27_18-45-32", "time_this_iter_s": 85.6172399520874, "time_total_s": 975.3520293235779, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 609.3250803947449, "iterations_since_restore": 7}
{"loss": 1953.2071273683564, "timestamp": 1719506817, "checkpoint_dir_name": "checkpoint_000011", "should_checkpoint": true, "done": false, "training_iteration": 12, "trial_id": "e0cf80c0", "date": "2024-06-27_18-46-57", "time_this_iter_s": 84.71766662597656, "time_total_s": 1060.0696959495544, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 694.0427470207214, "iterations_since_restore": 8}
{"loss": 1952.5803078478716, "timestamp": 1719506902, "checkpoint_dir_name": "checkpoint_000012", "should_checkpoint": true, "done": false, "training_iteration": 13, "trial_id": "e0cf80c0", "date": "2024-06-27_18-48-22", "time_this_iter_s": 85.59679841995239, "time_total_s": 1145.6664943695068, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 779.6395454406738, "iterations_since_restore": 9}
{"loss": 1954.0447209876354, "timestamp": 1719506988, "checkpoint_dir_name": "checkpoint_000013", "should_checkpoint": true, "done": false, "training_iteration": 14, "trial_id": "e0cf80c0", "date": "2024-06-27_18-49-48", "time_this_iter_s": 85.16450333595276, "time_total_s": 1230.8309977054596, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.03611990882258942, "lr": 0.00028375287963234745, "batch_size": 2048}, "time_since_restore": 864.8040487766266, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.9609532957830483,
"embedding_dim": 64,
"encoder_ff": 512,
"encoder_num_layer": 4,
"lr": 0.0003819692551562951,
"n_head": 4
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment