Skip to content
Snippets Groups Projects
Commit 02f95633 authored by Schneider Leo's avatar Schneider Leo
Browse files

del raysesult

parent b844726e
No related branches found
No related tags found
No related merge requests found
Showing
with 0 additions and 110 deletions
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.9176352757258278,
"embedding_dim": 256,
"encoder_ff": 2048,
"encoder_num_layer": 8,
"lr": 0.014441526763377911,
"n_head": 8
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2470.2349593996064,1719493562,checkpoint_000000,True,False,1,09d4c8af,2024-06-27_15-06-02,230.70093512535095,230.70093512535095,69992,r8i6n8,10.159.28.66,230.70093512535095,1
{"loss": 2470.2349593996064, "timestamp": 1719493562, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "09d4c8af", "date": "2024-06-27_15-06-02", "time_this_iter_s": 230.70093512535095, "time_total_s": 230.70093512535095, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 256, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.9176352757258278, "lr": 0.014441526763377911, "batch_size": 2048}, "time_since_restore": 230.70093512535095, "iterations_since_restore": 1}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.6143131375049876,
"embedding_dim": 64,
"encoder_ff": 2048,
"encoder_num_layer": 4,
"lr": 0.0007003169863053682,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1980.4066219780389,1719514079,checkpoint_000000,True,False,1,0cc69cc0,2024-06-27_20-47-59,78.72657775878906,78.72657775878906,242786,r8i6n8,10.159.28.66,78.72657775878906,1
1974.7192046398252,1719514144,checkpoint_000001,True,False,2,0cc69cc0,2024-06-27_20-49-04,64.93273973464966,143.65931749343872,242786,r8i6n8,10.159.28.66,143.65931749343872,2
1979.3855787862942,1719514209,checkpoint_000002,True,False,3,0cc69cc0,2024-06-27_20-50-09,65.05311489105225,208.71243238449097,242786,r8i6n8,10.159.28.66,208.71243238449097,3
1979.0269044891118,1719514274,checkpoint_000003,True,False,4,0cc69cc0,2024-06-27_20-51-14,65.01725125312805,273.729683637619,242786,r8i6n8,10.159.28.66,273.729683637619,4
1976.4739701879307,1719514339,checkpoint_000004,True,False,5,0cc69cc0,2024-06-27_20-52-19,65.06425142288208,338.7939350605011,242786,r8i6n8,10.159.28.66,338.7939350605011,5
1978.0683257335752,1719514404,checkpoint_000005,True,False,6,0cc69cc0,2024-06-27_20-53-24,65.00006556510925,403.79400062561035,242786,r8i6n8,10.159.28.66,403.79400062561035,6
1451.6436892531988,1719514469,checkpoint_000006,True,False,7,0cc69cc0,2024-06-27_20-54-29,64.97408652305603,468.7680871486664,242786,r8i6n8,10.159.28.66,468.7680871486664,7
1978.8701690914124,1719514535,checkpoint_000007,True,False,8,0cc69cc0,2024-06-27_20-55-35,65.56082820892334,534.3289153575897,242786,r8i6n8,10.159.28.66,534.3289153575897,8
1973.6112147053395,1719514600,checkpoint_000008,True,False,9,0cc69cc0,2024-06-27_20-56-40,64.95659232139587,599.2855076789856,242786,r8i6n8,10.159.28.66,599.2855076789856,9
1973.0043147530143,1719514665,checkpoint_000009,True,False,10,0cc69cc0,2024-06-27_20-57-45,65.37610912322998,664.6616168022156,242786,r8i6n8,10.159.28.66,664.6616168022156,10
1978.763697826956,1719519614,checkpoint_000010,True,False,11,0cc69cc0,2024-06-27_22-20-14,79.15366196632385,743.8152787685394,242786,r8i6n8,10.159.28.66,79.15366196632385,1
1975.8241879921259,1719519680,checkpoint_000011,True,False,12,0cc69cc0,2024-06-27_22-21-20,65.74563002586365,809.5609087944031,242786,r8i6n8,10.159.28.66,144.8992919921875,2
1974.2569397453249,1719519746,checkpoint_000012,True,False,13,0cc69cc0,2024-06-27_22-22-26,65.7228844165802,875.2837932109833,242786,r8i6n8,10.159.28.66,210.6221764087677,3
1976.7626645546259,1719519812,checkpoint_000013,True,False,14,0cc69cc0,2024-06-27_22-23-32,66.2012448310852,941.4850380420685,242786,r8i6n8,10.159.28.66,276.8234212398529,4
1976.9357179656743,1719519878,checkpoint_000014,True,False,15,0cc69cc0,2024-06-27_22-24-38,65.79811668395996,1007.2831547260284,242786,r8i6n8,10.159.28.66,342.62153792381287,5
1976.9357958215428,1719519944,checkpoint_000015,True,False,16,0cc69cc0,2024-06-27_22-25-44,65.78404641151428,1073.0672011375427,242786,r8i6n8,10.159.28.66,408.40558433532715,6
1976.7361752968134,1719520009,checkpoint_000016,True,False,17,0cc69cc0,2024-06-27_22-26-49,65.76862573623657,1138.8358268737793,242786,r8i6n8,10.159.28.66,474.1742100715637,7
1977.8280586783342,1719520075,checkpoint_000017,True,False,18,0cc69cc0,2024-06-27_22-27-55,65.81831574440002,1204.6541426181793,242786,r8i6n8,10.159.28.66,539.9925258159637,8
1975.8057380736343,1719520141,checkpoint_000018,True,False,19,0cc69cc0,2024-06-27_22-29-01,66.07627272605896,1270.7304153442383,242786,r8i6n8,10.159.28.66,606.0687985420227,9
1976.771424781619,1719520207,checkpoint_000019,True,False,20,0cc69cc0,2024-06-27_22-30-07,65.2650773525238,1335.995492696762,242786,r8i6n8,10.159.28.66,671.3338758945465,10
{"loss": 1980.4066219780389, "timestamp": 1719514079, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "0cc69cc0", "date": "2024-06-27_20-47-59", "time_this_iter_s": 78.72657775878906, "time_total_s": 78.72657775878906, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 78.72657775878906, "iterations_since_restore": 1}
{"loss": 1974.7192046398252, "timestamp": 1719514144, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "0cc69cc0", "date": "2024-06-27_20-49-04", "time_this_iter_s": 64.93273973464966, "time_total_s": 143.65931749343872, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 143.65931749343872, "iterations_since_restore": 2}
{"loss": 1979.3855787862942, "timestamp": 1719514209, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "0cc69cc0", "date": "2024-06-27_20-50-09", "time_this_iter_s": 65.05311489105225, "time_total_s": 208.71243238449097, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 208.71243238449097, "iterations_since_restore": 3}
{"loss": 1979.0269044891118, "timestamp": 1719514274, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "0cc69cc0", "date": "2024-06-27_20-51-14", "time_this_iter_s": 65.01725125312805, "time_total_s": 273.729683637619, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 273.729683637619, "iterations_since_restore": 4}
{"loss": 1976.4739701879307, "timestamp": 1719514339, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "0cc69cc0", "date": "2024-06-27_20-52-19", "time_this_iter_s": 65.06425142288208, "time_total_s": 338.7939350605011, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 338.7939350605011, "iterations_since_restore": 5}
{"loss": 1978.0683257335752, "timestamp": 1719514404, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "0cc69cc0", "date": "2024-06-27_20-53-24", "time_this_iter_s": 65.00006556510925, "time_total_s": 403.79400062561035, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 403.79400062561035, "iterations_since_restore": 6}
{"loss": 1451.6436892531988, "timestamp": 1719514469, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "0cc69cc0", "date": "2024-06-27_20-54-29", "time_this_iter_s": 64.97408652305603, "time_total_s": 468.7680871486664, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 468.7680871486664, "iterations_since_restore": 7}
{"loss": 1978.8701690914124, "timestamp": 1719514535, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "0cc69cc0", "date": "2024-06-27_20-55-35", "time_this_iter_s": 65.56082820892334, "time_total_s": 534.3289153575897, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 534.3289153575897, "iterations_since_restore": 8}
{"loss": 1973.6112147053395, "timestamp": 1719514600, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "0cc69cc0", "date": "2024-06-27_20-56-40", "time_this_iter_s": 64.95659232139587, "time_total_s": 599.2855076789856, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 599.2855076789856, "iterations_since_restore": 9}
{"loss": 1973.0043147530143, "timestamp": 1719514665, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "0cc69cc0", "date": "2024-06-27_20-57-45", "time_this_iter_s": 65.37610912322998, "time_total_s": 664.6616168022156, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 664.6616168022156, "iterations_since_restore": 10}
{"loss": 1978.763697826956, "timestamp": 1719519614, "checkpoint_dir_name": "checkpoint_000010", "should_checkpoint": true, "done": false, "training_iteration": 11, "trial_id": "0cc69cc0", "date": "2024-06-27_22-20-14", "time_this_iter_s": 79.15366196632385, "time_total_s": 743.8152787685394, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 79.15366196632385, "iterations_since_restore": 1}
{"loss": 1975.8241879921259, "timestamp": 1719519680, "checkpoint_dir_name": "checkpoint_000011", "should_checkpoint": true, "done": false, "training_iteration": 12, "trial_id": "0cc69cc0", "date": "2024-06-27_22-21-20", "time_this_iter_s": 65.74563002586365, "time_total_s": 809.5609087944031, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 144.8992919921875, "iterations_since_restore": 2}
{"loss": 1974.2569397453249, "timestamp": 1719519746, "checkpoint_dir_name": "checkpoint_000012", "should_checkpoint": true, "done": false, "training_iteration": 13, "trial_id": "0cc69cc0", "date": "2024-06-27_22-22-26", "time_this_iter_s": 65.7228844165802, "time_total_s": 875.2837932109833, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 210.6221764087677, "iterations_since_restore": 3}
{"loss": 1976.7626645546259, "timestamp": 1719519812, "checkpoint_dir_name": "checkpoint_000013", "should_checkpoint": true, "done": false, "training_iteration": 14, "trial_id": "0cc69cc0", "date": "2024-06-27_22-23-32", "time_this_iter_s": 66.2012448310852, "time_total_s": 941.4850380420685, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 276.8234212398529, "iterations_since_restore": 4}
{"loss": 1976.9357179656743, "timestamp": 1719519878, "checkpoint_dir_name": "checkpoint_000014", "should_checkpoint": true, "done": false, "training_iteration": 15, "trial_id": "0cc69cc0", "date": "2024-06-27_22-24-38", "time_this_iter_s": 65.79811668395996, "time_total_s": 1007.2831547260284, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 342.62153792381287, "iterations_since_restore": 5}
{"loss": 1976.9357958215428, "timestamp": 1719519944, "checkpoint_dir_name": "checkpoint_000015", "should_checkpoint": true, "done": false, "training_iteration": 16, "trial_id": "0cc69cc0", "date": "2024-06-27_22-25-44", "time_this_iter_s": 65.78404641151428, "time_total_s": 1073.0672011375427, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 408.40558433532715, "iterations_since_restore": 6}
{"loss": 1976.7361752968134, "timestamp": 1719520009, "checkpoint_dir_name": "checkpoint_000016", "should_checkpoint": true, "done": false, "training_iteration": 17, "trial_id": "0cc69cc0", "date": "2024-06-27_22-26-49", "time_this_iter_s": 65.76862573623657, "time_total_s": 1138.8358268737793, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 474.1742100715637, "iterations_since_restore": 7}
{"loss": 1977.8280586783342, "timestamp": 1719520075, "checkpoint_dir_name": "checkpoint_000017", "should_checkpoint": true, "done": false, "training_iteration": 18, "trial_id": "0cc69cc0", "date": "2024-06-27_22-27-55", "time_this_iter_s": 65.81831574440002, "time_total_s": 1204.6541426181793, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 539.9925258159637, "iterations_since_restore": 8}
{"loss": 1975.8057380736343, "timestamp": 1719520141, "checkpoint_dir_name": "checkpoint_000018", "should_checkpoint": true, "done": false, "training_iteration": 19, "trial_id": "0cc69cc0", "date": "2024-06-27_22-29-01", "time_this_iter_s": 66.07627272605896, "time_total_s": 1270.7304153442383, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 606.0687985420227, "iterations_since_restore": 9}
{"loss": 1976.771424781619, "timestamp": 1719520207, "checkpoint_dir_name": "checkpoint_000019", "should_checkpoint": true, "done": false, "training_iteration": 20, "trial_id": "0cc69cc0", "date": "2024-06-27_22-30-07", "time_this_iter_s": 65.2650773525238, "time_total_s": 1335.995492696762, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 2, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.6143131375049876, "lr": 0.0007003169863053682, "batch_size": 2048}, "time_since_restore": 671.3338758945465, "iterations_since_restore": 10}
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 2048,
"decoder_rt_num_layer": 4,
"drop_rate": 0.5738068254184514,
"embedding_dim": 64,
"encoder_ff": 2048,
"encoder_num_layer": 4,
"lr": 0.009136259111296272,
"n_head": 1
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2003.1058138148992,1719493727,checkpoint_000000,True,True,1,0d034d62,2024-06-27_15-08-47,94.90786528587341,94.90786528587341,69992,r8i6n8,10.159.28.66,94.90786528587341,1
{"loss": 2003.1058138148992, "timestamp": 1719493727, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": true, "training_iteration": 1, "trial_id": "0d034d62", "date": "2024-06-27_15-08-47", "time_this_iter_s": 94.90786528587341, "time_total_s": 94.90786528587341, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.5738068254184514, "lr": 0.009136259111296272, "batch_size": 1024}, "time_since_restore": 94.90786528587341, "iterations_since_restore": 1}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 2,
"drop_rate": 0.023920599186226577,
"embedding_dim": 1024,
"encoder_ff": 1024,
"encoder_num_layer": 2,
"lr": 0.0024687399238039302,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1986.2198524775467,1719348983,checkpoint_000000,True,False,1,0f80a6d7,2024-06-25_22-56-24,363.18635082244873,363.18635082244873,2195253,r8i6n2,10.159.28.60,363.18635082244873,1
1979.5493135226993,1719349334,checkpoint_000001,True,False,2,0f80a6d7,2024-06-25_23-02-14,350.295019865036,713.4813706874847,2195253,r8i6n2,10.159.28.60,713.4813706874847,2
1964.9348182978592,1719349683,checkpoint_000002,True,False,3,0f80a6d7,2024-06-25_23-08-04,349.6246259212494,1063.1059966087341,2195253,r8i6n2,10.159.28.60,1063.1059966087341,3
1955.6751497523992,1719350034,checkpoint_000003,True,False,4,0f80a6d7,2024-06-25_23-13-54,350.46285796165466,1413.5688545703888,2195253,r8i6n2,10.159.28.60,1413.5688545703888,4
1956.1783514548474,1719350384,checkpoint_000004,True,False,5,0f80a6d7,2024-06-25_23-19-44,350.18478202819824,1763.753636598587,2195253,r8i6n2,10.159.28.60,1763.753636598587,5
1971.8988527312993,1719355866,checkpoint_000005,True,False,6,0f80a6d7,2024-06-26_00-51-07,365.2865264415741,2129.040163040161,2850562,r8i6n2,10.159.28.60,365.2865264415741,1
1955.6729476808564,1719356216,checkpoint_000006,True,False,7,0f80a6d7,2024-06-26_00-56-56,349.18421268463135,2478.2243757247925,2850562,r8i6n2,10.159.28.60,714.4707391262054,2
1957.4972913847196,1719356565,checkpoint_000007,True,False,8,0f80a6d7,2024-06-26_01-02-46,349.7124717235565,2827.936847448349,2850562,r8i6n2,10.159.28.60,1064.183210849762,3
1967.2758471871923,1719356915,checkpoint_000008,True,False,9,0f80a6d7,2024-06-26_01-08-35,349.3587329387665,3177.2955803871155,2850562,r8i6n2,10.159.28.60,1413.5419437885284,4
1959.91755063515,1719357265,checkpoint_000009,True,True,10,0f80a6d7,2024-06-26_01-14-25,349.87603521347046,3527.171615600586,2850562,r8i6n2,10.159.28.60,1763.417979001999,5
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment