Skip to content
Snippets Groups Projects
Commit 915e419e authored by Léo Schneider's avatar Léo Schneider Committed by Schneider Leo
Browse files

res

parent a790c5c2
No related branches found
No related tags found
No related merge requests found
Showing
with 98 additions and 0 deletions
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
3133.156076986959,1719499095,checkpoint_000000,True,False,1,849f9246,2024-06-27_16-38-15,78.58129525184631,78.58129525184631,242786,r8i6n8,10.159.28.66,78.58129525184631,1
2193.2057009719488,1719499162,checkpoint_000001,True,False,2,849f9246,2024-06-27_16-39-22,66.90322375297546,145.48451900482178,242786,r8i6n8,10.159.28.66,145.48451900482178,2
{"loss": 3133.156076986959, "timestamp": 1719499095, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "849f9246", "date": "2024-06-27_16-38-15", "time_this_iter_s": 78.58129525184631, "time_total_s": 78.58129525184631, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.6055751532136977, "lr": 0.08464538523322317, "batch_size": 2048}, "time_since_restore": 78.58129525184631, "iterations_since_restore": 1}
{"loss": 2193.2057009719488, "timestamp": 1719499162, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "849f9246", "date": "2024-06-27_16-39-22", "time_this_iter_s": 66.90322375297546, "time_total_s": 145.48451900482178, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.6055751532136977, "lr": 0.08464538523322317, "batch_size": 2048}, "time_since_restore": 145.48451900482178, "iterations_since_restore": 2}
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 2048,
"decoder_rt_num_layer": 4,
"drop_rate": 0.02058782092742384,
"embedding_dim": 16,
"encoder_ff": 2048,
"encoder_num_layer": 8,
"lr": 0.00012206173551085312,
"n_head": 16
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1955.2079112135518,1719549284,checkpoint_000000,True,False,1,88943ec6,2024-06-28_06-34-44,138.29581928253174,138.29581928253174,242786,r8i6n8,10.159.28.66,138.29581928253174,1
1952.9390787440022,1719549409,checkpoint_000001,True,False,2,88943ec6,2024-06-28_06-36-49,125.04476261138916,263.3405818939209,242786,r8i6n8,10.159.28.66,263.3405818939209,2
1953.1876744548167,1719549534,checkpoint_000002,True,False,3,88943ec6,2024-06-28_06-38-54,124.98309111595154,388.32367300987244,242786,r8i6n8,10.159.28.66,388.32367300987244,3
1957.8012575164555,1719549659,checkpoint_000003,True,False,4,88943ec6,2024-06-28_06-40-59,124.89581799507141,513.2194910049438,242786,r8i6n8,10.159.28.66,513.2194910049438,4
1955.3321187177041,1719549784,checkpoint_000004,True,False,5,88943ec6,2024-06-28_06-43-04,124.5345048904419,637.7539958953857,242786,r8i6n8,10.159.28.66,637.7539958953857,5
1955.422944316714,1719549909,checkpoint_000005,True,False,6,88943ec6,2024-06-28_06-45-09,125.16982364654541,762.9238195419312,242786,r8i6n8,10.159.28.66,762.9238195419312,6
1955.47275332954,1719550034,checkpoint_000006,True,False,7,88943ec6,2024-06-28_06-47-14,124.71126890182495,887.6350884437561,242786,r8i6n8,10.159.28.66,887.6350884437561,7
1953.6913279135397,1719550158,checkpoint_000007,True,False,8,88943ec6,2024-06-28_06-49-18,124.53526043891907,1012.1703488826752,242786,r8i6n8,10.159.28.66,1012.1703488826752,8
1952.0587047667016,1719550282,checkpoint_000008,True,False,9,88943ec6,2024-06-28_06-51-22,123.8325846195221,1136.0029335021973,242786,r8i6n8,10.159.28.66,1136.0029335021973,9
1953.125932348056,1719550406,checkpoint_000009,True,False,10,88943ec6,2024-06-28_06-53-26,124.03362774848938,1260.0365612506866,242786,r8i6n8,10.159.28.66,1260.0365612506866,10
{"loss": 1955.2079112135518, "timestamp": 1719549284, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "88943ec6", "date": "2024-06-28_06-34-44", "time_this_iter_s": 138.29581928253174, "time_total_s": 138.29581928253174, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 138.29581928253174, "iterations_since_restore": 1}
{"loss": 1952.9390787440022, "timestamp": 1719549409, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "88943ec6", "date": "2024-06-28_06-36-49", "time_this_iter_s": 125.04476261138916, "time_total_s": 263.3405818939209, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 263.3405818939209, "iterations_since_restore": 2}
{"loss": 1953.1876744548167, "timestamp": 1719549534, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "88943ec6", "date": "2024-06-28_06-38-54", "time_this_iter_s": 124.98309111595154, "time_total_s": 388.32367300987244, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 388.32367300987244, "iterations_since_restore": 3}
{"loss": 1957.8012575164555, "timestamp": 1719549659, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "88943ec6", "date": "2024-06-28_06-40-59", "time_this_iter_s": 124.89581799507141, "time_total_s": 513.2194910049438, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 513.2194910049438, "iterations_since_restore": 4}
{"loss": 1955.3321187177041, "timestamp": 1719549784, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "88943ec6", "date": "2024-06-28_06-43-04", "time_this_iter_s": 124.5345048904419, "time_total_s": 637.7539958953857, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 637.7539958953857, "iterations_since_restore": 5}
{"loss": 1955.422944316714, "timestamp": 1719549909, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "88943ec6", "date": "2024-06-28_06-45-09", "time_this_iter_s": 125.16982364654541, "time_total_s": 762.9238195419312, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 762.9238195419312, "iterations_since_restore": 6}
{"loss": 1955.47275332954, "timestamp": 1719550034, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "88943ec6", "date": "2024-06-28_06-47-14", "time_this_iter_s": 124.71126890182495, "time_total_s": 887.6350884437561, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 887.6350884437561, "iterations_since_restore": 7}
{"loss": 1953.6913279135397, "timestamp": 1719550158, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "88943ec6", "date": "2024-06-28_06-49-18", "time_this_iter_s": 124.53526043891907, "time_total_s": 1012.1703488826752, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 1012.1703488826752, "iterations_since_restore": 8}
{"loss": 1952.0587047667016, "timestamp": 1719550282, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "88943ec6", "date": "2024-06-28_06-51-22", "time_this_iter_s": 123.8325846195221, "time_total_s": 1136.0029335021973, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 1136.0029335021973, "iterations_since_restore": 9}
{"loss": 1953.125932348056, "timestamp": 1719550406, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "88943ec6", "date": "2024-06-28_06-53-26", "time_this_iter_s": 124.03362774848938, "time_total_s": 1260.0365612506866, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.02058782092742384, "lr": 0.00012206173551085312, "batch_size": 1024}, "time_since_restore": 1260.0365612506866, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 512,
"decoder_rt_num_layer": 1,
"drop_rate": 0.2933049514156799,
"embedding_dim": 64,
"encoder_ff": 2048,
"encoder_num_layer": 4,
"lr": 0.011848091629580768,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
2238.4140029066193,1719509287,checkpoint_000000,True,False,1,8e5e7f52,2024-06-27_19-28-07,76.45697116851807,76.45697116851807,242786,r8i6n8,10.159.28.66,76.45697116851807,1
2216.8567279004674,1719509350,checkpoint_000001,True,False,2,8e5e7f52,2024-06-27_19-29-10,63.10471820831299,139.56168937683105,242786,r8i6n8,10.159.28.66,139.56168937683105,2
2184.21265321266,1719509413,checkpoint_000002,True,False,3,8e5e7f52,2024-06-27_19-30-13,62.492005825042725,202.05369520187378,242786,r8i6n8,10.159.28.66,202.05369520187378,3
2145.5848196435163,1719509475,checkpoint_000003,True,False,4,8e5e7f52,2024-06-27_19-31-15,62.598204612731934,264.6518998146057,242786,r8i6n8,10.159.28.66,264.6518998146057,4
2114.985403466412,1719509537,checkpoint_000004,True,False,5,8e5e7f52,2024-06-27_19-32-17,62.10174918174744,326.75364899635315,242786,r8i6n8,10.159.28.66,326.75364899635315,5
{"loss": 2238.4140029066193, "timestamp": 1719509287, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "8e5e7f52", "date": "2024-06-27_19-28-07", "time_this_iter_s": 76.45697116851807, "time_total_s": 76.45697116851807, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.2933049514156799, "lr": 0.011848091629580768, "batch_size": 2048}, "time_since_restore": 76.45697116851807, "iterations_since_restore": 1}
{"loss": 2216.8567279004674, "timestamp": 1719509350, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "8e5e7f52", "date": "2024-06-27_19-29-10", "time_this_iter_s": 63.10471820831299, "time_total_s": 139.56168937683105, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.2933049514156799, "lr": 0.011848091629580768, "batch_size": 2048}, "time_since_restore": 139.56168937683105, "iterations_since_restore": 2}
{"loss": 2184.21265321266, "timestamp": 1719509413, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "8e5e7f52", "date": "2024-06-27_19-30-13", "time_this_iter_s": 62.492005825042725, "time_total_s": 202.05369520187378, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.2933049514156799, "lr": 0.011848091629580768, "batch_size": 2048}, "time_since_restore": 202.05369520187378, "iterations_since_restore": 3}
{"loss": 2145.5848196435163, "timestamp": 1719509475, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "8e5e7f52", "date": "2024-06-27_19-31-15", "time_this_iter_s": 62.598204612731934, "time_total_s": 264.6518998146057, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.2933049514156799, "lr": 0.011848091629580768, "batch_size": 2048}, "time_since_restore": 264.6518998146057, "iterations_since_restore": 4}
{"loss": 2114.985403466412, "timestamp": 1719509537, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "8e5e7f52", "date": "2024-06-27_19-32-17", "time_this_iter_s": 62.10174918174744, "time_total_s": 326.75364899635315, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 2048, "decoder_rt_ff": 512, "decoder_int_ff": 512, "n_head": 4, "drop_rate": 0.2933049514156799, "lr": 0.011848091629580768, "batch_size": 2048}, "time_since_restore": 326.75364899635315, "iterations_since_restore": 5}
{
"batch_size": 1024,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 8,
"drop_rate": 0.7914041407453669,
"embedding_dim": 16,
"encoder_ff": 1024,
"encoder_num_layer": 1,
"lr": 0.0017184389008014717,
"n_head": 1
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1996.2721538393516,1719502422,checkpoint_000000,True,False,1,93c649bd,2024-06-27_17-33-42,84.1758508682251,84.1758508682251,242786,r8i6n8,10.159.28.66,84.1758508682251,1
1999.4757651982345,1719502493,checkpoint_000001,True,False,2,93c649bd,2024-06-27_17-34-53,70.39586234092712,154.57171320915222,242786,r8i6n8,10.159.28.66,154.57171320915222,2
2008.213741753045,1719502563,checkpoint_000002,True,False,3,93c649bd,2024-06-27_17-36-03,70.20663857460022,224.77835178375244,242786,r8i6n8,10.159.28.66,224.77835178375244,3
1996.1505780557948,1719502633,checkpoint_000003,True,False,4,93c649bd,2024-06-27_17-37-13,70.27228903770447,295.0506408214569,242786,r8i6n8,10.159.28.66,295.0506408214569,4
{"loss": 1996.2721538393516, "timestamp": 1719502422, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "93c649bd", "date": "2024-06-27_17-33-42", "time_this_iter_s": 84.1758508682251, "time_total_s": 84.1758508682251, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7914041407453669, "lr": 0.0017184389008014717, "batch_size": 1024}, "time_since_restore": 84.1758508682251, "iterations_since_restore": 1}
{"loss": 1999.4757651982345, "timestamp": 1719502493, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "93c649bd", "date": "2024-06-27_17-34-53", "time_this_iter_s": 70.39586234092712, "time_total_s": 154.57171320915222, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7914041407453669, "lr": 0.0017184389008014717, "batch_size": 1024}, "time_since_restore": 154.57171320915222, "iterations_since_restore": 2}
{"loss": 2008.213741753045, "timestamp": 1719502563, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "93c649bd", "date": "2024-06-27_17-36-03", "time_this_iter_s": 70.20663857460022, "time_total_s": 224.77835178375244, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7914041407453669, "lr": 0.0017184389008014717, "batch_size": 1024}, "time_since_restore": 224.77835178375244, "iterations_since_restore": 3}
{"loss": 1996.1505780557948, "timestamp": 1719502633, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "93c649bd", "date": "2024-06-27_17-37-13", "time_this_iter_s": 70.27228903770447, "time_total_s": 295.0506408214569, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 8, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7914041407453669, "lr": 0.0017184389008014717, "batch_size": 1024}, "time_since_restore": 295.0506408214569, "iterations_since_restore": 4}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 2048,
"decoder_rt_num_layer": 1,
"drop_rate": 0.7686353033166121,
"embedding_dim": 256,
"encoder_ff": 2048,
"encoder_num_layer": 8,
"lr": 0.00011707230271575167,
"n_head": 16
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment