Skip to content
Snippets Groups Projects
Commit 02f95633 authored by Schneider Leo's avatar Schneider Leo
Browse files

del raysesult

parent b844726e
No related branches found
No related tags found
No related merge requests found
Showing
with 0 additions and 98 deletions
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1987.5899369848057,1719496799,checkpoint_000000,True,False,1,5fd6b12b,2024-06-27_15-59-59,79.29838418960571,79.29838418960571,69992,r8i6n8,10.159.28.66,79.29838418960571,1
1964.0069681002399,1719496864,checkpoint_000001,True,False,2,5fd6b12b,2024-06-27_16-01-04,65.23948526382446,144.53786945343018,69992,r8i6n8,10.159.28.66,144.53786945343018,2
1967.0336683378446,1719502712,checkpoint_000002,True,False,3,5fd6b12b,2024-06-27_17-38-32,78.57935905456543,223.1172285079956,242786,r8i6n8,10.159.28.66,78.57935905456543,1
1958.9930592934916,1719502777,checkpoint_000003,True,False,4,5fd6b12b,2024-06-27_17-39-37,65.23711919784546,288.35434770584106,242786,r8i6n8,10.159.28.66,143.8164782524109,2
1975.2254739596149,1719505928,checkpoint_000004,True,False,5,5fd6b12b,2024-06-27_18-32-08,78.82753491401672,367.1818826198578,242786,r8i6n8,10.159.28.66,78.82753491401672,1
1980.3283037801427,1719505993,checkpoint_000005,True,False,6,5fd6b12b,2024-06-27_18-33-13,64.60036778450012,431.7822504043579,242786,r8i6n8,10.159.28.66,143.42790269851685,2
1965.8961032657173,1719506058,checkpoint_000006,True,False,7,5fd6b12b,2024-06-27_18-34-18,64.92104005813599,496.7032904624939,242786,r8i6n8,10.159.28.66,208.34894275665283,3
1969.885332723302,1719506123,checkpoint_000007,True,False,8,5fd6b12b,2024-06-27_18-35-23,65.11498975753784,561.8182802200317,242786,r8i6n8,10.159.28.66,273.4639325141907,4
{"loss": 1987.5899369848057, "timestamp": 1719496799, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "5fd6b12b", "date": "2024-06-27_15-59-59", "time_this_iter_s": 79.29838418960571, "time_total_s": 79.29838418960571, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 79.29838418960571, "iterations_since_restore": 1}
{"loss": 1964.0069681002399, "timestamp": 1719496864, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "5fd6b12b", "date": "2024-06-27_16-01-04", "time_this_iter_s": 65.23948526382446, "time_total_s": 144.53786945343018, "pid": 69992, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 144.53786945343018, "iterations_since_restore": 2}
{"loss": 1967.0336683378446, "timestamp": 1719502712, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "5fd6b12b", "date": "2024-06-27_17-38-32", "time_this_iter_s": 78.57935905456543, "time_total_s": 223.1172285079956, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 78.57935905456543, "iterations_since_restore": 1}
{"loss": 1958.9930592934916, "timestamp": 1719502777, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "5fd6b12b", "date": "2024-06-27_17-39-37", "time_this_iter_s": 65.23711919784546, "time_total_s": 288.35434770584106, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 143.8164782524109, "iterations_since_restore": 2}
{"loss": 1975.2254739596149, "timestamp": 1719505928, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "5fd6b12b", "date": "2024-06-27_18-32-08", "time_this_iter_s": 78.82753491401672, "time_total_s": 367.1818826198578, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 78.82753491401672, "iterations_since_restore": 1}
{"loss": 1980.3283037801427, "timestamp": 1719505993, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "5fd6b12b", "date": "2024-06-27_18-33-13", "time_this_iter_s": 64.60036778450012, "time_total_s": 431.7822504043579, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 143.42790269851685, "iterations_since_restore": 2}
{"loss": 1965.8961032657173, "timestamp": 1719506058, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "5fd6b12b", "date": "2024-06-27_18-34-18", "time_this_iter_s": 64.92104005813599, "time_total_s": 496.7032904624939, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 208.34894275665283, "iterations_since_restore": 3}
{"loss": 1969.885332723302, "timestamp": 1719506123, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "5fd6b12b", "date": "2024-06-27_18-35-23", "time_this_iter_s": 65.11498975753784, "time_total_s": 561.8182802200317, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 1, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 16, "drop_rate": 0.2066693100484649, "lr": 0.01811726031464282, "batch_size": 1024}, "time_since_restore": 273.4639325141907, "iterations_since_restore": 4}
{
"batch_size": 2048,
"decoder_int_ff": 2048,
"decoder_int_num_layer": 8,
"decoder_rt_ff": 2048,
"decoder_rt_num_layer": 1,
"drop_rate": 0.6683907000004579,
"embedding_dim": 16,
"encoder_ff": 2048,
"encoder_num_layer": 8,
"lr": 0.0001175178193869245,
"n_head": 4
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1981.618032380352,1719326489,checkpoint_000000,True,False,1,651349c4,2024-06-25_16-41-29,86.11733651161194,86.11733651161194,69318,r3i5n6,10.159.8.159,86.11733651161194,1
{"loss": 1981.618032380352, "timestamp": 1719326489, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "651349c4", "date": "2024-06-25_16-41-29", "time_this_iter_s": 86.11733651161194, "time_total_s": 86.11733651161194, "pid": 69318, "hostname": "r3i5n6", "node_ip": "10.159.8.159", "config": {"encoder_num_layer": 8, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 8, "embedding_dim": 16, "encoder_ff": 2048, "decoder_rt_ff": 2048, "decoder_int_ff": 2048, "n_head": 4, "drop_rate": 0.6683907000004579, "lr": 0.0001175178193869245, "batch_size": 2048}, "time_since_restore": 86.11733651161194, "iterations_since_restore": 1}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 2048,
"decoder_rt_num_layer": 4,
"drop_rate": 0.4436137502039823,
"embedding_dim": 256,
"encoder_ff": 512,
"encoder_num_layer": 2,
"lr": 0.07179226263764402,
"n_head": 8
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
3811.964426596334,1719334521,checkpoint_000000,True,False,1,6743cdee,2024-06-25_18-55-21,141.20554637908936,141.20554637908936,2195253,r8i6n2,10.159.28.60,141.20554637908936,1
2680.254179226132,1719334648,checkpoint_000001,True,False,2,6743cdee,2024-06-25_18-57-29,127.1407482624054,268.34629464149475,2195253,r8i6n2,10.159.28.60,268.34629464149475,2
{"loss": 3811.964426596334, "timestamp": 1719334521, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "6743cdee", "date": "2024-06-25_18-55-21", "time_this_iter_s": 141.20554637908936, "time_total_s": 141.20554637908936, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 2, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 256, "encoder_ff": 512, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.4436137502039823, "lr": 0.07179226263764402, "batch_size": 2048}, "time_since_restore": 141.20554637908936, "iterations_since_restore": 1}
{"loss": 2680.254179226132, "timestamp": 1719334648, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "6743cdee", "date": "2024-06-25_18-57-29", "time_this_iter_s": 127.1407482624054, "time_total_s": 268.34629464149475, "pid": 2195253, "hostname": "r8i6n2", "node_ip": "10.159.28.60", "config": {"encoder_num_layer": 2, "decoder_rt_num_layer": 4, "decoder_int_num_layer": 1, "embedding_dim": 256, "encoder_ff": 512, "decoder_rt_ff": 2048, "decoder_int_ff": 512, "n_head": 8, "drop_rate": 0.4436137502039823, "lr": 0.07179226263764402, "batch_size": 2048}, "time_since_restore": 268.34629464149475, "iterations_since_restore": 2}
{
"batch_size": 2048,
"decoder_int_ff": 512,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 1,
"drop_rate": 0.7402505539115447,
"embedding_dim": 64,
"encoder_ff": 1024,
"encoder_num_layer": 4,
"lr": 0.0006126521431696416,
"n_head": 1
}
\ No newline at end of file
loss,timestamp,checkpoint_dir_name,should_checkpoint,done,training_iteration,trial_id,date,time_this_iter_s,time_total_s,pid,hostname,node_ip,time_since_restore,iterations_since_restore
1988.1164252814347,1719511145,checkpoint_000000,True,False,1,694ee9b5,2024-06-27_19-59-05,70.52699637413025,70.52699637413025,242786,r8i6n8,10.159.28.66,70.52699637413025,1
2003.6415064053272,1719511203,checkpoint_000001,True,False,2,694ee9b5,2024-06-27_20-00-03,57.75782370567322,128.28482007980347,242786,r8i6n8,10.159.28.66,128.28482007980347,2
1990.098658764456,1719511261,checkpoint_000002,True,False,3,694ee9b5,2024-06-27_20-01-01,57.42855453491211,185.71337461471558,242786,r8i6n8,10.159.28.66,185.71337461471558,3
1556.502945066437,1719511318,checkpoint_000003,True,False,4,694ee9b5,2024-06-27_20-01-58,57.167978286743164,242.88135290145874,242786,r8i6n8,10.159.28.66,242.88135290145874,4
1371.0674741249384,1719511376,checkpoint_000004,True,False,5,694ee9b5,2024-06-27_20-02-56,58.11665964126587,300.9980125427246,242786,r8i6n8,10.159.28.66,300.9980125427246,5
1413.1876518670028,1719511433,checkpoint_000005,True,False,6,694ee9b5,2024-06-27_20-03-53,57.10992646217346,358.10793900489807,242786,r8i6n8,10.159.28.66,358.10793900489807,6
1547.3413826048843,1719511491,checkpoint_000006,True,False,7,694ee9b5,2024-06-27_20-04-51,57.56092953681946,415.66886854171753,242786,r8i6n8,10.159.28.66,415.66886854171753,7
1366.6497523991143,1719511548,checkpoint_000007,True,False,8,694ee9b5,2024-06-27_20-05-49,57.96260166168213,473.63147020339966,242786,r8i6n8,10.159.28.66,473.63147020339966,8
1566.9438976377953,1719511606,checkpoint_000008,True,False,9,694ee9b5,2024-06-27_20-06-46,57.52634882926941,531.1578190326691,242786,r8i6n8,10.159.28.66,531.1578190326691,9
1427.2011093980684,1719511663,checkpoint_000009,True,False,10,694ee9b5,2024-06-27_20-07-43,57.44098997116089,588.59880900383,242786,r8i6n8,10.159.28.66,588.59880900383,10
{"loss": 1988.1164252814347, "timestamp": 1719511145, "checkpoint_dir_name": "checkpoint_000000", "should_checkpoint": true, "done": false, "training_iteration": 1, "trial_id": "694ee9b5", "date": "2024-06-27_19-59-05", "time_this_iter_s": 70.52699637413025, "time_total_s": 70.52699637413025, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 70.52699637413025, "iterations_since_restore": 1}
{"loss": 2003.6415064053272, "timestamp": 1719511203, "checkpoint_dir_name": "checkpoint_000001", "should_checkpoint": true, "done": false, "training_iteration": 2, "trial_id": "694ee9b5", "date": "2024-06-27_20-00-03", "time_this_iter_s": 57.75782370567322, "time_total_s": 128.28482007980347, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 128.28482007980347, "iterations_since_restore": 2}
{"loss": 1990.098658764456, "timestamp": 1719511261, "checkpoint_dir_name": "checkpoint_000002", "should_checkpoint": true, "done": false, "training_iteration": 3, "trial_id": "694ee9b5", "date": "2024-06-27_20-01-01", "time_this_iter_s": 57.42855453491211, "time_total_s": 185.71337461471558, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 185.71337461471558, "iterations_since_restore": 3}
{"loss": 1556.502945066437, "timestamp": 1719511318, "checkpoint_dir_name": "checkpoint_000003", "should_checkpoint": true, "done": false, "training_iteration": 4, "trial_id": "694ee9b5", "date": "2024-06-27_20-01-58", "time_this_iter_s": 57.167978286743164, "time_total_s": 242.88135290145874, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 242.88135290145874, "iterations_since_restore": 4}
{"loss": 1371.0674741249384, "timestamp": 1719511376, "checkpoint_dir_name": "checkpoint_000004", "should_checkpoint": true, "done": false, "training_iteration": 5, "trial_id": "694ee9b5", "date": "2024-06-27_20-02-56", "time_this_iter_s": 58.11665964126587, "time_total_s": 300.9980125427246, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 300.9980125427246, "iterations_since_restore": 5}
{"loss": 1413.1876518670028, "timestamp": 1719511433, "checkpoint_dir_name": "checkpoint_000005", "should_checkpoint": true, "done": false, "training_iteration": 6, "trial_id": "694ee9b5", "date": "2024-06-27_20-03-53", "time_this_iter_s": 57.10992646217346, "time_total_s": 358.10793900489807, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 358.10793900489807, "iterations_since_restore": 6}
{"loss": 1547.3413826048843, "timestamp": 1719511491, "checkpoint_dir_name": "checkpoint_000006", "should_checkpoint": true, "done": false, "training_iteration": 7, "trial_id": "694ee9b5", "date": "2024-06-27_20-04-51", "time_this_iter_s": 57.56092953681946, "time_total_s": 415.66886854171753, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 415.66886854171753, "iterations_since_restore": 7}
{"loss": 1366.6497523991143, "timestamp": 1719511548, "checkpoint_dir_name": "checkpoint_000007", "should_checkpoint": true, "done": false, "training_iteration": 8, "trial_id": "694ee9b5", "date": "2024-06-27_20-05-49", "time_this_iter_s": 57.96260166168213, "time_total_s": 473.63147020339966, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 473.63147020339966, "iterations_since_restore": 8}
{"loss": 1566.9438976377953, "timestamp": 1719511606, "checkpoint_dir_name": "checkpoint_000008", "should_checkpoint": true, "done": false, "training_iteration": 9, "trial_id": "694ee9b5", "date": "2024-06-27_20-06-46", "time_this_iter_s": 57.52634882926941, "time_total_s": 531.1578190326691, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 531.1578190326691, "iterations_since_restore": 9}
{"loss": 1427.2011093980684, "timestamp": 1719511663, "checkpoint_dir_name": "checkpoint_000009", "should_checkpoint": true, "done": false, "training_iteration": 10, "trial_id": "694ee9b5", "date": "2024-06-27_20-07-43", "time_this_iter_s": 57.44098997116089, "time_total_s": 588.59880900383, "pid": 242786, "hostname": "r8i6n8", "node_ip": "10.159.28.66", "config": {"encoder_num_layer": 4, "decoder_rt_num_layer": 1, "decoder_int_num_layer": 1, "embedding_dim": 64, "encoder_ff": 1024, "decoder_rt_ff": 1024, "decoder_int_ff": 512, "n_head": 1, "drop_rate": 0.7402505539115447, "lr": 0.0006126521431696416, "batch_size": 2048}, "time_since_restore": 588.59880900383, "iterations_since_restore": 10}
{
"batch_size": 2048,
"decoder_int_ff": 1024,
"decoder_int_num_layer": 1,
"decoder_rt_ff": 1024,
"decoder_rt_num_layer": 2,
"drop_rate": 0.06860896590384413,
"embedding_dim": 16,
"encoder_ff": 512,
"encoder_num_layer": 1,
"lr": 0.00016561766448063182,
"n_head": 4
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment