# Note: In this checkpoint, we use total batch size 1536 on 3 nodes instead of default total batch size 2048. {"train_lr": 1.0000000000000165e-06, "train_loss": 6.947688245349269, "epoch": 0, "n_parameters": 19839528} {"train_lr": 1.0000000000000165e-06, "train_loss": 6.906806535214829, "epoch": 1, "n_parameters": 19839528} {"train_lr": 0.00030079999999999566, "train_loss": 6.750862715865591, "epoch": 2, "n_parameters": 19839528} {"train_lr": 0.0006006000000000057, "train_loss": 6.464740750458029, "epoch": 3, "n_parameters": 19839528} {"train_lr": 0.0009004000000000146, "train_loss": 6.189836003201948, "epoch": 4, "n_parameters": 19839528} {"train_lr": 0.00120019999999999, "train_loss": 5.901831143932472, "epoch": 5, "n_parameters": 19839528} {"train_lr": 0.0014989790033921367, "train_loss": 5.634134349562853, "epoch": 6, "n_parameters": 19839528} {"train_lr": 0.001498529912679069, "train_loss": 5.371459696325752, "epoch": 7, "n_parameters": 19839528} {"train_lr": 0.001497999285532199, "train_loss": 5.16688393688888, "epoch": 8, "n_parameters": 19839528} {"train_lr": 0.0014973871801409009, "train_loss": 5.015170075148225, "test_loss": 2.5237968180779076, "test_acc1": 46.514001395874025, "test_acc5": 72.64600218139648, "epoch": 9, "n_parameters": 19839528} {"train_lr": 0.001496693663629296, "train_loss": 4.875404845574777, "epoch": 10, "n_parameters": 19839528} {"train_lr": 0.0014959188120493578, "train_loss": 4.756588101196441, "epoch": 11, "n_parameters": 19839528} {"train_lr": 0.0014950627103722735, "train_loss": 4.66400419322135, "epoch": 12, "n_parameters": 19839528} {"train_lr": 0.001494125452479267, "train_loss": 4.571849648627064, "epoch": 13, "n_parameters": 19839528} {"train_lr": 0.0014931071411512452, "train_loss": 4.496018391885727, "epoch": 14, "n_parameters": 19839528} {"train_lr": 0.0014920078880574345, "train_loss": 4.433957217206105, "epoch": 15, "n_parameters": 19839528} {"train_lr": 0.0014908278137433452, "train_loss": 4.363442792261628, "epoch": 16, "n_parameters": 19839528} {"train_lr": 0.0014895670476175297, "train_loss": 4.320734623870213, "epoch": 17, "n_parameters": 19839528} {"train_lr": 0.0014882257279370923, "train_loss": 4.2681059798033685, "epoch": 18, "n_parameters": 19839528} {"train_lr": 0.0014868040017928692, "train_loss": 4.226282092581074, "test_loss": 1.6585596278166816, "test_acc1": 63.15200188232422, "test_acc5": 85.85600247314453, "epoch": 19, "n_parameters": 19839528} {"train_lr": 0.0014853020250931849, "train_loss": 4.179341602549374, "epoch": 20, "n_parameters": 19839528} {"train_lr": 0.0014837199625466779, "train_loss": 4.144583556875527, "epoch": 21, "n_parameters": 19839528} {"train_lr": 0.0014820579876443744, "train_loss": 4.119000114720883, "epoch": 22, "n_parameters": 19839528} {"train_lr": 0.0014803162826405153, "train_loss": 4.084575508864854, "epoch": 23, "n_parameters": 19839528} {"train_lr": 0.0014784950385326957, "train_loss": 4.065180547505641, "epoch": 24, "n_parameters": 19839528} {"train_lr": 0.0014765944550408027, "train_loss": 4.030295823129723, "epoch": 25, "n_parameters": 19839528} {"train_lr": 0.001474614740585323, "train_loss": 4.008203195224849, "epoch": 26, "n_parameters": 19839528} {"train_lr": 0.001472556112264245, "train_loss": 3.98382104041098, "epoch": 27, "n_parameters": 19839528} {"train_lr": 0.0014704187958293408, "train_loss": 3.95857941282453, "epoch": 28, "n_parameters": 19839528} {"train_lr": 0.0014682030256614013, "train_loss": 3.9418227669003483, "test_loss": 1.4053193943685853, "test_acc1": 68.0720020690918, "test_acc5": 89.12400251220703, "epoch": 29, "n_parameters": 19839528} {"train_lr": 0.0014659090447446384, "train_loss": 3.917877770168223, "epoch": 30, "n_parameters": 19839528} {"train_lr": 0.0014635371046398723, "train_loss": 3.8985606254600316, "epoch": 31, "n_parameters": 19839528} {"train_lr": 0.0014610874654571253, "train_loss": 3.89243519001251, "epoch": 32, "n_parameters": 19839528} {"train_lr": 0.0014585603958269045, "train_loss": 3.8673097123440314, "epoch": 33, "n_parameters": 19839528} {"train_lr": 0.0014559561728708823, "train_loss": 3.8573365786092744, "epoch": 34, "n_parameters": 19839528} {"train_lr": 0.0014532750821714343, "train_loss": 3.8401040153728303, "epoch": 35, "n_parameters": 19839528} {"train_lr": 0.0014505174177404001, "train_loss": 3.8260656106564923, "epoch": 36, "n_parameters": 19839528} {"train_lr": 0.00144768348198676, "train_loss": 3.8082419272235257, "epoch": 37, "n_parameters": 19839528} {"train_lr": 0.0014447735856834417, "train_loss": 3.806362329853429, "epoch": 38, "n_parameters": 19839528} {"train_lr": 0.001441788047933402, "train_loss": 3.7944285382422134, "test_loss": 1.3137738484453103, "test_acc1": 70.0560020703125, "test_acc5": 90.08200244628907, "epoch": 39, "n_parameters": 19839528} {"train_lr": 0.0014387271961345588, "train_loss": 3.7716537043273592, "epoch": 40, "n_parameters": 19839528} {"train_lr": 0.001435591365943752, "train_loss": 3.7691054848982373, "epoch": 41, "n_parameters": 19839528} {"train_lr": 0.0014323809012400694, "train_loss": 3.753198569710497, "epoch": 42, "n_parameters": 19839528} {"train_lr": 0.0014290961540871859, "train_loss": 3.7490347150346928, "epoch": 43, "n_parameters": 19839528} {"train_lr": 0.0014257374846946504, "train_loss": 3.7399942430017665, "epoch": 44, "n_parameters": 19839528} {"train_lr": 0.0014223052613783597, "train_loss": 3.7183216890151933, "epoch": 45, "n_parameters": 19839528} {"train_lr": 0.0014187998605203313, "train_loss": 3.718256932773369, "epoch": 46, "n_parameters": 19839528} {"train_lr": 0.001415221666527278, "train_loss": 3.710923992145023, "epoch": 47, "n_parameters": 19839528} {"train_lr": 0.0014115710717884254, "train_loss": 3.7006157325874036, "epoch": 48, "n_parameters": 19839528} {"train_lr": 0.0014078484766326686, "train_loss": 3.68586700798558, "test_loss": 1.2460817657768612, "test_acc1": 71.38200198974609, "test_acc5": 91.01800245117188, "epoch": 49, "n_parameters": 19839528} {"train_lr": 0.0014040542892845619, "train_loss": 3.688040502446828, "epoch": 50, "n_parameters": 19839528} {"train_lr": 0.0014001889258194106, "train_loss": 3.6761270952667835, "epoch": 51, "n_parameters": 19839528} {"train_lr": 0.0013962528101179224, "train_loss": 3.670613186143571, "epoch": 52, "n_parameters": 19839528} {"train_lr": 0.0013922463738196042, "train_loss": 3.6574560655988186, "epoch": 53, "n_parameters": 19839528} {"train_lr": 0.001388170056275224, "train_loss": 3.6521241424752655, "epoch": 54, "n_parameters": 19839528} {"train_lr": 0.001384024304499001, "train_loss": 3.645007494988916, "epoch": 55, "n_parameters": 19839528} {"train_lr": 0.0013798095731193541, "train_loss": 3.6392382943480133, "epoch": 56, "n_parameters": 19839528} {"train_lr": 0.0013755263243290382, "train_loss": 3.6331012160431664, "epoch": 57, "n_parameters": 19839528} {"train_lr": 0.0013711750278345505, "train_loss": 3.6251249182150422, "epoch": 58, "n_parameters": 19839528} {"train_lr": 0.0013667561608046155, "train_loss": 3.6197832348011287, "test_loss": 1.2162465350470022, "test_acc1": 72.74000217041015, "test_acc5": 91.60400239746093, "epoch": 59, "n_parameters": 19839528} {"train_lr": 0.0013622702078177633, "train_loss": 3.6102118924569835, "epoch": 60, "n_parameters": 19839528} {"train_lr": 0.0013577176608093506, "train_loss": 3.6121580472750536, "epoch": 61, "n_parameters": 19839528} {"train_lr": 0.001353099019017369, "train_loss": 3.595388781502664, "epoch": 62, "n_parameters": 19839528} {"train_lr": 0.0013484147889280046, "train_loss": 3.59794242188132, "epoch": 63, "n_parameters": 19839528} {"train_lr": 0.0013436654842199, "train_loss": 3.596312729783243, "epoch": 64, "n_parameters": 19839528} {"train_lr": 0.0013388516257077697, "train_loss": 3.586064077580242, "epoch": 65, "n_parameters": 19839528} {"train_lr": 0.0013339737412854293, "train_loss": 3.5823862424773947, "epoch": 66, "n_parameters": 19839528} {"train_lr": 0.0013290323658679758, "train_loss": 3.573030476852191, "epoch": 67, "n_parameters": 19839528} {"train_lr": 0.0013240280413328142, "train_loss": 3.5640731681820204, "epoch": 68, "n_parameters": 19839528} {"train_lr": 0.0013189613164605683, "train_loss": 3.5566233732788968, "test_loss": 1.161833205716166, "test_acc1": 73.7740022265625, "test_acc5": 92.13400266601562, "epoch": 69, "n_parameters": 19839528} {"train_lr": 0.0013138327468746884, "train_loss": 3.560873009008374, "epoch": 70, "n_parameters": 19839528} {"train_lr": 0.00130864289498067, "train_loss": 3.5527042015958177, "epoch": 71, "n_parameters": 19839528} {"train_lr": 0.001303392329904193, "train_loss": 3.5542818620133936, "epoch": 72, "n_parameters": 19839528} {"train_lr": 0.001298081627428957, "train_loss": 3.536791101229086, "epoch": 73, "n_parameters": 19839528} {"train_lr": 0.001292711369933259, "train_loss": 3.5413731852714583, "epoch": 74, "n_parameters": 19839528} {"train_lr": 0.0012872821463264423, "train_loss": 3.532636512192986, "epoch": 75, "n_parameters": 19839528} {"train_lr": 0.0012817945519839737, "train_loss": 3.531300665573965, "epoch": 76, "n_parameters": 19839528} {"train_lr": 0.001276249188682435, "train_loss": 3.521723607830483, "epoch": 77, "n_parameters": 19839528} {"train_lr": 0.001270646664533459, "train_loss": 3.520014625968788, "epoch": 78, "n_parameters": 19839528} {"train_lr": 0.001264987593916884, "train_loss": 3.5140520677589873, "test_loss": 1.1525079113450938, "test_acc1": 73.99800217529297, "test_acc5": 92.43400237304688, "epoch": 79, "n_parameters": 19839528} {"train_lr": 0.0012592725974135677, "train_loss": 3.5096971495962923, "epoch": 80, "n_parameters": 19839528} {"train_lr": 0.0012535023017373635, "train_loss": 3.5030885160350493, "epoch": 81, "n_parameters": 19839528} {"train_lr": 0.0012476773396661296, "train_loss": 3.49934267447435, "epoch": 82, "n_parameters": 19839528} {"train_lr": 0.0012417983499726233, "train_loss": 3.5026872634268305, "epoch": 83, "n_parameters": 19839528} {"train_lr": 0.00123586597735436, "train_loss": 3.4976599823883014, "epoch": 84, "n_parameters": 19839528} {"train_lr": 0.0012298808723627598, "train_loss": 3.4856067795833523, "epoch": 85, "n_parameters": 19839528} {"train_lr": 0.0012238436913321116, "train_loss": 3.4813140059927767, "epoch": 86, "n_parameters": 19839528} {"train_lr": 0.0012177550963073647, "train_loss": 3.4857984712953383, "epoch": 87, "n_parameters": 19839528} {"train_lr": 0.0012116157549714461, "train_loss": 3.4796693149349576, "epoch": 88, "n_parameters": 19839528} {"train_lr": 0.001205426340572496, "train_loss": 3.475287120464704, "test_loss": 1.1474317209276723, "test_acc1": 73.97600239379882, "test_acc5": 92.47600232421875, "epoch": 89, "n_parameters": 19839528} {"train_lr": 0.0011991875318493601, "train_loss": 3.4645843457022636, "epoch": 90, "n_parameters": 19839528} {"train_lr": 0.0011929000129579043, "train_loss": 3.4605257517332846, "epoch": 91, "n_parameters": 19839528} {"train_lr": 0.0011865644733952759, "train_loss": 3.4528368092257438, "epoch": 92, "n_parameters": 19839528} {"train_lr": 0.001180181607924886, "train_loss": 3.4550925550236404, "epoch": 93, "n_parameters": 19839528} {"train_lr": 0.0011737521164998377, "train_loss": 3.4465438418810983, "epoch": 94, "n_parameters": 19839528} {"train_lr": 0.0011672767041862814, "train_loss": 3.4482224686004277, "epoch": 95, "n_parameters": 19839528} {"train_lr": 0.0011607560810862106, "train_loss": 3.439574462809056, "epoch": 96, "n_parameters": 19839528} {"train_lr": 0.0011541909622593347, "train_loss": 3.443025219372565, "epoch": 97, "n_parameters": 19839528} {"train_lr": 0.0011475820676450082, "train_loss": 3.4410349249506265, "epoch": 98, "n_parameters": 19839528} {"train_lr": 0.0011409301219829958, "train_loss": 3.4320299951352187, "test_loss": 1.119165081495058, "test_acc1": 74.60600229736328, "test_acc5": 92.80600252441407, "epoch": 99, "n_parameters": 19839528} {"train_lr": 0.001134235854734039, "train_loss": 3.426822557991786, "epoch": 100, "n_parameters": 19839528} {"train_lr": 0.0011274999999999775, "train_loss": 3.4213120434984123, "epoch": 101, "n_parameters": 19839528} {"train_lr": 0.0011207232964432971, "train_loss": 3.4210826341065763, "epoch": 102, "n_parameters": 19839528} {"train_lr": 0.0011139064872057738, "train_loss": 3.420546773198745, "epoch": 103, "n_parameters": 19839528} {"train_lr": 0.0011070503198274664, "train_loss": 3.415572468599351, "epoch": 104, "n_parameters": 19839528} {"train_lr": 0.0011001555461642792, "train_loss": 3.407705580832051, "epoch": 105, "n_parameters": 19839528} {"train_lr": 0.001093222922305959, "train_loss": 3.4061744938806284, "epoch": 106, "n_parameters": 19839528} {"train_lr": 0.001086253208492762, "train_loss": 3.3971709956844554, "epoch": 107, "n_parameters": 19839528} {"train_lr": 0.0010792471690323983, "train_loss": 3.3955467719790176, "epoch": 108, "n_parameters": 19839528} {"train_lr": 0.0010722055722159876, "train_loss": 3.3883266369108673, "test_loss": 1.0889496070524094, "test_acc1": 75.42800229248047, "test_acc5": 92.96600269042969, "epoch": 109, "n_parameters": 19839528} {"train_lr": 0.001065129190234018, "train_loss": 3.3847132010651912, "epoch": 110, "n_parameters": 19839528} {"train_lr": 0.001058018799091484, "train_loss": 3.384699105001468, "epoch": 111, "n_parameters": 19839528} {"train_lr": 0.0010508751785228995, "train_loss": 3.3792246310568923, "epoch": 112, "n_parameters": 19839528} {"train_lr": 0.0010436991119068247, "train_loss": 3.3801923313682125, "epoch": 113, "n_parameters": 19839528} {"train_lr": 0.0010364913861797749, "train_loss": 3.3730486084957967, "epoch": 114, "n_parameters": 19839528} {"train_lr": 0.0010292527917500668, "train_loss": 3.369254187690459, "epoch": 115, "n_parameters": 19839528} {"train_lr": 0.0010219841224112544, "train_loss": 3.3700363271230227, "epoch": 116, "n_parameters": 19839528} {"train_lr": 0.001014686175254767, "train_loss": 3.3550394605413425, "epoch": 117, "n_parameters": 19839528} {"train_lr": 0.0010073597505827476, "train_loss": 3.3584723280464335, "epoch": 118, "n_parameters": 19839528} {"train_lr": 0.0010000056518202367, "train_loss": 3.356769576055302, "test_loss": 1.0667756019363934, "test_acc1": 75.98200227294922, "test_acc5": 93.22000239746093, "epoch": 119, "n_parameters": 19839528} {"train_lr": 0.0009926246854270522, "train_loss": 3.345970925673259, "epoch": 120, "n_parameters": 19839528} {"train_lr": 0.000985217660809356, "train_loss": 3.3426768485543064, "epoch": 121, "n_parameters": 19839528} {"train_lr": 0.0009777853902307732, "train_loss": 3.3353391076437386, "epoch": 122, "n_parameters": 19839528} {"train_lr": 0.0009703286887236246, "train_loss": 3.3345412513930546, "epoch": 123, "n_parameters": 19839528} {"train_lr": 0.0009628483739992136, "train_loss": 3.3293569454376835, "epoch": 124, "n_parameters": 19839528} {"train_lr": 0.0009553452663583553, "train_loss": 3.3319449843965367, "epoch": 125, "n_parameters": 19839528} {"train_lr": 0.0009478201886013921, "train_loss": 3.321284961339524, "epoch": 126, "n_parameters": 19839528} {"train_lr": 0.0009402739659378006, "train_loss": 3.321783634279367, "epoch": 127, "n_parameters": 19839528} {"train_lr": 0.0009327074258960266, "train_loss": 3.3219549272486346, "epoch": 128, "n_parameters": 19839528} {"train_lr": 0.0009251213982324277, "train_loss": 3.3126474231493463, "test_loss": 1.0391252767044385, "test_acc1": 76.62800237792969, "test_acc5": 93.56400246582031, "epoch": 129, "n_parameters": 19839528} {"train_lr": 0.0009175167148404177, "train_loss": 3.3041182362513957, "epoch": 130, "n_parameters": 19839528} {"train_lr": 0.0009098942096592476, "train_loss": 3.3008042172812444, "epoch": 131, "n_parameters": 19839528} {"train_lr": 0.0009022547185824416, "train_loss": 3.296161395409029, "epoch": 132, "n_parameters": 19839528} {"train_lr": 0.0008945990793663697, "train_loss": 3.2938995228932915, "epoch": 133, "n_parameters": 19839528} {"train_lr": 0.0008869281315380942, "train_loss": 3.294586158443174, "epoch": 134, "n_parameters": 19839528} {"train_lr": 0.0008792427163034921, "train_loss": 3.286772222756196, "epoch": 135, "n_parameters": 19839528} {"train_lr": 0.0008715436764549598, "train_loss": 3.2878594259492497, "epoch": 136, "n_parameters": 19839528} {"train_lr": 0.0008638318562789998, "train_loss": 3.2822027327321606, "epoch": 137, "n_parameters": 19839528} {"train_lr": 0.0008561081014635556, "train_loss": 3.280583902044024, "epoch": 138, "n_parameters": 19839528} {"train_lr": 0.0008483732590054104, "train_loss": 3.2728508614081084, "test_loss": 1.0182114099071946, "test_acc1": 76.7760022680664, "test_acc5": 93.87200264160157, "epoch": 139, "n_parameters": 19839528} {"train_lr": 0.0008406281771171736, "train_loss": 3.262690918872968, "epoch": 140, "n_parameters": 19839528} {"train_lr": 0.0008328737051344065, "train_loss": 3.26914616424641, "epoch": 141, "n_parameters": 19839528} {"train_lr": 0.0008251106934222841, "train_loss": 3.2643757565118237, "epoch": 142, "n_parameters": 19839528} {"train_lr": 0.0008173399932825871, "train_loss": 3.2593973223492205, "epoch": 143, "n_parameters": 19839528} {"train_lr": 0.0008095624568600761, "train_loss": 3.2555739046822634, "epoch": 144, "n_parameters": 19839528} {"train_lr": 0.0008017789370493494, "train_loss": 3.2501162530230485, "epoch": 145, "n_parameters": 19839528} {"train_lr": 0.0007939902874010041, "train_loss": 3.240686040279343, "epoch": 146, "n_parameters": 19839528} {"train_lr": 0.0007861973620282396, "train_loss": 3.2396678544586894, "epoch": 147, "n_parameters": 19839528} {"train_lr": 0.0007784010155131946, "train_loss": 3.235818375238507, "epoch": 148, "n_parameters": 19839528} {"train_lr": 0.0007706021028131007, "train_loss": 3.234391509051279, "test_loss": 0.9864389897536865, "test_acc1": 77.16200237548829, "test_acc5": 93.99600243652344, "epoch": 149, "n_parameters": 19839528} {"train_lr": 0.0007628014791666195, "train_loss": 3.2245655351465077, "epoch": 150, "n_parameters": 19839528} {"train_lr": 0.0007549999999999935, "train_loss": 3.2189684424945395, "epoch": 151, "n_parameters": 19839528} {"train_lr": 0.0007471985208333895, "train_loss": 3.2213869986536023, "epoch": 152, "n_parameters": 19839528} {"train_lr": 0.000739397897186908, "train_loss": 3.217819185220271, "epoch": 153, "n_parameters": 19839528} {"train_lr": 0.000731598984486791, "train_loss": 3.2115767053086506, "epoch": 154, "n_parameters": 19839528} {"train_lr": 0.0007238026379717457, "train_loss": 3.213753339180129, "epoch": 155, "n_parameters": 19839528} {"train_lr": 0.0007160097125989996, "train_loss": 3.2085193711921844, "epoch": 156, "n_parameters": 19839528} {"train_lr": 0.0007082210629506558, "train_loss": 3.2027822827621044, "epoch": 157, "n_parameters": 19839528} {"train_lr": 0.0007004375431399113, "train_loss": 3.195620530336309, "epoch": 158, "n_parameters": 19839528} {"train_lr": 0.0006926600067174185, "train_loss": 3.1916717061226505, "test_loss": 0.9700600523465883, "test_acc1": 77.60200218017579, "test_acc5": 94.12800249511719, "epoch": 159, "n_parameters": 19839528} {"train_lr": 0.000684889306577718, "train_loss": 3.187518267269186, "epoch": 160, "n_parameters": 19839528} {"train_lr": 0.0006771262948656035, "train_loss": 3.194343635170675, "epoch": 161, "n_parameters": 19839528} {"train_lr": 0.0006693718228828092, "train_loss": 3.18534828824915, "epoch": 162, "n_parameters": 19839528} {"train_lr": 0.0006616267409945818, "train_loss": 3.1746265178235125, "epoch": 163, "n_parameters": 19839528} {"train_lr": 0.0006538918985364373, "train_loss": 3.1735835823652554, "epoch": 164, "n_parameters": 19839528} {"train_lr": 0.0006461681437209942, "train_loss": 3.163681189904062, "epoch": 165, "n_parameters": 19839528} {"train_lr": 0.0006384563235450294, "train_loss": 3.1619515389942534, "epoch": 166, "n_parameters": 19839528} {"train_lr": 0.0006307572836964984, "train_loss": 3.1544494837415304, "epoch": 167, "n_parameters": 19839528} {"train_lr": 0.0006230718684619011, "train_loss": 3.1604412552728642, "epoch": 168, "n_parameters": 19839528} {"train_lr": 0.0006154009206336259, "train_loss": 3.1446313675490023, "test_loss": 0.9667077475511638, "test_acc1": 78.01200240722656, "test_acc5": 94.33400237304687, "epoch": 169, "n_parameters": 19839528} {"train_lr": 0.0006077452814175498, "train_loss": 3.1411627174841223, "epoch": 170, "n_parameters": 19839528} {"train_lr": 0.0006001057903407651, "train_loss": 3.1467720449066086, "epoch": 171, "n_parameters": 19839528} {"train_lr": 0.000592483285159584, "train_loss": 3.1348611479170985, "epoch": 172, "n_parameters": 19839528} {"train_lr": 0.0005848786017675498, "train_loss": 3.13206957392603, "epoch": 173, "n_parameters": 19839528} {"train_lr": 0.0005772925741039498, "train_loss": 3.130790768076571, "epoch": 174, "n_parameters": 19839528} {"train_lr": 0.0005697260340621892, "train_loss": 3.1211011101254265, "epoch": 175, "n_parameters": 19839528} {"train_lr": 0.0005621798113986145, "train_loss": 3.1191044482741233, "epoch": 176, "n_parameters": 19839528} {"train_lr": 0.0005546547336416323, "train_loss": 3.122323584058683, "epoch": 177, "n_parameters": 19839528} {"train_lr": 0.0005471516260007747, "train_loss": 3.107121829798134, "epoch": 178, "n_parameters": 19839528} {"train_lr": 0.0005396713112763611, "train_loss": 3.105290729859226, "test_loss": 0.9513865592612415, "test_acc1": 78.6240023046875, "test_acc5": 94.54600262207032, "epoch": 179, "n_parameters": 19839528} {"train_lr": 0.0005322146097692113, "train_loss": 3.0949065654838592, "epoch": 180, "n_parameters": 19839528} {"train_lr": 0.0005247823391906731, "train_loss": 3.1007531761444156, "epoch": 181, "n_parameters": 19839528} {"train_lr": 0.0005173753145729493, "train_loss": 3.0905356135287825, "epoch": 182, "n_parameters": 19839528} {"train_lr": 0.0005099943481797611, "train_loss": 3.0899510857381887, "epoch": 183, "n_parameters": 19839528} {"train_lr": 0.0005026402494172624, "train_loss": 3.0854811284015122, "epoch": 184, "n_parameters": 19839528} {"train_lr": 0.0004953138247452536, "train_loss": 3.0826281694521147, "epoch": 185, "n_parameters": 19839528} {"train_lr": 0.000488015877588746, "train_loss": 3.0705661256548216, "epoch": 186, "n_parameters": 19839528} {"train_lr": 0.00048074720824991987, "train_loss": 3.0711349826291214, "epoch": 187, "n_parameters": 19839528} {"train_lr": 0.0004735086138202327, "train_loss": 3.064244340500719, "epoch": 188, "n_parameters": 19839528} {"train_lr": 0.0004663008880931849, "train_loss": 3.061089770524479, "test_loss": 0.9355539579995534, "test_acc1": 79.02800233398438, "test_acc5": 94.7400024609375, "epoch": 189, "n_parameters": 19839528} {"train_lr": 0.0004591248214770861, "train_loss": 3.0555925460384903, "epoch": 190, "n_parameters": 19839528} {"train_lr": 0.0004519812009085206, "train_loss": 3.0528889834749804, "epoch": 191, "n_parameters": 19839528} {"train_lr": 0.0004448708097660038, "train_loss": 3.050381939128625, "epoch": 192, "n_parameters": 19839528} {"train_lr": 0.0004377944277840216, "train_loss": 3.0433583477263353, "epoch": 193, "n_parameters": 19839528} {"train_lr": 0.00043075283096761065, "train_loss": 3.0335270848741636, "epoch": 194, "n_parameters": 19839528} {"train_lr": 0.0004237467915072327, "train_loss": 3.0277370427080768, "epoch": 195, "n_parameters": 19839528} {"train_lr": 0.00041677707769403763, "train_loss": 3.0270061541339763, "epoch": 196, "n_parameters": 19839528} {"train_lr": 0.0004098444538357003, "train_loss": 3.022466329481009, "epoch": 197, "n_parameters": 19839528} {"train_lr": 0.00040294968017255505, "train_loss": 3.0184207006478956, "epoch": 198, "n_parameters": 19839528} {"train_lr": 0.0003960935127942218, "train_loss": 3.00698485773959, "test_loss": 0.8962165900075275, "test_acc1": 79.63600237792969, "test_acc5": 94.90800259277344, "epoch": 199, "n_parameters": 19839528} {"train_lr": 0.00038927670355671216, "train_loss": 3.0094634874475945, "epoch": 200, "n_parameters": 19839528} {"train_lr": 0.0003825000000000037, "train_loss": 3.006327954383729, "epoch": 201, "n_parameters": 19839528} {"train_lr": 0.00037576414526596793, "train_loss": 2.998049161756496, "epoch": 202, "n_parameters": 19839528} {"train_lr": 0.00036906987801701454, "train_loss": 2.994163888660695, "epoch": 203, "n_parameters": 19839528} {"train_lr": 0.0003624179323549749, "train_loss": 2.9868547734823063, "epoch": 204, "n_parameters": 19839528} {"train_lr": 0.00035580903774064737, "train_loss": 2.988940695171162, "epoch": 205, "n_parameters": 19839528} {"train_lr": 0.00034924391891380123, "train_loss": 2.975749797606878, "epoch": 206, "n_parameters": 19839528} {"train_lr": 0.0003427232958137021, "train_loss": 2.97958402243926, "epoch": 207, "n_parameters": 19839528} {"train_lr": 0.0003362478835001678, "train_loss": 2.9698372358719793, "epoch": 208, "n_parameters": 19839528} {"train_lr": 0.00032981839207510015, "train_loss": 2.958401198861458, "test_loss": 0.8916250368054678, "test_acc1": 79.90600252197265, "test_acc5": 94.97400248046876, "epoch": 209, "n_parameters": 19839528} {"train_lr": 0.00032343552660470695, "train_loss": 2.961305334753127, "epoch": 210, "n_parameters": 19839528} {"train_lr": 0.00031709998704210364, "train_loss": 2.9577821805882607, "epoch": 211, "n_parameters": 19839528} {"train_lr": 0.00031081246815062134, "train_loss": 2.958019855782854, "epoch": 212, "n_parameters": 19839528} {"train_lr": 0.00030457365942753627, "train_loss": 2.941526568502926, "epoch": 213, "n_parameters": 19839528} {"train_lr": 0.0002983842450285365, "train_loss": 2.936336069912028, "epoch": 214, "n_parameters": 19839528} {"train_lr": 0.0002922449036926526, "train_loss": 2.9336322738195686, "epoch": 215, "n_parameters": 19839528} {"train_lr": 0.0002861563086678732, "train_loss": 2.930901040740722, "epoch": 216, "n_parameters": 19839528} {"train_lr": 0.00028011912763722897, "train_loss": 2.921262913816076, "epoch": 217, "n_parameters": 19839528} {"train_lr": 0.00027413402264565205, "train_loss": 2.916639976513138, "epoch": 218, "n_parameters": 19839528} {"train_lr": 0.0002682016500273683, "train_loss": 2.916696022716548, "test_loss": 0.8663762587617775, "test_acc1": 80.33800242675781, "test_acc5": 95.18600251953124, "epoch": 219, "n_parameters": 19839528} {"train_lr": 0.0002623226603338801, "train_loss": 2.9102745090218947, "epoch": 220, "n_parameters": 19839528} {"train_lr": 0.00025649769826265625, "train_loss": 2.9026610607521044, "epoch": 221, "n_parameters": 19839528} {"train_lr": 0.0002507274025864154, "train_loss": 2.8995177312303695, "epoch": 222, "n_parameters": 19839528} {"train_lr": 0.00024501240608312813, "train_loss": 2.8968097002183697, "epoch": 223, "n_parameters": 19839528} {"train_lr": 0.00023935333546654323, "train_loss": 2.8909532371744646, "epoch": 224, "n_parameters": 19839528} {"train_lr": 0.0002337508113175451, "train_loss": 2.887213968091922, "epoch": 225, "n_parameters": 19839528} {"train_lr": 0.00022820544801602224, "train_loss": 2.8811725487680935, "epoch": 226, "n_parameters": 19839528} {"train_lr": 0.00022271785367356016, "train_loss": 2.8783173284334818, "epoch": 227, "n_parameters": 19839528} {"train_lr": 0.00021728863006672194, "train_loss": 2.8754133993951823, "epoch": 228, "n_parameters": 19839528} {"train_lr": 0.00021191837257104475, "train_loss": 2.8661468226155886, "test_loss": 0.8672365600568548, "test_acc1": 80.70000245117187, "test_acc5": 95.26600255371093, "epoch": 229, "n_parameters": 19839528} {"train_lr": 0.00020660767009580015, "train_loss": 2.8591344213242724, "epoch": 230, "n_parameters": 19839528} {"train_lr": 0.00020135710501933987, "train_loss": 2.852206010112374, "epoch": 231, "n_parameters": 19839528} {"train_lr": 0.0001961672531253057, "train_loss": 2.8437497442443784, "epoch": 232, "n_parameters": 19839528} {"train_lr": 0.00019103868353944288, "train_loss": 2.8411130388434844, "epoch": 233, "n_parameters": 19839528} {"train_lr": 0.0001859719586671909, "train_loss": 2.836851907928261, "epoch": 234, "n_parameters": 19839528} {"train_lr": 0.00018096763413203755, "train_loss": 2.8378764059748964, "epoch": 235, "n_parameters": 19839528} {"train_lr": 0.00017602625871455664, "train_loss": 2.82573682368159, "epoch": 236, "n_parameters": 19839528} {"train_lr": 0.0001711483742922467, "train_loss": 2.8273773891546075, "epoch": 237, "n_parameters": 19839528} {"train_lr": 0.0001663345157801127, "train_loss": 2.8169023906834405, "epoch": 238, "n_parameters": 19839528} {"train_lr": 0.00016158521107197287, "train_loss": 2.8168323529567076, "test_loss": 0.8494321693900451, "test_acc1": 81.08600236328125, "test_acc5": 95.33000243164062, "epoch": 239, "n_parameters": 19839528} {"train_lr": 0.00015690098098261856, "train_loss": 2.812256221517289, "epoch": 240, "n_parameters": 19839528} {"train_lr": 0.00015228233919066484, "train_loss": 2.8026976934511314, "epoch": 241, "n_parameters": 19839528} {"train_lr": 0.0001477297921822251, "train_loss": 2.8024677177258344, "epoch": 242, "n_parameters": 19839528} {"train_lr": 0.00014324383919539206, "train_loss": 2.790938279403152, "epoch": 243, "n_parameters": 19839528} {"train_lr": 0.00013882497216545216, "train_loss": 2.7947971656156194, "epoch": 244, "n_parameters": 19839528} {"train_lr": 0.00013447367567097436, "train_loss": 2.7819773850919343, "epoch": 245, "n_parameters": 19839528} {"train_lr": 0.00013019042688065826, "train_loss": 2.785810212937476, "epoch": 246, "n_parameters": 19839528} {"train_lr": 0.0001259756955010005, "train_loss": 2.783519161964873, "epoch": 247, "n_parameters": 19839528} {"train_lr": 0.00012182994372478594, "train_loss": 2.770407432346321, "epoch": 248, "n_parameters": 19839528} {"train_lr": 0.00011775362618042428, "train_loss": 2.7679095205714663, "test_loss": 0.8544427973581138, "test_acc1": 81.12400245117188, "test_acc5": 95.47400234375, "epoch": 249, "n_parameters": 19839528} {"train_lr": 0.00011374718988206232, "train_loss": 2.7665055080902854, "epoch": 250, "n_parameters": 19839528} {"train_lr": 0.00010981107418059352, "train_loss": 2.758272399290574, "epoch": 251, "n_parameters": 19839528} {"train_lr": 0.00010594571071545857, "train_loss": 2.7561737152812578, "epoch": 252, "n_parameters": 19839528} {"train_lr": 0.0001021515233673206, "train_loss": 2.7461836018639025, "epoch": 253, "n_parameters": 19839528} {"train_lr": 9.842892821157986e-05, "train_loss": 2.7482390486531787, "epoch": 254, "n_parameters": 19839528} {"train_lr": 9.477833347274443e-05, "train_loss": 2.7414107218765906, "epoch": 255, "n_parameters": 19839528} {"train_lr": 9.12001394796647e-05, "train_loss": 2.7369372587886263, "epoch": 256, "n_parameters": 19839528} {"train_lr": 8.769473862163653e-05, "train_loss": 2.738597976664702, "epoch": 257, "n_parameters": 19839528} {"train_lr": 8.426251530536481e-05, "train_loss": 2.728638687008005, "epoch": 258, "n_parameters": 19839528} {"train_lr": 8.090384591281436e-05, "train_loss": 2.727180750922953, "test_loss": 0.8427176240996069, "test_acc1": 81.50400241943359, "test_acc5": 95.55400247070313, "epoch": 259, "n_parameters": 19839528} {"train_lr": 7.761909875993307e-05, "train_loss": 2.7231130874473797, "epoch": 260, "n_parameters": 19839528} {"train_lr": 7.440863405626342e-05, "train_loss": 2.718082098634266, "epoch": 261, "n_parameters": 19839528} {"train_lr": 7.127280386543524e-05, "train_loss": 2.719369805580992, "epoch": 262, "n_parameters": 19839528} {"train_lr": 6.821195206656816e-05, "train_loss": 2.715197392242799, "epoch": 263, "n_parameters": 19839528} {"train_lr": 6.522641431655447e-05, "train_loss": 2.712659798103938, "epoch": 264, "n_parameters": 19839528} {"train_lr": 6.231651801325206e-05, "train_loss": 2.705489238156832, "epoch": 265, "n_parameters": 19839528} {"train_lr": 5.948258225958532e-05, "train_loss": 2.7076379898295317, "epoch": 266, "n_parameters": 19839528} {"train_lr": 5.6724917828541536e-05, "train_loss": 2.6951540292059777, "epoch": 267, "n_parameters": 19839528} {"train_lr": 5.4043827129102654e-05, "train_loss": 2.693375384921936, "epoch": 268, "n_parameters": 19839528} {"train_lr": 5.1439604173077446e-05, "train_loss": 2.6945020658113688, "test_loss": 0.8374539561955805, "test_acc1": 81.6560024609375, "test_acc5": 95.49000251953125, "epoch": 269, "n_parameters": 19839528} {"train_lr": 4.891253454285937e-05, "train_loss": 2.6824657809343653, "epoch": 270, "n_parameters": 19839528} {"train_lr": 4.646289536011009e-05, "train_loss": 2.6861505738193756, "epoch": 271, "n_parameters": 19839528} {"train_lr": 4.40909552553738e-05, "train_loss": 2.686985709053054, "epoch": 272, "n_parameters": 19839528} {"train_lr": 4.179697433860962e-05, "train_loss": 2.6823135913966847, "epoch": 273, "n_parameters": 19839528} {"train_lr": 3.958120417067725e-05, "train_loss": 2.6780190446691736, "epoch": 274, "n_parameters": 19839528} {"train_lr": 3.744388773574431e-05, "train_loss": 2.6674541361945616, "epoch": 275, "n_parameters": 19839528} {"train_lr": 3.538525941464467e-05, "train_loss": 2.668064514653002, "epoch": 276, "n_parameters": 19839528} {"train_lr": 3.3405544959169265e-05, "train_loss": 2.666533358043713, "epoch": 277, "n_parameters": 19839528} {"train_lr": 3.150496146732081e-05, "train_loss": 2.6688743355891686, "epoch": 278, "n_parameters": 19839528} {"train_lr": 2.9683717359496197e-05, "train_loss": 2.6624297294721044, "test_loss": 0.8292964244415115, "test_acc1": 81.74800256103515, "test_acc5": 95.62000242675781, "epoch": 279, "n_parameters": 19839528} {"train_lr": 2.79420123556334e-05, "train_loss": 2.6633270730336696, "epoch": 280, "n_parameters": 19839528} {"train_lr": 2.6280037453314815e-05, "train_loss": 2.660491506729147, "epoch": 281, "n_parameters": 19839528} {"train_lr": 2.4697974906816928e-05, "train_loss": 2.657245778470493, "epoch": 282, "n_parameters": 19839528} {"train_lr": 2.319599820712709e-05, "train_loss": 2.6555754047491664, "epoch": 283, "n_parameters": 19839528} {"train_lr": 2.177427206291483e-05, "train_loss": 2.649629327241513, "epoch": 284, "n_parameters": 19839528} {"train_lr": 2.0432952382473795e-05, "train_loss": 2.6503654493392705, "epoch": 285, "n_parameters": 19839528} {"train_lr": 1.917218625662254e-05, "train_loss": 2.6527743153542067, "epoch": 286, "n_parameters": 19839528} {"train_lr": 1.799211194257337e-05, "train_loss": 2.6521436361124, "epoch": 287, "n_parameters": 19839528} {"train_lr": 1.689285884877437e-05, "train_loss": 2.6430790753042004, "epoch": 288, "n_parameters": 19839528} {"train_lr": 1.5874547520713972e-05, "train_loss": 2.649511125942262, "test_loss": 0.8268017518600438, "test_acc1": 81.88000236816406, "test_acc5": 95.55800256347656, "epoch": 289, "n_parameters": 19839528} {"train_lr": 1.493728962770468e-05, "train_loss": 2.6444280449744704, "epoch": 290, "n_parameters": 19839528} {"train_lr": 1.408118795063667e-05, "train_loss": 2.637804407855685, "epoch": 291, "n_parameters": 19839528} {"train_lr": 1.3306336370705133e-05, "train_loss": 2.639624316153004, "epoch": 292, "n_parameters": 19839528} {"train_lr": 1.2612819859119116e-05, "train_loss": 2.643122653750112, "epoch": 293, "n_parameters": 19839528} {"train_lr": 1.2000714467778719e-05, "train_loss": 2.6374061775924584, "epoch": 294, "n_parameters": 19839528} {"train_lr": 1.1470087320937667e-05, "train_loss": 2.6381828155425144, "epoch": 295, "n_parameters": 19839528} {"train_lr": 1.1020996607842463e-05, "train_loss": 2.6382754055334985, "epoch": 296, "n_parameters": 19839528} {"train_lr": 1.0653491576350343e-05, "train_loss": 2.6401634517369224, "epoch": 297, "n_parameters": 19839528} {"train_lr": 1.036761252753003e-05, "train_loss": 2.633535975270229, "epoch": 298, "n_parameters": 19839528} {"train_lr": 1.0163390811239968e-05, "train_loss": 2.642274696555593, "test_loss": 0.8300226728598125, "test_acc1": 81.86200229736328, "test_acc5": 95.54600247558594, "epoch": 299, "n_parameters": 19839528}