Skip to content

Instantly share code, notes, and snippets.

@fmassa
Created January 13, 2021 23:48
Show Gist options
  • Save fmassa/0497ed4e382d5de19b98bb7168815610 to your computer and use it in GitHub Desktop.
Save fmassa/0497ed4e382d5de19b98bb7168815610 to your computer and use it in GitHub Desktop.
Training logs for DeiT base
{"train_lr": 9.999999999999955e-07, "train_loss": 6.932190733943149, "test_loss": 6.802212624540713, "test_acc1": 0.6680000299072265, "test_acc5": 2.3260000648498536, "epoch": 0, "n_parameters": 86567656}
{"train_lr": 9.999999999999955e-07, "train_loss": 6.877597264201045, "test_loss": 6.742397216826163, "test_acc1": 0.7480000346374511, "test_acc5": 2.966000115966797, "epoch": 1, "n_parameters": 86567656}
{"train_lr": 0.00020080000000000092, "train_loss": 6.753143510110468, "test_loss": 6.033484591632337, "test_acc1": 3.1680001258850097, "test_acc5": 10.304000309906005, "epoch": 2, "n_parameters": 86567656}
{"train_lr": 0.000400599999999987, "train_loss": 6.5730244404168054, "test_loss": 5.7046810271872666, "test_acc1": 5.416000174255371, "test_acc5": 15.448000488128661, "epoch": 3, "n_parameters": 86567656}
{"train_lr": 0.0006003999999999824, "train_loss": 6.507236412484392, "test_loss": 5.6710031151542735, "test_acc1": 5.638000180206299, "test_acc5": 15.78400046875, "epoch": 4, "n_parameters": 86567656}
{"train_lr": 0.0008002000000000078, "train_loss": 6.601504293753565, "test_loss": 5.9367088077164425, "test_acc1": 4.296000142669678, "test_acc5": 12.706000402069092, "epoch": 5, "n_parameters": 86567656}
{"train_lr": 0.0009993216197035086, "train_loss": 6.613494839575841, "test_loss": 5.951621986854099, "test_acc1": 4.556000160827637, "test_acc5": 12.960000394744872, "epoch": 6, "n_parameters": 86567656}
{"train_lr": 0.000999023230572016, "train_loss": 6.549718008624564, "test_loss": 5.6169251320229385, "test_acc1": 6.376000199432373, "test_acc5": 17.186000518188475, "epoch": 7, "n_parameters": 86567656}
{"train_lr": 0.000998670666226098, "train_loss": 6.459563489702584, "test_loss": 5.482276716982792, "test_acc1": 7.502000239562988, "test_acc5": 19.87800062576294, "epoch": 8, "n_parameters": 86567656}
{"train_lr": 0.0009982639653285214, "train_loss": 6.356104309753262, "test_loss": 5.114031962835857, "test_acc1": 10.296000334625244, "test_acc5": 25.298000780029298, "epoch": 9, "n_parameters": 86567656}
{"train_lr": 0.0009978031724785232, "train_loss": 6.255944427230852, "test_loss": 4.837308585071747, "test_acc1": 13.428000433044433, "test_acc5": 30.488000864868162, "epoch": 10, "n_parameters": 86567656}
{"train_lr": 0.000997288338207296, "train_loss": 6.1531622141337605, "test_loss": 4.6452020161897805, "test_acc1": 15.62600046218872, "test_acc5": 34.19200092941284, "epoch": 11, "n_parameters": 86567656}
{"train_lr": 0.0009967195189721821, "train_loss": 6.054307197328571, "test_loss": 4.380930809050284, "test_acc1": 18.5120005317688, "test_acc5": 38.68000105834961, "epoch": 12, "n_parameters": 86567656}
{"train_lr": 0.0009960967771506664, "train_loss": 5.947286129998361, "test_loss": 4.217004191509364, "test_acc1": 20.750000659484865, "test_acc5": 42.0440012348938, "epoch": 13, "n_parameters": 86567656}
{"train_lr": 0.0009954201810333755, "train_loss": 5.853549897170467, "test_loss": 3.9584940055281552, "test_acc1": 23.8160006880188, "test_acc5": 46.4660013293457, "epoch": 14, "n_parameters": 86567656}
{"train_lr": 0.0009946898048166896, "train_loss": 5.755316680593552, "test_loss": 3.726726113033844, "test_acc1": 26.474000716552734, "test_acc5": 49.988001569213864, "epoch": 15, "n_parameters": 86567656}
{"train_lr": 0.0009939057285945907, "train_loss": 5.669774887801932, "test_loss": 3.556508970466548, "test_acc1": 29.128000845947266, "test_acc5": 53.55800157348633, "epoch": 16, "n_parameters": 86567656}
{"train_lr": 0.0009930680383498827, "train_loss": 5.594056687611851, "test_loss": 3.4515661041246952, "test_acc1": 30.79600092666626, "test_acc5": 55.37000159362793, "epoch": 17, "n_parameters": 86567656}
{"train_lr": 0.0009921768259447904, "train_loss": 5.513628631067886, "test_loss": 3.3184851827296553, "test_acc1": 32.83200098236084, "test_acc5": 57.84200162475586, "epoch": 18, "n_parameters": 86567656}
{"train_lr": 0.0009912321891107068, "train_loss": 5.436586413952372, "test_loss": 3.151255369300806, "test_acc1": 35.34600100845337, "test_acc5": 60.32000177612305, "epoch": 19, "n_parameters": 86567656}
{"train_lr": 0.000990234231437762, "train_loss": 5.363546089398013, "test_loss": 3.024874873845454, "test_acc1": 37.11000106521607, "test_acc5": 62.77000180786133, "epoch": 20, "n_parameters": 86567656}
{"train_lr": 0.000989183062363242, "train_loss": 5.2940646689191615, "test_loss": 2.9705198340818657, "test_acc1": 38.54800114654541, "test_acc5": 63.90800188720703, "epoch": 21, "n_parameters": 86567656}
{"train_lr": 0.0009880787971596754, "train_loss": 5.229582776161407, "test_loss": 2.8990507664126763, "test_acc1": 39.464001149291995, "test_acc5": 65.14600181518554, "epoch": 22, "n_parameters": 86567656}
{"train_lr": 0.0009869215569222386, "train_loss": 5.178942910737271, "test_loss": 2.771049806286872, "test_acc1": 41.88600120727539, "test_acc5": 67.49200201049804, "epoch": 23, "n_parameters": 86567656}
{"train_lr": 0.0009857114685552669, "train_loss": 5.104300311179184, "test_loss": 2.677509635515268, "test_acc1": 43.058001239624026, "test_acc5": 68.80800211791993, "epoch": 24, "n_parameters": 86567656}
{"train_lr": 0.0009844486647586856, "train_loss": 5.050285994720688, "test_loss": 2.580574015223362, "test_acc1": 44.96200129455566, "test_acc5": 70.6500021081543, "epoch": 25, "n_parameters": 86567656}
{"train_lr": 0.00098313328401311, "train_loss": 4.994058527582459, "test_loss": 2.4957606429216272, "test_acc1": 46.77200135009765, "test_acc5": 72.14400233886718, "epoch": 26, "n_parameters": 86567656}
{"train_lr": 0.0009817654705648337, "train_loss": 4.940906394478515, "test_loss": 2.444073199825415, "test_acc1": 47.64600138122559, "test_acc5": 72.7760022253418, "epoch": 27, "n_parameters": 86567656}
{"train_lr": 0.00098034537441009, "train_loss": 4.889425958077208, "test_loss": 2.3804922262331805, "test_acc1": 49.00200140625, "test_acc5": 74.24600227783203, "epoch": 28, "n_parameters": 86567656}
{"train_lr": 0.0009788731512783825, "train_loss": 4.842023833811902, "test_loss": 2.3189165089958688, "test_acc1": 50.05000149963379, "test_acc5": 75.10800221191407, "epoch": 29, "n_parameters": 86567656}
{"train_lr": 0.00097734896261555, "train_loss": 4.796560239841898, "test_loss": 2.2549353332871895, "test_acc1": 51.21600147766113, "test_acc5": 76.00200235595703, "epoch": 30, "n_parameters": 86567656}
{"train_lr": 0.0009757729755660996, "train_loss": 4.763647347057371, "test_loss": 2.1767542242660634, "test_acc1": 52.318001491088864, "test_acc5": 76.89600238769532, "epoch": 31, "n_parameters": 86567656}
{"train_lr": 0.000974145362954742, "train_loss": 4.714707629178926, "test_loss": 2.1793058701646078, "test_acc1": 52.902001481933596, "test_acc5": 77.5260024194336, "epoch": 32, "n_parameters": 86567656}
{"train_lr": 0.000972466303267533, "train_loss": 4.676608896596159, "test_loss": 2.127642944941365, "test_acc1": 53.5500015625, "test_acc5": 78.06200229248047, "epoch": 33, "n_parameters": 86567656}
{"train_lr": 0.0009707359806323523, "train_loss": 4.647378469399697, "test_loss": 2.0980827232926456, "test_acc1": 54.030001530761716, "test_acc5": 78.64000247314453, "epoch": 34, "n_parameters": 86567656}
{"train_lr": 0.0009689545847984843, "train_loss": 4.613072235199759, "test_loss": 2.0406546418817855, "test_acc1": 55.25800164123535, "test_acc5": 79.4480025390625, "epoch": 35, "n_parameters": 86567656}
{"train_lr": 0.000967122311116087, "train_loss": 4.571712880731106, "test_loss": 2.0215139218289657, "test_acc1": 55.778001581420895, "test_acc5": 79.92800240966797, "epoch": 36, "n_parameters": 86567656}
{"train_lr": 0.0009652393605146942, "train_loss": 4.5433167233813005, "test_loss": 1.973966828291796, "test_acc1": 56.58000151855469, "test_acc5": 80.6140024169922, "epoch": 37, "n_parameters": 86567656}
{"train_lr": 0.0009633059394809262, "train_loss": 4.516756863450166, "test_loss": 1.9314669682402985, "test_acc1": 57.11800173217773, "test_acc5": 81.16600243408203, "epoch": 38, "n_parameters": 86567656}
{"train_lr": 0.0009613222600362934, "train_loss": 4.48332382489642, "test_loss": 1.908546046480794, "test_acc1": 57.90800151611328, "test_acc5": 81.55400229248046, "epoch": 39, "n_parameters": 86567656}
{"train_lr": 0.0009592885397135909, "train_loss": 4.451740840963608, "test_loss": 1.8815754514166123, "test_acc1": 58.500001770629886, "test_acc5": 82.27200254394532, "epoch": 40, "n_parameters": 86567656}
{"train_lr": 0.0009572050015330907, "train_loss": 4.43058649552383, "test_loss": 1.8450315956190773, "test_acc1": 58.898001651000975, "test_acc5": 82.56400255859376, "epoch": 41, "n_parameters": 86567656}
{"train_lr": 0.0009550718739782929, "train_loss": 4.4043412564231526, "test_loss": 1.824128090420062, "test_acc1": 59.25000171936035, "test_acc5": 82.6980024951172, "epoch": 42, "n_parameters": 86567656}
{"train_lr": 0.000952889390970695, "train_loss": 4.383354831597121, "test_loss": 1.8227412714953615, "test_acc1": 59.66400174804688, "test_acc5": 83.03600248046875, "epoch": 43, "n_parameters": 86567656}
{"train_lr": 0.0009506577918441058, "train_loss": 4.353979862577242, "test_loss": 1.7664298272178636, "test_acc1": 60.3300017199707, "test_acc5": 83.4380024584961, "epoch": 44, "n_parameters": 86567656}
{"train_lr": 0.0009483773213185082, "train_loss": 4.338856119844172, "test_loss": 1.7432186586385496, "test_acc1": 60.640001849365234, "test_acc5": 83.91000254882813, "epoch": 45, "n_parameters": 86567656}
{"train_lr": 0.0009460482294732177, "train_loss": 4.309616885787482, "test_loss": 1.7599336740323084, "test_acc1": 60.66000182678223, "test_acc5": 83.88000249023438, "epoch": 46, "n_parameters": 86567656}
{"train_lr": 0.000943670771719436, "train_loss": 4.289615833311439, "test_loss": 1.740280530445864, "test_acc1": 60.93600165771485, "test_acc5": 84.1440025756836, "epoch": 47, "n_parameters": 86567656}
{"train_lr": 0.0009412452087721683, "train_loss": 4.274783424836555, "test_loss": 1.7108713173076882, "test_acc1": 61.50800178100586, "test_acc5": 84.46400247802734, "epoch": 48, "n_parameters": 86567656}
{"train_lr": 0.0009387718066217019, "train_loss": 4.248400863650129, "test_loss": 1.6944977272437767, "test_acc1": 62.28200182739258, "test_acc5": 84.74400255371094, "epoch": 49, "n_parameters": 86567656}
{"train_lr": 0.000936250836504503, "train_loss": 4.232622410622622, "test_loss": 1.6617740028307213, "test_acc1": 62.754001751708984, "test_acc5": 84.99800245849609, "epoch": 50, "n_parameters": 86567656}
{"train_lr": 0.0009336825748732897, "train_loss": 4.207277786317203, "test_loss": 1.6491170545571596, "test_acc1": 62.74000178344726, "test_acc5": 84.99600249511718, "epoch": 51, "n_parameters": 86567656}
{"train_lr": 0.0009310673033669664, "train_loss": 4.193666700812743, "test_loss": 1.6320046994141562, "test_acc1": 63.21600186279297, "test_acc5": 85.62200239501954, "epoch": 52, "n_parameters": 86567656}
{"train_lr": 0.0009284053087794627, "train_loss": 4.175293596992962, "test_loss": 1.6034468361775385, "test_acc1": 63.63800183349609, "test_acc5": 85.79000251708985, "epoch": 53, "n_parameters": 86567656}
{"train_lr": 0.0009256968830284788, "train_loss": 4.1499804704428485, "test_loss": 1.5904232438603656, "test_acc1": 63.982001877441405, "test_acc5": 86.16200240966796, "epoch": 54, "n_parameters": 86567656}
{"train_lr": 0.0009229423231234935, "train_loss": 4.140841249450982, "test_loss": 1.5896301768334036, "test_acc1": 64.25600189331055, "test_acc5": 86.25200245605468, "epoch": 55, "n_parameters": 86567656}
{"train_lr": 0.0009201419311329745, "train_loss": 4.126061462860504, "test_loss": 1.5497980556824387, "test_acc1": 64.85200192016602, "test_acc5": 86.77200255859375, "epoch": 56, "n_parameters": 86567656}
{"train_lr": 0.0009172960141514878, "train_loss": 4.0892456480019765, "test_loss": 1.5338336727841115, "test_acc1": 65.22800185058594, "test_acc5": 86.99800257080078, "epoch": 57, "n_parameters": 86567656}
{"train_lr": 0.0009144048842658995, "train_loss": 4.090151033098463, "test_loss": 1.554975264360717, "test_acc1": 64.91400194458008, "test_acc5": 86.90200245605469, "epoch": 58, "n_parameters": 86567656}
{"train_lr": 0.0009114688585212051, "train_loss": 4.071263682308624, "test_loss": 1.5441503058296706, "test_acc1": 65.49600186157227, "test_acc5": 87.0840024609375, "epoch": 59, "n_parameters": 86567656}
{"train_lr": 0.0009084882588856559, "train_loss": 4.048776905158822, "test_loss": 1.5364339729760292, "test_acc1": 65.59200197631836, "test_acc5": 87.2220025, "epoch": 60, "n_parameters": 86567656}
{"train_lr": 0.0009054634122156225, "train_loss": 4.043769789268549, "test_loss": 1.5068948617537512, "test_acc1": 65.9760019946289, "test_acc5": 87.1400023828125, "epoch": 61, "n_parameters": 86567656}
{"train_lr": 0.0009023946502195919, "train_loss": 4.027713757672375, "test_loss": 1.4731654117237811, "test_acc1": 66.45800190551758, "test_acc5": 87.73200256103516, "epoch": 62, "n_parameters": 86567656}
{"train_lr": 0.0008992823094219693, "train_loss": 4.013316664168779, "test_loss": 1.4680036540338037, "test_acc1": 66.89800194824218, "test_acc5": 88.09600258544921, "epoch": 63, "n_parameters": 86567656}
{"train_lr": 0.0008961267311259655, "train_loss": 4.000876142669449, "test_loss": 1.4375451734564813, "test_acc1": 66.46200204589844, "test_acc5": 88.08400269042968, "epoch": 64, "n_parameters": 86567656}
{"train_lr": 0.0008929282613763057, "train_loss": 3.9976798101580684, "test_loss": 1.4658008489521817, "test_acc1": 66.88400192138671, "test_acc5": 87.83600245361328, "epoch": 65, "n_parameters": 86567656}
{"train_lr": 0.0008896872509212006, "train_loss": 3.9786956763143637, "test_loss": 1.463694032860809, "test_acc1": 67.04600197387695, "test_acc5": 88.17200239501953, "epoch": 66, "n_parameters": 86567656}
{"train_lr": 0.0008864040551740224, "train_loss": 3.9684006593805803, "test_loss": 1.4333227765880483, "test_acc1": 67.20000204345703, "test_acc5": 88.24400258544922, "epoch": 67, "n_parameters": 86567656}
{"train_lr": 0.0008830790341741554, "train_loss": 3.9536622501939513, "test_loss": 1.4067328895751436, "test_acc1": 67.82600194458009, "test_acc5": 88.86600270019531, "epoch": 68, "n_parameters": 86567656}
{"train_lr": 0.000879712552547612, "train_loss": 3.9474297726182916, "test_loss": 1.4099018707900037, "test_acc1": 67.73800202148438, "test_acc5": 88.42800237792969, "epoch": 69, "n_parameters": 86567656}
{"train_lr": 0.0008763049794670929, "train_loss": 3.9359117702161854, "test_loss": 1.4090413861620221, "test_acc1": 67.95600211791992, "test_acc5": 88.75200241210938, "epoch": 70, "n_parameters": 86567656}
{"train_lr": 0.0008728566886112912, "train_loss": 3.921899017265184, "test_loss": 1.4206063412201382, "test_acc1": 67.89400209472656, "test_acc5": 88.66600254638672, "epoch": 71, "n_parameters": 86567656}
{"train_lr": 0.000869368058124286, "train_loss": 3.9143798775333676, "test_loss": 1.402022508107083, "test_acc1": 68.36800203369141, "test_acc5": 88.86200243408203, "epoch": 72, "n_parameters": 86567656}
{"train_lr": 0.0008658394705736102, "train_loss": 3.8945145027981485, "test_loss": 1.4016583293047153, "test_acc1": 68.34600194335937, "test_acc5": 88.83400240966797, "epoch": 73, "n_parameters": 86567656}
{"train_lr": 0.0008622713129087039, "train_loss": 3.8866909041965036, "test_loss": 1.4053741517886091, "test_acc1": 68.29800217163086, "test_acc5": 89.1280025024414, "epoch": 74, "n_parameters": 86567656}
{"train_lr": 0.0008586639764182332, "train_loss": 3.886018632734708, "test_loss": 1.3765921392218852, "test_acc1": 68.83600210693359, "test_acc5": 89.3660025, "epoch": 75, "n_parameters": 86567656}
{"train_lr": 0.0008550178566873157, "train_loss": 3.868177431057111, "test_loss": 1.3631657589362816, "test_acc1": 69.08800186523438, "test_acc5": 89.21000241210938, "epoch": 76, "n_parameters": 86567656}
{"train_lr": 0.0008513333535541272, "train_loss": 3.864417827213935, "test_loss": 1.3890389862708075, "test_acc1": 68.7460021484375, "test_acc5": 89.17800246826172, "epoch": 77, "n_parameters": 86567656}
{"train_lr": 0.0008476108710658582, "train_loss": 3.8526818855917995, "test_loss": 1.3439982177371486, "test_acc1": 69.34800200927734, "test_acc5": 89.64000254882812, "epoch": 78, "n_parameters": 86567656}
{"train_lr": 0.00084385081743468, "train_loss": 3.846847207295142, "test_loss": 1.3401660867135492, "test_acc1": 69.38200208251953, "test_acc5": 89.48800264648438, "epoch": 79, "n_parameters": 86567656}
{"train_lr": 0.0008400536049929256, "train_loss": 3.8321303970140996, "test_loss": 1.3650580041410827, "test_acc1": 68.8940020739746, "test_acc5": 89.2540025048828, "epoch": 80, "n_parameters": 86567656}
{"train_lr": 0.0008362196501476587, "train_loss": 3.819716771777204, "test_loss": 1.3609292548643193, "test_acc1": 69.21200206298828, "test_acc5": 89.5340025439453, "epoch": 81, "n_parameters": 86567656}
{"train_lr": 0.0008323493733352106, "train_loss": 3.8125970807793044, "test_loss": 1.317762158853994, "test_acc1": 69.85200207763671, "test_acc5": 89.83200244140625, "epoch": 82, "n_parameters": 86567656}
{"train_lr": 0.0008284431989751196, "train_loss": 3.8104509739019123, "test_loss": 1.3279681993137165, "test_acc1": 69.65400213378906, "test_acc5": 89.88800242431641, "epoch": 83, "n_parameters": 86567656}
{"train_lr": 0.0008245015554233518, "train_loss": 3.8005393500939357, "test_loss": 1.3056690217265698, "test_acc1": 69.88600223388671, "test_acc5": 89.85800252197265, "epoch": 84, "n_parameters": 86567656}
{"train_lr": 0.0008205248749255873, "train_loss": 3.7926494595434646, "test_loss": 1.3300568780606172, "test_acc1": 70.04800222167968, "test_acc5": 89.99200262695312, "epoch": 85, "n_parameters": 86567656}
{"train_lr": 0.0008165135935696841, "train_loss": 3.7806424369914926, "test_loss": 1.3066793919010034, "test_acc1": 70.15600204711915, "test_acc5": 90.07600260742187, "epoch": 86, "n_parameters": 86567656}
{"train_lr": 0.0008124681512377846, "train_loss": 3.7689378549107353, "test_loss": 1.2885048412029665, "test_acc1": 70.56200220458985, "test_acc5": 90.20600251953125, "epoch": 87, "n_parameters": 86567656}
{"train_lr": 0.0008083889915582182, "train_loss": 3.7677804811728848, "test_loss": 1.2747489950135207, "test_acc1": 70.49400211914063, "test_acc5": 90.14200237060547, "epoch": 88, "n_parameters": 86567656}
{"train_lr": 0.0008042765618568846, "train_loss": 3.7601282552515953, "test_loss": 1.2911592898693744, "test_acc1": 70.72600203735351, "test_acc5": 90.24200243896485, "epoch": 89, "n_parameters": 86567656}
{"train_lr": 0.0008001313131079711, "train_loss": 3.7540939442998025, "test_loss": 1.2852089909296804, "test_acc1": 70.5460021484375, "test_acc5": 90.09800256591797, "epoch": 90, "n_parameters": 86567656}
{"train_lr": 0.0007959536998847493, "train_loss": 3.7457242519390004, "test_loss": 1.2600903794484037, "test_acc1": 70.87200221191407, "test_acc5": 90.37400258300781, "epoch": 91, "n_parameters": 86567656}
{"train_lr": 0.0007917441803096098, "train_loss": 3.735124783115469, "test_loss": 1.2626564547619756, "test_acc1": 71.25400228393555, "test_acc5": 90.45200252441406, "epoch": 92, "n_parameters": 86567656}
{"train_lr": 0.0007875032160038205, "train_loss": 3.7294276796287296, "test_loss": 1.287691175279828, "test_acc1": 71.08600213378907, "test_acc5": 90.47800247070313, "epoch": 93, "n_parameters": 86567656}
{"train_lr": 0.0007832312720368117, "train_loss": 3.7214987597031466, "test_loss": 1.2749037786946416, "test_acc1": 71.18400201660157, "test_acc5": 90.78600256347656, "epoch": 94, "n_parameters": 86567656}
{"train_lr": 0.0007789288168754664, "train_loss": 3.714799323444553, "test_loss": 1.2625454982846347, "test_acc1": 71.29800217773438, "test_acc5": 90.7360024609375, "epoch": 95, "n_parameters": 86567656}
{"train_lr": 0.0007745963223324492, "train_loss": 3.705345804599835, "test_loss": 1.2591125583580038, "test_acc1": 71.35200228515625, "test_acc5": 90.59600237304687, "epoch": 96, "n_parameters": 86567656}
{"train_lr": 0.0007702342635146132, "train_loss": 3.7035852444769857, "test_loss": 1.2378938079109119, "test_acc1": 71.69000206787109, "test_acc5": 90.8700026171875, "epoch": 97, "n_parameters": 86567656}
{"train_lr": 0.0007658431187708385, "train_loss": 3.694852126099699, "test_loss": 1.2469493661240287, "test_acc1": 71.8420020703125, "test_acc5": 90.93400253417968, "epoch": 98, "n_parameters": 86567656}
{"train_lr": 0.0007614233696396924, "train_loss": 3.690621215370681, "test_loss": 1.249524564580588, "test_acc1": 71.44000217407226, "test_acc5": 90.91200248535156, "epoch": 99, "n_parameters": 86567656}
{"train_lr": 0.0007569755007964469, "train_loss": 3.6718781237110054, "test_loss": 1.2350448122580542, "test_acc1": 71.7220023022461, "test_acc5": 91.08600243164062, "epoch": 100, "n_parameters": 86567656}
{"train_lr": 0.0007525000000000169, "train_loss": 3.6674151625171554, "test_loss": 1.2218696922063828, "test_acc1": 71.71600217041015, "test_acc5": 90.87400243164062, "epoch": 101, "n_parameters": 86567656}
{"train_lr": 0.0007479973580395145, "train_loss": 3.664181846681592, "test_loss": 1.229475072272222, "test_acc1": 71.74800213256836, "test_acc5": 90.95800254882812, "epoch": 102, "n_parameters": 86567656}
{"train_lr": 0.0007434680686803327, "train_loss": 3.6683847403807417, "test_loss": 1.2287794816631272, "test_acc1": 71.91400230224609, "test_acc5": 91.24000263427735, "epoch": 103, "n_parameters": 86567656}
{"train_lr": 0.0007389126286101684, "train_loss": 3.6535593235759523, "test_loss": 1.2166868554939465, "test_acc1": 72.21200203613282, "test_acc5": 91.212002421875, "epoch": 104, "n_parameters": 86567656}
{"train_lr": 0.0007343315373843357, "train_loss": 3.6413857344564775, "test_loss": 1.2250027885363792, "test_acc1": 72.24600209472656, "test_acc5": 91.03600252685547, "epoch": 105, "n_parameters": 86567656}
{"train_lr": 0.0007297252973710595, "train_loss": 3.6447426636251423, "test_loss": 1.1999774874972748, "test_acc1": 72.28600231933594, "test_acc5": 91.23200234375, "epoch": 106, "n_parameters": 86567656}
{"train_lr": 0.0007250944136965276, "train_loss": 3.638388103009652, "test_loss": 1.2114782737507244, "test_acc1": 72.32600219726562, "test_acc5": 91.33000254882812, "epoch": 107, "n_parameters": 86567656}
{"train_lr": 0.0007204393941893078, "train_loss": 3.6322500522342995, "test_loss": 1.2029579412513869, "test_acc1": 72.71200220947266, "test_acc5": 91.54000237304687, "epoch": 108, "n_parameters": 86567656}
{"train_lr": 0.0007157607493246968, "train_loss": 3.6227213309632598, "test_loss": 1.19367569464754, "test_acc1": 72.62000221679688, "test_acc5": 91.61400251953125, "epoch": 109, "n_parameters": 86567656}
{"train_lr": 0.0007110589921689151, "train_loss": 3.614883722369667, "test_loss": 1.1863410010962476, "test_acc1": 72.50000203857422, "test_acc5": 91.43400251464844, "epoch": 110, "n_parameters": 86567656}
{"train_lr": 0.0007063346383225065, "train_loss": 3.608024074870953, "test_loss": 1.1866816249667111, "test_acc1": 72.82000220336914, "test_acc5": 91.55000237304688, "epoch": 111, "n_parameters": 86567656}
{"train_lr": 0.0007015882058641976, "train_loss": 3.6046528006664853, "test_loss": 1.1883701651773617, "test_acc1": 72.67400215576171, "test_acc5": 91.60200256835938, "epoch": 112, "n_parameters": 86567656}
{"train_lr": 0.0006968202152938009, "train_loss": 3.595116863523027, "test_loss": 1.1900387504164867, "test_acc1": 73.02200213500977, "test_acc5": 91.63400241210938, "epoch": 113, "n_parameters": 86567656}
{"train_lr": 0.0006920311894751397, "train_loss": 3.591501490103541, "test_loss": 1.2069337679191194, "test_acc1": 72.72800232299805, "test_acc5": 91.47400241699219, "epoch": 114, "n_parameters": 86567656}
{"train_lr": 0.0006872216535789267, "train_loss": 3.5831009028650684, "test_loss": 1.1699077605686352, "test_acc1": 73.37200220336914, "test_acc5": 91.868002578125, "epoch": 115, "n_parameters": 86567656}
{"train_lr": 0.0006823921350249367, "train_loss": 3.5842772988285376, "test_loss": 1.1740828102129206, "test_acc1": 72.97600218017578, "test_acc5": 91.75800252441407, "epoch": 116, "n_parameters": 86567656}
{"train_lr": 0.0006775431634242845, "train_loss": 3.5685654405852874, "test_loss": 1.1643850652647567, "test_acc1": 73.31800228149415, "test_acc5": 91.90800249023438, "epoch": 117, "n_parameters": 86567656}
{"train_lr": 0.0006726752705214028, "train_loss": 3.564477817421194, "test_loss": 1.173028209473716, "test_acc1": 73.3140022631836, "test_acc5": 91.8400026171875, "epoch": 118, "n_parameters": 86567656}
{"train_lr": 0.0006677889901356114, "train_loss": 3.5554917009114075, "test_loss": 1.1880661253164917, "test_acc1": 73.01000225585938, "test_acc5": 91.71000260742187, "epoch": 119, "n_parameters": 86567656}
{"train_lr": 0.000662884858102535, "train_loss": 3.5531239350922674, "test_loss": 1.1568047881069201, "test_acc1": 73.620002109375, "test_acc5": 91.98400249023437, "epoch": 120, "n_parameters": 86567656}
{"train_lr": 0.0006579634122155856, "train_loss": 3.5509738077958235, "test_loss": 1.1721605630788143, "test_acc1": 73.50400214111328, "test_acc5": 91.69400240966797, "epoch": 121, "n_parameters": 86567656}
{"train_lr": 0.0006530251921667783, "train_loss": 3.543098789866832, "test_loss": 1.1556392123568768, "test_acc1": 73.70000222412109, "test_acc5": 92.112002578125, "epoch": 122, "n_parameters": 86567656}
{"train_lr": 0.0006480707394875038, "train_loss": 3.543089595939711, "test_loss": 1.1678765612062703, "test_acc1": 73.33200229492188, "test_acc5": 91.83400251464843, "epoch": 123, "n_parameters": 86567656}
{"train_lr": 0.0006431005974894059, "train_loss": 3.525551415372381, "test_loss": 1.1425051378540252, "test_acc1": 73.7240022668457, "test_acc5": 92.16000249023438, "epoch": 124, "n_parameters": 86567656}
{"train_lr": 0.0006381153112045359, "train_loss": 3.5223406369177748, "test_loss": 1.1384239852886053, "test_acc1": 73.70600221191407, "test_acc5": 92.24400254882812, "epoch": 125, "n_parameters": 86567656}
{"train_lr": 0.0006331154273257683, "train_loss": 3.5213875332169775, "test_loss": 1.1328076123619262, "test_acc1": 73.93800219482422, "test_acc5": 92.16800258789063, "epoch": 126, "n_parameters": 86567656}
{"train_lr": 0.0006281014941466044, "train_loss": 3.5152407807471464, "test_loss": 1.1604019130889376, "test_acc1": 74.01200230712891, "test_acc5": 92.08400260253906, "epoch": 127, "n_parameters": 86567656}
{"train_lr": 0.000623074061501409, "train_loss": 3.5077851228028845, "test_loss": 1.1244228157338163, "test_acc1": 73.93000219238282, "test_acc5": 92.37400252929687, "epoch": 128, "n_parameters": 86567656}
{"train_lr": 0.0006180336807047859, "train_loss": 3.4945462813658965, "test_loss": 1.1314636070188313, "test_acc1": 74.19800236083984, "test_acc5": 92.28600247070312, "epoch": 129, "n_parameters": 86567656}
{"train_lr": 0.0006129809044912788, "train_loss": 3.5000349288161616, "test_loss": 1.1298315134364219, "test_acc1": 74.27200221191406, "test_acc5": 92.36000241210938, "epoch": 130, "n_parameters": 86567656}
{"train_lr": 0.0006079162869547816, "train_loss": 3.4891138726132187, "test_loss": 1.1295712536733575, "test_acc1": 74.12200232910156, "test_acc5": 92.36000234863282, "epoch": 131, "n_parameters": 86567656}
{"train_lr": 0.0006028403834876773, "train_loss": 3.4815534904396697, "test_loss": 1.1211089000477672, "test_acc1": 74.4120023461914, "test_acc5": 92.33400254394532, "epoch": 132, "n_parameters": 86567656}
{"train_lr": 0.0005977537507199184, "train_loss": 3.4748228248551216, "test_loss": 1.1177433512661599, "test_acc1": 74.44000232421875, "test_acc5": 92.44600252441407, "epoch": 133, "n_parameters": 86567656}
{"train_lr": 0.0005926569464581886, "train_loss": 3.4736785936674814, "test_loss": 1.0964308133109288, "test_acc1": 74.52800233398438, "test_acc5": 92.60000263183593, "epoch": 134, "n_parameters": 86567656}
{"train_lr": 0.0005875505296244566, "train_loss": 3.4673725597852236, "test_loss": 1.1132738089435619, "test_acc1": 74.31000221191407, "test_acc5": 92.52600253417968, "epoch": 135, "n_parameters": 86567656}
{"train_lr": 0.0005824350601949219, "train_loss": 3.4646664584795537, "test_loss": 1.1175338277546778, "test_acc1": 74.42800239013673, "test_acc5": 92.466002578125, "epoch": 136, "n_parameters": 86567656}
{"train_lr": 0.0005773110991383895, "train_loss": 3.455456799198445, "test_loss": 1.0943328227111337, "test_acc1": 74.81000230834961, "test_acc5": 92.64600267578125, "epoch": 137, "n_parameters": 86567656}
{"train_lr": 0.0005721792083549796, "train_loss": 3.450480998140111, "test_loss": 1.0881213866989352, "test_acc1": 74.9320021887207, "test_acc5": 92.62600249511719, "epoch": 138, "n_parameters": 86567656}
{"train_lr": 0.0005670399506143469, "train_loss": 3.437457082827362, "test_loss": 1.1091633370707452, "test_acc1": 75.02200225830079, "test_acc5": 92.68800235351563, "epoch": 139, "n_parameters": 86567656}
{"train_lr": 0.0005618938894939768, "train_loss": 3.4320671381138497, "test_loss": 1.0865142293374506, "test_acc1": 75.02800225585938, "test_acc5": 92.73800244628906, "epoch": 140, "n_parameters": 86567656}
{"train_lr": 0.0005567415893175016, "train_loss": 3.426269463736186, "test_loss": 1.106057016296945, "test_acc1": 74.81000226318359, "test_acc5": 92.75200245117188, "epoch": 141, "n_parameters": 86567656}
{"train_lr": 0.0005515836150926655, "train_loss": 3.422003237594613, "test_loss": 1.093539923372287, "test_acc1": 75.21000218383789, "test_acc5": 92.86000247070312, "epoch": 142, "n_parameters": 86567656}
{"train_lr": 0.0005464205324494959, "train_loss": 3.419977205256812, "test_loss": 1.081409704147511, "test_acc1": 75.34800225830078, "test_acc5": 92.95200264160157, "epoch": 143, "n_parameters": 86567656}
{"train_lr": 0.0005412529075781865, "train_loss": 3.4079681129919157, "test_loss": 1.0899399144006554, "test_acc1": 75.17400214355469, "test_acc5": 92.94000244140625, "epoch": 144, "n_parameters": 86567656}
{"train_lr": 0.0005360813071670112, "train_loss": 3.405631442805179, "test_loss": 1.05908976177794, "test_acc1": 75.31000237548828, "test_acc5": 92.94000262695313, "epoch": 145, "n_parameters": 86567656}
{"train_lr": 0.0005309062983402612, "train_loss": 3.398518598194031, "test_loss": 1.0823960560525905, "test_acc1": 75.22400239501953, "test_acc5": 92.87600249511719, "epoch": 146, "n_parameters": 86567656}
{"train_lr": 0.0005257284485959572, "train_loss": 3.393898235367452, "test_loss": 1.064496947055586, "test_acc1": 75.58200220703125, "test_acc5": 93.05600246582031, "epoch": 147, "n_parameters": 86567656}
{"train_lr": 0.000520548325743666, "train_loss": 3.393869087117896, "test_loss": 1.0835783130376673, "test_acc1": 75.37200219970703, "test_acc5": 92.92200257324218, "epoch": 148, "n_parameters": 86567656}
{"train_lr": 0.0005153664978422618, "train_loss": 3.3843041309159245, "test_loss": 1.0716892635010025, "test_acc1": 75.68800229492187, "test_acc5": 92.98000239746094, "epoch": 149, "n_parameters": 86567656}
{"train_lr": 0.0005101835331375457, "train_loss": 3.3783737677130863, "test_loss": 1.0637317369057442, "test_acc1": 75.59000237548828, "test_acc5": 93.05400241210937, "epoch": 150, "n_parameters": 86567656}
{"train_lr": 0.0005049999999999881, "train_loss": 3.37658649060628, "test_loss": 1.0613045451336767, "test_acc1": 75.78800233886719, "test_acc5": 93.16600266113281, "epoch": 151, "n_parameters": 86567656}
{"train_lr": 0.0004998164668624689, "train_loss": 3.3716152545800218, "test_loss": 1.0438073943306525, "test_acc1": 75.7880023461914, "test_acc5": 93.11400240234374, "epoch": 152, "n_parameters": 86567656}
{"train_lr": 0.0004946335021577291, "train_loss": 3.356528867342823, "test_loss": 1.0350618531173112, "test_acc1": 76.13400234619141, "test_acc5": 93.27800240234374, "epoch": 153, "n_parameters": 86567656}
{"train_lr": 0.0004894516742563275, "train_loss": 3.3511958251313434, "test_loss": 1.0526964371298189, "test_acc1": 75.79000239257813, "test_acc5": 93.1440025048828, "epoch": 154, "n_parameters": 86567656}
{"train_lr": 0.0004842715514040588, "train_loss": 3.346994234640583, "test_loss": 1.0520886109280265, "test_acc1": 75.92800229492188, "test_acc5": 93.17000251953125, "epoch": 155, "n_parameters": 86567656}
{"train_lr": 0.00047909370165973703, "train_loss": 3.3455612537779396, "test_loss": 1.0418137731799237, "test_acc1": 76.00200229492188, "test_acc5": 93.38400249023438, "epoch": 156, "n_parameters": 86567656}
{"train_lr": 0.00047391869283298406, "train_loss": 3.330031465116641, "test_loss": 1.0450043267572224, "test_acc1": 76.03000229492187, "test_acc5": 93.35600255859374, "epoch": 157, "n_parameters": 86567656}
{"train_lr": 0.0004687470924218306, "train_loss": 3.329861494950015, "test_loss": 1.0565957334929372, "test_acc1": 76.11600232421875, "test_acc5": 93.35400247070312, "epoch": 158, "n_parameters": 86567656}
{"train_lr": 0.0004635794675504931, "train_loss": 3.3228573790259306, "test_loss": 1.03216290845752, "test_acc1": 76.4920023779297, "test_acc5": 93.4380026171875, "epoch": 159, "n_parameters": 86567656}
{"train_lr": 0.0004584163849073357, "train_loss": 3.3102992619279856, "test_loss": 1.040823851059586, "test_acc1": 76.34400228271484, "test_acc5": 93.56600235839844, "epoch": 160, "n_parameters": 86567656}
{"train_lr": 0.0004532584106825094, "train_loss": 3.3138566714503783, "test_loss": 1.0251121477808467, "test_acc1": 76.39800229980469, "test_acc5": 93.48000238769531, "epoch": 161, "n_parameters": 86567656}
{"train_lr": 0.0004481061105060409, "train_loss": 3.2990098250069493, "test_loss": 1.0290264447225033, "test_acc1": 76.35800231201172, "test_acc5": 93.52800250976563, "epoch": 162, "n_parameters": 86567656}
{"train_lr": 0.00044296004938566933, "train_loss": 3.299712732809482, "test_loss": 1.0195860669674663, "test_acc1": 76.48400222167969, "test_acc5": 93.44600270507813, "epoch": 163, "n_parameters": 86567656}
{"train_lr": 0.0004378207916450146, "train_loss": 3.2989827446240505, "test_loss": 1.018364011697943, "test_acc1": 76.43200244384765, "test_acc5": 93.37200237792969, "epoch": 164, "n_parameters": 86567656}
{"train_lr": 0.00043268890086160794, "train_loss": 3.291691841493598, "test_loss": 1.0165801825084064, "test_acc1": 76.92600226318359, "test_acc5": 93.56600246582032, "epoch": 165, "n_parameters": 86567656}
{"train_lr": 0.00042756493980507503, "train_loss": 3.282969684903618, "test_loss": 1.0177554152405421, "test_acc1": 76.5840023388672, "test_acc5": 93.48800239257812, "epoch": 166, "n_parameters": 86567656}
{"train_lr": 0.0004224494703755201, "train_loss": 3.273610697584234, "test_loss": 1.0214411963256445, "test_acc1": 76.68800235839844, "test_acc5": 93.62200255371094, "epoch": 167, "n_parameters": 86567656}
{"train_lr": 0.00041734305354179923, "train_loss": 3.26893277596727, "test_loss": 1.000688601707085, "test_acc1": 76.94200241210937, "test_acc5": 93.774002421875, "epoch": 168, "n_parameters": 86567656}
{"train_lr": 0.0004122462492800569, "train_loss": 3.261983603250971, "test_loss": 1.0103487031187526, "test_acc1": 76.98800224609376, "test_acc5": 93.63800242675781, "epoch": 169, "n_parameters": 86567656}
{"train_lr": 0.0004071596165123325, "train_loss": 3.255067869413385, "test_loss": 1.0064577528073555, "test_acc1": 77.15400231201171, "test_acc5": 93.73200248535156, "epoch": 170, "n_parameters": 86567656}
{"train_lr": 0.0004020837130452182, "train_loss": 3.2519517151667157, "test_loss": 1.0001335621108935, "test_acc1": 77.1740023828125, "test_acc5": 93.60400252929688, "epoch": 171, "n_parameters": 86567656}
{"train_lr": 0.00039701909550871056, "train_loss": 3.240579614649526, "test_loss": 0.9909070881938065, "test_acc1": 77.0720021875, "test_acc5": 93.70200251953125, "epoch": 172, "n_parameters": 86567656}
{"train_lr": 0.0003919663192952229, "train_loss": 3.2413162102790283, "test_loss": 0.9880042900107873, "test_acc1": 77.39600220214844, "test_acc5": 93.96000244628907, "epoch": 173, "n_parameters": 86567656}
{"train_lr": 0.0003869259384985974, "train_loss": 3.2294046959871774, "test_loss": 1.0089962324860458, "test_acc1": 77.08400235107422, "test_acc5": 93.75600252929688, "epoch": 174, "n_parameters": 86567656}
{"train_lr": 0.0003818985058534034, "train_loss": 3.2279050957194144, "test_loss": 0.9944835267460507, "test_acc1": 77.33000229003906, "test_acc5": 93.8860023828125, "epoch": 175, "n_parameters": 86567656}
{"train_lr": 0.0003768845726742596, "train_loss": 3.2245855438444826, "test_loss": 0.98429896500884, "test_acc1": 77.39600244628906, "test_acc5": 94.03200262207031, "epoch": 176, "n_parameters": 86567656}
{"train_lr": 0.0003718846887954506, "train_loss": 3.215076746224023, "test_loss": 0.988809123234877, "test_acc1": 77.6080023046875, "test_acc5": 93.78800251953125, "epoch": 177, "n_parameters": 86567656}
{"train_lr": 0.00036689940251057154, "train_loss": 3.2065876076082818, "test_loss": 0.9868185235305391, "test_acc1": 77.55800219238282, "test_acc5": 94.04800247070312, "epoch": 178, "n_parameters": 86567656}
{"train_lr": 0.0003619292605124837, "train_loss": 3.2050574634918014, "test_loss": 0.9834786712436896, "test_acc1": 77.62800240478515, "test_acc5": 94.01200252441406, "epoch": 179, "n_parameters": 86567656}
{"train_lr": 0.0003569748078332422, "train_loss": 3.1918656357246147, "test_loss": 0.9921081590675347, "test_acc1": 77.36400233886718, "test_acc5": 93.86400274414062, "epoch": 180, "n_parameters": 86567656}
{"train_lr": 0.00035203658778439235, "train_loss": 3.1921141405257103, "test_loss": 0.9749775048123669, "test_acc1": 77.79000235839844, "test_acc5": 94.07200254394532, "epoch": 181, "n_parameters": 86567656}
{"train_lr": 0.0003471151418974503, "train_loss": 3.189818975057819, "test_loss": 0.9579585125659111, "test_acc1": 77.68800219238281, "test_acc5": 94.10400243164062, "epoch": 182, "n_parameters": 86567656}
{"train_lr": 0.0003422110098644085, "train_loss": 3.171989895111556, "test_loss": 0.9698748211885826, "test_acc1": 77.64400220825195, "test_acc5": 94.0220024560547, "epoch": 183, "n_parameters": 86567656}
{"train_lr": 0.0003373247294785742, "train_loss": 3.1703767621938845, "test_loss": 0.9723664212421355, "test_acc1": 78.11200226074219, "test_acc5": 94.210002421875, "epoch": 184, "n_parameters": 86567656}
{"train_lr": 0.0003324568365756945, "train_loss": 3.166205885944416, "test_loss": 0.9651561257306078, "test_acc1": 78.06800224853515, "test_acc5": 94.0820026171875, "epoch": 185, "n_parameters": 86567656}
{"train_lr": 0.00032760786497508304, "train_loss": 3.1597316172792853, "test_loss": 0.9552094892897213, "test_acc1": 78.1340023803711, "test_acc5": 94.19000245605469, "epoch": 186, "n_parameters": 86567656}
{"train_lr": 0.00032277834642108216, "train_loss": 3.156443008850757, "test_loss": 0.9576324989264848, "test_acc1": 77.93000223144531, "test_acc5": 94.16000243164062, "epoch": 187, "n_parameters": 86567656}
{"train_lr": 0.00031796881052486697, "train_loss": 3.1446771065501284, "test_loss": 0.9659298881459374, "test_acc1": 78.1760023876953, "test_acc5": 94.22000250976562, "epoch": 188, "n_parameters": 86567656}
{"train_lr": 0.0003131797847062025, "train_loss": 3.136061396256244, "test_loss": 0.9600868780244564, "test_acc1": 78.04400226806641, "test_acc5": 94.17000249023438, "epoch": 189, "n_parameters": 86567656}
{"train_lr": 0.0003084117941357799, "train_loss": 3.1373875858031397, "test_loss": 0.9573571463464089, "test_acc1": 78.25400211669921, "test_acc5": 94.32600250976563, "epoch": 190, "n_parameters": 86567656}
{"train_lr": 0.0003036653616774752, "train_loss": 3.1306712192644794, "test_loss": 0.9568888733517414, "test_acc1": 78.12200237792969, "test_acc5": 94.31000267089844, "epoch": 191, "n_parameters": 86567656}
{"train_lr": 0.00029894100783110664, "train_loss": 3.1200240212593147, "test_loss": 0.9476718956929937, "test_acc1": 78.48000229003907, "test_acc5": 94.31600235351563, "epoch": 192, "n_parameters": 86567656}
{"train_lr": 0.0002942392506752879, "train_loss": 3.1160478303127057, "test_loss": 0.9543764597795289, "test_acc1": 78.31000234130859, "test_acc5": 94.18800240234376, "epoch": 193, "n_parameters": 86567656}
{"train_lr": 0.0002895606058107011, "train_loss": 3.1012808386322788, "test_loss": 0.9456948308191921, "test_acc1": 78.45200226806641, "test_acc5": 94.33200260253906, "epoch": 194, "n_parameters": 86567656}
{"train_lr": 0.0002849055863034561, "train_loss": 3.098641149717555, "test_loss": 0.9445924288995435, "test_acc1": 78.54800236328126, "test_acc5": 94.37400237304688, "epoch": 195, "n_parameters": 86567656}
{"train_lr": 0.0002802747026289244, "train_loss": 3.0931782620452006, "test_loss": 0.9372673418494424, "test_acc1": 78.40200234130859, "test_acc5": 94.45600252929688, "epoch": 196, "n_parameters": 86567656}
{"train_lr": 0.0002756684626156735, "train_loss": 3.0878213243030435, "test_loss": 0.9348279039827738, "test_acc1": 78.38800235839844, "test_acc5": 94.58000241699219, "epoch": 197, "n_parameters": 86567656}
{"train_lr": 0.00027108737138981483, "train_loss": 3.0864678089388553, "test_loss": 0.9324265690431027, "test_acc1": 78.79600248779298, "test_acc5": 94.47400247070313, "epoch": 198, "n_parameters": 86567656}
{"train_lr": 0.0002665319313196479, "train_loss": 3.073305655363128, "test_loss": 0.9290834515857834, "test_acc1": 78.82000245849609, "test_acc5": 94.5800026171875, "epoch": 199, "n_parameters": 86567656}
{"train_lr": 0.00026200264196050673, "train_loss": 3.064749463957896, "test_loss": 0.9332024799427464, "test_acc1": 78.94600228027343, "test_acc5": 94.50200252929687, "epoch": 200, "n_parameters": 86567656}
{"train_lr": 0.00025750000000000143, "train_loss": 3.0673988985834266, "test_loss": 0.924392034562444, "test_acc1": 78.89000243652343, "test_acc5": 94.60600244140625, "epoch": 201, "n_parameters": 86567656}
{"train_lr": 0.0002530244992035622, "train_loss": 3.0512422359675813, "test_loss": 0.9203511039206254, "test_acc1": 78.90000236572266, "test_acc5": 94.63000267578126, "epoch": 202, "n_parameters": 86567656}
{"train_lr": 0.0002485766303603018, "train_loss": 3.0516018261976665, "test_loss": 0.9277822382161804, "test_acc1": 78.86200229980469, "test_acc5": 94.50000241210938, "epoch": 203, "n_parameters": 86567656}
{"train_lr": 0.00024415688122914167, "train_loss": 3.0430931606107383, "test_loss": 0.923912382429026, "test_acc1": 79.10600245117188, "test_acc5": 94.68600253417969, "epoch": 204, "n_parameters": 86567656}
{"train_lr": 0.00023976573648539732, "train_loss": 3.035738169628796, "test_loss": 0.9126077786574208, "test_acc1": 79.02200230957031, "test_acc5": 94.62000257324219, "epoch": 205, "n_parameters": 86567656}
{"train_lr": 0.0002354036776675575, "train_loss": 3.0249579330380683, "test_loss": 0.9133295737736056, "test_acc1": 79.25800254882813, "test_acc5": 94.49000244140625, "epoch": 206, "n_parameters": 86567656}
{"train_lr": 0.00023107118312454297, "train_loss": 3.0229408154360873, "test_loss": 0.9240840127166082, "test_acc1": 79.08200240234375, "test_acc5": 94.68200243652343, "epoch": 207, "n_parameters": 86567656}
{"train_lr": 0.00022676872796319747, "train_loss": 3.0117405723515365, "test_loss": 0.912925429656501, "test_acc1": 79.11200229980469, "test_acc5": 94.73000250976563, "epoch": 208, "n_parameters": 86567656}
{"train_lr": 0.00022249678399621184, "train_loss": 3.004481432350467, "test_loss": 0.9116701114772606, "test_acc1": 79.2000025, "test_acc5": 94.82600242675781, "epoch": 209, "n_parameters": 86567656}
{"train_lr": 0.00021825581969037202, "train_loss": 3.0031299623761245, "test_loss": 0.9109335530570739, "test_acc1": 79.26600239013672, "test_acc5": 94.77000238769531, "epoch": 210, "n_parameters": 86567656}
{"train_lr": 0.00021404630011522877, "train_loss": 2.9964410694752286, "test_loss": 0.8992272809634053, "test_acc1": 79.41000229003906, "test_acc5": 94.76200254394531, "epoch": 211, "n_parameters": 86567656}
{"train_lr": 0.00020986868689201908, "train_loss": 2.9924510245104963, "test_loss": 0.8947183613642163, "test_acc1": 79.36400234619141, "test_acc5": 94.76400255859375, "epoch": 212, "n_parameters": 86567656}
{"train_lr": 0.00020572343814312388, "train_loss": 2.9823559692961803, "test_loss": 0.8998423185263852, "test_acc1": 79.36400228759766, "test_acc5": 94.88400254394531, "epoch": 213, "n_parameters": 86567656}
{"train_lr": 0.00020161100844177222, "train_loss": 2.975718041249126, "test_loss": 0.9195369655934954, "test_acc1": 79.374002265625, "test_acc5": 94.74000237304688, "epoch": 214, "n_parameters": 86567656}
{"train_lr": 0.0001975318487622333, "train_loss": 2.9736629534098835, "test_loss": 0.899601411367561, "test_acc1": 79.61600233886719, "test_acc5": 94.81000249023438, "epoch": 215, "n_parameters": 86567656}
{"train_lr": 0.0001934864064303279, "train_loss": 2.961540795100345, "test_loss": 0.8973594622511324, "test_acc1": 79.63800220947266, "test_acc5": 94.86200252441407, "epoch": 216, "n_parameters": 86567656}
{"train_lr": 0.00018947512507439562, "train_loss": 2.954377043983347, "test_loss": 0.8870117384046602, "test_acc1": 79.77400250732421, "test_acc5": 94.84400250976563, "epoch": 217, "n_parameters": 86567656}
{"train_lr": 0.00018549844457663907, "train_loss": 2.9490734525888467, "test_loss": 0.8899080330602496, "test_acc1": 79.6060023828125, "test_acc5": 94.86600220703124, "epoch": 218, "n_parameters": 86567656}
{"train_lr": 0.00018155680102489234, "train_loss": 2.9474317169577766, "test_loss": 0.900220085500298, "test_acc1": 79.81000245117187, "test_acc5": 94.83800240722657, "epoch": 219, "n_parameters": 86567656}
{"train_lr": 0.00017765062666479713, "train_loss": 2.9385974038299993, "test_loss": 0.8831283893157333, "test_acc1": 79.61600232910156, "test_acc5": 94.990002421875, "epoch": 220, "n_parameters": 86567656}
{"train_lr": 0.00017378034985236136, "train_loss": 2.928655767368136, "test_loss": 0.9019939714681622, "test_acc1": 79.62400236328125, "test_acc5": 94.89200250488281, "epoch": 221, "n_parameters": 86567656}
{"train_lr": 0.0001699463950070852, "train_loss": 2.924485314134166, "test_loss": 0.8827514088142399, "test_acc1": 79.84600239990235, "test_acc5": 94.97000248535156, "epoch": 222, "n_parameters": 86567656}
{"train_lr": 0.00016614918256530037, "train_loss": 2.9118585276791897, "test_loss": 0.8866927613452391, "test_acc1": 79.83400236572265, "test_acc5": 94.86000253417969, "epoch": 223, "n_parameters": 86567656}
{"train_lr": 0.0001623891289341519, "train_loss": 2.9064688433012327, "test_loss": 0.8908811007374308, "test_acc1": 79.81400236328125, "test_acc5": 94.9820025, "epoch": 224, "n_parameters": 86567656}
{"train_lr": 0.00015866664644587948, "train_loss": 2.9025012384906566, "test_loss": 0.891094551119603, "test_acc1": 79.91800235839844, "test_acc5": 94.98000241210937, "epoch": 225, "n_parameters": 86567656}
{"train_lr": 0.00015498214331266302, "train_loss": 2.8967916879067412, "test_loss": 0.8961087554521615, "test_acc1": 79.81600222167968, "test_acc5": 94.91200256835937, "epoch": 226, "n_parameters": 86567656}
{"train_lr": 0.00015133602358175863, "train_loss": 2.8904558579734476, "test_loss": 0.8928148392981164, "test_acc1": 79.97800249023437, "test_acc5": 94.93800234375, "epoch": 227, "n_parameters": 86567656}
{"train_lr": 0.00014772868709131358, "train_loss": 2.887752041917482, "test_loss": 0.8901664490548754, "test_acc1": 79.86800240478516, "test_acc5": 94.89000237792969, "epoch": 228, "n_parameters": 86567656}
{"train_lr": 0.00014416052942639815, "train_loss": 2.879063463795909, "test_loss": 0.8927803474573165, "test_acc1": 80.03400234375, "test_acc5": 95.01600249511719, "epoch": 229, "n_parameters": 86567656}
{"train_lr": 0.0001406319418757283, "train_loss": 2.865383940212113, "test_loss": 0.877749084482495, "test_acc1": 80.06200251708984, "test_acc5": 94.98000239257813, "epoch": 230, "n_parameters": 86567656}
{"train_lr": 0.00013714331138869076, "train_loss": 2.86347589897309, "test_loss": 0.8827237793442841, "test_acc1": 79.96400236328125, "test_acc5": 95.01600229492188, "epoch": 231, "n_parameters": 86567656}
{"train_lr": 0.00013369502053292505, "train_loss": 2.8560005076807276, "test_loss": 0.8829581342823446, "test_acc1": 80.02400239257813, "test_acc5": 94.99400246582032, "epoch": 232, "n_parameters": 86567656}
{"train_lr": 0.00013028744745238475, "train_loss": 2.856597069356081, "test_loss": 0.870715930128395, "test_acc1": 80.33200252441407, "test_acc5": 95.07400244628906, "epoch": 233, "n_parameters": 86567656}
{"train_lr": 0.0001269209658258495, "train_loss": 2.8468394889641435, "test_loss": 0.8724553899378328, "test_acc1": 80.34000236083985, "test_acc5": 95.09600241699219, "epoch": 234, "n_parameters": 86567656}
{"train_lr": 0.0001235959448259827, "train_loss": 2.835719402709739, "test_loss": 0.8760520423728536, "test_acc1": 80.25000238525391, "test_acc5": 95.14600248535156, "epoch": 235, "n_parameters": 86567656}
{"train_lr": 0.00012031274907879946, "train_loss": 2.8332032141008443, "test_loss": 0.8641697278464366, "test_acc1": 80.41800242919922, "test_acc5": 95.12000228027344, "epoch": 236, "n_parameters": 86567656}
{"train_lr": 0.00011707173862371172, "train_loss": 2.8218578875041027, "test_loss": 0.8682519170578977, "test_acc1": 80.55200255371093, "test_acc5": 95.02800225097656, "epoch": 237, "n_parameters": 86567656}
{"train_lr": 0.00011387326887403272, "train_loss": 2.821014185663131, "test_loss": 0.8590295232131705, "test_acc1": 80.50600235595704, "test_acc5": 95.18200252929688, "epoch": 238, "n_parameters": 86567656}
{"train_lr": 0.00011071769057802179, "train_loss": 2.8118154635782435, "test_loss": 0.8719377509691894, "test_acc1": 80.59000229248046, "test_acc5": 95.08000247558594, "epoch": 239, "n_parameters": 86567656}
{"train_lr": 0.00010760534978039747, "train_loss": 2.806045424630888, "test_loss": 0.8622480818783711, "test_acc1": 80.72000256835938, "test_acc5": 95.22200249511718, "epoch": 240, "n_parameters": 86567656}
{"train_lr": 0.00010453658778440302, "train_loss": 2.7914802947228283, "test_loss": 0.8640052004361565, "test_acc1": 80.51800227783203, "test_acc5": 95.12400244628907, "epoch": 241, "n_parameters": 86567656}
{"train_lr": 0.0001015117411143637, "train_loss": 2.791099696219873, "test_loss": 0.8726189613285082, "test_acc1": 80.79800226806641, "test_acc5": 95.21200250488282, "epoch": 242, "n_parameters": 86567656}
{"train_lr": 9.853114147881454e-05, "train_loss": 2.780526550488173, "test_loss": 0.8579040051593433, "test_acc1": 80.75200235595703, "test_acc5": 95.09400246582031, "epoch": 243, "n_parameters": 86567656}
{"train_lr": 9.559511573409267e-05, "train_loss": 2.7794591542080247, "test_loss": 0.8566054748138859, "test_acc1": 80.67400241943359, "test_acc5": 95.13400247558594, "epoch": 244, "n_parameters": 86567656}
{"train_lr": 9.270398584849976e-05, "train_loss": 2.7720949506278423, "test_loss": 0.8602037597983904, "test_acc1": 80.70000248046875, "test_acc5": 95.19200245605468, "epoch": 245, "n_parameters": 86567656}
{"train_lr": 8.985806886701763e-05, "train_loss": 2.766673109025883, "test_loss": 0.8576798720174468, "test_acc1": 80.74600235107422, "test_acc5": 95.228002421875, "epoch": 246, "n_parameters": 86567656}
{"train_lr": 8.705767687650155e-05, "train_loss": 2.7568419143247853, "test_loss": 0.8546478330459796, "test_acc1": 80.8980023413086, "test_acc5": 95.33600237304688, "epoch": 247, "n_parameters": 86567656}
{"train_lr": 8.430311697149993e-05, "train_loss": 2.7621957105603054, "test_loss": 0.8610858470773514, "test_acc1": 80.98000253173828, "test_acc5": 95.28200248535157, "epoch": 248, "n_parameters": 86567656}
{"train_lr": 8.159469122054745e-05, "train_loss": 2.7462982253657637, "test_loss": 0.8558791913592655, "test_acc1": 80.88800244384765, "test_acc5": 95.22800236816406, "epoch": 249, "n_parameters": 86567656}
{"train_lr": 7.893269663304691e-05, "train_loss": 2.739886419378596, "test_loss": 0.8510716419073533, "test_acc1": 80.95000244873047, "test_acc5": 95.24600241210938, "epoch": 250, "n_parameters": 86567656}
{"train_lr": 7.631742512670381e-05, "train_loss": 2.7357003887553963, "test_loss": 0.8525940635582994, "test_acc1": 80.824002421875, "test_acc5": 95.24600252441407, "epoch": 251, "n_parameters": 86567656}
{"train_lr": 7.37491634955067e-05, "train_loss": 2.7310378534688082, "test_loss": 0.8533202671444119, "test_acc1": 80.93200256347656, "test_acc5": 95.32400232421875, "epoch": 252, "n_parameters": 86567656}
{"train_lr": 7.122819337828824e-05, "train_loss": 2.723337799834786, "test_loss": 0.8517538225010123, "test_acc1": 80.89000220947266, "test_acc5": 95.30000233886719, "epoch": 253, "n_parameters": 86567656}
{"train_lr": 6.87547912278283e-05, "train_loss": 2.709741816037803, "test_loss": 0.8510411470384835, "test_acc1": 81.06000245361328, "test_acc5": 95.3380026220703, "epoch": 254, "n_parameters": 86567656}
{"train_lr": 6.632922828055003e-05, "train_loss": 2.716105786307777, "test_loss": 0.8552826739375742, "test_acc1": 81.088002421875, "test_acc5": 95.30400244140625, "epoch": 255, "n_parameters": 86567656}
{"train_lr": 6.395177052675899e-05, "train_loss": 2.710197583764053, "test_loss": 0.8535275982117241, "test_acc1": 81.19000259033203, "test_acc5": 95.32200235351563, "epoch": 256, "n_parameters": 86567656}
{"train_lr": 6.162267868149164e-05, "train_loss": 2.702078429527944, "test_loss": 0.8525201122271122, "test_acc1": 81.02200240234374, "test_acc5": 95.2960024951172, "epoch": 257, "n_parameters": 86567656}
{"train_lr": 5.934220815591336e-05, "train_loss": 2.6945799249741764, "test_loss": 0.8499247298188035, "test_acc1": 81.14200240234375, "test_acc5": 95.3260024609375, "epoch": 258, "n_parameters": 86567656}
{"train_lr": 5.711060902932033e-05, "train_loss": 2.6904077286616883, "test_loss": 0.8517582393939573, "test_acc1": 81.16200248291015, "test_acc5": 95.31200239257812, "epoch": 259, "n_parameters": 86567656}
{"train_lr": 5.492812602170232e-05, "train_loss": 2.687441740009329, "test_loss": 0.8490255698990684, "test_acc1": 81.14200229980469, "test_acc5": 95.38000251464844, "epoch": 260, "n_parameters": 86567656}
{"train_lr": 5.2794998466913834e-05, "train_loss": 2.6867280198003556, "test_loss": 0.8477142209512487, "test_acc1": 81.23400244140625, "test_acc5": 95.34400248046875, "epoch": 261, "n_parameters": 86567656}
{"train_lr": 5.0711460286429e-05, "train_loss": 2.6715660277459263, "test_loss": 0.8417479030344628, "test_acc1": 81.35000235595703, "test_acc5": 95.42600248046875, "epoch": 262, "n_parameters": 86567656}
{"train_lr": 4.8677739963691566e-05, "train_loss": 2.6730031927200337, "test_loss": 0.8474233212546515, "test_acc1": 81.22800254394531, "test_acc5": 95.40000239257813, "epoch": 263, "n_parameters": 86567656}
{"train_lr": 4.669406051905346e-05, "train_loss": 2.6695463993876194, "test_loss": 0.8435185357156046, "test_acc1": 81.2340022241211, "test_acc5": 95.44800235839844, "epoch": 264, "n_parameters": 86567656}
{"train_lr": 4.476063948531632e-05, "train_loss": 2.6627261445617125, "test_loss": 0.8407083097380549, "test_acc1": 81.3220025366211, "test_acc5": 95.418002421875, "epoch": 265, "n_parameters": 86567656}
{"train_lr": 4.287768888388454e-05, "train_loss": 2.6590220925273846, "test_loss": 0.8428784298519255, "test_acc1": 81.2840023461914, "test_acc5": 95.30600247070312, "epoch": 266, "n_parameters": 86567656}
{"train_lr": 4.1045415201513915e-05, "train_loss": 2.6509330914163, "test_loss": 0.840783360852161, "test_acc1": 81.21800251953125, "test_acc5": 95.4700023828125, "epoch": 267, "n_parameters": 86567656}
{"train_lr": 3.926401936765786e-05, "train_loss": 2.648916074096394, "test_loss": 0.8382869310491144, "test_acc1": 81.40200246826171, "test_acc5": 95.41600236328125, "epoch": 268, "n_parameters": 86567656}
{"train_lr": 3.753369673244709e-05, "train_loss": 2.64328251418164, "test_loss": 0.8442193738501269, "test_acc1": 81.43600237060546, "test_acc5": 95.41200244628907, "epoch": 269, "n_parameters": 86567656}
{"train_lr": 3.585463704525412e-05, "train_loss": 2.640485584533377, "test_loss": 0.8385991968943839, "test_acc1": 81.38600242675781, "test_acc5": 95.4860024609375, "epoch": 270, "n_parameters": 86567656}
{"train_lr": 3.4227024433899046e-05, "train_loss": 2.6329833099203146, "test_loss": 0.8402550630628949, "test_acc1": 81.41600228027343, "test_acc5": 95.36400253417969, "epoch": 271, "n_parameters": 86567656}
{"train_lr": 3.2651037384443736e-05, "train_loss": 2.6347867263068587, "test_loss": 0.835176540256233, "test_acc1": 81.49200240234374, "test_acc5": 95.40600232910157, "epoch": 272, "n_parameters": 86567656}
{"train_lr": 3.112684872162703e-05, "train_loss": 2.6294872568641825, "test_loss": 0.840626989239237, "test_acc1": 81.41400234130859, "test_acc5": 95.38200243164063, "epoch": 273, "n_parameters": 86567656}
{"train_lr": 2.9654625589913e-05, "train_loss": 2.6263693506650023, "test_loss": 0.8450270975848764, "test_acc1": 81.46600243896485, "test_acc5": 95.3420024609375, "epoch": 274, "n_parameters": 86567656}
{"train_lr": 2.8234529435159726e-05, "train_loss": 2.6190262686887045, "test_loss": 0.8413780319885191, "test_acc1": 81.54000249511719, "test_acc5": 95.38200239257813, "epoch": 275, "n_parameters": 86567656}
{"train_lr": 2.6866715986911513e-05, "train_loss": 2.6181365711857185, "test_loss": 0.8359859471929737, "test_acc1": 81.47000244628906, "test_acc5": 95.44200222167969, "epoch": 276, "n_parameters": 86567656}
{"train_lr": 2.55513352413271e-05, "train_loss": 2.612261126945011, "test_loss": 0.8389055236401805, "test_acc1": 81.57600252929687, "test_acc5": 95.42000248535156, "epoch": 277, "n_parameters": 86567656}
{"train_lr": 2.4288531444729954e-05, "train_loss": 2.612850309389053, "test_loss": 0.8398726727105605, "test_acc1": 81.53000241455078, "test_acc5": 95.42000233886719, "epoch": 278, "n_parameters": 86567656}
{"train_lr": 2.3078443077785567e-05, "train_loss": 2.6091023498921277, "test_loss": 0.8374149336581496, "test_acc1": 81.58200235839844, "test_acc5": 95.40200241210937, "epoch": 279, "n_parameters": 86567656}
{"train_lr": 2.192120284031953e-05, "train_loss": 2.5997269399505822, "test_loss": 0.8397330811493914, "test_acc1": 81.55000237304688, "test_acc5": 95.44600233886719, "epoch": 280, "n_parameters": 86567656}
{"train_lr": 2.0816937636766537e-05, "train_loss": 2.6013922716954725, "test_loss": 0.8388328586567386, "test_acc1": 81.60600229003906, "test_acc5": 95.45000256835938, "epoch": 281, "n_parameters": 86567656}
{"train_lr": 1.976576856224742e-05, "train_loss": 2.5963034313693227, "test_loss": 0.8399712192234289, "test_acc1": 81.46800229980468, "test_acc5": 95.40800250976562, "epoch": 282, "n_parameters": 86567656}
{"train_lr": 1.8767810889299472e-05, "train_loss": 2.5964147593263243, "test_loss": 0.8392346777350798, "test_acc1": 81.55000247558594, "test_acc5": 95.45800252441406, "epoch": 283, "n_parameters": 86567656}
{"train_lr": 1.7823174055225238e-05, "train_loss": 2.5886976396103654, "test_loss": 0.8379598187565117, "test_acc1": 81.59200237060547, "test_acc5": 95.46000245117187, "epoch": 284, "n_parameters": 86567656}
{"train_lr": 1.6931961650100128e-05, "train_loss": 2.5943218352232904, "test_loss": 0.8366602797940688, "test_acc1": 81.65200252929688, "test_acc5": 95.4660025341797, "epoch": 285, "n_parameters": 86567656}
{"train_lr": 1.609427140540658e-05, "train_loss": 2.586010974385946, "test_loss": 0.8361005031158737, "test_acc1": 81.7300023828125, "test_acc5": 95.48000244140626, "epoch": 286, "n_parameters": 86567656}
{"train_lr": 1.5310195183320784e-05, "train_loss": 2.587221210642303, "test_loss": 0.8389281437744792, "test_acc1": 81.62800233886719, "test_acc5": 95.4780023828125, "epoch": 287, "n_parameters": 86567656}
{"train_lr": 1.4579818966635116e-05, "train_loss": 2.583657564090596, "test_loss": 0.8379138405229217, "test_acc1": 81.60200234130859, "test_acc5": 95.45400228515625, "epoch": 288, "n_parameters": 86567656}
{"train_lr": 1.3903222849333426e-05, "train_loss": 2.5751478614793313, "test_loss": 0.8347588189217957, "test_acc1": 81.6420024243164, "test_acc5": 95.47200242675781, "epoch": 289, "n_parameters": 86567656}
{"train_lr": 1.3280481027803718e-05, "train_loss": 2.5794426158761428, "test_loss": 0.8377101036671714, "test_acc1": 81.7240025, "test_acc5": 95.51000231933594, "epoch": 290, "n_parameters": 86567656}
{"train_lr": 1.2711661792704427e-05, "train_loss": 2.5743517098154762, "test_loss": 0.8410206067870994, "test_acc1": 81.6880025366211, "test_acc5": 95.47200223632812, "epoch": 291, "n_parameters": 86567656}
{"train_lr": 1.2196827521475628e-05, "train_loss": 2.5715944095254897, "test_loss": 0.8385688908498256, "test_acc1": 81.66600239013673, "test_acc5": 95.49000254394531, "epoch": 292, "n_parameters": 86567656}
{"train_lr": 1.1736034671495227e-05, "train_loss": 2.5710425417688634, "test_loss": 0.8383938503700117, "test_acc1": 81.65200235351563, "test_acc5": 95.45400233886718, "epoch": 293, "n_parameters": 86567656}
{"train_lr": 1.1329333773893123e-05, "train_loss": 2.5672798307477045, "test_loss": 0.8378399063666814, "test_acc1": 81.66000251220703, "test_acc5": 95.49200240234374, "epoch": 294, "n_parameters": 86567656}
{"train_lr": 1.0976769428005425e-05, "train_loss": 2.5717379520241495, "test_loss": 0.8335310324254283, "test_acc1": 81.70000238525391, "test_acc5": 95.53200232910156, "epoch": 295, "n_parameters": 86567656}
{"train_lr": 1.067838029648576e-05, "train_loss": 2.5691555647386446, "test_loss": 0.8382410909873281, "test_acc1": 81.67800233642578, "test_acc5": 95.52000247070312, "epoch": 296, "n_parameters": 86567656}
{"train_lr": 1.0434199101065238e-05, "train_loss": 2.5718514431866524, "test_loss": 0.838546558499565, "test_acc1": 81.5360024633789, "test_acc5": 95.47600235839843, "epoch": 297, "n_parameters": 86567656}
{"train_lr": 1.0244252618963046e-05, "train_loss": 2.5662289233051903, "test_loss": 0.8406346994604121, "test_acc1": 81.62000234619141, "test_acc5": 95.48200241699219, "epoch": 298, "n_parameters": 86567656}
{"train_lr": 1.0108561679951307e-05, "train_loss": 2.566221835688769, "test_loss": 0.8378001146318816, "test_acc1": 81.66000240966797, "test_acc5": 95.51200231445313, "epoch": 299, "n_parameters": 86567656}
@zhihou7
Copy link

zhihou7 commented Dec 29, 2021

Hi, May I ask the total batch size of this log? is it 64 * 16?

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment