Skip to content

Instantly share code, notes, and snippets.

@Yuxin-CV
Created June 1, 2021 15:01
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
Star You must be signed in to star a gist
Save Yuxin-CV/98168420dbcc5a0d1e656da83c6bf416 to your computer and use it in GitHub Desktop.
DeiT-Samll @ ImageNet-1k (Pre-train 200 Epochs)
{"train_lr": 9.999999999999953e-07, "train_loss": 6.934438605865033, "epoch": 0, "n_parameters": 22050664}
{"train_lr": 9.999999999999953e-07, "train_loss": 6.901241369241719, "epoch": 1, "n_parameters": 22050664}
{"train_lr": 0.00020080000000000092, "train_loss": 6.75567844217058, "epoch": 2, "n_parameters": 22050664}
{"train_lr": 0.000400599999999987, "train_loss": 6.563156393744486, "epoch": 3, "n_parameters": 22050664}
{"train_lr": 0.0006003999999999824, "train_loss": 6.442344095543039, "epoch": 4, "n_parameters": 22050664}
{"train_lr": 0.0008002000000000078, "train_loss": 6.351373942064153, "epoch": 5, "n_parameters": 22050664}
{"train_lr": 0.0009984740801978918, "train_loss": 6.261527323656136, "epoch": 6, "n_parameters": 22050664}
{"train_lr": 0.0009978031724785232, "train_loss": 6.121864894787661, "epoch": 7, "n_parameters": 22050664}
{"train_lr": 0.0009970106729503033, "train_loss": 5.994587432947472, "epoch": 8, "n_parameters": 22050664}
{"train_lr": 0.0009960967771506664, "train_loss": 5.878069390734132, "epoch": 9, "n_parameters": 22050664}
{"train_lr": 0.000995061710569694, "train_loss": 5.765940131615106, "epoch": 10, "n_parameters": 22050664}
{"train_lr": 0.000993905728594591, "train_loss": 5.650089027832071, "epoch": 11, "n_parameters": 22050664}
{"train_lr": 0.0009926291164466016, "train_loss": 5.56765893032606, "epoch": 12, "n_parameters": 22050664}
{"train_lr": 0.0009912321891107068, "train_loss": 5.469603928111249, "epoch": 13, "n_parameters": 22050664}
{"train_lr": 0.0009897152912577711, "train_loss": 5.403764398859368, "epoch": 14, "n_parameters": 22050664}
{"train_lr": 0.0009880787971596754, "train_loss": 5.334179552196027, "epoch": 15, "n_parameters": 22050664}
{"train_lr": 0.0009863231105968705, "train_loss": 5.270896238102901, "epoch": 16, "n_parameters": 22050664}
{"train_lr": 0.0009844486647586856, "train_loss": 5.226490205283359, "epoch": 17, "n_parameters": 22050664}
{"train_lr": 0.0009824559221366003, "train_loss": 5.167045326089021, "epoch": 18, "n_parameters": 22050664}
{"train_lr": 0.0009803453744100898, "train_loss": 5.114678869192168, "epoch": 19, "n_parameters": 22050664}
{"train_lr": 0.000978117542325151, "train_loss": 5.067171387940193, "epoch": 20, "n_parameters": 22050664}
{"train_lr": 0.0009757729755660996, "train_loss": 5.017920854327967, "epoch": 21, "n_parameters": 22050664}
{"train_lr": 0.0009733122526196471, "train_loss": 4.973697706663923, "epoch": 22, "n_parameters": 22050664}
{"train_lr": 0.000970735980632352, "train_loss": 4.9348408005458655, "epoch": 23, "n_parameters": 22050664}
{"train_lr": 0.000968044795260779, "train_loss": 4.905667897703932, "test_loss": 2.378918208381682, "test_acc1": 48.67400140625, "test_acc5": 74.31000232421874, "epoch": 24, "n_parameters": 22050664}
{"train_lr": 0.000965239360514694, "train_loss": 4.868394846062389, "epoch": 25, "n_parameters": 22050664}
{"train_lr": 0.0009623203685930996, "train_loss": 4.8292380654983385, "epoch": 26, "n_parameters": 22050664}
{"train_lr": 0.0009592885397135909, "train_loss": 4.793001462372659, "epoch": 27, "n_parameters": 22050664}
{"train_lr": 0.0009561446219345371, "train_loss": 4.764862982131881, "epoch": 28, "n_parameters": 22050664}
{"train_lr": 0.0009528893909706948, "train_loss": 4.729272379696988, "epoch": 29, "n_parameters": 22050664}
{"train_lr": 0.0009495236500014729, "train_loss": 4.695496585300501, "epoch": 30, "n_parameters": 22050664}
{"train_lr": 0.0009460482294732177, "train_loss": 4.682567354252965, "epoch": 31, "n_parameters": 22050664}
{"train_lr": 0.0009424639868938875, "train_loss": 4.651861028777038, "epoch": 32, "n_parameters": 22050664}
{"train_lr": 0.0009387718066217019, "train_loss": 4.619058724192025, "epoch": 33, "n_parameters": 22050664}
{"train_lr": 0.0009349725996469011, "train_loss": 4.603423546758487, "epoch": 34, "n_parameters": 22050664}
{"train_lr": 0.0009310673033669664, "train_loss": 4.581711596626934, "epoch": 35, "n_parameters": 22050664}
{"train_lr": 0.0009270568813552856, "train_loss": 4.555999542740609, "epoch": 36, "n_parameters": 22050664}
{"train_lr": 0.0009229423231234935, "train_loss": 4.534499420750913, "epoch": 37, "n_parameters": 22050664}
{"train_lr": 0.0009187246438773041, "train_loss": 4.518962263798923, "epoch": 38, "n_parameters": 22050664}
{"train_lr": 0.0009144048842658995, "train_loss": 4.493459974666484, "epoch": 39, "n_parameters": 22050664}
{"train_lr": 0.0009099841101254148, "train_loss": 4.472153503951028, "epoch": 40, "n_parameters": 22050664}
{"train_lr": 0.0009054634122156225, "train_loss": 4.46853403026442, "epoch": 41, "n_parameters": 22050664}
{"train_lr": 0.0009008439059511137, "train_loss": 4.434036824557421, "epoch": 42, "n_parameters": 22050664}
{"train_lr": 0.0008961267311259657, "train_loss": 4.422930070369555, "epoch": 43, "n_parameters": 22050664}
{"train_lr": 0.0008913130516324681, "train_loss": 4.400826388959595, "epoch": 44, "n_parameters": 22050664}
{"train_lr": 0.0008864040551740224, "train_loss": 4.384913919521845, "epoch": 45, "n_parameters": 22050664}
{"train_lr": 0.000881400952972042, "train_loss": 4.375954539965478, "epoch": 46, "n_parameters": 22050664}
{"train_lr": 0.0008763049794670927, "train_loss": 4.350782034422854, "epoch": 47, "n_parameters": 22050664}
{"train_lr": 0.0008711173920144025, "train_loss": 4.333344814588698, "epoch": 48, "n_parameters": 22050664}
{"train_lr": 0.0008658394705736102, "train_loss": 4.315457099514137, "test_loss": 1.7112128868185241, "test_acc1": 61.67000193359375, "test_acc5": 84.31800241210938, "epoch": 49, "n_parameters": 22050664}
{"train_lr": 0.0008604725173927694, "train_loss": 4.303641652389111, "epoch": 50, "n_parameters": 22050664}
{"train_lr": 0.0008550178566873157, "train_loss": 4.275390069047324, "epoch": 51, "n_parameters": 22050664}
{"train_lr": 0.0008494768343132194, "train_loss": 4.260202005517473, "epoch": 52, "n_parameters": 22050664}
{"train_lr": 0.00084385081743468, "train_loss": 4.242446700517508, "epoch": 53, "n_parameters": 22050664}
{"train_lr": 0.0008381411941873461, "train_loss": 4.238289606418731, "epoch": 54, "n_parameters": 22050664}
{"train_lr": 0.0008323493733352106, "train_loss": 4.233631628761284, "epoch": 55, "n_parameters": 22050664}
{"train_lr": 0.000826476783923446, "train_loss": 4.2231202625589885, "epoch": 56, "n_parameters": 22050664}
{"train_lr": 0.0008205248749255873, "train_loss": 4.186821224854337, "epoch": 57, "n_parameters": 22050664}
{"train_lr": 0.0008144951148861791, "train_loss": 4.192926019311047, "epoch": 58, "n_parameters": 22050664}
{"train_lr": 0.0008083889915582182, "train_loss": 4.185811056245527, "epoch": 59, "n_parameters": 22050664}
{"train_lr": 0.000802208011536304, "train_loss": 4.158665855749429, "epoch": 60, "n_parameters": 22050664}
{"train_lr": 0.0007959536998847494, "train_loss": 4.153939531885272, "epoch": 61, "n_parameters": 22050664}
{"train_lr": 0.0007896275997614222, "train_loss": 4.143303760950514, "epoch": 62, "n_parameters": 22050664}
{"train_lr": 0.0007832312720368117, "train_loss": 4.1317306310534, "epoch": 63, "n_parameters": 22050664}
{"train_lr": 0.0007767662949090809, "train_loss": 4.123738460070033, "epoch": 64, "n_parameters": 22050664}
{"train_lr": 0.0007702342635146132, "train_loss": 4.111527248466615, "epoch": 65, "n_parameters": 22050664}
{"train_lr": 0.0007636367895343943, "train_loss": 4.101290073516748, "epoch": 66, "n_parameters": 22050664}
{"train_lr": 0.0007569755007964469, "train_loss": 4.092988407726196, "epoch": 67, "n_parameters": 22050664}
{"train_lr": 0.0007502520408740605, "train_loss": 4.080424974433524, "epoch": 68, "n_parameters": 22050664}
{"train_lr": 0.0007434680686803327, "train_loss": 4.080858544122687, "epoch": 69, "n_parameters": 22050664}
{"train_lr": 0.0007366252580589767, "train_loss": 4.058361858439198, "epoch": 70, "n_parameters": 22050664}
{"train_lr": 0.0007297252973710595, "train_loss": 4.045745422871565, "epoch": 71, "n_parameters": 22050664}
{"train_lr": 0.000722769889078688, "train_loss": 4.0453878210174095, "epoch": 72, "n_parameters": 22050664}
{"train_lr": 0.0007157607493246968, "train_loss": 4.022558767947076, "epoch": 73, "n_parameters": 22050664}
{"train_lr": 0.0007086996075095225, "train_loss": 4.018317679278285, "test_loss": 1.474770495261269, "test_acc1": 66.69200206542969, "test_acc5": 87.7820024609375, "epoch": 74, "n_parameters": 22050664}
{"train_lr": 0.0007015882058641976, "train_loss": 4.01164030342651, "epoch": 75, "n_parameters": 22050664}
{"train_lr": 0.0006944282990206983, "train_loss": 3.9990942917472356, "epoch": 76, "n_parameters": 22050664}
{"train_lr": 0.0006872216535789267, "train_loss": 3.999647147959466, "epoch": 77, "n_parameters": 22050664}
{"train_lr": 0.0006799700476707307, "train_loss": 3.98122750316783, "epoch": 78, "n_parameters": 22050664}
{"train_lr": 0.0006726752705214028, "train_loss": 3.9758978984672293, "epoch": 79, "n_parameters": 22050664}
{"train_lr": 0.0006653391220080658, "train_loss": 3.957459979253612, "epoch": 80, "n_parameters": 22050664}
{"train_lr": 0.0006579634122155856, "train_loss": 3.9460486585049512, "epoch": 81, "n_parameters": 22050664}
{"train_lr": 0.0006505499609900032, "train_loss": 3.9455526720562712, "epoch": 82, "n_parameters": 22050664}
{"train_lr": 0.0006431005974894059, "train_loss": 3.940910641857379, "epoch": 83, "n_parameters": 22050664}
{"train_lr": 0.0006356171597328481, "train_loss": 3.9315769086829384, "epoch": 84, "n_parameters": 22050664}
{"train_lr": 0.0006281014941466044, "train_loss": 3.918982666935757, "epoch": 85, "n_parameters": 22050664}
{"train_lr": 0.0006205554551086674, "train_loss": 3.908034684989664, "epoch": 86, "n_parameters": 22050664}
{"train_lr": 0.0006129809044912789, "train_loss": 3.9023384381350663, "epoch": 87, "n_parameters": 22050664}
{"train_lr": 0.0006053797112014571, "train_loss": 3.894737351617272, "epoch": 88, "n_parameters": 22050664}
{"train_lr": 0.0005977537507199184, "train_loss": 3.8878711060368474, "epoch": 89, "n_parameters": 22050664}
{"train_lr": 0.0005901049046382965, "train_loss": 3.8870922263196523, "epoch": 90, "n_parameters": 22050664}
{"train_lr": 0.0005824350601949218, "train_loss": 3.8796465897636354, "epoch": 91, "n_parameters": 22050664}
{"train_lr": 0.0005747461098091134, "train_loss": 3.8673873389367577, "epoch": 92, "n_parameters": 22050664}
{"train_lr": 0.0005670399506143469, "train_loss": 3.85865579325137, "epoch": 93, "n_parameters": 22050664}
{"train_lr": 0.0005593184839900548, "train_loss": 3.8404861695284276, "epoch": 94, "n_parameters": 22050664}
{"train_lr": 0.0005515836150926655, "train_loss": 3.840278819477339, "epoch": 95, "n_parameters": 22050664}
{"train_lr": 0.0005438372523852734, "train_loss": 3.8347245656329094, "epoch": 96, "n_parameters": 22050664}
{"train_lr": 0.0005360813071670112, "train_loss": 3.8239090633001642, "epoch": 97, "n_parameters": 22050664}
{"train_lr": 0.000528317693101275, "train_loss": 3.8111618225761266, "epoch": 98, "n_parameters": 22050664}
{"train_lr": 0.0005205483257436661, "train_loss": 3.8126060650360096, "test_loss": 1.2973820929097946, "test_acc1": 70.07800200683593, "test_acc5": 90.3000024609375, "epoch": 99, "n_parameters": 22050664}
{"train_lr": 0.0005127751220693652, "train_loss": 3.7977484707876172, "epoch": 100, "n_parameters": 22050664}
{"train_lr": 0.0005049999999999881, "train_loss": 3.7892301880674872, "epoch": 101, "n_parameters": 22050664}
{"train_lr": 0.0004972248779306491, "train_loss": 3.7788950559094276, "epoch": 102, "n_parameters": 22050664}
{"train_lr": 0.0004894516742563275, "train_loss": 3.7842627887864957, "epoch": 103, "n_parameters": 22050664}
{"train_lr": 0.00048168230689872056, "train_loss": 3.7703248498727566, "epoch": 104, "n_parameters": 22050664}
{"train_lr": 0.00047391869283298395, "train_loss": 3.7551315068055113, "epoch": 105, "n_parameters": 22050664}
{"train_lr": 0.00046616274761472094, "train_loss": 3.765370129490737, "epoch": 106, "n_parameters": 22050664}
{"train_lr": 0.0004584163849073357, "train_loss": 3.7499642115798024, "epoch": 107, "n_parameters": 22050664}
{"train_lr": 0.0004506815160099214, "train_loss": 3.7343447823747455, "epoch": 108, "n_parameters": 22050664}
{"train_lr": 0.00044296004938566933, "train_loss": 3.727317790047442, "epoch": 109, "n_parameters": 22050664}
{"train_lr": 0.00043525389019089515, "train_loss": 3.719071038382993, "epoch": 110, "n_parameters": 22050664}
{"train_lr": 0.00042756493980507503, "train_loss": 3.711673707794324, "epoch": 111, "n_parameters": 22050664}
{"train_lr": 0.00041989509536167954, "train_loss": 3.710834577024507, "epoch": 112, "n_parameters": 22050664}
{"train_lr": 0.0004122462492800569, "train_loss": 3.6983115132287634, "epoch": 113, "n_parameters": 22050664}
{"train_lr": 0.0004046202887985183, "train_loss": 3.6898308734146714, "epoch": 114, "n_parameters": 22050664}
{"train_lr": 0.00039701909550871056, "train_loss": 3.6795111723559843, "epoch": 115, "n_parameters": 22050664}
{"train_lr": 0.0003894445448913186, "train_loss": 3.675327813501457, "epoch": 116, "n_parameters": 22050664}
{"train_lr": 0.0003818985058534034, "train_loss": 3.6653446586821956, "epoch": 117, "n_parameters": 22050664}
{"train_lr": 0.0003743828402671402, "train_loss": 3.6584957596495284, "epoch": 118, "n_parameters": 22050664}
{"train_lr": 0.00036689940251057154, "train_loss": 3.6554025984067713, "epoch": 119, "n_parameters": 22050664}
{"train_lr": 0.00035945003901000387, "train_loss": 3.635240924777649, "epoch": 120, "n_parameters": 22050664}
{"train_lr": 0.00035203658778439235, "train_loss": 3.6355248386863703, "epoch": 121, "n_parameters": 22050664}
{"train_lr": 0.00034466087799191083, "train_loss": 3.622979417431364, "epoch": 122, "n_parameters": 22050664}
{"train_lr": 0.0003373247294785742, "train_loss": 3.6262091487574635, "epoch": 123, "n_parameters": 22050664}
{"train_lr": 0.0003300299523292763, "train_loss": 3.609837022592886, "test_loss": 1.1700371950293866, "test_acc1": 73.41200212890625, "test_acc5": 91.7280025390625, "epoch": 124, "n_parameters": 22050664}
{"train_lr": 0.00032277834642108216, "train_loss": 3.596687549166828, "epoch": 125, "n_parameters": 22050664}
{"train_lr": 0.00031557170097928574, "train_loss": 3.5902157211713464, "epoch": 126, "n_parameters": 22050664}
{"train_lr": 0.0003084117941357799, "train_loss": 3.5801557226480245, "epoch": 127, "n_parameters": 22050664}
{"train_lr": 0.00030130039249047426, "train_loss": 3.580977399572194, "epoch": 128, "n_parameters": 22050664}
{"train_lr": 0.0002942392506752879, "train_loss": 3.568922481162371, "epoch": 129, "n_parameters": 22050664}
{"train_lr": 0.00028723011092131773, "train_loss": 3.5671421859761794, "epoch": 130, "n_parameters": 22050664}
{"train_lr": 0.0002802747026289244, "train_loss": 3.548819579487796, "epoch": 131, "n_parameters": 22050664}
{"train_lr": 0.00027337474194101676, "train_loss": 3.5468957390097215, "epoch": 132, "n_parameters": 22050664}
{"train_lr": 0.00026653193131964784, "train_loss": 3.5327837272084874, "epoch": 133, "n_parameters": 22050664}
{"train_lr": 0.00025974795912596046, "train_loss": 3.5275949300002516, "epoch": 134, "n_parameters": 22050664}
{"train_lr": 0.0002530244992035622, "train_loss": 3.519673021696359, "epoch": 135, "n_parameters": 22050664}
{"train_lr": 0.0002463632104656113, "train_loss": 3.5111626882633145, "epoch": 136, "n_parameters": 22050664}
{"train_lr": 0.00023976573648539732, "train_loss": 3.509913947656572, "epoch": 137, "n_parameters": 22050664}
{"train_lr": 0.0002332337050909282, "train_loss": 3.498194780078628, "epoch": 138, "n_parameters": 22050664}
{"train_lr": 0.00022676872796319677, "train_loss": 3.4841540919886316, "epoch": 139, "n_parameters": 22050664}
{"train_lr": 0.00022037240023858274, "train_loss": 3.4780334418745253, "epoch": 140, "n_parameters": 22050664}
{"train_lr": 0.0002140463001152288, "train_loss": 3.477724570831616, "epoch": 141, "n_parameters": 22050664}
{"train_lr": 0.00020779198846368618, "train_loss": 3.4678721043060152, "epoch": 142, "n_parameters": 22050664}
{"train_lr": 0.00020161100844177222, "train_loss": 3.4549207411033453, "epoch": 143, "n_parameters": 22050664}
{"train_lr": 0.00019550488511382814, "train_loss": 3.4348790068134702, "epoch": 144, "n_parameters": 22050664}
{"train_lr": 0.00018947512507439562, "train_loss": 3.4291364775239517, "epoch": 145, "n_parameters": 22050664}
{"train_lr": 0.00018352321607656278, "train_loss": 3.428964727776323, "epoch": 146, "n_parameters": 22050664}
{"train_lr": 0.00017765062666479713, "train_loss": 3.4251757884959426, "epoch": 147, "n_parameters": 22050664}
{"train_lr": 0.00017185880581266342, "train_loss": 3.4216424423775416, "epoch": 148, "n_parameters": 22050664}
{"train_lr": 0.00016614918256530037, "train_loss": 3.4057335008343728, "test_loss": 1.0441676331434213, "test_acc1": 75.92000228515624, "test_acc5": 93.12000247070313, "epoch": 149, "n_parameters": 22050664}
{"train_lr": 0.0001605231656868015, "train_loss": 3.4018312994477085, "epoch": 150, "n_parameters": 22050664}
{"train_lr": 0.00015498214331266302, "train_loss": 3.3968590074758547, "epoch": 151, "n_parameters": 22050664}
{"train_lr": 0.0001495274826072216, "train_loss": 3.384095481152443, "epoch": 152, "n_parameters": 22050664}
{"train_lr": 0.00014416052942639815, "train_loss": 3.367812543607158, "epoch": 153, "n_parameters": 22050664}
{"train_lr": 0.000138882607985586, "train_loss": 3.365708000404086, "epoch": 154, "n_parameters": 22050664}
{"train_lr": 0.00013369502053292505, "train_loss": 3.354487799792934, "epoch": 155, "n_parameters": 22050664}
{"train_lr": 0.00012859904702798252, "train_loss": 3.352311377223733, "epoch": 156, "n_parameters": 22050664}
{"train_lr": 0.0001235959448259827, "train_loss": 3.3401191960231102, "epoch": 157, "n_parameters": 22050664}
{"train_lr": 0.0001186869483675294, "train_loss": 3.338969543028316, "epoch": 158, "n_parameters": 22050664}
{"train_lr": 0.00011387326887403272, "train_loss": 3.3288807266121574, "epoch": 159, "n_parameters": 22050664}
{"train_lr": 0.00010915609404889089, "train_loss": 3.3180156576333286, "epoch": 160, "n_parameters": 22050664}
{"train_lr": 0.00010453658778440302, "train_loss": 3.321174738897408, "epoch": 161, "n_parameters": 22050664}
{"train_lr": 0.00010001588987461343, "train_loss": 3.2937839920286365, "epoch": 162, "n_parameters": 22050664}
{"train_lr": 9.559511573409267e-05, "train_loss": 3.2993596947545725, "epoch": 163, "n_parameters": 22050664}
{"train_lr": 9.12753561227054e-05, "train_loss": 3.2995029770903925, "epoch": 164, "n_parameters": 22050664}
{"train_lr": 8.705767687650155e-05, "train_loss": 3.284530080074696, "epoch": 165, "n_parameters": 22050664}
{"train_lr": 8.29431186447221e-05, "train_loss": 3.2844199677356047, "epoch": 166, "n_parameters": 22050664}
{"train_lr": 7.893269663304691e-05, "train_loss": 3.2665358206017507, "epoch": 167, "n_parameters": 22050664}
{"train_lr": 7.50274003530937e-05, "train_loss": 3.261560802575019, "epoch": 168, "n_parameters": 22050664}
{"train_lr": 7.122819337828824e-05, "train_loss": 3.2592836789828508, "epoch": 169, "n_parameters": 22050664}
{"train_lr": 6.75360131060965e-05, "train_loss": 3.251781676908572, "epoch": 170, "n_parameters": 22050664}
{"train_lr": 6.395177052675899e-05, "train_loss": 3.254208669685822, "epoch": 171, "n_parameters": 22050664}
{"train_lr": 6.047634999849368e-05, "train_loss": 3.2304268911135474, "epoch": 172, "n_parameters": 22050664}
{"train_lr": 5.7110609029320316e-05, "train_loss": 3.239149059644706, "epoch": 173, "n_parameters": 22050664}
{"train_lr": 5.385537806545422e-05, "train_loss": 3.2260327472699157, "test_loss": 0.9626575089505806, "test_acc1": 77.9320023486328, "test_acc5": 94.0360026171875, "epoch": 174, "n_parameters": 22050664}
{"train_lr": 5.0711460286429e-05, "train_loss": 3.2263898661168073, "epoch": 175, "n_parameters": 22050664}
{"train_lr": 4.767963140691428e-05, "train_loss": 3.2220385019108355, "epoch": 176, "n_parameters": 22050664}
{"train_lr": 4.476063948531632e-05, "train_loss": 3.211318061124983, "epoch": 177, "n_parameters": 22050664}
{"train_lr": 4.195520473921506e-05, "train_loss": 3.210434863035627, "epoch": 178, "n_parameters": 22050664}
{"train_lr": 3.926401936765786e-05, "train_loss": 3.2052426848361057, "epoch": 179, "n_parameters": 22050664}
{"train_lr": 3.66877473803659e-05, "train_loss": 3.194936732772729, "epoch": 180, "n_parameters": 22050664}
{"train_lr": 3.4227024433899046e-05, "train_loss": 3.1995563340796935, "epoch": 181, "n_parameters": 22050664}
{"train_lr": 3.188245767482609e-05, "train_loss": 3.1951332394953824, "epoch": 182, "n_parameters": 22050664}
{"train_lr": 2.9654625589913007e-05, "train_loss": 3.1808865092855565, "epoch": 183, "n_parameters": 22050664}
{"train_lr": 2.7544077863389885e-05, "train_loss": 3.181196793163423, "epoch": 184, "n_parameters": 22050664}
{"train_lr": 2.55513352413271e-05, "train_loss": 3.175809731491083, "epoch": 185, "n_parameters": 22050664}
{"train_lr": 2.367688940314948e-05, "train_loss": 3.172979227287306, "epoch": 186, "n_parameters": 22050664}
{"train_lr": 2.192120284031953e-05, "train_loss": 3.1778069079565485, "epoch": 187, "n_parameters": 22050664}
{"train_lr": 2.028470874222617e-05, "train_loss": 3.165040424413723, "epoch": 188, "n_parameters": 22050664}
{"train_lr": 1.876781088929933e-05, "train_loss": 3.1578869402623004, "epoch": 189, "n_parameters": 22050664}
{"train_lr": 1.7370883553386852e-05, "train_loss": 3.1697809523243983, "epoch": 190, "n_parameters": 22050664}
{"train_lr": 1.609427140540658e-05, "train_loss": 3.1606179392761846, "epoch": 191, "n_parameters": 22050664}
{"train_lr": 1.4938289430304017e-05, "train_loss": 3.159473898456537, "epoch": 192, "n_parameters": 22050664}
{"train_lr": 1.3903222849333426e-05, "train_loss": 3.1616512115219897, "epoch": 193, "n_parameters": 22050664}
{"train_lr": 1.2989327049686034e-05, "train_loss": 3.143136017661777, "epoch": 194, "n_parameters": 22050664}
{"train_lr": 1.2196827521475628e-05, "train_loss": 3.1501416968141527, "epoch": 195, "n_parameters": 22050664}
{"train_lr": 1.1525919802101344e-05, "train_loss": 3.150686197477184, "epoch": 196, "n_parameters": 22050664}
{"train_lr": 1.0976769428005425e-05, "train_loss": 3.149354827239645, "epoch": 197, "n_parameters": 22050664}
{"train_lr": 1.0549511893824651e-05, "train_loss": 3.1480970263695545, "epoch": 198, "n_parameters": 22050664}
{"train_lr": 1.0244252618963044e-05, "train_loss": 3.1423607404283485, "test_loss": 0.9316812765666809, "test_acc1": 78.47200244628907, "test_acc5": 94.39400260742188, "epoch": 199, "n_parameters": 22050664}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment