Created
December 21, 2017 16:03
-
-
Save kedarbellare/764b16e813d5e643a1b14c52f53d08ee to your computer and use it in GitHub Desktop.
Output of training a bilstm model on movie review sentiment data using GloVe vectors
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
$ lein with-profile main-sentclass run --model-type bilstm --num-data 8000 --embed-file data/glove.6B.300d.txt --emb-size 300 | |
Reflection warning, /private/var/folders/cg/mm4fc_4j3_96tm1fpqkm4v5w0000gn/T/form-init2811519414259970652.clj:1:1201 - call to static method invokeStaticMethod on clojure.lang.Reflector can't be resolved (argument types: unknown, java.lang.String, unknown). | |
WARNING: any? already refers to: #'clojure.core/any? in namespace: vertigo.core, being replaced by: #'vertigo.core/any? | |
{:train-file data/sentiment-train10k.txt, :test-file data/sentiment-test10k.txt, :embed-file data/glove.6B.300d.txt, :num-classes 2, :emb-size 300, :model-type :bilstm, :lstm-size 25, :num-data 8000} | |
Params ([lstm/input->gates/b [200]] [hidden->logits/W [2 50]] [lstm/input->gates/W [200 650]] [hidden->logits/b [2]]) | |
Total # params 130302 | |
Optimizing with flare.optimize.Adadelta | |
SLF4J: Failed to load class "org.slf4j.impl.StaticLoggerBinder". | |
SLF4J: Defaulting to no-operation (NOP) logger implementation | |
SLF4J: See http://www.slf4j.org/codes.html#StaticLoggerBinder for further details. | |
Iteration 0 | |
{:train-accuracy {:acc 0.79275, :n 8000}} | |
{:test-accuracy {:acc 0.79275, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.2338297386565726, :backward 0.35450095916002544}] | |
[:hadamard | |
{:forward 0.038903537076641716, :backward 0.05569571719368588}] | |
[:split | |
{:forward 0.043522367487013214, :backward 0.041129014182646605}] | |
[:concat | |
{:forward 0.03796264965882638, :backward 0.021459814103749756}] | |
[:tanh | |
{:forward 0.017553832732651688, :backward 0.04130011203848467}] | |
[:sigmoid | |
{:forward 0.028152573241789713, :backward 0.02706570012084407}] | |
[:+ {:forward 0.03294608470531097, :backward 0.019342458756390693}] | |
[:cross-entropy-loss | |
{:forward 0.002285743536311088, :backward 9.358835909925495E-4}] | |
[:dropout | |
{:forward 0.0016734355489546595, :backward 0.0011785801346759772}] | |
[:arg-max {:forward 5.617980744323131E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 0: 4633.645 (110781 ms) | |
Iteration 1 | |
{:train-accuracy {:acc 0.837, :n 8000}} | |
{:test-accuracy {:acc 0.835, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.23397435842799078, :backward 0.35743539676972624}] | |
[:hadamard | |
{:forward 0.03970264272679637, :backward 0.05517143628430263}] | |
[:split | |
{:forward 0.043675474412805025, :backward 0.0408602788732126}] | |
[:tanh | |
{:forward 0.017562911889311212, :backward 0.041219599219211936}] | |
[:concat | |
{:forward 0.03658253637173119, :backward 0.021233171018168906}] | |
[:sigmoid | |
{:forward 0.027950294158732375, :backward 0.027157313580783753}] | |
[:+ {:forward 0.033151837717871904, :backward 0.01919665029798812}] | |
[:dropout | |
{:forward 0.0014283139874683905, :backward 0.0010078108779877977}] | |
[:cross-entropy-loss | |
{:forward 0.001547920071658735, :backward 7.772454679784459E-4}] | |
[:arg-max {:forward 3.6480784627360467E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 1: 3742.246 (108119 ms) | |
Iteration 2 | |
{:train-accuracy {:acc 0.880875, :n 8000}} | |
{:test-accuracy {:acc 0.8735, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.23748740058577844, :backward 0.3543250545613171}] | |
[:hadamard | |
{:forward 0.04042535250858017, :backward 0.05450115532605749}] | |
[:split | |
{:forward 0.044192012562525654, :backward 0.04053169280920947}] | |
[:tanh | |
{:forward 0.01778042960678652, :backward 0.04105267995389415}] | |
[:concat | |
{:forward 0.03651740153582167, :backward 0.02103278213740871}] | |
[:sigmoid | |
{:forward 0.028268076926051086, :backward 0.026857190017891656}] | |
[:+ {:forward 0.03354363118434993, :backward 0.018911585455762298}] | |
[:dropout | |
{:forward 0.001326881737948029, :backward 9.385521297065816E-4}] | |
[:cross-entropy-loss | |
{:forward 0.0012912405403130785, :backward 7.126095573202046E-4}] | |
[:arg-max {:forward 3.042708632778079E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 2: 3161.178 (105517 ms) | |
Iteration 3 | |
{:train-accuracy {:acc 0.92275, :n 8000}} | |
{:test-accuracy {:acc 0.913625, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.23909638946038364, :backward 0.35251191962285683}] | |
[:hadamard | |
{:forward 0.040787953621720135, :backward 0.05428406327110418}] | |
[:split | |
{:forward 0.044485220567761254, :backward 0.040355291584530634}] | |
[:tanh | |
{:forward 0.01791225313066358, :backward 0.04099722864222819}] | |
[:concat | |
{:forward 0.03647886406166629, :backward 0.0209491030373981}] | |
[:sigmoid | |
{:forward 0.02843953248507187, :backward 0.026761526484133626}] | |
[:+ {:forward 0.033796693292296696, :backward 0.018839511941191194}] | |
[:dropout | |
{:forward 0.0012828470574794146, :backward 9.05020014236773E-4}] | |
[:cross-entropy-loss | |
{:forward 0.001163410976056937, :backward 6.815012969134234E-4}] | |
[:arg-max {:forward 2.716694523072207E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 3: 2550.035 (106487 ms) | |
Iteration 4 | |
{:train-accuracy {:acc 0.9515, :n 8000}} | |
{:test-accuracy {:acc 0.937625, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.24025745309774435, :backward 0.3506348041103015}] | |
[:hadamard | |
{:forward 0.040999637525030025, :backward 0.054263302261812876}] | |
[:split | |
{:forward 0.044692949157001415, :backward 0.04029944905893549}] | |
[:tanh | |
{:forward 0.018012453517090125, :backward 0.0410428561191693}] | |
[:concat | |
{:forward 0.036536498655600186, :backward 0.020925821740629288}] | |
[:sigmoid | |
{:forward 0.0285790768318796, :backward 0.026764909688467134}] | |
[:+ {:forward 0.0339522901701443, :backward 0.01885316695401001}] | |
[:dropout | |
{:forward 0.0012903811583394307, :backward 8.880260983102017E-4}] | |
[:cross-entropy-loss | |
{:forward 0.0010879343190806432, :backward 6.660566864062999E-4}] | |
[:arg-max {:forward 2.529328500478E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 4: 1954.412 (106830 ms) | |
Iteration 5 | |
{:train-accuracy {:acc 0.965125, :n 8000}} | |
{:test-accuracy {:acc 0.94925, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.24136594428032793, :backward 0.3495985656744447}] | |
[:hadamard | |
{:forward 0.04116828750170531, :backward 0.05413565570527926}] | |
[:split | |
{:forward 0.04481422531051453, :backward 0.04015554849125716}] | |
[:tanh | |
{:forward 0.018117053156046396, :backward 0.04095726380352636}] | |
[:concat | |
{:forward 0.03653916719754411, :backward 0.020904646698269178}] | |
[:sigmoid | |
{:forward 0.0286519347465072, :backward 0.026682669458032864}] | |
[:+ {:forward 0.03407359499055657, :backward 0.018772632457257087}] | |
[:dropout | |
{:forward 0.0012631910995071131, :backward 8.730873942764248E-4}] | |
[:cross-entropy-loss | |
{:forward 0.001033060499938447, :backward 6.512209057943381E-4}] | |
[:arg-max {:forward 2.4225062921501457E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 5: 1351.601 (107573 ms) | |
Iteration 6 | |
{:train-accuracy {:acc 0.979375, :n 8000}} | |
{:test-accuracy {:acc 0.96425, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.24238432571041604, :backward 0.3480591912069894}] | |
[:hadamard | |
{:forward 0.041269457423607124, :backward 0.054181870681758316}] | |
[:split | |
{:forward 0.04489303967014931, :backward 0.040167914127695714}] | |
[:tanh | |
{:forward 0.018162276335750027, :backward 0.040991061789679935}] | |
[:concat | |
{:forward 0.036529854167468526, :backward 0.020890684016220584}] | |
[:sigmoid | |
{:forward 0.02873359029928581, :backward 0.026825456141668095}] | |
[:+ {:forward 0.034135733364118064, :backward 0.018785246589378517}] | |
[:dropout | |
{:forward 0.0012495665785474896, :backward 8.675115846664764E-4}] | |
[:cross-entropy-loss | |
{:forward 9.961935334161457E-4, :backward 6.444308271595969E-4}] | |
[:arg-max {:forward 2.3259595202479785E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 6: 934.039 (109306 ms) | |
Iteration 7 | |
{:train-accuracy {:acc 0.9785, :n 8000}} | |
{:test-accuracy {:acc 0.961875, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.24247088104244685, :backward 0.3484212347693487}] | |
[:hadamard | |
{:forward 0.04128891006201954, :backward 0.05406804529362814}] | |
[:split | |
{:forward 0.04490076013249798, :backward 0.04011549593275201}] | |
[:tanh | |
{:forward 0.018168782617389558, :backward 0.04092220849556201}] | |
[:concat | |
{:forward 0.03646313521630789, :backward 0.020880354619546}] | |
[:sigmoid | |
{:forward 0.028710055895463795, :backward 0.026794953245637996}] | |
[:+ {:forward 0.03413165938709586, :backward 0.018742052888751807}] | |
[:dropout | |
{:forward 0.0012350972451970553, :backward 8.58587619119022E-4}] | |
[:cross-entropy-loss | |
{:forward 9.66152634372875E-4, :backward 6.367036689489209E-4}] | |
[:arg-max {:forward 2.2492923391396688E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 7: 727.560 (106857 ms) | |
Iteration 8 | |
{:train-accuracy {:acc 0.99225, :n 8000}} | |
{:test-accuracy {:acc 0.972625, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.2427920937665831, :backward 0.3485124195892605}] | |
[:hadamard | |
{:forward 0.04129396058884055, :backward 0.053967769827668724}] | |
[:split | |
{:forward 0.04492732887536577, :backward 0.040044051258747125}] | |
[:tanh | |
{:forward 0.018175402874258294, :backward 0.04086448199387627}] | |
[:concat | |
{:forward 0.036396567781483945, :backward 0.02087765285964186}] | |
[:sigmoid | |
{:forward 0.02871313240028372, :backward 0.026747622821622703}] | |
[:+ {:forward 0.03411235543241738, :backward 0.018703588724487897}] | |
[:dropout | |
{:forward 0.0012245028454994106, :backward 8.533725900835347E-4}] | |
[:cross-entropy-loss | |
{:forward 9.433877175581861E-4, :backward 6.315251193155914E-4}] | |
[:arg-max {:forward 2.1878293300550434E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 8: 496.482 (108328 ms) | |
Iteration 9 | |
{:train-accuracy {:acc 0.993125, :n 8000}} | |
{:test-accuracy {:acc 0.97375, :n 8000}} | |
{:debug | |
{:perf | |
([:* {:forward 0.2430087402503307, :backward 0.3482022223967197}] | |
[:hadamard | |
{:forward 0.04138163898775469, :backward 0.05389910879308368}] | |
[:split | |
{:forward 0.044976606829269454, :backward 0.04003487956085481}] | |
[:tanh | |
{:forward 0.018194989854637265, :backward 0.04085962070348915}] | |
[:concat | |
{:forward 0.036408509865430976, :backward 0.02086718648098555}] | |
[:sigmoid | |
{:forward 0.0287191342318726, :backward 0.026749580517026136}] | |
[:+ {:forward 0.034176155717576276, :backward 0.01868977920727521}] | |
[:dropout | |
{:forward 0.0012154442270910777, :backward 8.479320952876777E-4}] | |
[:cross-entropy-loss | |
{:forward 9.271056478826494E-4, :backward 6.27326508187013E-4}] | |
[:arg-max {:forward 2.140381252453742E-4, :backward 0.0}] | |
[:scale {:forward 0.0, :backward 0.0}] | |
[:exp {:forward 0.0, :backward 0.0}] | |
[:strech {:forward 0.0, :backward 0.0}] | |
[:max {:forward 0.0, :backward 0.0}] | |
[:squeeze {:forward 0.0, :backward 0.0}] | |
[:sum-elems {:forward 0.0, :backward 0.0}])}} | |
End of iteration 9: 367.994 (105766 ms) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment