import os

# each output is (batch size, feature dim, spatial dim)

[('data', (1000, 1, 36, 60)),
 ('label', (1000, 6)),
 ('gaze', (1000, 3)),
 ('headpose', (1000, 3)),
 ('conv1', (1000, 20, 32, 56)),
 ('pool1', (1000, 20, 16, 28)),
 ('conv2', (1000, 50, 12, 24)),
 ('pool2', (1000, 50, 6, 12)),
 ('ip1', (1000, 500)),
 ('cat', (1000, 503)),
 ('ip2', (1000, 3)),
 ('loss', ())]

# just print the weight sizes (not biases)

[('conv1', (20, 1, 5, 5)),
 ('conv2', (50, 20, 5, 5)),
 ('ip1', (500, 3600)),
 ('ip2', (3, 503))]

solver.net.forward()  # train net

{'loss': array(0.5101643800735474, dtype=float32)}

# we use a little trick to tile the first eight images

[[ -2.44513273e-01   5.20949736e-02  -9.68245506e-01  -5.07045567e-01
   -1.12138920e-01  -2.90884897e-02]
 [ -7.41908699e-02   2.27922529e-01  -9.70848620e-01  -1.28387764e-01
    1.65355857e-02   1.06296828e-03]
 [ -1.74087971e-01   3.04691344e-02  -9.84258592e-01  -9.52000245e-02
   -3.14195365e-01  -1.50917871e-02]
 [ -2.49744281e-02   1.77879885e-01  -9.83735263e-01  -7.38587156e-02
   -1.21144764e-02  -4.47588827e-04]
 [ -1.61419377e-01   5.79187945e-02  -9.85184848e-01  -1.06810793e-01
    1.42905980e-01   7.65229668e-03]
 [ -1.52415037e-01   2.09456533e-01  -9.65866268e-01  -5.29863574e-02
   -1.14266567e-01  -3.03129526e-03]
 [ -1.76816806e-02   6.62708879e-02  -9.97644961e-01  -6.35477304e-02
   -2.95568883e-01  -9.46362782e-03]
 [  1.79661021e-01   2.34958977e-01  -9.55257118e-01  -8.40480402e-02
    1.60711512e-01   6.77234307e-03]]

solver.step(1)

imshow(solver.net.params['conv1'][0].diff[:, 0].reshape(4, 5, 5, 5)

<matplotlib.image.AxesImage at 0x7f3cbc4fc290>

Show the conv1 weights pics.

%%time

Iteration 0
Iteration 25
Iteration 50
Iteration 75
Iteration 100
Iteration 125
Iteration 150
Iteration 175
Iteration 200
Iteration 225
Iteration 250
Iteration 275
Iteration 300
Iteration 325
Iteration 350
Iteration 375
Iteration 400
Iteration 425
Iteration 450
Iteration 475
CPU times: user 32.3 s, sys: 4.66 s, total: 36.9 s
Wall time: 36.9 s

_, ax1 = subplots()

<matplotlib.text.Text at 0x7f3cbeb36d90>

**show you the train loss curve.

num_test = 20

[-0.05740207  0.26108676 -0.96360713] label<->ip2 [-0.10422539  0.16509452 -0.93686533]
[-0.05108735  0.33534154 -0.94071043] label<->ip2 [-0.25041708  0.18521631 -0.9361276 ]
[ 0.14314307  0.08807883 -0.98577493] label<->ip2 [ 0.00178884  0.09841065 -0.96245277]
[ 0.14494585  0.10631151 -0.9837116 ] label<->ip2 [-0.10024959  0.11104928 -0.93721461]
[ 0.07297696  0.09071066 -0.99319983] label<->ip2 [-0.0581101   0.09164033 -0.95781732]
[-0.22788107  0.33246592 -0.91517025] label<->ip2 [-0.31594035  0.19744298 -0.93812776]
[ 0.11161654  0.03402296 -0.99316877] label<->ip2 [-0.0754093   0.0890121  -0.95794833]
[ 0.16556081  0.14849275 -0.97495615] label<->ip2 [ 0.01194712  0.11699522 -0.95868605]
[ 0.22707051  0.11209575 -0.96740556] label<->ip2 [ 0.06209523  0.04362224 -0.94721079]
[-0.26985002  0.27037239 -0.92416435] label<->ip2 [-0.2470575   0.12694712 -0.91398209]
[ 0.186772    0.03520598 -0.98177224] label<->ip2 [ 0.10427623  0.06089177 -0.95213568]
[ 0.25852728 -0.02351192 -0.96571779] label<->ip2 [-0.05272117  0.14147422 -0.92849791]
[ 0.04857407  0.20633523 -0.97727495] label<->ip2 [-0.0877868   0.18057725 -0.94327462]
[ 0.22813955  0.2115647  -0.95036453] label<->ip2 [ 0.04242265  0.13245447 -0.95119071]
[ 0.22677779  0.18486373 -0.95624119] label<->ip2 [-0.00176571  0.0784395  -0.94786465]
[ 0.16038546  0.30930048 -0.93734181] label<->ip2 [ 0.07084656  0.213103   -0.93380082]
[-0.25437474  0.04642556 -0.96599078] label<->ip2 [-0.31199673  0.06233154 -0.94071221]
[-0.01042224  0.20404638 -0.97890574] label<->ip2 [-0.11482257  0.12694134 -0.95108247]
[-0.268558    0.2635223  -0.92651635] label<->ip2 [-0.20304951  0.16384324 -0.95930922]
[-0.22500102  0.28130114 -0.93286884] label<->ip2 [-0.2839283   0.0932559  -0.94048727]
0.0121220568454 0.0622909313362 0.0206316891713 0.0623052168533 0.0184366047861 0.0265126769845 0.0392429523873 0.0248539803716 0.0323132961798 0.0211939856687 0.00834363794539 0.125481342432 0.0204137831727 0.0407498777752 0.0636284110556 0.0172837099069 0.0042122994471 0.0176187526438 0.0153026472347 0.0388914749171

<matplotlib.text.Text at 0x7f3cbcaac310>

imshow(solver.net.params['conv1'][0].diff[:, 0].reshape(4, 5, 5, 5)

<matplotlib.image.AxesImage at 0x7f3cbc64f810>

x

<matplotlib.image.AxesImage at 0x7f3cbc56cfd0>

figure(figsize=(20, 10))

<matplotlib.image.AxesImage at 0x7f3cbc456710>

figure(figsize=(50, 25))

<matplotlib.image.AxesImage at 0x7f3cbc2c8b10>

​