# FUNCTION GENERATOR using Policy Gradient

Useful links:
Policy Gradient Explanation: http://karpathy.github.io/2016/05/31/rl/ <br>
Example of Policy Gradient: https://github.com/keon/policy-gradient

In [1]:
import numpy as np
from keras.models import Sequential, Model
from keras.layers import TimeDistributed, Dense, Reshape, Flatten, GRU, Input, Embedding
from keras.optimizers import Adam
from keras.layers.convolutional import Convolution2D
from PolicyGradientModel import PolicyGradientModel
from RewardCalculator import RewardCalculator

Using TensorFlow backend.


In [2]:
ALLOWED_PARAMETERS = list('XY')
ALLOWED_SYMBOLS = ALLOWED_PARAMETERS + list('0123456789+-*/#')
NUM_SYMBOLS = len(ALLOWED_SYMBOLS)
MAX_LENGTH = 10 # Max length of the output expression
CORRECT_EXPRESSION = "3*X+2*Y"

### DEFINE MODEL

In [3]:
def getModel():
    # Trying to neglect input
    input1 = Input(shape=(1,1))
    # TODO: Add noise layer to make output vary
    x = GRU(128)(input1)
    x = Dense(100, activation='relu')(x)
    x = Dense(100, activation='relu')(x)
    out = Dense(NUM_SYMBOLS, activation='sigmoid')(x)
    model = Model(inputs=input1, outputs=out)
    model.compile(optimizer=Adam(lr=0.00001),
                loss='categorical_crossentropy')
    return model

In [None]:
setting = []
setting.append([0.0,0.6,-0.0,0.05,-0.7]) # Converge to Number + Math Symbol

In [None]:
rewardCalculator = RewardCalculator(correctExpression=CORRECT_EXPRESSION,
                                    parameters=ALLOWED_PARAMETERS,
                                    functionDifferenceRewardWeight=0.0,
                                    compilableRewardWeight=1, 
                                    lengthRewardWeight=-0.00,
                                    foundMathSymbolWeight=0.00,
                                    foundVariableWeight=0.0,
                                    rewardOffset=0.0,
                                    usingFile=False)

In [None]:
model = getModel()
pgModel = PolicyGradientModel(model=model,
                              allowedSymbol=ALLOWED_SYMBOLS,
                              numSymbol=NUM_SYMBOLS,
                              maxLength=MAX_LENGTH,
                              rewardCalculator=rewardCalculator,
                              learningRate=0.00001,
                              fileName="Number.hdf5")

In [None]:
pgModel.train(input=np.ones((1,1,1)))

In [4]:
rewardCalculator = RewardCalculator(correctExpression=CORRECT_EXPRESSION,
                                    parameters=ALLOWED_PARAMETERS,
                                    functionDifferenceRewardWeight=0.0,
                                    compilableRewardWeight=0.60, 
                                    lengthRewardWeight=-0.01,
                                    foundMathSymbolWeight=0.1,
                                    foundVariableWeight=0.5,
                                    rewardOffset=-0.7,
                                    usingFile=False)

In [5]:
model = getModel()
pgModel = PolicyGradientModel(model=model,
                              allowedSymbol=ALLOWED_SYMBOLS,
                              numSymbol=NUM_SYMBOLS,
                              maxLength=MAX_LENGTH,
                              rewardCalculator=rewardCalculator,
                              learningRate=0.000001,
                              fileName="Number_FoundSymbol.hdf5")

In [None]:
pgModel.loadWeight("Number_FoundSymbol.hdf5")

In [6]:
pgModel.train(input=np.ones((1,1,1)))

Epoch: 0	Loss: 24.109960556	Example Output: X526	Example Reward:  -0.3
[[ 0.4982734   0.50277507  0.49818498  0.51301628  0.50358164  0.49870691
   0.49689391  0.50190926  0.4942376   0.50579143  0.49995667  0.50182897
   0.50406724  0.49372408  0.50085878  0.49927068  0.49681947]]
Saving Weight
Epoch: 1	Loss: 24.1100381851	Example Output: 847X2	Example Reward:  -0.3
[[ 0.49827743  0.50277013  0.49818841  0.51302427  0.50359291  0.49870399
   0.49689081  0.50190431  0.49423778  0.50580525  0.49995059  0.50182444
   0.50407195  0.49372739  0.50085354  0.49926662  0.49681771]]
Epoch: 2	Loss: 24.1101678848	Example Output: -1Y-2X923/	Example Reward:  -0.3
[[ 0.4982824   0.50277144  0.49819538  0.51303768  0.50360817  0.4987008
   0.49688911  0.5019061   0.49423209  0.50582629  0.4999516   0.50182039
   0.5040831   0.49373111  0.50085425  0.49926734  0.49682382]]
Epoch: 3	Loss: 24.1102794647	Example Output: +*53+X70	Example Reward:  -0.3
[[ 0.49828103  0.50276953  0.49819526  0.51304543  0.

Epoch: 29	Loss: 24.1049396515	Example Output: 2/8YY599/5	Example Reward:  -0.3
[[ 0.49799463  0.50242591  0.49806121  0.51359349  0.50405633  0.49853861
   0.49632153  0.50132328  0.4940353   0.5064972   0.49937642  0.50137591
   0.50448728  0.49366021  0.50043827  0.49898076  0.49704584]]
Epoch: 30	Loss: 24.1052757263	Example Output: -9Y965*94-	Example Reward:  -0.3
[[ 0.49799925  0.50241822  0.49806359  0.51361936  0.50408667  0.49853477
   0.49631247  0.50131792  0.49401665  0.50652528  0.49937102  0.50135326
   0.50450462  0.49365917  0.50041991  0.49897629  0.4970631 ]]
Saving Weight
Epoch: 31	Loss: 24.1051912308	Example Output: 9-02	Example Reward:  -0.3
[[ 0.49799344  0.5024007   0.49806684  0.51363158  0.50410926  0.49852723
   0.4963018   0.50129801  0.49400708  0.50655371  0.49935365  0.50133491
   0.50452721  0.49366224  0.50039071  0.49895683  0.4970628 ]]
Epoch: 32	Loss: 24.1049442291	Example Output: -/7+X959*X	Example Reward:  -0.3
[[ 0.49797559  0.50238532  0.49806228  0

Epoch: 58	Loss: 24.1054759979	Example Output: 0//9	Example Reward:  0.06
[[ 0.49798459  0.50215983  0.49800101  0.51449126  0.50503403  0.49837631
   0.4957962   0.500669    0.49368054  0.50754207  0.49878952  0.5006507
   0.50518793  0.49375802  0.50003952  0.49873233  0.49744776]]
Epoch: 59	Loss: 24.105437088	Example Output: Y572/26Y37	Example Reward:  -0.3
[[ 0.49796543  0.50213599  0.49800149  0.51452053  0.50506353  0.49836776
   0.49576879  0.50063914  0.49366987  0.50756991  0.49876601  0.50063324
   0.50520873  0.49375889  0.50002581  0.49872148  0.49747118]]
Epoch: 60	Loss: 24.1051271439	Example Output: 94*	Example Reward:  -0.3
[[ 0.49795738  0.50211221  0.49799344  0.51453954  0.50509691  0.4983564
   0.4957498   0.50061047  0.49366125  0.50759745  0.49873453  0.50060302
   0.50522298  0.49375552  0.49999225  0.49870706  0.4974764 ]]
Saving Weight
Epoch: 61	Loss: 24.1050138474	Example Output: 1987+	Example Reward:  -0.3
[[ 0.49795243  0.50209677  0.49798399  0.5145607   0.50

Epoch: 88	Loss: 24.1029409409	Example Output: 	Example Reward:  -0.3
[[ 0.49784094  0.50157177  0.49796188  0.51545042  0.50605786  0.49811387
   0.49513555  0.49991393  0.49325323  0.508587    0.49793893  0.49998671
   0.50591522  0.49364656  0.49994725  0.49837169  0.49777576]]
Epoch: 89	Loss: 24.1032341003	Example Output: ++/-*97933	Example Reward:  -0.3
[[ 0.49785218  0.50155938  0.49796686  0.5154916   0.50609875  0.49811611
   0.49513313  0.49991727  0.49323341  0.50862014  0.4979316   0.49998403
   0.50594735  0.49364853  0.49994612  0.4983674   0.4978101 ]]
Epoch: 90	Loss: 24.103645134	Example Output: 9/+6	Example Reward:  0.06
[[ 0.49788231  0.50154024  0.49797499  0.51553667  0.50615054  0.49811825
   0.49512219  0.4999187   0.49321699  0.50865287  0.49791542  0.49998575
   0.50598097  0.49365604  0.49995446  0.49837387  0.49783096]]
Saving Weight
Epoch: 91	Loss: 24.1044019699	Example Output: 785/6-4/54	Example Reward:  0.10000000000000009
[[ 0.49791896  0.50153655  0.4979842

Epoch: 117	Loss: 24.100761795	Example Output: 9X*9*823Y1	Example Reward:  -0.3
[[ 0.49764898  0.50092536  0.49768215  0.51659322  0.50707853  0.49778718
   0.49438709  0.49959621  0.49297348  0.50938767  0.49724114  0.49966958
   0.50676441  0.49326938  0.49982566  0.4979941   0.49791345]]
Epoch: 118	Loss: 24.1008619308	Example Output: X1Y	Example Reward:  -0.3
[[ 0.49765122  0.50090873  0.49766728  0.51664537  0.50711066  0.49777868
   0.49436945  0.49959865  0.49295178  0.50943041  0.49722126  0.49965459
   0.5068146   0.49325725  0.49983442  0.49796921  0.4979341 ]]
Epoch: 119	Loss: 24.1009065628	Example Output: 98067Y/+-9	Example Reward:  -0.3
[[ 0.49766621  0.50089318  0.49763352  0.51669896  0.50714374  0.49777496
   0.49435353  0.49958822  0.49293211  0.50946146  0.49719119  0.49963108
   0.50684595  0.49323434  0.49983203  0.49794355  0.49794218]]
Epoch: 120	Loss: 24.1008117676	Example Output: 9-6+393/29	Example Reward:  0.10000000000000009
[[ 0.49766946  0.50088727  0.49761885

Epoch: 146	Loss: 24.0974691391	Example Output: 7404639	Example Reward:  -0.17
[[ 0.4974274   0.50029224  0.49744818  0.51767731  0.5080387   0.49752915
   0.49353775  0.49919567  0.49257493  0.51018959  0.496326    0.4992696
   0.50751185  0.4930445   0.49980724  0.49751958  0.49836493]]
Epoch: 147	Loss: 24.0981330872	Example Output: 	Example Reward:  -0.3
[[ 0.49741608  0.5002749   0.49745321  0.51773089  0.50808662  0.49751839
   0.49350449  0.49919248  0.49257991  0.51022238  0.49629721  0.49926591
   0.50753802  0.49304625  0.49983782  0.49751556  0.49838981]]
Epoch: 148	Loss: 24.098184967	Example Output: 43+6YX7	Example Reward:  -0.3
[[ 0.49740481  0.50025129  0.4974325   0.51777279  0.50811774  0.49750718
   0.49345994  0.49918273  0.49257094  0.51024878  0.49624154  0.49924386
   0.50755841  0.49303901  0.49984032  0.4975026   0.49843991]]
Epoch: 149	Loss: 24.0977733612	Example Output: 557Y0XXX6	Example Reward:  -0.3
[[ 0.4973959   0.50022691  0.49742058  0.51778883  0.50815439 

Epoch: 175	Loss: 24.0949523926	Example Output: 1	Example Reward:  -0.10999999999999999
[[ 0.4972952   0.49989828  0.49710777  0.51857394  0.5091489   0.49700892
   0.49257979  0.49888787  0.49206793  0.51124823  0.4954516   0.49879792
   0.50828511  0.49269724  0.49973801  0.49703753  0.49882805]]
Epoch: 176	Loss: 24.0942340851	Example Output: /11Y571349	Example Reward:  -0.3
[[ 0.49728751  0.49988803  0.49708137  0.51861393  0.50917149  0.4969942
   0.49253097  0.49886259  0.49204463  0.51123345  0.49540421  0.49878073
   0.50828248  0.49265662  0.49973515  0.4970085   0.49883887]]
Epoch: 177	Loss: 24.0938621521	Example Output: 9+X07Y16Y7	Example Reward:  -0.3
[[ 0.49727032  0.49987367  0.49706712  0.51867509  0.50919771  0.49697801
   0.49249798  0.49883163  0.49202943  0.51123774  0.49537131  0.49878749
   0.50828302  0.49263579  0.49973467  0.49701279  0.49885631]]
Epoch: 178	Loss: 24.0934972763	Example Output: 	Example Reward:  -0.3
[[ 0.49725747  0.49986222  0.49704343  0.5187072

Epoch: 204	Loss: 24.0938711166	Example Output: /9	Example Reward:  -0.3
[[ 0.4970693   0.49977657  0.49679109  0.51974577  0.51002997  0.4965665
   0.49176061  0.49857298  0.49155959  0.51214939  0.49474317  0.49856007
   0.50881535  0.49221599  0.49992543  0.49688423  0.49928612]]
Epoch: 205	Loss: 24.0934652328	Example Output: X/0846Y897	Example Reward:  -0.3
[[ 0.49705216  0.49975526  0.4967491   0.51974618  0.51003432  0.49654728
   0.49171981  0.49855164  0.49154013  0.51216376  0.49468085  0.49853411
   0.50881833  0.49218464  0.49988797  0.49686009  0.49931455]]
Epoch: 206	Loss: 24.0928501129	Example Output: *58YY-/71	Example Reward:  -0.3
[[ 0.49705723  0.49974346  0.49673074  0.51975626  0.51005298  0.49654597
   0.49169582  0.49853837  0.49151886  0.51218396  0.49464849  0.49851692
   0.50883245  0.4921709   0.4998683   0.49685171  0.49932131]]
Epoch: 207	Loss: 24.0923303604	Example Output: +2*6896928	Example Reward:  5.55111512313e-17
[[ 0.49704409  0.4997392   0.49670532  0.

Epoch: 232	Loss: 24.0875644684	Example Output: YY9X1154Y*	Example Reward:  -0.3
[[ 0.49680147  0.49956551  0.49635246  0.52065182  0.51085931  0.49611712
   0.49080446  0.49810085  0.49101752  0.51295614  0.49392891  0.49800491
   0.50948685  0.4917537   0.49983007  0.49629563  0.4997206 ]]
Epoch: 233	Loss: 24.0876634598	Example Output: 35	Example Reward:  -0.12
[[ 0.49682581  0.49957174  0.49635571  0.52071631  0.51092088  0.49608883
   0.4907707   0.49808192  0.49098101  0.5130102   0.49390814  0.49798977
   0.50952899  0.49174795  0.49984103  0.49628359  0.49974114]]
Epoch: 234	Loss: 24.0882329941	Example Output: -0-433**7*	Example Reward:  -0.3
[[ 0.49684337  0.49957108  0.49636418  0.52077609  0.51097894  0.49606746
   0.49074578  0.49807942  0.49095476  0.51306236  0.49389842  0.49797913
   0.50957972  0.49173754  0.4998568   0.49627978  0.49975514]]
Epoch: 235	Loss: 24.0882822037	Example Output: /66Y--/74	Example Reward:  -0.3
[[ 0.49684843  0.49954849  0.49635506  0.52081352  0

Epoch: 261	Loss: 24.0822048187	Example Output: 8*98770012	Example Reward:  -0.1
[[ 0.4966715   0.49927175  0.49637333  0.52191907  0.51223212  0.49547964
   0.4894405   0.49753067  0.49026394  0.51383972  0.49271679  0.49746329
   0.51028216  0.49134532  0.49981785  0.49556881  0.50012285]]
Epoch: 262	Loss: 24.0820142746	Example Output: 	Example Reward:  -0.3
[[ 0.49667522  0.49926561  0.49640706  0.52195621  0.51228428  0.49544457
   0.48941606  0.49751851  0.49024096  0.51388884  0.49270383  0.49744996
   0.51032007  0.49133813  0.49981672  0.49555403  0.50014913]]
Epoch: 263	Loss: 24.0823062897	Example Output: 4YY7-94*YY	Example Reward:  -0.3
[[ 0.49665946  0.49925154  0.49643454  0.52200109  0.512335    0.49540403
   0.48938301  0.49750605  0.49021414  0.5139485   0.49267489  0.49742836
   0.51036549  0.49131522  0.49982309  0.49553618  0.50020146]]
Epoch: 264	Loss: 24.0822608948	Example Output: 015832/722	Example Reward:  -0.3
[[ 0.49663687  0.49924952  0.49643397  0.52205372  0.5

Epoch: 291	Loss: 24.0769376755	Example Output: 08612*00	Example Reward:  -0.3
[[ 0.49646327  0.49892923  0.49644589  0.52308476  0.5135591   0.4947077
   0.48823696  0.4969587   0.48972869  0.5150066   0.4917371   0.49693778
   0.51110369  0.49082837  0.49972406  0.4948841   0.50035006]]
Epoch: 292	Loss: 24.0772628784	Example Output: 7765987X2*	Example Reward:  -0.3
[[ 0.4964543   0.4989121   0.4964591   0.5231207   0.51360178  0.49469334
   0.48821199  0.49694574  0.48971292  0.51504797  0.49173456  0.49694121
   0.51113313  0.49081662  0.49972203  0.49487847  0.50037545]]
Epoch: 293	Loss: 24.0773899078	Example Output: 4875	Example Reward:  -0.14
[[ 0.49644524  0.49890882  0.49646944  0.5231598   0.51366067  0.49467373
   0.48817116  0.4969272   0.48969668  0.51510584  0.49171796  0.49694344
   0.51117706  0.49082118  0.49974132  0.49486727  0.50039929]]
Epoch: 294	Loss: 24.0776874542	Example Output: 9/13	Example Reward:  -0.04000000000000001
[[ 0.49643829  0.498889    0.49648592  0.5

Epoch: 319	Loss: 24.0776151657	Example Output: 0Y0-	Example Reward:  -0.3
[[ 0.49634138  0.49866319  0.49656609  0.52434498  0.51498258  0.49406692
   0.48711774  0.49643749  0.48921239  0.5163157   0.49097499  0.49660218
   0.51194906  0.4904592   0.49975705  0.49443612  0.50063086]]
Epoch: 320	Loss: 24.0770498276	Example Output: 180803638*	Example Reward:  -0.3
[[ 0.49632376  0.49864346  0.49659052  0.52436209  0.5150311   0.49401519
   0.4870967   0.49640375  0.48922339  0.5163542   0.4909389   0.49658948
   0.51197261  0.49045718  0.49974716  0.49441776  0.50061554]]
Saving Weight
Epoch: 321	Loss: 24.0770290375	Example Output: 6*1005/+75	Example Reward:  0.10000000000000009
[[ 0.49631342  0.49862349  0.49663222  0.5243969   0.51507831  0.49396044
   0.48707867  0.49636897  0.4892132   0.5164023   0.49091044  0.49658936
   0.51201367  0.49045008  0.49974394  0.49439806  0.50060338]]
Epoch: 322	Loss: 24.0770553589	Example Output: 18-604645Y	Example Reward:  -0.3
[[ 0.49630979  0.4986

Epoch: 348	Loss: 24.0709482193	Example Output: *79/-/1812	Example Reward:  -0.3
[[ 0.4961144   0.49816155  0.49663028  0.52557439  0.51629668  0.49334127
   0.4859173   0.4956584   0.48857927  0.51732266  0.48992342  0.49613482
   0.51284683  0.48996639  0.4996593   0.49369204  0.50086761]]
Epoch: 349	Loss: 24.0708631516	Example Output: X	Example Reward:  0.39
[[ 0.49611712  0.49815118  0.49663523  0.52561557  0.51633322  0.49332222
   0.48588666  0.49563614  0.48855919  0.51735127  0.48991302  0.49613717
   0.51288503  0.48995879  0.49965549  0.49367467  0.50084245]]
Epoch: 350	Loss: 24.0703111649	Example Output: 	Example Reward:  -0.3
[[ 0.4961265   0.49813041  0.49658561  0.52562344  0.51633722  0.49330297
   0.48585385  0.4955999   0.4885174   0.51733351  0.48987317  0.49610642
   0.51289445  0.48993081  0.49960899  0.49361572  0.5008328 ]]
Saving Weight
Epoch: 351	Loss: 24.0692890167	Example Output: +9719-2683	Example Reward:  5.551115123125783e-17
[[ 0.49612367  0.49812728  0.496

Epoch: 378	Loss: 24.0697853088	Example Output: 	Example Reward:  -0.3
[[ 0.49606976  0.49771595  0.49669915  0.52694678  0.51772243  0.49282598
   0.48480153  0.49514687  0.48815238  0.51831508  0.48897001  0.49575728
   0.51359791  0.48957723  0.49967566  0.49316996  0.50116432]]
Epoch: 379	Loss: 24.0691724777	Example Output: 917+X84X/Y	Example Reward:  -0.3
[[ 0.49606031  0.49769694  0.49668321  0.52697754  0.51775622  0.49280387
   0.48474959  0.49511263  0.48811057  0.51835799  0.488911    0.49571031
   0.51362777  0.48955163  0.49966186  0.49312985  0.50116974]]
Epoch: 380	Loss: 24.0688297272	Example Output: -9165+/2*2	Example Reward:  -0.3
[[ 0.49605051  0.49769562  0.49668029  0.52702254  0.51779866  0.49278501
   0.48473832  0.49510095  0.48808843  0.51839775  0.48888537  0.4956795
   0.51366562  0.48953304  0.49966618  0.49310583  0.50120813]]
Saving Weight
Epoch: 381	Loss: 24.0694419861	Example Output: 4-0Y/6977Y	Example Reward:  -0.3
[[ 0.49604851  0.49770543  0.49671185  0.

Epoch: 407	Loss: 24.0601486206	Example Output: /Y029Y9+92	Example Reward:  -0.3
[[ 0.49581626  0.49750045  0.49639165  0.52808654  0.51884317  0.4921526
   0.48375502  0.49429515  0.48741522  0.51916885  0.48795739  0.49508154
   0.51432729  0.48910987  0.49945658  0.49231151  0.50144738]]
Epoch: 408	Loss: 24.0601039886	Example Output: 03	Example Reward:  -0.3
[[ 0.49580571  0.49748594  0.49639553  0.52811909  0.51889658  0.4921225
   0.48371363  0.494275    0.48738912  0.51919562  0.48792383  0.49507114
   0.51436073  0.48908648  0.49944445  0.49229661  0.50148171]]
Epoch: 409	Loss: 24.0601131439	Example Output: 8YX4**698Y	Example Reward:  -0.3
[[ 0.49579632  0.49748316  0.49640164  0.52815574  0.51895821  0.49208993
   0.48369277  0.49425396  0.4873676   0.51923883  0.48789334  0.49505594
   0.5143981   0.48906732  0.49943522  0.49227881  0.50150281]]
Epoch: 410	Loss: 24.0601772308	Example Output: 777660	Example Reward:  -0.16
[[ 0.49579778  0.49749297  0.49640718  0.52822155  0.5190

Epoch: 436	Loss: 24.0531269073	Example Output: 48X/253*46	Example Reward:  -0.3
[[ 0.49561179  0.49733305  0.49608999  0.52952945  0.52007288  0.49163607
   0.48261943  0.49348527  0.48664668  0.5201115   0.48696148  0.49455592
   0.51508528  0.48852715  0.49938321  0.49157873  0.50159252]]
Epoch: 437	Loss: 24.0533086777	Example Output: 	Example Reward:  -0.3
[[ 0.49561214  0.49732313  0.49607903  0.52955127  0.5201056   0.49160764
   0.48260826  0.49347389  0.48662052  0.52012551  0.48693973  0.49453387
   0.51509333  0.48850206  0.49937505  0.49154311  0.50160021]]
Epoch: 438	Loss: 24.0522735596	Example Output: 4127+6--41	Example Reward:  0.10000000000000009
[[ 0.49559632  0.49729082  0.49605596  0.52956396  0.520127    0.49157554
   0.48255891  0.49343869  0.48657739  0.5201214   0.4868741   0.49449486
   0.51509243  0.48845494  0.49933866  0.49147221  0.50160086]]
Epoch: 439	Loss: 24.0513137817	Example Output: -*0*+-22	Example Reward:  -0.3
[[ 0.49558121  0.49728152  0.4960359   0.

Epoch: 465	Loss: 24.0435352325	Example Output: 392+43996-	Example Reward:  -0.3
[[ 0.4953424   0.49702069  0.49589345  0.5308851   0.5215022   0.49085179
   0.48123935  0.49282077  0.48588058  0.52099955  0.48569882  0.49384075
   0.51576251  0.48795852  0.49920031  0.49062556  0.50195807]]
Epoch: 466	Loss: 24.0434965134	Example Output: 84/28++55+	Example Reward:  -0.3
[[ 0.4953396   0.49701032  0.49589473  0.53095728  0.52154666  0.49083558
   0.48118055  0.4927952   0.48585528  0.5210278   0.48565698  0.49383819
   0.51580006  0.48793131  0.49920541  0.49061054  0.50195283]]
Epoch: 467	Loss: 24.0432552338	Example Output: 22X/43X5X+	Example Reward:  -0.3
[[ 0.49533972  0.4970009   0.49590325  0.53101689  0.52159923  0.49079517
   0.48113126  0.49276567  0.48581892  0.52107006  0.48561141  0.49381435
   0.51583546  0.48790866  0.49920252  0.49059066  0.50195593]]
Epoch: 468	Loss: 24.0428571701	Example Output: -/Y/386YX6	Example Reward:  -0.3
[[ 0.49535167  0.49697089  0.49589774  0.531

Epoch: 494	Loss: 24.0408973694	Example Output: Y1-X	Example Reward:  -0.3
[[ 0.49522084  0.49685055  0.49583688  0.53227431  0.52302194  0.49024227
   0.48004368  0.49221253  0.48513153  0.52199608  0.48476958  0.49341327
   0.51674092  0.48743725  0.49915564  0.48989469  0.5022825 ]]
Epoch: 495	Loss: 24.0399032593	Example Output: /+27X41*	Example Reward:  -0.3
[[ 0.49518755  0.49684137  0.49581403  0.53233647  0.52308404  0.49019843
   0.47996283  0.49216032  0.48508763  0.52203012  0.4847168   0.49338827
   0.5167653   0.48739552  0.49913117  0.48981598  0.50229084]]
Epoch: 496	Loss: 24.0394018173	Example Output: 	Example Reward:  -0.3
[[ 0.49516523  0.4968349   0.49580312  0.53242171  0.52315569  0.49015427
   0.47991094  0.49211714  0.48504686  0.52206963  0.48468086  0.49336547
   0.51680142  0.48736817  0.49913201  0.48978016  0.50232315]]
Epoch: 497	Loss: 24.0392091751	Example Output: -X	Example Reward:  0.48
[[ 0.49513951  0.49684185  0.49579889  0.53249854  0.52321452  0.49011

Epoch: 523	Loss: 24.0330688477	Example Output: 7	Example Reward:  -0.10999999999999999
[[ 0.49493608  0.49662453  0.49561816  0.53392547  0.52468032  0.4894841
   0.47855407  0.49135879  0.48428285  0.52313471  0.48349956  0.49273786
   0.51757485  0.48684347  0.49913082  0.48891476  0.5027625 ]]
Epoch: 524	Loss: 24.03301754	Example Output: 6*1-160287	Example Reward:  5.55111512313e-17
[[ 0.49492747  0.49663228  0.4956252   0.53398257  0.52473217  0.48945495
   0.4784877   0.49132937  0.48425573  0.52320111  0.48345894  0.49271241
   0.51761973  0.48684984  0.49913681  0.48888743  0.5027681 ]]
Epoch: 525	Loss: 24.03282547	Example Output: 4+-+/53828	Example Reward:  -0.3
[[ 0.49492112  0.49664292  0.49564585  0.53403294  0.52478623  0.48943257
   0.47842515  0.49128318  0.4842152   0.52325702  0.4834075   0.49268925
   0.51765621  0.48684737  0.49912974  0.48885253  0.50277257]]
Epoch: 526	Loss: 24.0328178406	Example Output: -7-//811X1	Example Reward:  -0.3
[[ 0.49493173  0.49666393  0.

Epoch: 551	Loss: 24.0374900818	Example Output: 74616438	Example Reward:  -0.18
[[ 0.49500528  0.4967078   0.49585998  0.53555775  0.52657628  0.48883507
   0.47731149  0.49083012  0.48371869  0.52446157  0.48246902  0.49232918
   0.518498    0.48677391  0.4993023   0.4882856   0.50321954]]
Epoch: 552	Loss: 24.0371797562	Example Output: 3-Y-41	Example Reward:  0.54
[[ 0.49500048  0.49668923  0.49584931  0.53560549  0.52662081  0.48881188
   0.47726938  0.49079838  0.48369801  0.52449292  0.48243573  0.49231255
   0.51851177  0.48675561  0.49930549  0.48825163  0.5032227 ]]
Epoch: 553	Loss: 24.0363010406	Example Output: 4/504XY4*5	Example Reward:  -0.3
[[ 0.49496749  0.49665317  0.49581262  0.53563845  0.52665448  0.48878384
   0.47719374  0.49075139  0.48366365  0.52449745  0.48236671  0.49227661
   0.51851398  0.48671207  0.49927294  0.48818627  0.50324088]]
Epoch: 554	Loss: 24.0352376938	Example Output: 7/28186*9X	Example Reward:  -0.3
[[ 0.49494833  0.49662477  0.49581209  0.53567457

Epoch: 580	Loss: 24.0248575211	Example Output: 0*--X1*33Y	Example Reward:  -0.3
[[ 0.49443662  0.49624389  0.49561355  0.53715086  0.52814341  0.48798934
   0.47549075  0.49006119  0.48288864  0.52543104  0.48089957  0.49168637
   0.51907182  0.48579291  0.49921843  0.48716721  0.50423586]]
Saving Weight
Epoch: 581	Loss: 24.024707222	Example Output: ++1596	Example Reward:  0.04000000000000009
[[ 0.49441281  0.49622381  0.49561101  0.53721094  0.52819437  0.48795703
   0.47542694  0.49005738  0.48285773  0.52545696  0.4808484   0.49166441
   0.51910084  0.48577076  0.49922723  0.48712748  0.50427502]]
Epoch: 582	Loss: 24.0243350983	Example Output: -41001+9X6	Example Reward:  -0.3
[[ 0.49439329  0.49621126  0.49559936  0.53725022  0.52825332  0.48792332
   0.47536391  0.49005827  0.48283193  0.52549553  0.48079801  0.49163622
   0.51914054  0.4857533   0.49923554  0.48708335  0.50430816]]
Epoch: 583	Loss: 24.0243190765	Example Output: 5706*-Y6X7	Example Reward:  -0.3
[[ 0.49438909  0.496

Epoch: 608	Loss: 24.0282407761	Example Output: 4	Example Reward:  -0.10999999999999999
[[ 0.49416086  0.49612129  0.49564904  0.53893864  0.52998698  0.48714292
   0.4741298   0.48978239  0.48213673  0.52687001  0.47988325  0.49112818
   0.52015704  0.4851864   0.49969095  0.48635516  0.50560361]]
Epoch: 609	Loss: 24.0281152725	Example Output: 520Y*70+61	Example Reward:  -0.3
[[ 0.4941377   0.49611586  0.49564421  0.53899032  0.53003752  0.48710948
   0.47409078  0.48976234  0.48211548  0.52689523  0.47986218  0.49110961
   0.52017158  0.48513663  0.49969429  0.48631945  0.5056417 ]]
Epoch: 610	Loss: 24.0276351929	Example Output: 10995+**-Y	Example Reward:  -0.3
[[ 0.49410015  0.49610054  0.49565244  0.53903639  0.53009647  0.4870539
   0.4740282   0.48973763  0.4820998   0.52693141  0.47980997  0.4910841
   0.52019626  0.48509365  0.49967691  0.48627639  0.50567102]]
Saving Weight
Epoch: 611	Loss: 24.0269041061	Example Output: 40/**/*-5	Example Reward:  -0.3
[[ 0.4940601   0.4960697  

Epoch: 637	Loss: 24.0183004379	Example Output: 55-8-781-/	Example Reward:  -0.3
[[ 0.49346402  0.49574393  0.49546483  0.54049301  0.53175712  0.48604062
   0.47251543  0.48908535  0.48142079  0.52807111  0.4783763   0.4904561
   0.52084821  0.48430264  0.49964085  0.48517692  0.5069384 ]]
Epoch: 638	Loss: 24.018970108	Example Output: -0/+-95	Example Reward:  0.2300000000000001
[[ 0.49345461  0.49575189  0.49546441  0.54057419  0.53183693  0.48600525
   0.47244474  0.48907435  0.48138204  0.52815247  0.47832775  0.49043131
   0.52090448  0.48429102  0.49968132  0.48515525  0.50700438]]
Epoch: 639	Loss: 24.0189775467	Example Output: 4-7Y-*Y98Y	Example Reward:  -0.3
[[ 0.49342656  0.49574634  0.49545729  0.54062551  0.53188884  0.48597339
   0.47238559  0.48906779  0.48136279  0.52820498  0.47827807  0.49041548
   0.52093655  0.48427257  0.49969095  0.48511699  0.5070529 ]]
Epoch: 640	Loss: 24.0189222336	Example Output: 0/33Y-	Example Reward:  -0.3
[[ 0.49340671  0.4957341   0.49547794  

Epoch: 666	Loss: 24.016119957	Example Output: 7Y+8*7/61X	Example Reward:  -0.3
[[ 0.49295071  0.49546951  0.4953196   0.54217488  0.53356159  0.48499906
   0.47093973  0.48861039  0.48059142  0.52957654  0.47706524  0.48981518
   0.52175122  0.48363799  0.499919    0.48429748  0.5083642 ]]
Epoch: 667	Loss: 24.015852356	Example Output: 511*857096	Example Reward:  -0.1
[[ 0.49295527  0.49547455  0.49531212  0.54223198  0.53363496  0.4849841
   0.47088209  0.48860949  0.4805401   0.52961749  0.4770371   0.48977548
   0.52179086  0.48359537  0.49992347  0.48425931  0.50840873]]
Epoch: 668	Loss: 24.0160573959	Example Output: 60*-7127+Y	Example Reward:  0.6
[[ 0.49296767  0.49547899  0.49532241  0.54228282  0.53371078  0.48495364
   0.47084069  0.48863021  0.48051885  0.52967972  0.47701228  0.48974735
   0.52183974  0.48357415  0.49994802  0.48422754  0.50848496]]
Epoch: 669	Loss: 24.0164360046	Example Output: 3452X4*	Example Reward:  -0.3
[[ 0.49294558  0.49548286  0.49532393  0.54233134  

Epoch: 695	Loss: 24.0118967056	Example Output: 2+/Y78	Example Reward:  -0.3
[[ 0.49239624  0.4952651   0.49504465  0.54403329  0.5352475   0.48420417
   0.46933612  0.48811978  0.47978073  0.53079563  0.47567448  0.48911536
   0.52275062  0.48282871  0.49999642  0.48329654  0.50994307]]
Epoch: 696	Loss: 24.0114704132	Example Output: 1+/-777+4-	Example Reward:  -0.3
[[ 0.4923715   0.49525118  0.49503678  0.54408586  0.53528494  0.48417529
   0.46928188  0.48809984  0.47976828  0.53083736  0.47562233  0.48909813
   0.52277827  0.48279747  0.49999738  0.48327962  0.50997412]]
Epoch: 697	Loss: 24.0112340927	Example Output: 	Example Reward:  -0.3
[[ 0.49234617  0.4952445   0.49502018  0.54412967  0.53532338  0.48414811
   0.46923184  0.4880555   0.47974181  0.53088462  0.47556657  0.48906985
   0.52281153  0.48277628  0.50000131  0.48325205  0.50999916]]
Epoch: 698	Loss: 24.0108829498	Example Output: 86*9-99+7-	Example Reward:  -0.3
[[ 0.49232155  0.4952251   0.49501392  0.54418862  0.53537

Epoch: 724	Loss: 24.0040111542	Example Output: +046-154	Example Reward:  -0.3
[[ 0.49187249  0.49502632  0.49469846  0.54580641  0.53684521  0.48320073
   0.46756583  0.48743889  0.47894514  0.53212035  0.47409958  0.48845074
   0.52368039  0.48191381  0.49988273  0.48227796  0.51142555]]
Epoch: 725	Loss: 24.0032974243	Example Output: 1X450	Example Reward:  -0.3
[[ 0.49183345  0.49501744  0.49467444  0.54586112  0.53687143  0.48315236
   0.46751058  0.48740384  0.47890243  0.53213632  0.47403955  0.48842025
   0.52373576  0.48188058  0.49986461  0.48223284  0.51146859]]
Epoch: 726	Loss: 24.0024095535	Example Output: 57*-22+056	Example Reward:  -0.3
[[ 0.49180385  0.49501202  0.4946633   0.54593068  0.53691477  0.48310956
   0.46744505  0.48737666  0.47886211  0.53216618  0.47395813  0.48838305
   0.52377266  0.48183772  0.49985388  0.4821845   0.51151389]]
Epoch: 727	Loss: 24.0019851685	Example Output: 9+6Y6087/1	Example Reward:  -0.3
[[ 0.49177948  0.49500224  0.49464801  0.54598546  

Epoch: 752	Loss: 23.9934209824	Example Output: 27422/41X2	Example Reward:  -0.3
[[ 0.49130809  0.49457482  0.4942553   0.54772365  0.53851718  0.48232657
   0.46582463  0.48667088  0.47804624  0.53314596  0.47247943  0.48785329
   0.52453667  0.48095116  0.49994576  0.48110113  0.51264322]]
Epoch: 753	Loss: 23.9932434082	Example Output: +2//Y77Y80	Example Reward:  -0.3
[[ 0.49128598  0.49456018  0.49424577  0.54781604  0.53860563  0.48229384
   0.46576601  0.48664889  0.478021    0.53319967  0.47242028  0.48782423
   0.52456099  0.48091653  0.49994445  0.48107186  0.51270133]]
Epoch: 754	Loss: 23.9931783676	Example Output: 7+867/2848	Example Reward:  5.551115123125783e-17
[[ 0.49126413  0.49455038  0.49424133  0.54788303  0.53867066  0.48227009
   0.46572605  0.48662618  0.4779985   0.53325564  0.4723728   0.48780972
   0.52459198  0.48089701  0.49993807  0.48105499  0.51274407]]
Epoch: 755	Loss: 23.993378067	Example Output: 8+1	Example Reward:  -0.03
[[ 0.49124628  0.49453861  0.49422

Epoch: 781	Loss: 23.9889146805	Example Output: 35+	Example Reward:  -0.3
[[ 0.4907425   0.4944379   0.49397182  0.54956913  0.5402016   0.48147368
   0.46426329  0.48596194  0.47715005  0.53457278  0.47116989  0.48723736
   0.52558017  0.48019636  0.49990264  0.48017648  0.51406723]]
Epoch: 782	Loss: 23.9889801025	Example Output: X0Y3-0	Example Reward:  -0.3
[[ 0.49073347  0.49445418  0.49396479  0.54963481  0.54026824  0.48143455
   0.46420291  0.4859553   0.47711158  0.53464353  0.47112593  0.4872084
   0.52563286  0.48017338  0.4999212   0.48013768  0.5141266 ]]
Epoch: 783	Loss: 23.9892946243	Example Output: 000815+*++	Example Reward:  -0.3
[[ 0.49072647  0.49444842  0.49397835  0.54970938  0.5403372   0.48139775
   0.4641481   0.48594904  0.47708324  0.53469598  0.4710767   0.48718971
   0.52566671  0.48014805  0.49993086  0.48012859  0.51418871]]
Epoch: 784	Loss: 23.9892181396	Example Output: 0	Example Reward:  -0.10999999999999999
[[ 0.49071953  0.49444038  0.49397713  0.54978216

Epoch: 810	Loss: 23.9824876785	Example Output: 1/34Y1580-	Example Reward:  -0.3
[[ 0.49023557  0.4942835   0.49355832  0.55137396  0.54179835  0.48060322
   0.46264485  0.48516643  0.47610435  0.53582674  0.46981531  0.48658395
   0.52650559  0.47931704  0.49997514  0.47918874  0.51558554]]
Saving Weight
Epoch: 811	Loss: 23.9819236755	Example Output: 5XX+Y9060-	Example Reward:  -0.3
[[ 0.49020848  0.49427408  0.49356413  0.55146337  0.54186249  0.48056379
   0.46259648  0.48513079  0.47606868  0.53586984  0.46976006  0.48656893
   0.52653491  0.47927499  0.49999189  0.47916141  0.51566523]]
Epoch: 812	Loss: 23.9821674347	Example Output: /566-+40//	Example Reward:  -0.3
[[ 0.49017981  0.49425584  0.49358311  0.55156201  0.54193902  0.48051831
   0.46254262  0.48509601  0.47603786  0.53592521  0.46970519  0.48656747
   0.52657866  0.47923845  0.50001204  0.47914663  0.51573265]]
Epoch: 813	Loss: 23.9819887161	Example Output: 489/4X--0X	Example Reward:  -0.3
[[ 0.49015954  0.49423611  0.4

Epoch: 839	Loss: 23.9776329041	Example Output: Y4+03	Example Reward:  -0.3
[[ 0.48973933  0.49385121  0.49335235  0.55383801  0.5438987   0.47960654
   0.46072075  0.48436406  0.47494933  0.53713071  0.46824598  0.4861317
   0.52768785  0.47828728  0.50003392  0.47823358  0.51740295]]
Epoch: 840	Loss: 23.9779075623	Example Output: -Y	Example Reward:  0.48
[[ 0.48974615  0.49385262  0.49335489  0.55392128  0.54399347  0.4795666
   0.4606837   0.48432779  0.47491878  0.53717089  0.46818775  0.48610595
   0.52773124  0.47826508  0.50002718  0.47818804  0.51744729]]
Saving Weight
Epoch: 841	Loss: 23.9777038574	Example Output: 301Y1XY-/	Example Reward:  -0.3
[[ 0.48973709  0.49386919  0.49334949  0.55398506  0.54406065  0.47952592
   0.46063918  0.48428196  0.47489187  0.5372082   0.46812913  0.48605761
   0.52776623  0.47825828  0.50001174  0.47814134  0.51750422]]
Epoch: 842	Loss: 23.9776172638	Example Output: 4-7	Example Reward:  -0.03
[[ 0.48972082  0.49387097  0.49334562  0.55407459  0

Epoch: 867	Loss: 23.9697937012	Example Output: 42	Example Reward:  -0.12
[[ 0.48921794  0.49357876  0.49304381  0.55587989  0.54548031  0.47857609
   0.45899674  0.48358032  0.47387955  0.5383215   0.46676692  0.48551854
   0.52865875  0.47730941  0.49989942  0.4773218   0.51892668]]
Epoch: 868	Loss: 23.9694419861	Example Output: */4+*2Y155	Example Reward:  -0.3
[[ 0.48918375  0.49356017  0.49302885  0.55595195  0.54553241  0.47853437
   0.45894843  0.4835501   0.47384897  0.53836614  0.46671727  0.48550075
   0.52868116  0.47727227  0.49989465  0.47729224  0.51897049]]
Epoch: 869	Loss: 23.9695676804	Example Output: 271/62X*00	Example Reward:  -0.3
[[ 0.48915663  0.49355564  0.4930408   0.55605525  0.54561448  0.47849691
   0.45889851  0.4835296   0.47382516  0.53843361  0.46665999  0.48548648
   0.52872187  0.47724837  0.49993205  0.47727334  0.51902443]]
Epoch: 870	Loss: 23.9699308395	Example Output: 0Y*031*7XY	Example Reward:  -0.3
[[ 0.48915732  0.49355099  0.49306074  0.55615896  

Epoch: 896	Loss: 23.9583023071	Example Output: 4-/08856/+	Example Reward:  -0.3
[[ 0.48852172  0.49309343  0.49255145  0.55816126  0.54732776  0.47757307
   0.4568896   0.48259616  0.4726395   0.53953302  0.46513653  0.48490745
   0.52965319  0.47606617  0.49995464  0.47630775  0.52042031]]
Epoch: 897	Loss: 23.9586019516	Example Output: 8/	Example Reward:  -0.3
[[ 0.48849842  0.49309447  0.49256486  0.55824077  0.54740238  0.47753945
   0.45686206  0.48259154  0.47261745  0.53960288  0.46513912  0.48488829
   0.52970088  0.4760488   0.49999559  0.47630161  0.52048618]]
Epoch: 898	Loss: 23.9591337204	Example Output: 3767X/	Example Reward:  -0.3
[[ 0.48846519  0.493094    0.49255836  0.55834097  0.54748964  0.47749591
   0.4568238   0.48257685  0.47259167  0.53967094  0.46511421  0.48487282
   0.52974325  0.47601366  0.50002402  0.4762927   0.52058971]]
Epoch: 899	Loss: 23.9597434998	Example Output: 6	Example Reward:  -0.10999999999999999
[[ 0.48845983  0.49310178  0.49256253  0.55844122

Epoch: 924	Loss: 23.9568164825	Example Output: 853/-+X	Example Reward:  0.63
[[ 0.48794422  0.49289426  0.49229857  0.56058902  0.54927075  0.47668698
   0.45516011  0.48183873  0.47165868  0.54115242  0.46373034  0.48428094
   0.5309037   0.47504151  0.50000852  0.47553593  0.52222729]]
Epoch: 925	Loss: 23.9568067551	Example Output: 856Y*8	Example Reward:  -0.3
[[ 0.48793501  0.49289027  0.49230111  0.56067151  0.54933012  0.47667736
   0.45510963  0.48181239  0.47162706  0.5412277   0.46368712  0.48424521
   0.53096795  0.47500929  0.50000423  0.47550973  0.5223186 ]]
Epoch: 926	Loss: 23.9569213867	Example Output: 	Example Reward:  -0.3
[[ 0.48791924  0.49289712  0.49230006  0.56076324  0.54939938  0.47665006
   0.45504096  0.48179004  0.47158343  0.54129213  0.46362042  0.48419631
   0.53102297  0.4749563   0.50001013  0.47546288  0.5224191 ]]
Epoch: 927	Loss: 23.9569107056	Example Output: 	Example Reward:  -0.3
[[ 0.48790827  0.49289897  0.49228886  0.5608446   0.54946625  0.476621

Epoch: 952	Loss: 23.9499322891	Example Output: 8/85*1*X52	Example Reward:  -0.3
[[ 0.48745137  0.49262178  0.49183449  0.56305474  0.55123156  0.47561359
   0.45289743  0.48104286  0.47066471  0.54293108  0.46194616  0.48337737
   0.53223765  0.47383842  0.50001657  0.47437477  0.5241521 ]]
Epoch: 953	Loss: 23.9496213913	Example Output: +5074373+3	Example Reward:  5.55111512313e-17
[[ 0.48742825  0.49262324  0.49181354  0.56313467  0.55129534  0.47558424
   0.452806    0.48101357  0.4706243   0.54299319  0.46188837  0.48334259
   0.53229493  0.47380579  0.50001484  0.47434098  0.52420866]]
Epoch: 954	Loss: 23.949679184	Example Output: 9-	Example Reward:  -0.3
[[ 0.487407    0.49263579  0.49179307  0.56322247  0.55137432  0.47556677
   0.45273581  0.48100799  0.4706113   0.54306376  0.46183321  0.48332232
   0.53235132  0.47378811  0.50003022  0.47431469  0.52426773]]
Epoch: 955	Loss: 23.950030899	Example Output: ++52	Example Reward:  0.06
[[ 0.48737228  0.49263394  0.49179676  0.563320

Epoch: 980	Loss: 23.94680233	Example Output: 2Y4/18*+Y/	Example Reward:  -0.3
[[ 0.48707646  0.49251077  0.49140352  0.5655219   0.55354548  0.4747467
   0.44994718  0.48032379  0.46964219  0.54495019  0.46019244  0.48257238
   0.5339011   0.47286037  0.50000733  0.47341403  0.5262596 ]]
Saving Weight
Epoch: 981	Loss: 23.9468015671	Example Output: /*-1+X+*	Example Reward:  -0.3
[[ 0.48704398  0.49251974  0.49135688  0.56563485  0.55363828  0.47470903
   0.44984385  0.48028907  0.4696148   0.54501033  0.46012425  0.48252386
   0.53396541  0.47280642  0.50001776  0.47336033  0.52634907]]
Epoch: 982	Loss: 23.9466480255	Example Output: YY28	Example Reward:  -0.3
[[ 0.48703459  0.4925434   0.49132621  0.56576467  0.55373704  0.4746753
   0.44971979  0.48026335  0.46957868  0.54510856  0.46004289  0.48245931
   0.53405672  0.47276446  0.50003946  0.47329539  0.52644044]]
Epoch: 983	Loss: 23.9467973709	Example Output: 3/7474Y*9	Example Reward:  -0.3
[[ 0.48704061  0.49258366  0.49130222  0.56

Epoch: 1008	Loss: 23.9430246353	Example Output: Y30Y1*9X-8	Example Reward:  -0.3
[[ 0.48672128  0.49249926  0.49092969  0.56823701  0.5559082   0.47382784
   0.44698593  0.47957671  0.46862867  0.54708952  0.45839512  0.48151767
   0.53565919  0.4718205   0.50003219  0.47231483  0.52801901]]
Epoch: 1009	Loss: 23.9429800034	Example Output: 72688/Y-Y3	Example Reward:  -0.3
[[ 0.48669207  0.49248695  0.49090883  0.56834483  0.55597937  0.4737871
   0.44687229  0.47951409  0.46858925  0.54715413  0.45833346  0.48149899
   0.53570509  0.47179481  0.50003201  0.472271    0.5280782 ]]
Epoch: 1010	Loss: 23.9422212601	Example Output: 	Example Reward:  -0.3
[[ 0.48665634  0.49245363  0.49088845  0.5684455   0.55605203  0.47373796
   0.44672754  0.47945839  0.46853828  0.54721451  0.45825124  0.4814707
   0.53575355  0.47174388  0.5000059   0.4722183   0.52813911]]
Saving Weight
Epoch: 1011	Loss: 23.9412343979	Example Output: *	Example Reward:  -0.3
[[ 0.48661563  0.49244034  0.49083742  0.568531

Epoch: 1036	Loss: 23.9352460861	Example Output: 8	Example Reward:  -0.10999999999999999
[[ 0.48600569  0.49205875  0.49047592  0.57114041  0.55847275  0.4726876
   0.44352451  0.47869462  0.46735588  0.54930258  0.45616621  0.48055631
   0.53735965  0.47045827  0.5002417   0.47114646  0.53026998]]
Epoch: 1037	Loss: 23.9340246201	Example Output: 68+9Y4*10*	Example Reward:  -0.3
[[ 0.48595914  0.49203601  0.49044129  0.57123297  0.55855024  0.47262895
   0.44336587  0.47865435  0.46730432  0.5493657   0.45606253  0.48050624
   0.5374012   0.47038758  0.50023514  0.47109646  0.5303697 ]]
Epoch: 1038	Loss: 23.9336194992	Example Output: Y43-11*Y3X	Example Reward:  -0.3
[[ 0.48595762  0.49202955  0.49044284  0.57132941  0.55864501  0.47259253
   0.44324115  0.47861683  0.46726298  0.54945832  0.4559831   0.48045346
   0.53746253  0.47034839  0.50025159  0.47106773  0.53045696]]
Epoch: 1039	Loss: 23.9337701797	Example Output: 25*/19YY*9	Example Reward:  -0.3
[[ 0.48597339  0.49203503  0.49044

Epoch: 1065	Loss: 23.925810051	Example Output: 71304*Y/20	Example Reward:  0.5
[[ 0.48538074  0.49181637  0.49008796  0.57413644  0.56106532  0.47140169
   0.44035295  0.47764587  0.46628734  0.55138397  0.45386019  0.47961137
   0.53879601  0.46926546  0.50023103  0.46995309  0.53228247]]
Epoch: 1066	Loss: 23.9259195328	Example Output: 5	Example Reward:  -0.10999999999999999
[[ 0.48536089  0.49181253  0.4900851   0.57424295  0.56118041  0.47136715
   0.44025749  0.47759622  0.46622732  0.5514732   0.45379356  0.47957167
   0.53884923  0.46922082  0.50023872  0.46991408  0.53236425]]
Epoch: 1067	Loss: 23.9254161835	Example Output: 1/262	Example Reward:  -0.05000000000000002
[[ 0.48533019  0.49181125  0.49006721  0.57431114  0.56124175  0.47133386
   0.44017264  0.47755858  0.46616518  0.55154616  0.45372683  0.47952637
   0.5388974   0.46919069  0.50021321  0.46985596  0.53243065]]
Epoch: 1068	Loss: 23.9252901077	Example Output: 3X7+-2157Y	Example Reward:  -0.3
[[ 0.48531458  0.4918182

Epoch: 1093	Loss: 23.9189985275	Example Output: 	Example Reward:  -0.3
[[ 0.484907    0.4916065   0.48978493  0.57700968  0.56387073  0.47029385
   0.43698561  0.47677043  0.46514669  0.55390441  0.45100906  0.47845829
   0.54052716  0.46820334  0.50024283  0.46881008  0.53439403]]
Epoch: 1094	Loss: 23.9187166214	Example Output: 224Y	Example Reward:  -0.3
[[ 0.48488301  0.49159533  0.48977     0.57712829  0.56398124  0.47024566
   0.43683851  0.47675124  0.46510512  0.5539937   0.45088941  0.4784264
   0.54058594  0.46814585  0.50024694  0.4687517   0.53450322]]
Epoch: 1095	Loss: 23.9183019638	Example Output: Y1-93-26-Y	Example Reward:  -0.3
[[ 0.48484725  0.49157041  0.48975581  0.57725376  0.56412625  0.47018921
   0.43668786  0.47671333  0.46507138  0.55407524  0.4507519   0.47838941
   0.54063743  0.46807823  0.50026613  0.46868297  0.53460425]]
Epoch: 1096	Loss: 23.9175064087	Example Output: *030726/2-	Example Reward:  -0.3
[[ 0.48481631  0.4915317   0.48973534  0.57734603  0.5642

Epoch: 1122	Loss: 23.910027504	Example Output: 19YX70	Example Reward:  -0.3
[[ 0.48435184  0.4911471   0.48968866  0.58060724  0.56720769  0.46896592
   0.43286121  0.47589225  0.46381813  0.55654162  0.44744083  0.47753483
   0.54237801  0.46685347  0.50035971  0.46743166  0.53666407]]
Epoch: 1123	Loss: 23.9096399307	Example Output: /70019/01*	Example Reward:  -0.3
[[ 0.48434716  0.4911302   0.48968101  0.58072418  0.5673123   0.46892872
   0.43273476  0.47588232  0.46378073  0.55664164  0.44731975  0.4775109
   0.54244512  0.46682623  0.50036913  0.46740258  0.53672934]]
Epoch: 1124	Loss: 23.9101593018	Example Output: 59167-4/82	Example Reward:  5.55111512313e-17
[[ 0.4843547   0.49112409  0.48970777  0.58086294  0.56744146  0.46888083
   0.43263444  0.47586784  0.46374193  0.55675793  0.44721961  0.47749144
   0.54253286  0.46682218  0.50039762  0.46739051  0.53681183]]
Epoch: 1125	Loss: 23.9107154846	Example Output: 2+46753/46	Example Reward:  5.551115123125783e-17
[[ 0.48435909  0

Epoch: 1151	Loss: 23.8997053146	Example Output: 3100987155	Example Reward:  -0.2
[[ 0.48372981  0.49072567  0.48949036  0.58398432  0.5703696   0.46754333
   0.42884851  0.47492522  0.46268395  0.55938178  0.44402748  0.4764981
   0.54420692  0.4656693   0.50031412  0.46617207  0.53867817]]
Epoch: 1152	Loss: 23.8999534607	Example Output: X4*//8709Y	Example Reward:  -0.3
[[ 0.48372343  0.49072945  0.48951373  0.58412164  0.57051772  0.4674961
   0.42872232  0.47492728  0.46267313  0.55950016  0.44391653  0.47648224
   0.54426771  0.46565577  0.50034332  0.46614212  0.53874779]]
Epoch: 1153	Loss: 23.900097847	Example Output: /XY8697253	Example Reward:  -0.3
[[ 0.48369712  0.49071845  0.48952973  0.58423048  0.57063961  0.4674342
   0.42857739  0.47487319  0.46263224  0.55960029  0.44377661  0.47644114
   0.54433662  0.46561617  0.50033402  0.46609801  0.53882021]]
Epoch: 1154	Loss: 23.8990652084	Example Output: +-212X4+X6	Example Reward:  -0.3
[[ 0.48363554  0.49068451  0.48953003  0.584

Epoch: 1180	Loss: 23.8827838898	Example Output: 7	Example Reward:  -0.10999999999999999
[[ 0.48292109  0.49007002  0.48935878  0.58758408  0.57389992  0.46566951
   0.4243162   0.47371966  0.46142188  0.56225961  0.44005296  0.47551772
   0.54614943  0.46417344  0.50000107  0.4646374   0.54072946]]
Saving Weight
Epoch: 1181	Loss: 23.8825878143	Example Output: -29XY6**68	Example Reward:  -0.3
[[ 0.48289707  0.49003333  0.48936817  0.58772784  0.57401961  0.46562505
   0.42415199  0.47368121  0.46138725  0.56235725  0.43991283  0.47547394
   0.54622895  0.46412057  0.50000137  0.46458685  0.54082435]]
Epoch: 1182	Loss: 23.8816982269	Example Output: Y9X-3Y9+13	Example Reward:  -0.3
[[ 0.48286733  0.49001393  0.48934394  0.58785629  0.57413536  0.46556926
   0.42395845  0.47363123  0.46134564  0.56243896  0.43975547  0.47542027
   0.54630023  0.4640567   0.49999219  0.46451861  0.54089195]]
Epoch: 1183	Loss: 23.8811452866	Example Output: 0+351/4	Example Reward:  0.030000000000000082
[[ 0.4

Epoch: 1209	Loss: 23.8761451721	Example Output: 857335+7-/	Example Reward:  -0.3
[[ 0.48232955  0.48959881  0.48950237  0.59176993  0.57796609  0.46386603
   0.419687    0.47278014  0.46034566  0.56556034  0.43598539  0.47444877
   0.54844141  0.46285567  0.50018203  0.46312234  0.54308194]]
Epoch: 1210	Loss: 23.8762569427	Example Output: 3641	Example Reward:  -0.14
[[ 0.4823148   0.48961195  0.48950294  0.59189683  0.57807624  0.46381807
   0.41956776  0.47276574  0.46033069  0.56568003  0.43588254  0.47438073
   0.5485363   0.46283644  0.50019556  0.46307519  0.5431819 ]]
Saving Weight
Epoch: 1211	Loss: 23.8765769958	Example Output: 00+	Example Reward:  -0.3
[[ 0.48229939  0.48962957  0.48950934  0.59204763  0.57819617  0.46374848
   0.41943899  0.47274157  0.46033636  0.56578201  0.43577877  0.47433442
   0.54861325  0.46282578  0.50020933  0.46303004  0.54328567]]
Epoch: 1212	Loss: 23.876474762	Example Output: +8/+6X8137	Example Reward:  -0.3
[[ 0.48227909  0.48961207  0.48950616  

Epoch: 1237	Loss: 23.8650001526	Example Output: 94+*5X-Y50	Example Reward:  -0.3
[[ 0.48192677  0.48912013  0.48938176  0.5956111   0.58176297  0.46229422
   0.41499433  0.47161475  0.45916569  0.56849551  0.43222886  0.47314569
   0.5505566   0.46164283  0.500009    0.46164173  0.54522157]]
Epoch: 1238	Loss: 23.8637714386	Example Output: *3+-72*35-	Example Reward:  -0.3
[[ 0.48187572  0.48910427  0.48935309  0.59572506  0.58189583  0.46222988
   0.41479138  0.47155702  0.45913109  0.56859034  0.43205506  0.47308281
   0.55064076  0.46159324  0.50001067  0.46155953  0.5452944 ]]
Epoch: 1239	Loss: 23.8630580902	Example Output: 04X3X4	Example Reward:  -0.3
[[ 0.48182279  0.48907515  0.48933384  0.59586608  0.58204198  0.46218002
   0.41459593  0.47151041  0.45909372  0.56867868  0.43190956  0.47305924
   0.55070293  0.46154094  0.50001311  0.46150479  0.54536009]]
Epoch: 1240	Loss: 23.8621574402	Example Output: 7182	Example Reward:  -0.14
[[ 0.48180595  0.48904371  0.48933694  0.59601271

Epoch: 1266	Loss: 23.8544755936	Example Output: 3+1289	Example Reward:  -0.059999999999999915
[[ 0.48130196  0.48889706  0.48933983  0.59995025  0.58624232  0.46046856
   0.40980962  0.47050756  0.4577978   0.57225436  0.42773855  0.47174287
   0.55307108  0.46011859  0.50008386  0.45974174  0.54796958]]
Epoch: 1267	Loss: 23.8546585083	Example Output: X/*5/4/YY6	Example Reward:  -0.3
[[ 0.48132858  0.4889012   0.48935252  0.60007191  0.58635277  0.4604457
   0.40967634  0.47048858  0.45776448  0.57234317  0.42763233  0.47169569
   0.55314314  0.46008322  0.50010568  0.45968935  0.54806107]]
Epoch: 1268	Loss: 23.8551538467	Example Output: 75*83	Example Reward:  -0.05000000000000002
[[ 0.48132735  0.48892581  0.48936769  0.60022682  0.58648556  0.46041569
   0.40955561  0.47048524  0.45774314  0.57246202  0.42753649  0.47165209
   0.55321687  0.46005088  0.50016785  0.4596673   0.54815996]]
Epoch: 1269	Loss: 23.8555671692	Example Output: 2*06-75182	Example Reward:  -0.3
[[ 0.48131776  0.

Epoch: 1294	Loss: 23.8485544205	Example Output: 1*X--+7*11	Example Reward:  0.8
[[ 0.4805716   0.48848537  0.48943469  0.60422945  0.59045017  0.45884737
   0.40484613  0.46953201  0.45684564  0.57559806  0.42357919  0.47058818
   0.55560863  0.4588446   0.5003863   0.45833126  0.55048925]]
Epoch: 1295	Loss: 23.8490114212	Example Output: 	Example Reward:  -0.3
[[ 0.48056036  0.48849544  0.48945713  0.60438722  0.59057885  0.45877364
   0.40469775  0.46950001  0.45682779  0.57574219  0.4234409   0.47054452
   0.55571055  0.45883259  0.50041038  0.45827088  0.55056697]]
Epoch: 1296	Loss: 23.8486461639	Example Output: 	Example Reward:  -0.3
[[ 0.48051122  0.48847559  0.48945788  0.6045289   0.59070826  0.45870611
   0.40451801  0.46947703  0.4567908   0.5758577   0.42326784  0.47050864
   0.55578834  0.45876241  0.5004378   0.4582161   0.5506615 ]]
Epoch: 1297	Loss: 23.8482694626	Example Output: 0*/62*35	Example Reward:  -0.3
[[ 0.48047808  0.48845556  0.48944765  0.60467261  0.59084517  

Epoch: 1324	Loss: 23.841334343	Example Output: ++36*02X+3	Example Reward:  -0.3
[[ 0.47986367  0.48829368  0.48934337  0.6089921   0.59515506  0.45686716
   0.3992866   0.46846879  0.45566639  0.57956475  0.41887471  0.46938372
   0.5584318   0.45750836  0.50052017  0.45650479  0.55321002]]
Epoch: 1325	Loss: 23.8406202316	Example Output: +-X	Example Reward:  0.57
[[ 0.47982821  0.48827162  0.48934337  0.60916132  0.59532964  0.45678639
   0.39905983  0.46840703  0.45560765  0.57969618  0.4186869   0.46932858
   0.55853152  0.45743591  0.50051808  0.45641291  0.55331922]]
Epoch: 1326	Loss: 23.8398637772	Example Output: +761348869	Example Reward:  -0.1
[[ 0.47982058  0.48824808  0.48933783  0.60930651  0.59546715  0.45669961
   0.39888117  0.46834522  0.45552483  0.57980996  0.41852266  0.46927145
   0.55864704  0.45737121  0.50051033  0.45636663  0.55341339]]
Epoch: 1327	Loss: 23.838833046	Example Output: 3+57*-08/*	Example Reward:  -0.3
[[ 0.47978407  0.48822239  0.48930588  0.60945052

Epoch: 1353	Loss: 23.819698143	Example Output: 13-9+1Y274	Example Reward:  -0.3
[[ 0.47902384  0.48777148  0.48887351  0.61350137  0.59940141  0.45497081
   0.39339814  0.46690798  0.45407599  0.58297223  0.41397268  0.46796709
   0.56109697  0.45574096  0.50013572  0.45467478  0.555843  ]]
Epoch: 1354	Loss: 23.8188014984	Example Output: 5X7-727*47	Example Reward:  -0.3
[[ 0.47895557  0.48775479  0.48884207  0.61364442  0.59954995  0.45489639
   0.39318016  0.46685284  0.45402437  0.58308637  0.41377753  0.46791115
   0.56116813  0.45565543  0.50013173  0.4545916   0.55597222]]
Epoch: 1355	Loss: 23.817423439	Example Output: /5*4749Y70	Example Reward:  -0.3
[[ 0.4788869   0.48773688  0.48882127  0.61381316  0.59973025  0.4548223
   0.39296314  0.466809    0.45395651  0.58324128  0.41356081  0.46784914
   0.56125516  0.45557776  0.50014722  0.4544993   0.55607581]]
Epoch: 1356	Loss: 23.816988945	Example Output: 14928*01Y7	Example Reward:  -0.3
[[ 0.47884446  0.48773462  0.4888269   0.613

Epoch: 1382	Loss: 23.8021873474	Example Output: X0Y+Y38Y/+	Example Reward:  -0.3
[[ 0.47822446  0.48748365  0.48884982  0.61883247  0.6047287   0.45225662
   0.38720775  0.46539369  0.4519017   0.58724141  0.40863517  0.46648559
   0.56411636  0.45388505  0.50037307  0.45193666  0.55901903]]
Epoch: 1383	Loss: 23.8007631302	Example Output: 745*+X5079	Example Reward:  -0.3
[[ 0.47818193  0.48745459  0.48884046  0.61902249  0.60492498  0.45212764
   0.38694763  0.46532354  0.45181242  0.58740979  0.40842268  0.46642697
   0.56423748  0.4538185   0.50035214  0.45180964  0.55912924]]
Epoch: 1384	Loss: 23.7999656677	Example Output: -30186/-41	Example Reward:  0.10000000000000009
[[ 0.47815523  0.48746508  0.48885465  0.61922938  0.60514104  0.45199043
   0.38672656  0.46526113  0.45174235  0.58759105  0.4082199   0.46638969
   0.56436342  0.45375913  0.50035459  0.45167693  0.55924511]]
Epoch: 1385	Loss: 23.7998773575	Example Output: 4X2/147113	Example Reward:  -0.3
[[ 0.47816232  0.48749346

Epoch: 1411	Loss: 23.7860395432	Example Output: XX08343720	Example Reward:  -0.3
[[ 0.4774901   0.48732251  0.48932636  0.62530923  0.61108857  0.44854587
   0.38059661  0.46393305  0.44923556  0.5925613   0.40277445  0.46495369
   0.56794107  0.45085663  0.50094855  0.44813871  0.56313568]]
Epoch: 1412	Loss: 23.7852994919	Example Output: 79/3375875	Example Reward:  -0.09999999999999995
[[ 0.47747895  0.48732433  0.48936656  0.62552488  0.61131299  0.44842926
   0.38039002  0.46387327  0.44913858  0.59274918  0.40256834  0.46489593
   0.56806618  0.45075539  0.50098139  0.44799945  0.56326663]]
Epoch: 1413	Loss: 23.7852636337	Example Output: 2-948YX	Example Reward:  -0.3
[[ 0.47747162  0.48731595  0.48941305  0.62574428  0.61154485  0.44832394
   0.38018128  0.46384037  0.44905737  0.59292203  0.40237075  0.46485311
   0.56819052  0.45064864  0.5010156   0.44789857  0.56343484]]
Epoch: 1414	Loss: 23.7847496033	Example Output: 06Y004Y8*2	Example Reward:  -0.3
[[ 0.47742394  0.48731613  

Epoch: 1440	Loss: 23.7739295959	Example Output: 0*X712-X+8	Example Reward:  -0.3
[[ 0.47665486  0.48731646  0.48999828  0.6324442   0.61785239  0.44483861
   0.37380609  0.46261483  0.44630724  0.59848946  0.39646563  0.46306419
   0.5718298   0.44768018  0.5016582   0.44464889  0.56778556]]
Saving Weight
Epoch: 1441	Loss: 23.772823143	Example Output: 8	Example Reward:  -0.10999999999999999
[[ 0.47662014  0.48731267  0.49000823  0.63269979  0.61810654  0.44467628
   0.37352815  0.46253964  0.44618356  0.59870923  0.39623383  0.46299678
   0.57196814  0.4475556   0.50165987  0.44447035  0.56792426]]
Epoch: 1442	Loss: 23.7719575882	Example Output: 637	Example Reward:  -0.13
[[ 0.4765988   0.48730475  0.49003172  0.63292843  0.61832422  0.44453883
   0.37327841  0.46248764  0.44608229  0.59890157  0.39602569  0.46295166
   0.57210028  0.4474605   0.50168282  0.44432899  0.56804955]]
Epoch: 1443	Loss: 23.7712636948	Example Output: X/23Y*-X7X	Example Reward:  -0.3
[[ 0.47657713  0.48729771 

Epoch: 1468	Loss: 23.7499908447	Example Output: *9214894Y1	Example Reward:  -0.3
[[ 0.47589189  0.48719001  0.49051839  0.63914049  0.62442744  0.44086874
   0.36661234  0.46106869  0.44340119  0.60393161  0.39006588  0.46126252
   0.57529789  0.44415513  0.50238341  0.4407399   0.57200491]]
Epoch: 1469	Loss: 23.7498826981	Example Output: +	Example Reward:  -0.3
[[ 0.47585323  0.48717937  0.49052951  0.63937485  0.62465304  0.44075349
   0.36640301  0.46105033  0.44329357  0.60411334  0.38987783  0.46122247
   0.57541406  0.44402987  0.50243223  0.44063503  0.57217419]]
Epoch: 1470	Loss: 23.7492479324	Example Output: 1X14844	Example Reward:  -0.3
[[ 0.47578546  0.48715261  0.49053147  0.63964128  0.6248976   0.44058415
   0.36613819  0.46100259  0.44316956  0.60431629  0.3896434   0.46116105
   0.57557046  0.4438884   0.50247055  0.44049171  0.57234299]]
Saving Weight
Epoch: 1471	Loss: 23.7476980209	Example Output: 1411773-7	Example Reward:  -0.09
[[ 0.47570363  0.48712522  0.49051115 

Epoch: 1496	Loss: 23.7261493683	Example Output: 488362-+*0	Example Reward:  -0.3
[[ 0.47521666  0.48737553  0.49088636  0.64619774  0.63151145  0.43677312
   0.35887584  0.45936307  0.44013819  0.60980117  0.3831971   0.45930144
   0.57933718  0.44092417  0.50287253  0.43670061  0.57615554]]
Epoch: 1497	Loss: 23.7252239227	Example Output: X989-710X8	Example Reward:  -0.3
[[ 0.47517413  0.48740894  0.49093199  0.64645314  0.63177913  0.43661195
   0.35856581  0.45930892  0.44002524  0.61003703  0.38293061  0.45922872
   0.57949984  0.44078925  0.5029158   0.43652549  0.57631099]]
Epoch: 1498	Loss: 23.7243600845	Example Output: 380Y7	Example Reward:  -0.3
[[ 0.47511867  0.48744792  0.49096373  0.6467548   0.63208848  0.43643323
   0.3582173   0.45924184  0.43989447  0.61031157  0.38265115  0.45914096
   0.57967395  0.44063443  0.50296307  0.43635496  0.5765062 ]]
Epoch: 1499	Loss: 23.723077774	Example Output: 2	Example Reward:  -0.10999999999999999
[[ 0.47503743  0.48744497  0.49098137  

Epoch: 1524	Loss: 23.6981874466	Example Output: 46*2+/25X0	Example Reward:  -0.3
[[ 0.47400549  0.48686668  0.49150649  0.6536721   0.63960493  0.43234786
   0.34946415  0.45785987  0.43641624  0.61670035  0.37551183  0.45701286
   0.58394712  0.43656406  0.50527078  0.43209779  0.58121091]]
Epoch: 1525	Loss: 23.6974401474	Example Output: 72*	Example Reward:  -0.3
[[ 0.47401643  0.48683968  0.4915255   0.65395957  0.63992298  0.43218419
   0.34906489  0.45784113  0.43628123  0.61697161  0.37519163  0.4569177
   0.5841338   0.43639395  0.50541514  0.43190703  0.58141333]]
Epoch: 1526	Loss: 23.6964422226	Example Output: 14Y2	Example Reward:  -0.3
[[ 0.47397292  0.48678476  0.49152988  0.65421361  0.64023048  0.43204641
   0.34870645  0.45782697  0.43613678  0.61723     0.37486804  0.456826
   0.58429277  0.43620819  0.50557292  0.43172804  0.58163291]]
Epoch: 1527	Loss: 23.6954847336	Example Output: X292110+2+	Example Reward:  -0.3
[[ 0.47392195  0.48676771  0.4915368   0.65446258  0.640

Epoch: 1553	Loss: 23.6569545746	Example Output: *X+3*	Example Reward:  -0.3
[[ 0.47258666  0.48595548  0.49159268  0.6622315   0.64904583  0.42738819
   0.33743525  0.45671883  0.4317835   0.62459797  0.36574468  0.45452043
   0.58894593  0.43073708  0.50925064  0.42633829  0.58711994]]
Epoch: 1554	Loss: 23.6545654297	Example Output: 5-931/*X37	Example Reward:  -0.3
[[ 0.47250873  0.48587519  0.49155325  0.66248381  0.64933687  0.42720583
   0.3370136   0.45664874  0.43161711  0.62483436  0.36539036  0.4544214
   0.58910483  0.43054262  0.5093776   0.4261528   0.58730131]]
Epoch: 1555	Loss: 23.6523378372	Example Output: *Y6-Y133+X	Example Reward:  -0.3
[[ 0.47244176  0.48580924  0.49155903  0.6628077   0.64972681  0.42698792
   0.33653459  0.45659027  0.4314515   0.62514538  0.36498207  0.45430636
   0.58930242  0.43033478  0.50955975  0.42593601  0.58752549]]
Epoch: 1556	Loss: 23.6507307053	Example Output: 24*+33	Example Reward:  0.04000000000000009
[[ 0.4723973   0.48576659  0.491566

Epoch: 1582	Loss: 23.6101823807	Example Output: 23*6Y*70*+	Example Reward:  -0.3
[[ 0.47112951  0.48495141  0.49187681  0.67101026  0.65867931  0.42193699
   0.32488093  0.45539746  0.42665747  0.63338161  0.35537058  0.45054483
   0.59492004  0.42511466  0.51350081  0.42034709  0.59376997]]
Epoch: 1583	Loss: 23.6090988159	Example Output: 7X7/-6-6*3	Example Reward:  -0.3
[[ 0.47112173  0.48492864  0.49189627  0.67135364  0.65903503  0.4217726
   0.32442155  0.45536053  0.42648056  0.63373619  0.35498488  0.45036569
   0.59515977  0.42489272  0.51369083  0.4201428   0.59401566]]
Epoch: 1584	Loss: 23.6083345413	Example Output: 9Y33/Y7X25	Example Reward:  -0.3
[[ 0.47111395  0.48495185  0.4919228   0.67164576  0.65935391  0.42161232
   0.3240447   0.45533201  0.42638317  0.63404614  0.35466006  0.45018372
   0.59537387  0.42474592  0.51385254  0.41996953  0.59423161]]
Epoch: 1585	Loss: 23.6076906204	Example Output: X00*Y294X5	Example Reward:  -0.3
[[ 0.47109169  0.48496604  0.49194881  0.

Epoch: 1611	Loss: 23.554312706	Example Output: 43	Example Reward:  -0.12
[[ 0.46958667  0.48424739  0.49255687  0.6812194   0.67005944  0.41576126
   0.31064859  0.45350349  0.42136514  0.64321619  0.34247419  0.44573572
   0.60128331  0.41877994  0.518646    0.4134196   0.60091329]]
Epoch: 1612	Loss: 23.5533287048	Example Output: 79/89	Example Reward:  -0.05000000000000002
[[ 0.46957469  0.48426026  0.49263978  0.68159801  0.67047501  0.41557646
   0.31016731  0.45340475  0.42118695  0.64356929  0.34202069  0.4455885
   0.60152042  0.41860083  0.51884198  0.41317567  0.60117841]]
Epoch: 1613	Loss: 23.5523241043	Example Output: *371+/30*2	Example Reward:  -0.3
[[ 0.4695645   0.48426473  0.49267703  0.68185753  0.67078459  0.41543818
   0.30986112  0.45332262  0.42103463  0.64385444  0.34170383  0.44544798
   0.60168946  0.41846457  0.51897591  0.41299298  0.60138106]]
Epoch: 1614	Loss: 23.5513132095	Example Output: -*	Example Reward:  -0.3
[[ 0.46952033  0.4842681   0.4926874   0.68216

Epoch: 1639	Loss: 23.4991765976	Example Output: 	Example Reward:  -0.3
[[ 0.46847138  0.48370269  0.49383184  0.69175839  0.68194079  0.40954468
   0.29617143  0.44981214  0.41579679  0.65350187  0.3292098   0.44115359
   0.60790181  0.41262767  0.52418745  0.40662771  0.60826528]]
Epoch: 1640	Loss: 23.4962087631	Example Output: 6517+Y69Y1	Example Reward:  -0.3
[[ 0.46835348  0.48364389  0.49387214  0.69216162  0.68240029  0.40925437
   0.29557621  0.44963017  0.41555643  0.65389222  0.32866624  0.44096604
   0.60819679  0.41235244  0.52437407  0.40631595  0.608522  ]]
Saving Weight
Epoch: 1641	Loss: 23.4935604095	Example Output: 7192	Example Reward:  -0.14
[[ 0.46828988  0.48360932  0.49396124  0.69262642  0.68289834  0.40898845
   0.29497397  0.44947308  0.41533101  0.65433854  0.32811972  0.44076556
   0.60851324  0.41211307  0.52464586  0.40603203  0.6088115 ]]
Epoch: 1642	Loss: 23.4912889481	Example Output: 8898	Example Reward:  -0.14
[[ 0.46823019  0.48355323  0.49403864  0.69302

Epoch: 1667	Loss: 23.4209173203	Example Output: 7*+36*4	Example Reward:  0.13000000000000012
[[ 0.46652529  0.48294413  0.49485806  0.70362484  0.69447708  0.40246165
   0.27986827  0.4454135   0.40925542  0.66440612  0.31454989  0.43583271
   0.61545777  0.40537158  0.52967393  0.39852819  0.6164304 ]]
Epoch: 1668	Loss: 23.4174455643	Example Output: 	Example Reward:  -0.3
[[ 0.46643481  0.48291048  0.49486721  0.70406491  0.69490272  0.40218282
   0.27931353  0.44523308  0.40901268  0.66474092  0.31405845  0.43564075
   0.61569715  0.40512183  0.52983111  0.39826116  0.61672151]]
Epoch: 1669	Loss: 23.4142534256	Example Output: 2+*797X0*Y	Example Reward:  -0.3
[[ 0.46633565  0.48285016  0.49491078  0.70455456  0.69538516  0.40189445
   0.27871916  0.44506809  0.40873852  0.66513962  0.31351623  0.4354277
   0.61595166  0.40481839  0.53005034  0.39796066  0.61709136]]
Epoch: 1670	Loss: 23.4112043381	Example Output: *7-0	Example Reward:  -0.3
[[ 0.46627524  0.48278436  0.49494132  0.7050

Epoch: 1695	Loss: 23.3257631302	Example Output: 59	Example Reward:  -0.12
[[ 0.46467897  0.48190606  0.49566433  0.71784836  0.70915407  0.39405864
   0.26211205  0.44004834  0.40190738  0.67589074  0.29830664  0.42975104
   0.62357306  0.39700404  0.53558457  0.3891384   0.62529892]]
Epoch: 1696	Loss: 23.3213037491	Example Output: +2Y92*4*1+	Example Reward:  -0.3
[[ 0.46458972  0.48180553  0.49568084  0.71832675  0.70967078  0.39374596
   0.26145032  0.43980175  0.40163752  0.67628205  0.29768288  0.42955154
   0.62384677  0.39668548  0.53578013  0.3887834   0.6256246 ]]
Epoch: 1697	Loss: 23.3175979614	Example Output: 662721+065	Example Reward:  -0.3
[[ 0.46452242  0.48180303  0.49574685  0.71889174  0.7102775   0.39339185
   0.2607629   0.43960455  0.40140226  0.67677832  0.29704544  0.42933023
   0.62419808  0.39637557  0.53604519  0.38841522  0.62599921]]
Epoch: 1698	Loss: 23.3150655746	Example Output: 8306506XY/	Example Reward:  -0.3
[[ 0.46445987  0.48178658  0.49579832  0.719435

Epoch: 1725	Loss: 23.1975269318	Example Output: Y420-	Example Reward:  -0.3
[[ 0.46224013  0.48072031  0.49668017  0.73455834  0.72734755  0.38347217
   0.2403449   0.43258294  0.39290184  0.68988037  0.2782104   0.42214718
   0.63355887  0.38696575  0.54287046  0.37739667  0.63607723]]
Epoch: 1726	Loss: 23.1912952423	Example Output: Y0129Y2	Example Reward:  -0.3
[[ 0.4621346   0.4806453   0.49665451  0.73512483  0.72795451  0.38305804
   0.23950021  0.43231922  0.392492    0.6903953   0.27743897  0.42180017
   0.63390326  0.38651928  0.54309833  0.37693021  0.63646871]]
Epoch: 1727	Loss: 23.184504509	Example Output: 961/9768Y1	Example Reward:  -0.3
[[ 0.46204987  0.48054561  0.49664018  0.7357232   0.72861302  0.38261348
   0.23863752  0.43203405  0.39206442  0.69092804  0.27663675  0.42146409
   0.63426572  0.38604468  0.54333973  0.37644532  0.63686663]]
Epoch: 1728	Loss: 23.1785772324	Example Output: 601/02Y927	Example Reward:  -0.3
[[ 0.46199134  0.48046911  0.49672762  0.73630255

Epoch: 1753	Loss: 23.0476495743	Example Output: 25	Example Reward:  -0.12
[[ 0.46019331  0.47899768  0.49816746  0.75205231  0.74625993  0.3717998
   0.21676712  0.4251498   0.38244742  0.70529073  0.25663239  0.41365594
   0.64494497  0.37561688  0.55058706  0.36428097  0.64793956]]
Epoch: 1754	Loss: 23.0415224075	Example Output: X64/928	Example Reward:  -0.3
[[ 0.46008211  0.47893599  0.49819592  0.75270563  0.74696523  0.37136769
   0.21588591  0.4248645   0.38203144  0.70592034  0.2558341   0.41331646
   0.6453777   0.37518471  0.55087447  0.36374801  0.64840645]]
Epoch: 1755	Loss: 23.0360239029	Example Output: 7X2004+9Y*	Example Reward:  -0.3
[[ 0.45997837  0.4788906   0.49822593  0.75341469  0.74770349  0.37091148
   0.21496409  0.42456284  0.38162103  0.70658416  0.25499201  0.4130013
   0.64582133  0.37470976  0.55124724  0.36321095  0.64889306]]
Epoch: 1756	Loss: 23.029722023	Example Output: 62*2+X*052	Example Reward:  -0.3
[[ 0.45984367  0.47882041  0.49823564  0.75410229  0.

Epoch: 1781	Loss: 22.8613142014	Example Output: +1	Example Reward:  -0.01999999999999999
[[ 0.45683819  0.47760665  0.49893251  0.76947534  0.76580012  0.35886043
   0.1924051   0.41637421  0.37080988  0.72295302  0.2334139   0.40379614
   0.65678227  0.36271653  0.55911058  0.34891373  0.66070855]]
Epoch: 1782	Loss: 22.8546318054	Example Output: 90	Example Reward:  -0.12
[[ 0.45672998  0.47753602  0.4990226   0.77010906  0.76651657  0.35840458
   0.19154644  0.41611111  0.3704097   0.72359681  0.23258023  0.4034268
   0.657224    0.36224428  0.55949444  0.34830639  0.66116172]]
Epoch: 1783	Loss: 22.8481313705	Example Output: 	Example Reward:  -0.3
[[ 0.45661223  0.47743732  0.4991408   0.77071857  0.76719362  0.35789001
   0.19070296  0.41579637  0.37001267  0.72419858  0.23178016  0.4031136
   0.65764213  0.36178645  0.55979449  0.34768406  0.66157407]]
Epoch: 1784	Loss: 22.8401968002	Example Output: 	Example Reward:  -0.3
[[ 0.45648712  0.47731182  0.49926111  0.77133137  0.76789135

Epoch: 1810	Loss: 22.6184688568	Example Output: X12737+759	Example Reward:  -0.3
[[ 0.45313835  0.47575051  0.50037295  0.7899884   0.78852707  0.34124026
   0.16509636  0.40565619  0.35602131  0.74387944  0.20607862  0.39177045
   0.67172557  0.34630883  0.57022321  0.32866824  0.67597181]]
Saving Weight
Epoch: 1811	Loss: 22.609192276	Example Output: 5X132Y2	Example Reward:  -0.3
[[ 0.45292464  0.47568175  0.50038511  0.79078686  0.78935707  0.34058747
   0.16411255  0.40529031  0.35551298  0.74465221  0.2050869   0.39135808
   0.67228466  0.34564236  0.57063138  0.32789406  0.67650586]]
Epoch: 1812	Loss: 22.5988721848	Example Output: 1*Y+X71	Example Reward:  -0.3
[[ 0.45266819  0.47562641  0.50040019  0.79166818  0.79027146  0.33978608
   0.16302291  0.40486395  0.35492322  0.7455011   0.20397425  0.39086083
   0.6729371   0.34490812  0.57111228  0.32700875  0.67710477]]
Epoch: 1813	Loss: 22.588561058	Example Output: 10*+6Y9-98	Example Reward:  -0.3
[[ 0.45248756  0.47555351  0.50049

Epoch: 1840	Loss: 22.2844875336	Example Output: +6+	Example Reward:  -0.3
[[ 0.44569999  0.47311035  0.50008696  0.81380969  0.81428564  0.31921852
   0.13496171  0.39194271  0.33560795  0.7683838   0.17507334  0.37743264
   0.6907596   0.32444194  0.58408207  0.30389476  0.69408965]]
Saving Weight
Epoch: 1841	Loss: 22.2718069077	Example Output: Y2927*+216	Example Reward:  -0.3
[[ 0.44540054  0.47304162  0.50005263  0.81465954  0.81519908  0.31839094
   0.13393679  0.39141226  0.33485895  0.76925886  0.1739895   0.3768861
   0.69148779  0.32369041  0.58461326  0.30297524  0.69474334]]
Epoch: 1842	Loss: 22.2600263596	Example Output: 3791-3+15-	Example Reward:  -0.3
[[ 0.44512668  0.47305518  0.50003654  0.81548995  0.81610996  0.31756541
   0.13293605  0.39089695  0.3341296   0.77015436  0.17290676  0.37632406
   0.69221336  0.32292107  0.58518702  0.30207777  0.69542247]]
Epoch: 1843	Loss: 22.2475711823	Example Output: +	Example Reward:  -0.3
[[ 0.44480771  0.4730922   0.49995971  0.81

Epoch: 1869	Loss: 21.8969379425	Example Output: *76X07X2	Example Reward:  -0.3
[[ 0.43664896  0.47073442  0.499982    0.83735448  0.83973664  0.29487005
   0.10661515  0.3752104   0.31263983  0.79305136  0.1444252   0.36028379
   0.71195406  0.30007041  0.59920925  0.27680552  0.71487492]]
Epoch: 1870	Loss: 21.8823663712	Example Output: *Y/*5-Y1	Example Reward:  -0.3
[[ 0.43636855  0.47060862  0.49984169  0.83802509  0.84049016  0.29410201
   0.10577036  0.37456715  0.3118349   0.79379576  0.1435      0.35962403
   0.71262342  0.29919702  0.59965026  0.27595517  0.71551049]]
Saving Weight
Epoch: 1871	Loss: 21.8683404922	Example Output: 5/7X199X*2	Example Reward:  -0.3
[[ 0.43609279  0.47058296  0.49989286  0.83875841  0.84127247  0.29327425
   0.10492007  0.37397137  0.31103742  0.7946167   0.14255662  0.3590081
   0.71333438  0.29836798  0.60014552  0.27505249  0.71618783]]
Epoch: 1872	Loss: 21.8553079605	Example Output: X7/53+077X	Example Reward:  -0.3
[[ 0.43578389  0.47050884  0.49

Epoch: 1898	Loss: 21.4644983292	Example Output: /73Y-6XY1	Example Reward:  -0.3
[[ 0.42696404  0.46859816  0.50070637  0.86087102  0.86506695  0.26787564
   0.08063608  0.35582352  0.28701174  0.81912667  0.11487359  0.33824682
   0.73649365  0.273359    0.61789024  0.24704425  0.73817611]]
Epoch: 1899	Loss: 21.4490915298	Example Output: 12X60*3623	Example Reward:  -0.3
[[ 0.42671388  0.46854591  0.50073576  0.86175805  0.86600739  0.26680809
   0.07970861  0.35509199  0.28598812  0.8201077   0.11378612  0.33725026
   0.73749638  0.27233225  0.61866236  0.24588518  0.73907566]]
Epoch: 1900	Loss: 21.431668663	Example Output: 65+*+13+63	Example Reward:  -0.3
[[ 0.42639977  0.46848097  0.50073904  0.86263198  0.86695319  0.26575547
   0.07877546  0.35427177  0.28494704  0.82110167  0.11268187  0.33622909
   0.73850548  0.27127048  0.61940634  0.24466729  0.73999268]]
Saving Weight
Epoch: 1901	Loss: 21.4137081146	Example Output: 1+0235	Example Reward:  -0.3
[[ 0.42603531  0.46846104  0.500

Epoch: 1927	Loss: 20.9502439499	Example Output: 95/77+*2*1	Example Reward:  -0.3
[[ 0.41580442  0.4692024   0.50292987  0.88531363  0.89106756  0.23539242
   0.05688563  0.32891542  0.25701284  0.84695411  0.08587875  0.31119877
   0.76503581  0.24263471  0.64077163  0.21187013  0.7652536 ]]
Epoch: 1928	Loss: 20.9324369431	Example Output: +X2010+/X	Example Reward:  -0.3
[[ 0.41525146  0.46912095  0.50293642  0.88607413  0.89186323  0.2342851
   0.05620239  0.32806396  0.25600788  0.84784806  0.08500914  0.31029439
   0.76597518  0.2415629   0.64171052  0.21072499  0.766141  ]]
Epoch: 1929	Loss: 20.9137794495	Example Output: 1	Example Reward:  -0.10999999999999999
[[ 0.41476199  0.46924219  0.50301242  0.88691396  0.89273077  0.23315139
   0.0554652   0.32713139  0.25495484  0.84880942  0.08407471  0.30927998
   0.76698762  0.2404435   0.64263308  0.20942725  0.767079  ]]
Epoch: 1930	Loss: 20.8958057404	Example Output: XY*77+	Example Reward:  -0.3
[[ 0.41430658  0.46934754  0.50319403  

Epoch: 1955	Loss: 20.388768959	Example Output: 51Y170	Example Reward:  -0.3
[[ 0.40288466  0.46945339  0.51290756  0.90828121  0.91519862  0.20028037
   0.03812321  0.29812631  0.2230607   0.87348753  0.06107202  0.28082836
   0.79439574  0.209271    0.66617239  0.17495976  0.79307896]]
Epoch: 1956	Loss: 20.3645627975	Example Output: 27	Example Reward:  -0.12
[[ 0.40221092  0.46951422  0.51336253  0.9091289   0.91607392  0.19894578
   0.03749638  0.29681757  0.22166754  0.87448031  0.06021126  0.27952692
   0.79553109  0.20794415  0.66722548  0.17349239  0.79413193]]
Epoch: 1957	Loss: 20.340836525	Example Output: +++	Example Reward:  -0.3
[[ 0.40164685  0.46947739  0.51378828  0.90996188  0.9169383   0.19762528
   0.03687824  0.29549029  0.2202417   0.87545317  0.05936656  0.27823865
   0.79668409  0.20657504  0.66818798  0.17205529  0.79515475]]
Epoch: 1958	Loss: 20.3167032242	Example Output: *+2*+2	Example Reward:  -0.3
[[ 0.40115345  0.46950331  0.51434231  0.9108761   0.91787398  0

Epoch: 1984	Loss: 19.6826627731	Example Output: +23+X	Example Reward:  0.5499999999999999
[[ 0.38491562  0.47064728  0.52799869  0.93167698  0.93885976  0.15948679
   0.02261984  0.25760391  0.18204249  0.90130889  0.038912    0.24144448
   0.82804471  0.16896673  0.69758791  0.1335379   0.82502359]]
Epoch: 1985	Loss: 19.6562835693	Example Output: +2*	Example Reward:  -0.3
[[ 0.38420567  0.47069016  0.52847123  0.93246406  0.93963432  0.1579926
   0.02215756  0.25605953  0.18055281  0.90227485  0.03821743  0.23991708
   0.82926661  0.16748513  0.69873405  0.13206056  0.82620329]]
Epoch: 1986	Loss: 19.6276540756	Example Output: 	Example Reward:  -0.3
[[ 0.38335532  0.47073624  0.52894902  0.93330771  0.94046241  0.15640686
   0.02167138  0.2544083   0.17893274  0.90332741  0.03748368  0.23823999
   0.83056414  0.16589355  0.70002782  0.1305142   0.82748669]]
Epoch: 1987	Loss: 19.5984449387	Example Output: *3	Example Reward:  -0.3
[[ 0.38273147  0.47075573  0.52949381  0.9341045   0.9412

Epoch: 2013	Loss: 18.9509679794	Example Output: +-267*76+0	Example Reward:  0.20000000000000007
[[ 0.3638331   0.47630417  0.54555839  0.95099509  0.95796478  0.12058815
   0.01249671  0.21220243  0.1413444   0.92626339  0.02307374  0.1975989
   0.86018372  0.12956958  0.73473483  0.09582551  0.85648435]]
Epoch: 2014	Loss: 18.9310745239	Example Output: Y11XYY/	Example Reward:  -0.3
[[ 0.36315024  0.47644207  0.54600734  0.95145226  0.95840997  0.11958297
   0.01228922  0.21097484  0.14030685  0.92687696  0.022734    0.19644068
   0.86099333  0.1285397   0.73573941  0.09489766  0.85730195]]
Epoch: 2015	Loss: 18.9085668564	Example Output: 	Example Reward:  -0.3
[[ 0.36240444  0.47666132  0.54652673  0.95200962  0.95895034  0.11833878
   0.01203908  0.20945272  0.13902421  0.92763358  0.0223229   0.19497311
   0.86198157  0.12724036  0.73703527  0.09377187  0.85827112]]
Epoch: 2016	Loss: 18.8832263947	Example Output: 52X0	Example Reward:  -0.3
[[ 0.36167973  0.47685587  0.54707223  0.9525

Epoch: 2042	Loss: 18.1996793747	Example Output: 6+210	Example Reward:  -0.05000000000000002
[[ 0.33277652  0.48597676  0.57081825  0.96692663  0.97303504  0.08400283
   0.00618634  0.16336554  0.10177139  0.94799447  0.01233297  0.15193431
   0.89121175  0.09155466  0.77592415  0.06335075  0.88780439]]
Epoch: 2043	Loss: 18.1731388092	Example Output: 52271*179Y	Example Reward:  -0.3
[[ 0.33154112  0.4865801   0.5718109   0.96740127  0.97346717  0.08286593
   0.00602977  0.16164719  0.10052825  0.94864792  0.0120523   0.15044945
   0.89219952  0.0903608   0.77739441  0.06236355  0.88880545]]
Epoch: 2044	Loss: 18.1482469559	Example Output: 29*	Example Reward:  -0.3
[[ 0.33025604  0.48727152  0.57286119  0.96788108  0.97390568  0.08171489
   0.00587252  0.15991695  0.09924479  0.94931167  0.01177055  0.14891042
   0.89322633  0.08914908  0.77890575  0.06136525  0.8898381 ]]
Epoch: 2045	Loss: 18.1233983994	Example Output: +Y*+*+	Example Reward:  -0.3
[[ 0.32898557  0.48779252  0.57392168  0

Epoch: 2072	Loss: 17.4748695374	Example Output: *Y+/X0+22Y	Example Reward:  -0.3
[[ 0.2899341   0.50713164  0.60566437  0.97943032  0.98407656  0.05276572
   0.00266021  0.11388624  0.06601525  0.96584743  0.0057833   0.10665944
   0.9205541   0.05853852  0.82014126  0.03728852  0.91800487]]
Epoch: 2073	Loss: 17.4498594284	Example Output: 22+277	Example Reward:  -0.059999999999999915
[[ 0.28822601  0.50799984  0.60694927  0.97979891  0.98439264  0.05180381
   0.00257478  0.11221699  0.06486564  0.96639431  0.00561649  0.1051092
   0.92152834  0.05749992  0.82161862  0.03651417  0.91900158]]
Epoch: 2074	Loss: 17.4252487183	Example Output: 	Example Reward:  -0.3
[[ 0.28646952  0.50907052  0.60813886  0.98015243  0.98469353  0.05088393
   0.00249458  0.11063575  0.06377379  0.96692097  0.00545927  0.10360136
   0.92247373  0.05650958  0.82310104  0.03577363  0.91994929]]
Epoch: 2075	Loss: 17.4026041031	Example Output: 	Example Reward:  -0.3
[[ 0.28462029  0.51020187  0.60933703  0.9804858

Epoch: 2101	Loss: 16.8697277069	Example Output: *27170*2-Y	Example Reward:  -0.3
[[  2.35771537e-01   5.46728373e-01   6.47190452e-01   9.88141835e-01
    9.91300523e-01   2.95435470e-02   9.88155254e-04   7.16782808e-02
    3.83311547e-02   9.79107916e-01   2.37383437e-03   6.74766079e-02
    9.45387125e-01   3.35481465e-02   8.63012612e-01   1.94296837e-02
    9.43483710e-01]]
Epoch: 2102	Loss: 16.8515010834	Example Output: 	Example Reward:  -0.3
[[  2.33737737e-01   5.48037171e-01   6.48914337e-01   9.88377392e-01
    9.91489649e-01   2.89057419e-02   9.52820701e-04   7.04423264e-02
    3.75557207e-02   9.79478776e-01   2.29729526e-03   6.63248226e-02
    9.46138322e-01   3.28513905e-02   8.64425480e-01   1.89622138e-02
    9.44244444e-01]]
Epoch: 2103	Loss: 16.8339906693	Example Output: 777X0Y7220	Example Reward:  -0.3
[[  2.31676698e-01   5.49568236e-01   6.50505424e-01   9.88608241e-01
    9.91674244e-01   2.82810517e-02   9.18685342e-04   6.92072809e-02
    3.67914177e-02   9.79

Epoch: 2123	Loss: 16.5309118271	Example Output: 27	Example Reward:  -0.12
[[  1.91196442e-01   5.81133842e-01   6.82279110e-01   9.92367327e-01
    9.94628489e-01   1.80806853e-02   4.41606593e-04   4.79980595e-02
    2.42162682e-02   9.85933125e-01   1.14959560e-03   4.54170294e-02
    9.59744215e-01   2.09453702e-02   8.91200840e-01   1.12814931e-02
    9.58286583e-01]]
Epoch: 2124	Loss: 16.5164550781	Example Output: 2+2	Example Reward:  -0.03
[[  1.89217776e-01   5.82549691e-01   6.83625579e-01   9.92513716e-01
    9.94741201e-01   1.76831614e-02   4.26029932e-04   4.71254438e-02
    2.37177424e-02   9.86176193e-01   1.11306272e-03   4.46054079e-02
    9.60283041e-01   2.05030628e-02   8.92320335e-01   1.10096186e-02
    9.58855510e-01]]
Epoch: 2125	Loss: 16.5041151047	Example Output: +*22*1+122	Example Reward:  -0.3
[[  1.87379912e-01   5.83967328e-01   6.85157359e-01   9.92650092e-01
    9.94846225e-01   1.73142478e-02   4.11766785e-04   4.63084541e-02
    2.32539698e-02   9.86402

Epoch: 2146	Loss: 16.2823764801	Example Output: 	Example Reward:  -0.3
[[  1.43088624e-01   6.23548269e-01   7.28299081e-01   9.95453835e-01
    9.96957064e-01   9.94256139e-03   1.68660481e-04   2.92804781e-02
    1.38817634e-02   9.91097808e-01   4.85012046e-04   2.79938746e-02
    9.71885502e-01   1.17961159e-02   9.18098986e-01   5.85653121e-03
    9.70790565e-01]]
Epoch: 2147	Loss: 16.2740236282	Example Output: 70Y01	Example Reward:  -0.3
[[  1.41166672e-01   6.25503182e-01   7.30279565e-01   9.95557129e-01
    9.97032762e-01   9.67772678e-03   1.61545031e-04   2.86400300e-02
    1.35395154e-02   9.91275668e-01   4.66683676e-04   2.73905676e-02
    9.72329676e-01   1.14948777e-02   9.19130504e-01   5.68658672e-03
    9.71243203e-01]]
Epoch: 2148	Loss: 16.2664909363	Example Output: 022	Example Reward:  -0.3
[[  1.39175937e-01   6.27630293e-01   7.32417047e-01   9.95663941e-01
    9.97110844e-01   9.40484833e-03   1.54339097e-04   2.79728491e-02
    1.31857544e-02   9.91459370e-01  

Epoch: 2169	Loss: 16.1411157608	Example Output: 022Y7707*1	Example Reward:  -0.3
[[  1.00598857e-01   6.69781864e-01   7.75969505e-01   9.97423649e-01
    9.98368800e-01   5.03876200e-03   5.74881597e-05   1.66637581e-02
    7.40057928e-03   9.94584024e-01   1.85372381e-04   1.61379967e-02
    9.81060088e-01   6.13519549e-03   9.40204620e-01   2.79724016e-03
    9.80149686e-01]]
Epoch: 2170	Loss: 16.1371227264	Example Output: +	Example Reward:  -0.3
[[  9.88844261e-02   6.72080398e-01   7.77966857e-01   9.97489333e-01
    9.98416901e-01   4.87561896e-03   5.46419869e-05   1.62121020e-02
    7.18020601e-03   9.94712710e-01   1.76920323e-04   1.57284271e-02
    9.81398880e-01   5.94395632e-03   9.41103280e-01   2.69822450e-03
    9.80502188e-01]]
Saving Weight
Epoch: 2171	Loss: 16.1334608078	Example Output: 11710+Y07*	Example Reward:  -0.3
[[  9.72047821e-02   6.74336791e-01   7.79897571e-01   9.97550189e-01
    9.98462200e-01   4.72275354e-03   5.20423637e-05   1.57871172e-02
    6.9736

Epoch: 2191	Loss: 16.1027046204	Example Output: *+	Example Reward:  -0.3
[[  6.63217530e-02   7.27153182e-01   8.17408264e-01   9.98563588e-01
    9.99173939e-01   2.35597487e-03   1.79855942e-05   8.83074105e-03
    3.68305203e-03   9.96865571e-01   6.35419419e-05   8.90672300e-03
    9.87455726e-01   2.95259454e-03   9.57624197e-01   1.21828623e-03
    9.86734271e-01]]
Epoch: 2192	Loss: 16.1029371262	Example Output: +Y+0X70102	Example Reward:  1.0
[[  6.49991110e-02   7.29829967e-01   8.19164574e-01   9.98602331e-01
    9.99199688e-01   2.27281940e-03   1.70279309e-05   8.56926572e-03
    3.56344483e-03   9.96943891e-01   6.04317829e-05   8.65719467e-03
    9.87695217e-01   2.85247713e-03   9.58304524e-01   1.17152289e-03
    9.86981332e-01]]
Epoch: 2193	Loss: 16.1038440704	Example Output: 	Example Reward:  -0.3
[[  6.38736784e-02   7.32497454e-01   8.20909321e-01   9.98636663e-01
    9.99222279e-01   2.19969871e-03   1.62025626e-05   8.33857339e-03
    3.45806219e-03   9.97013569e-0

Epoch: 2213	Loss: 16.1408401489	Example Output: Y	Example Reward:  0.39
[[  4.08080928e-02   7.87490010e-01   8.56321812e-01   9.99241948e-01
    9.99604642e-01   1.00502127e-03   4.94984988e-06   4.32846788e-03
    1.68381922e-03   9.98260677e-01   1.94732784e-05   4.52815229e-03
    9.91993546e-01   1.30219723e-03   9.70969021e-01   4.82936506e-04
    9.91452336e-01]]
Epoch: 2214	Loss: 16.1427881241	Example Output: 2+Y11++*1Y	Example Reward:  -0.3
[[  4.00177799e-02   7.89541483e-01   8.57658267e-01   9.99260604e-01
    9.99615788e-01   9.71737667e-04   4.70494615e-06   4.20812843e-03
    1.63250149e-03   9.98299897e-01   1.85887257e-05   4.40818956e-03
    9.92131770e-01   1.26070064e-03   9.71391976e-01   4.65632329e-04
    9.91597474e-01]]
Epoch: 2215	Loss: 16.1450426102	Example Output: 117*	Example Reward:  -0.3
[[  3.90831530e-02   7.92051971e-01   8.59249175e-01   9.99282539e-01
    9.99628901e-01   9.32931958e-04   4.42489136e-06   4.06681467e-03
    1.57248252e-03   9.9834621

Epoch: 2235	Loss: 16.20481987	Example Output: Y*22*0+Y	Example Reward:  1
[[  2.42366474e-02   8.36776912e-01   8.88370514e-01   9.99602377e-01
    9.99812186e-01   4.13961214e-04   1.30947728e-06   2.05758796e-03
    7.45054916e-04   9.99037623e-01   5.75491458e-06   2.22922093e-03
    9.94904041e-01   5.55013423e-04   9.80170369e-01   1.84979886e-04
    9.94497120e-01]]
Epoch: 2236	Loss: 16.2078119278	Example Output: 0	Example Reward:  -0.10999999999999999
[[  2.35991906e-02   8.38829935e-01   8.89750123e-01   9.99614835e-01
    9.99818981e-01   3.95867566e-04   1.22500421e-06   1.98180275e-03
    7.15055561e-04   9.99065340e-01   5.41355394e-06   2.15084571e-03
    9.95016634e-01   5.31650556e-04   9.80544388e-01   1.76262620e-04
    9.94614899e-01]]
Epoch: 2237	Loss: 16.2111885071	Example Output: Y++2	Example Reward:  0.5599999999999999
[[  2.30018012e-02   8.40884864e-01   8.91120732e-01   9.99626517e-01
    9.99825299e-01   3.79181729e-04   1.14884085e-06   1.91141374e-03
    6.8

Epoch: 2257	Loss: 16.290391922	Example Output: +700*11*0+	Example Reward:  -0.3
[[  1.29107041e-02   8.81065607e-01   9.18724895e-01   9.99815881e-01
    9.99922633e-01   1.43449055e-04   2.38589337e-07   8.39440327e-04
    2.79502565e-04   9.99520421e-01   1.32460718e-06   9.48110304e-04
    9.97018576e-01   1.98922367e-04   9.87299740e-01   5.85980233e-05
    9.96727705e-01]]
Epoch: 2258	Loss: 16.2937784195	Example Output: 1Y0221+1*	Example Reward:  -0.3
[[  1.25850793e-02   8.82601261e-01   9.19788659e-01   9.99821246e-01
    9.99925137e-01   1.37521070e-04   2.24164282e-07   8.10173457e-04
    2.68859381e-04   9.99533176e-01   1.25080430e-06   9.16429388e-04
    9.97078776e-01   1.91008119e-04   9.87516522e-01   5.59925174e-05
    9.96791780e-01]]
Epoch: 2259	Loss: 16.2973796844	Example Output: 2X1101+711	Example Reward:  -0.3
[[  1.22384625e-02   8.84216607e-01   9.20952559e-01   9.99826849e-01
    9.99927878e-01   1.31333014e-04   2.09939586e-07   7.79494585e-04
    2.57735490e-0

Epoch: 2279	Loss: 16.3733264923	Example Output: +**020Y	Example Reward:  -0.3
[[  6.66466821e-03   9.15232658e-01   9.42312598e-01   9.99911904e-01
    9.99967933e-01   4.72705105e-05   5.54922934e-08   3.34223121e-04
    1.02005186e-04   9.99761522e-01   2.66286975e-07   3.91823589e-04
    9.98212218e-01   6.96019706e-05   9.91886675e-01   1.79324670e-05
    9.98026431e-01]]
Epoch: 2280	Loss: 16.3763114929	Example Output: 7070+7	Example Reward:  -0.059999999999999915
[[  6.48644380e-03   9.16392863e-01   9.43069696e-01   9.99914408e-01
    9.99969006e-01   4.52302884e-05   5.26003063e-08   3.22188513e-04
    9.79921679e-05   9.99767721e-01   2.51044924e-07   3.78216529e-04
    9.98247027e-01   6.67464337e-05   9.92024302e-01   1.71094180e-05
    9.98064220e-01]]
Saving Weight
Epoch: 2281	Loss: 16.3791070938	Example Output: Y1Y2*+0*20	Example Reward:  -0.3
[[  6.30602846e-03   9.17507410e-01   9.43829894e-01   9.99916911e-01
    9.99969959e-01   4.32151464e-05   4.98083779e-08   3.1019

Epoch: 2301	Loss: 16.4329828262	Example Output: *Y*	Example Reward:  -0.3
[[  3.35545558e-03   9.38804090e-01   9.56947565e-01   9.99954820e-01
    9.99985099e-01   1.61497883e-05   1.64852576e-08   1.35851355e-04
    3.80565871e-05   9.99871254e-01   7.71394326e-08   1.63933903e-04
    9.98878181e-01   2.47926491e-05   9.94514346e-01   5.70263592e-06
    9.98740971e-01]]
Epoch: 2302	Loss: 16.4353693008	Example Output: 0**Y*	Example Reward:  -0.3
[[  3.24994628e-03   9.39718544e-01   9.57508683e-01   9.99956131e-01
    9.99985576e-01   1.53748842e-05   1.56267266e-08   1.30332977e-04
    3.63678737e-05   9.99874711e-01   7.32285912e-08   1.57476359e-04
    9.98901486e-01   2.36402884e-05   9.94608760e-01   5.41088048e-06
    9.98765945e-01]]
Epoch: 2303	Loss: 16.4376264572	Example Output: 2	Example Reward:  -0.10999999999999999
[[  3.15760798e-03   9.40524638e-01   9.58006561e-01   9.99957323e-01
    9.99986053e-01   1.47069686e-05   1.48869423e-08   1.25542181e-04
    3.49072798e-05  

Epoch: 2324	Loss: 16.482116127	Example Output: 11*	Example Reward:  -0.3
[[  1.59671472e-03   9.56390023e-01   9.67828035e-01   9.99977231e-01
    9.99993205e-01   5.17549279e-06   4.85635931e-09   5.18473389e-05
    1.32758159e-05   9.99931216e-01   2.40724400e-08   6.44873289e-05
    9.99306798e-01   8.21406138e-06   9.96299207e-01   1.69036150e-06
    9.99203384e-01]]
Epoch: 2325	Loss: 16.483956337	Example Output: Y0*+122	Example Reward:  -0.3
[[  1.54429034e-03   9.57006931e-01   9.68242466e-01   9.99977946e-01
    9.99993443e-01   4.91795254e-06   4.59961003e-09   4.96469765e-05
    1.26623599e-05   9.99933124e-01   2.28779573e-08   6.18373087e-05
    9.99321580e-01   7.81658127e-06   9.96362746e-01   1.60066168e-06
    9.99219298e-01]]
Epoch: 2326	Loss: 16.4857345581	Example Output: 1Y1Y7+YY7*	Example Reward:  -0.3
[[  1.49649871e-03   9.57575321e-01   9.68622148e-01   9.99978542e-01
    9.99993682e-01   4.68692542e-06   4.36995906e-09   4.76582354e-05
    1.21099947e-05   9.9993

Epoch: 2346	Loss: 16.5231880188	Example Output: +020*+27Y	Example Reward:  -0.3
[[  7.22468307e-04   9.69719946e-01   9.76303339e-01   9.99989152e-01
    9.99997139e-01   1.50284973e-06   1.27561262e-09   1.80875595e-05
    4.25871804e-06   9.99965429e-01   6.92748303e-09   2.33817736e-05
    9.99592483e-01   2.49120535e-06   9.97578442e-01   3.88927162e-07
    9.99513865e-01]]
Epoch: 2347	Loss: 16.5247419357	Example Output: 00Y0Y22+Y+	Example Reward:  -0.3
[[  6.97252166e-04   9.70216691e-01   9.76621032e-01   9.99989510e-01
    9.99997258e-01   1.42114743e-06   1.20031507e-09   1.72444288e-05
    4.04610319e-06   9.99966502e-01   6.54722232e-09   2.23338884e-05
    9.99602258e-01   2.36075493e-06   9.97624457e-01   3.63182636e-07
    9.99524593e-01]]
Epoch: 2348	Loss: 16.5264011383	Example Output: Y017+7Y*10	Example Reward:  -0.3
[[  6.70049048e-04   9.70743716e-01   9.76973593e-01   9.99989867e-01
    9.99997377e-01   1.33589663e-06   1.12322762e-09   1.63571167e-05
    3.82185226e-

Epoch: 2369	Loss: 16.55832901	Example Output: 7710*Y	Example Reward:  0.44
[[  2.80553417e-04   9.79845583e-01   9.83784795e-01   9.99995589e-01
    9.99998927e-01   2.90181703e-07   2.68709638e-10   5.19362902e-06
    1.08535278e-06   9.99984503e-01   1.63524383e-09   7.11869234e-06
    9.99777377e-01   5.49575702e-07   9.98549640e-01   9.20287988e-08
    9.99728262e-01]]
Epoch: 2370	Loss: 16.5595901489	Example Output: *Y01Y+*+22	Example Reward:  -0.3
[[  2.68906297e-04   9.80164468e-01   9.84074235e-01   9.99995708e-01
    9.99999046e-01   2.71182671e-07   2.50219484e-10   4.91688797e-06
    1.01573005e-06   9.99985099e-01   1.53219559e-09   6.73841168e-06
    9.99783337e-01   5.03231320e-07   9.98580813e-01   8.68351364e-08
    9.99736130e-01]]
Saving Weight
Epoch: 2371	Loss: 16.5608148575	Example Output: +*17*+0	Example Reward:  -0.3
[[  2.57718784e-04   9.80477631e-01   9.84349549e-01   9.99995947e-01
    9.99999046e-01   2.54014793e-07   2.33369934e-10   4.65496851e-06
    9.5128

Epoch: 2391	Loss: 16.5798461914	Example Output: 7	Example Reward:  -0.10999999999999999
[[  1.16904062e-04   9.85410213e-01   9.88577008e-01   9.99997854e-01
    9.99999523e-01   8.86299247e-08   6.90876523e-11   1.63202651e-06
    2.37895435e-07   9.99992490e-01   4.79389584e-10   2.31071112e-06
    9.99870539e-01   1.38183736e-07   9.99034882e-01   3.16397895e-08
    9.99837518e-01]]
Epoch: 2392	Loss: 16.5804710388	Example Output: 7**17Y7	Example Reward:  -0.3
[[  1.12758877e-04   9.85579967e-01   9.88705337e-01   9.99997973e-01
    9.99999523e-01   8.51858033e-08   6.58409577e-11   1.55888802e-06
    2.26796075e-07   9.99992609e-01   4.59173671e-10   2.21169853e-06
    9.99872923e-01   1.32483549e-07   9.99049008e-01   3.04716501e-08
    9.99840260e-01]]
Epoch: 2393	Loss: 16.5810810089	Example Output: 11YY7127+*	Example Reward:  -0.3
[[  1.08685279e-04   9.85747159e-01   9.88828957e-01   9.99997973e-01
    9.99999642e-01   8.18937949e-08   6.27399036e-11   1.48811023e-06
    2.16407

Epoch: 2413	Loss: 16.5922136307	Example Output: 71+	Example Reward:  -0.3
[[  5.14111198e-05   9.88898456e-01   9.91038859e-01   9.99998808e-01
    9.99999762e-01   3.86273449e-08   2.40738263e-11   5.08230812e-07
    9.55538155e-08   9.99995470e-01   1.89148863e-10   8.90389174e-07
    9.99913573e-01   6.06632611e-08   9.99300957e-01   1.39670471e-08
    9.99885201e-01]]
Epoch: 2414	Loss: 16.5928611755	Example Output: 2+7	Example Reward:  -0.03
[[  4.91786886e-05   9.89077687e-01   9.91158664e-01   9.99998808e-01
    9.99999762e-01   3.70768376e-08   2.27679195e-11   4.73189544e-07
    9.17060348e-08   9.99995589e-01   1.80305756e-10   8.48633022e-07
    9.99915481e-01   5.84523363e-08   9.99312162e-01   1.33778002e-08
    9.99886990e-01]]
Epoch: 2415	Loss: 16.5934537888	Example Output: ++YY	Example Reward:  -0.3
[[  4.71322783e-05   9.89239812e-01   9.91268516e-01   9.99998927e-01
    9.99999762e-01   3.56535210e-08   2.15887776e-11   4.42535850e-07
    8.81689530e-08   9.99995708e-0

Epoch: 2435	Loss: 16.6018198013	Example Output: Y	Example Reward:  0.39
[[  2.17032539e-05   9.91565347e-01   9.92795646e-01   9.99999404e-01
    9.99999881e-01   1.73317201e-08   7.83380565e-12   1.70483503e-07
    4.32171099e-08   9.99997377e-01   6.97439537e-11   2.47928085e-07
    9.99943972e-01   2.80728738e-08   9.99506712e-01   5.90954352e-09
    9.99922276e-01]]
Epoch: 2436	Loss: 16.6020702362	Example Output: 1Y2*20*717	Example Reward:  -0.3
[[  2.10113903e-05   9.91636693e-01   9.92844284e-01   9.99999404e-01
    9.99999881e-01   1.68928782e-08   7.55923189e-12   1.64942918e-07
    4.21392379e-08   9.99997377e-01   6.75753412e-11   2.38789426e-07
    9.99944687e-01   2.73764211e-08   9.99512196e-01   5.75039572e-09
    9.99923229e-01]]
Epoch: 2437	Loss: 16.6023132324	Example Output: 2Y	Example Reward:  -0.3
[[  2.02813590e-05   9.91703629e-01   9.92890954e-01   9.99999404e-01
    9.99999881e-01   1.64615361e-08   7.29277923e-12   1.59610394e-07
    4.10837089e-08   9.99997497e

Epoch: 2457	Loss: 16.6062093735	Example Output: 772*17+Y*	Example Reward:  -0.3
[[  1.04865312e-05   9.92704272e-01   9.93694365e-01   9.99999523e-01
    9.99999881e-01   1.05874554e-08   4.00463603e-12   9.27971229e-08
    2.64318505e-08   9.99998093e-01   3.86269176e-11   1.27903192e-07
    9.99956608e-01   1.69219323e-08   9.99599278e-01   3.54508867e-09
    9.99939203e-01]]
Epoch: 2458	Loss: 16.6063617706	Example Output: 11*Y2+Y	Example Reward:  -0.3
[[  1.01174592e-05   9.92743373e-01   9.93726730e-01   9.99999523e-01
    9.99999881e-01   1.03733919e-08   3.89565203e-12   9.05951154e-08
    2.59108255e-08   9.99998093e-01   3.77061507e-11   1.24780627e-07
    9.99957085e-01   1.65632326e-08   9.99602735e-01   3.47203444e-09
    9.99939919e-01]]
Epoch: 2459	Loss: 16.6065139771	Example Output: +0Y77+2077	Example Reward:  -0.3
[[  9.76192496e-06   9.92781341e-01   9.93758321e-01   9.99999523e-01
    9.99999881e-01   1.01653237e-08   3.79053689e-12   8.84688021e-08
    2.54051074e-08 

Epoch: 2480	Loss: 16.6091827393	Example Output: 	Example Reward:  -0.3
[[  4.88833530e-06   9.93441463e-01   9.94322300e-01   9.99999642e-01
    1.00000000e+00   6.93400048e-09   2.26583466e-12   5.69615572e-08
    1.75546262e-08   9.99998569e-01   2.34909644e-11   7.81044207e-08
    9.99964833e-01   1.08352225e-08   9.99666095e-01   2.30896813e-09
    9.99950886e-01]]
Saving Weight
Epoch: 2481	Loss: 16.6092878342	Example Output: +Y2Y027+*2	Example Reward:  -0.3
[[  4.72317197e-06   9.93469357e-01   9.94345725e-01   9.99999642e-01
    1.00000000e+00   6.81277523e-09   2.21281912e-12   5.58555620e-08
    1.72636554e-08   9.99998569e-01   2.30117089e-11   7.66198980e-08
    9.99965072e-01   1.06340039e-08   9.99668598e-01   2.26842833e-09
    9.99951363e-01]]
Epoch: 2482	Loss: 16.6094045639	Example Output: +122+	Example Reward:  -0.3
[[  4.56882753e-06   9.93496537e-01   9.94369328e-01   9.99999642e-01
    1.00000000e+00   6.69630129e-09   2.16220661e-12   5.47923591e-08
    1.69831100e-

Epoch: 2502	Loss: 16.6113769531	Example Output: *	Example Reward:  -0.3
[[  2.34623553e-06   9.93972957e-01   9.94796813e-01   9.99999762e-01
    1.00000000e+00   4.79309348e-09   1.38161780e-12   3.80814669e-08
    1.24091937e-08   9.99998927e-01   1.52710292e-11   5.29445430e-08
    9.99970555e-01   7.30965422e-09   9.99716341e-01   1.59605384e-09
    9.99959230e-01]]
Epoch: 2503	Loss: 16.6114711761	Example Output: Y*	Example Reward:  -0.3
[[  2.26277007e-06   9.93995607e-01   9.94817436e-01   9.99999762e-01
    1.00000000e+00   4.71138240e-09   1.35019209e-12   3.73993672e-08
    1.22144304e-08   9.99998927e-01   1.49685212e-11   5.20549648e-08
    9.99970794e-01   7.17605664e-09   9.99718606e-01   1.56904822e-09
    9.99959588e-01]]
Epoch: 2504	Loss: 16.6115732193	Example Output: 1	Example Reward:  -0.10999999999999999
[[  2.18838636e-06   9.94017124e-01   9.94837940e-01   9.99999762e-01
    1.00000000e+00   4.63524330e-09   1.32109016e-12   3.67584931e-08
    1.20314407e-08   9.99

Epoch: 2524	Loss: 16.613293457	Example Output: *7177207Y7	Example Reward:  -0.3
[[  1.09235475e-06   9.94421422e-01   9.95225906e-01   9.99999762e-01
    1.00000000e+00   3.34701244e-09   8.52008676e-13   2.61152415e-08
    8.91580410e-09   9.99999046e-01   1.00407105e-11   3.74057123e-08
    9.99975085e-01   4.96900299e-09   9.99758780e-01   1.11376408e-09
    9.99966025e-01]]
Epoch: 2525	Loss: 16.6134096146	Example Output: +++*Y+*Y17	Example Reward:  -0.3
[[  1.05392212e-06   9.94448304e-01   9.95249033e-01   9.99999762e-01
    1.00000000e+00   3.29748562e-09   8.33879949e-13   2.56653347e-08
    8.78851658e-09   9.99999166e-01   9.86214322e-12   3.68856838e-08
    9.99975324e-01   4.88844965e-09   9.99760330e-01   1.09545573e-09
    9.99966264e-01]]
Epoch: 2526	Loss: 16.6135046005	Example Output: 0Y2Y**	Example Reward:  -0.3
[[  1.01764010e-06   9.94476616e-01   9.95272100e-01   9.99999762e-01
    1.00000000e+00   3.24942295e-09   8.16424998e-13   2.52301096e-08
    8.66481464e-09  

Epoch: 2546	Loss: 16.6162309647	Example Output: +*	Example Reward:  -0.3
[[  3.25695197e-07   9.95118380e-01   9.95884478e-01   9.99999881e-01
    1.00000000e+00   2.06782813e-09   4.27709002e-13   1.56249964e-08
    5.73197712e-09   9.99999285e-01   5.62019094e-12   2.52643453e-08
    9.99980688e-01   2.92186164e-09   9.99805510e-01   6.59890920e-10
    9.99973178e-01]]
Epoch: 2547	Loss: 16.6163286209	Example Output: Y++0++Y+	Example Reward:  -0.3
[[  3.11132226e-07   9.95142817e-01   9.95908499e-01   9.99999881e-01
    1.00000000e+00   2.02761985e-09   4.16031006e-13   1.53121764e-08
    5.63031710e-09   9.99999404e-01   5.48876396e-12   2.48563445e-08
    9.99980927e-01   2.85990409e-09   9.99807179e-01   6.46232012e-10
    9.99973416e-01]]
Epoch: 2548	Loss: 16.6164352417	Example Output: *Y	Example Reward:  -0.3
[[  2.97777660e-07   9.95166659e-01   9.95932162e-01   9.99999881e-01
    1.00000000e+00   1.98950234e-09   4.05058772e-13   1.50155550e-08
    5.53361534e-09   9.99999404e-

Epoch: 2569	Loss: 16.6179838181	Example Output: 7Y1+712770	Example Reward:  -0.3
[[  1.52780927e-07   9.95527446e-01   9.96274710e-01   9.99999881e-01
    1.00000000e+00   1.46670676e-09   2.64326890e-13   1.09352527e-08
    4.17350376e-09   9.99999523e-01   3.71634928e-12   1.86705922e-08
    9.99983788e-01   2.01376804e-09   9.99833465e-01   4.58352023e-10
    9.99977350e-01]]
Epoch: 2570	Loss: 16.6180368423	Example Output: 07111*	Example Reward:  -0.3
[[  1.49115010e-07   9.95539486e-01   9.96286988e-01   9.99999881e-01
    1.00000000e+00   1.44973811e-09   2.60074568e-13   1.08023510e-08
    4.12823420e-09   9.99999523e-01   3.66469008e-12   1.84683913e-08
    9.99983907e-01   1.98870564e-09   9.99834299e-01   4.52746007e-10
    9.99977589e-01]]
Saving Weight
Epoch: 2571	Loss: 16.618091774	Example Output: **22+01	Example Reward:  -0.3
[[  1.45600907e-07   9.95552242e-01   9.96299446e-01   9.99999881e-01
    1.00000000e+00   1.43321166e-09   2.55954600e-13   1.06728750e-08
    4.084

Epoch: 2591	Loss: 16.6190258026	Example Output: YY1	Example Reward:  -0.3
[[  9.69986118e-08   9.95777011e-01   9.96502042e-01   9.99999881e-01
    1.00000000e+00   1.17265508e-09   1.93722019e-13   8.62940386e-09
    3.37753825e-09   9.99999523e-01   2.84006976e-12   1.50416106e-08
    9.99985576e-01   1.58399271e-09   9.99849319e-01   3.61936814e-10
    9.99979734e-01]]
Epoch: 2592	Loss: 16.6190736771	Example Output: 7000*7YYY*	Example Reward:  -0.3
[[  9.53086357e-08   9.95789826e-01   9.96511638e-01   9.99999881e-01
    1.00000000e+00   1.16224519e-09   1.91346423e-13   8.54764526e-09
    3.34891515e-09   9.99999523e-01   2.80983158e-12   1.49081956e-08
    9.99985576e-01   1.56898838e-09   9.99849916e-01   3.58550745e-10
    9.99979854e-01]]
Epoch: 2593	Loss: 16.6191225052	Example Output: 	Example Reward:  -0.3
[[  9.36666780e-08   9.95802343e-01   9.96520996e-01   9.99999881e-01
    1.00000000e+00   1.15201770e-09   1.89022328e-13   8.46740367e-09
    3.32079475e-09   9.99999523e

Epoch: 2614	Loss: 16.6199008942	Example Output: 	Example Reward:  -0.3
[[  6.75994158e-08   9.95999694e-01   9.96683419e-01   9.99999881e-01
    1.00000000e+00   9.72947944e-10   1.49707043e-13   7.06166325e-09
    2.82264145e-09   9.99999642e-01   2.27048090e-12   1.24268151e-08
    9.99986887e-01   1.29801325e-09   9.99861360e-01   2.97376013e-10
    9.99981523e-01]]
Epoch: 2615	Loss: 16.6199390411	Example Output: +27201*222	Example Reward:  5.55111512313e-17
[[  6.66589841e-08   9.96006668e-01   9.96689558e-01   9.99999881e-01
    1.00000000e+00   9.65789004e-10   1.48190271e-13   7.00546687e-09
    2.80250312e-09   9.99999642e-01   2.25047997e-12   1.23308848e-08
    9.99986887e-01   1.28784083e-09   9.99861717e-01   2.95075880e-10
    9.99981642e-01]]
Epoch: 2616	Loss: 16.6199689865	Example Output: 	Example Reward:  -0.3
[[  6.57394139e-08   9.96012926e-01   9.96695518e-01   9.99999881e-01
    1.00000000e+00   9.58737534e-10   1.46701160e-13   6.95011426e-09
    2.78263568e-09   9

Epoch: 2636	Loss: 16.6205106735	Example Output: 02*21Y012Y	Example Reward:  -0.3
[[  5.08425231e-08   9.96149659e-01   9.96813953e-01   9.99999881e-01
    1.00000000e+00   8.35449376e-10   1.21416955e-13   5.98346972e-09
    2.43309750e-09   9.99999642e-01   1.89207114e-12   1.05613163e-08
    9.99987841e-01   1.10381382e-09   9.99870420e-01   2.53412485e-10
    9.99982834e-01]]
Epoch: 2637	Loss: 16.6205354691	Example Output: 0*1*Y2007*	Example Reward:  -0.3
[[  5.02389774e-08   9.96156752e-01   9.96819019e-01   9.99999881e-01
    1.00000000e+00   8.30041036e-10   1.20341183e-13   5.94118843e-09
    2.41766496e-09   9.99999642e-01   1.87746498e-12   1.04871258e-08
    9.99987841e-01   1.09624587e-09   9.99870777e-01   2.51695192e-10
    9.99982953e-01]]
Epoch: 2638	Loss: 16.6205598831	Example Output: 1Y1	Example Reward:  -0.3
[[  4.96466654e-08   9.96162415e-01   9.96822357e-01   9.99999881e-01
    1.00000000e+00   8.24715018e-10   1.19282676e-13   5.89947557e-09
    2.40243581e-09   9

KeyboardInterrupt: 