ray/rllib/tests/data/cartpole/large.json

21 lines
1.2 MiB

{"type": "SampleBatch", "eps_id": [199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 199910694, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1662335932, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1930047199, 1127856969, 1127856969, 1127856969, 1127856969, 1127856969, 1127856969, 1127856969, 1127856969, 1127856969, 1127856969, 836223419, 836223419, 836223419, 836223419, 836223419, 836223419, 836223419, 836223419, 836223419, 836223419, 836223419, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 659841359, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 151725540, 1157656163, 1157656163, 1157656163, 1157656163, 1157656163, 1157656163, 1157656163, 1157656163, 1157656163, 1157656163, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 190681968, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1049471566, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 1333369052, 726689153, 726689153, 726689153, 726689153, 726689153, 726689153, 726689153, 726689153, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470, 224279470], "obs": [[-0.0232973862439394, 0.03324240818619728, 0.01929166354238987, -0.049009691923856735], [-0.0226325374096632, -0.1621507853269577, 0.01831146888434887, 0.24969695508480072], [-0.025875553488731384, 0.032704953104257584, 0.023305408656597137, -0.03715437278151512], [-0.025221453979611397, -0.16274331510066986, 0.02256232127547264, 0.2627895772457123], [-0.028476320207118988, -0.3581799268722534, 0.027818111702799797, 0.5625026822090149], [-0.035639919340610504, -0.1634591668844223, 0.03906816616654396, 0.2787119746208191], [-0.038909103721380234, 0.031084304675459862, 0.04464240372180939, -0.0013974315952509642], [-0.038287416100502014, 0.22553853690624237, 0.044614456593990326, -0.2796676456928253], [-0.03377664461731911, 0.41999658942222595, 0.03902110457420349, -0.5579522252082825], [-0.025376712903380394, 0.2243492305278778, 0.027862058952450752, -0.25323525071144104], [-0.020889729261398315, 0.4190624952316284, 0.0227973535656929, -0.5370014309883118], [-0.012508478946983814, 0.6138566136360168, 0.012057325802743435, -0.8224148154258728], [-0.00023134703224059194, 0.418571799993515, -0.004390971269458532, -0.5259641408920288], [0.008140088990330696, 0.22351190447807312, -0.014910253696143627, -0.2346680462360382], [0.012610326521098614, 0.028606122359633446, -0.019603613764047623, 0.053274668753147125], [0.013182449154555798, -0.16622933745384216, -0.01853812113404274, 0.3397085964679718], [0.009857862256467342, -0.36108267307281494, -0.011743948794901371, 0.6264885067939758], [0.002636209363117814, -0.5560387372970581, 0.0007858205353841186, 0.9154497981071472], [-0.008484565652906895, -0.7511712908744812, 0.019094815477728844, 1.2083796262741089], [-0.023507991805672646, -0.9465346336364746, 0.043262407183647156, 1.5069847106933594], [-0.04243868589401245, -0.7519631385803223, 0.07340209931135178, 1.2281156778335571], [-0.05747794732451439, -0.5578585863113403, 0.09796441346406937, 0.9593037366867065], [-0.06863512098789215, -0.36418038606643677, 0.11715049296617508, 0.6989348530769348], [-0.07591872662305832, -0.5607149600982666, 0.131129190325737, 1.026079535484314], [-0.087133027613163, -0.7573157548904419, 0.1516507863998413, 1.3568905591964722], [-0.10227934271097183, -0.9539796113967896, 0.17878858745098114, 1.692915439605713], [-0.04606005176901817, -0.0012466305634006858, 0.0029205239843577147, -0.017267948016524315], [-0.04608498141169548, -0.19641034305095673, 0.002575164893642068, 0.2763350009918213], [-0.050013188272714615, -0.0013252266217023134, 0.008101864717900753, -0.015534601174294949], [-0.05003969371318817, -0.19656242430210114, 0.007791173178702593, 0.27969351410865784], [-0.05397094413638115, -0.0015524782938882709, 0.013385043479502201, -0.010521952994167805], [-0.05400199070572853, -0.1968638002872467, 0.013174604624509811, 0.2863538861274719], [-0.05793926864862442, -0.0019321977160871029, 0.018901681527495384, -0.0021449350751936436], [-0.057977911084890366, 0.19291365146636963, 0.018858782947063446, -0.2888047397136688], [-0.05411963909864426, 0.387761652469635, 0.013082688674330711, -0.5754806399345398], [-0.04636440798640251, 0.5826978087425232, 0.001573075889609754, -0.8640136122703552], [-0.03471045196056366, 0.38755446672439575, -0.015707196667790413, -0.5708364844322205], [-0.026959361508488655, 0.5828931331634521, -0.02712392620742321, -0.8684260845184326], [-0.015301498584449291, 0.7783734202384949, -0.0444924458861351, -1.1695120334625244], [0.000265969691099599, 0.974044919013977, -0.06788268685340881, -1.475805401802063], [0.019746867939829826, 1.1699273586273193, -0.0973987951874733, -1.7888944149017334], [0.04314541444182396, 0.9760239720344543, -0.13317668437957764, -1.528007984161377], [0.0626658946275711, 1.1724774837493896, -0.16373685002326965, -1.8591171503067017], [0.08611544221639633, 1.368974208831787, -0.20091918110847473, -2.1978437900543213], [0.01938316412270069, -0.034108467400074005, -0.014867947436869144, -0.04402117803692818], [0.018700994551181793, 0.16122350096702576, -0.015748370438814163, -0.3413577377796173], [0.021925466135144234, -0.03367089480161667, -0.02257552556693554, -0.053682249039411545], [0.021252047270536423, 0.1617673635482788, -0.023649170994758606, -0.3534015715122223], [0.024487394839525223, 0.3572174608707428, -0.03071720153093338, -0.6534469723701477], [0.031631745398044586, 0.1625364124774933, -0.04378614202141762, -0.37059256434440613], [0.03488247096538544, 0.35825222730636597, -0.051197994500398636, -0.6767539381980896], [0.042047515511512756, 0.5540467500686646, -0.06473307311534882, -0.9851065278053284], [0.053128451108932495, 0.3598487973213196, -0.08443520218133926, -0.7134379148483276], [0.06032542884349823, 0.16599103808403015, -0.09870395809412003, -0.4484816789627075], [0.06364525109529495, -0.027606314048171043, -0.10767359286546707, -0.1884709745645523], [0.06309312582015991, -0.22103624045848846, -0.11144301295280457, 0.06839873641729355], [0.05867239832878113, -0.02450760081410408, -0.11007504165172577, -0.2572619915008545], [0.0581822469830513, -0.21789996325969696, -0.11522027850151062, -0.001225856482051313], [0.05382424592971802, -0.021330274641513824, -0.1152447983622551, -0.3279252052307129], [0.05339764058589935, 0.17522762715816498, -0.12180329859256744, -0.6546133160591125], [0.056902192533016205, 0.3718160390853882, -0.13489556312561035, -0.9830328822135925], [0.06433851271867752, 0.5684621930122375, -0.15455622971057892, -1.314861536026001], [0.07570775598287582, 0.7651647925376892, -0.1808534562587738, -1.651657223701477], [-0.04752064496278763, -0.02107728272676468, 0.02262268401682377, -0.03299928829073906], [-0.04794218763709068, -0.21651622653007507, 0.02196269854903221, 0.26673460006713867], [-0.05227251350879669, -0.4119446277618408, 0.02729739062488079, 0.5662630200386047], [-0.060511406511068344, -0.6074386835098267, 0.0386226512491703, 0.8674193024635315], [-0.0726601779460907, -0.8030642867088318, 0.05597103759646416, 1.1719911098480225], [-0.08872146904468536, -0.9988674521446228, 0.0794108584523201, 1.4816828966140747], [-0.10869881510734558, -0.8047990798950195, 0.10904451459646225, 1.2148199081420898], [-0.12479479610919952, -0.6112396717071533, 0.13334091007709503, 0.9582008123397827], [-0.1370195895433426, -0.8078779578208923, 0.15250493586063385, 1.289626121520996], [-0.1531771421432495, -1.0045746564865112, 0.17829746007919312, 1.625909686088562], [-0.033046234399080276, -0.026037782430648804, 0.01944105513393879, 0.028076769784092903], [-0.03356698900461197, -0.22143305838108063, 0.020002590492367744, 0.32682961225509644], [-0.03799565136432648, -0.02660151571035385, 0.026539182290434837, 0.04052112624049187], [-0.038527682423591614, -0.22209379076957703, 0.027349604293704033, 0.34145787358283997], [-0.042969558387994766, -0.41759395599365234, 0.03417876362800598, 0.6426382660865784], [-0.05132143571972847, -0.6131752133369446, 0.047031525522470474, 0.945885419845581], [-0.06358493864536285, -0.8088979721069336, 0.06594923883676529, 1.252967119216919], [-0.07976289838552475, -1.0047998428344727, 0.09100857377052307, 1.5655560493469238], [-0.09985889494419098, -1.2008839845657349, 0.12231969833374023, 1.885184645652771], [-0.12387657910585403, -1.3971059322357178, 0.16002339124679565, 2.213190793991089], [-0.15181869268417358, -1.593357801437378, 0.20428720116615295, 2.5506539344787598], [0.009257699362933636, 0.04725342243909836, 0.04538232460618019, 0.03693678602576256], [0.010202767327427864, 0.24169619381427765, 0.046121060848236084, -0.24108925461769104], [0.015036690980196, 0.04594679921865463, 0.04129927605390549, 0.06577739119529724], [0.015955626964569092, -0.14974218606948853, 0.04261482134461403, 0.3711991012096405], [0.012960783205926418, -0.34544283151626587, 0.05003880336880684, 0.6770085692405701], [0.006051926873624325, -0.15105053782463074, 0.06357897818088531, 0.40049034357070923], [0.003030915977433324, 0.043114639818668365, 0.07158878445625305, 0.12851065397262573], [0.0038932086899876595, 0.2371419221162796, 0.07415899634361267, -0.14075566828250885], [0.008636047132313251, 0.43112772703170776, 0.07134388387203217, -0.4091518521308899], [0.017258601263165474, 0.6251694560050964, 0.06316084414720535, -0.6785167455673218], [0.029761990532279015, 0.42922958731651306, 0.04959050938487053, -0.3666359782218933], [0.038346581161022186, 0.23343929648399353, 0.04225778952240944, -0.05873797833919525], [0.04301536828279495, 0.42793068289756775, 0.04108303040266037, -0.3377945125102997], [0.0515739805996418, 0.232248917222023, 0.03432714194059372, -0.032444536685943604], [0.056218959391117096, 0.4268622100353241, 0.03367825224995613, -0.31410232186317444], [0.06475620716810226, 0.621488630771637, 0.027396203950047493, -0.5959768295288086], [0.0771859809756279, 0.8162167072296143, 0.015476667322218418, -0.8799058198928833], [0.09351031482219696, 0.6208879351615906, -0.0021214494481682777, -0.5823978185653687], [0.10592807084321976, 0.816039502620697, -0.013769405893981457, -0.8757482767105103], [0.12224885821342468, 1.0113458633422852, -0.03128437325358391, -1.172728180885315], [0.14247578382492065, 0.8166443109512329, -0.054738935083150864, -0.8900147676467896], [0.1588086634874344, 0.6223061084747314, -0.07253923267126083, -0.6150293350219727], [0.17125478386878967, 0.4282686710357666, -0.08483981341123581, -0.3460463881492615], [0.17982016503810883, 0.23444955050945282, -0.09176074713468552, -0.08127638697624207], [0.18450915813446045, 0.040754612535238266, -0.09338627010583878, 0.1811038702726364], [0.18532423675060272, 0.2370801866054535, -0.08976419270038605, -0.13951699435710907], [0.19006584584712982, 0.04335089027881622, -0.09255453199148178, 0.12355174869298935], [0.19093286991119385, 0.2396685630083084, -0.09008350223302841, -0.19683656096458435], [0.19572623074054718, 0.04594288393855095, -0.09402023255825043, 0.06612493842840195], [0.1966450959444046, 0.24227827787399292, -0.09269773215055466, -0.2546786665916443], [0.20149065554141998, 0.4385930895805359, -0.09779130667448044, -0.5751007795333862], [0.21026252210140228, 0.6349401473999023, -0.10929331928491592, -0.8969190120697021], [0.22296132147312164, 0.8313604593276978, -0.12723170220851898, -1.2218598127365112], [0.23958852887153625, 0.6380864381790161, -0.15166890621185303, -0.9715974926948547], [0.2523502707481384, 0.8348824977874756, -0.17110085487365723, -1.3078227043151855], [0.26904791593551636, 1.03170907497406, -0.19725731015205383, -1.6488099098205566], [-0.037853602319955826, -0.026145925745368004, -0.013264045119285583, -0.030621331185102463], [-0.038376521319150925, -0.221075177192688, -0.013876471668481827, 0.25784730911254883], [-0.04279802367091179, -0.025757893919944763, -0.00871952623128891, -0.0391799621284008], [-0.04331318289041519, -0.2207537293434143, -0.009503125213086605, 0.2507391571998596], [-0.04772825539112091, -0.41573870182037354, -0.004488341975957155, 0.540409505367279], [-0.05604303255677223, -0.6107972860336304, 0.006319848820567131, 0.8316748738288879], [-0.06825897842645645, -0.8060050010681152, 0.022953346371650696, 1.1263387203216553], [-0.08437907695770264, -1.0014201402664185, 0.04548012092709541, 1.4261317253112793], [-0.10440748184919357, -1.1970735788345337, 0.07400275766849518, 1.7326750755310059], [-0.1283489465713501, -1.0028702020645142, 0.10865625739097595, 1.4639042615890503], [-0.14840635657310486, -1.199142575263977, 0.1379343420267105, 1.7884587049484253], [-0.1723892092704773, -1.3955169916152954, 0.17370352149009705, 2.1206469535827637], [0.0035095978528261185, -0.03964754939079285, 0.019583238288760185, -0.005700720939785242], [0.002716646995395422, -0.23504479229450226, 0.01946922391653061, 0.29309606552124023], [-0.0019842488691210747, -0.4304388463497162, 0.025331145152449608, 0.5918551683425903], [-0.01059302594512701, -0.6259061098098755, 0.03716824948787689, 0.892408549785614], [-0.023111147806048393, -0.82151198387146, 0.0550164170563221, 1.1965396404266357], [-0.03954138606786728, -1.0173012018203735, 0.07894720882177353, 1.5059458017349243], [-0.05988741293549538, -0.8232206106185913, 0.10906612873077393, 1.2389180660247803], [-0.0763518214225769, -1.0195611715316772, 0.1338444948196411, 1.56368088722229], [-0.09674304723739624, -0.8262693881988525, 0.16511811316013336, 1.315569281578064], [-0.11326843500137329, -1.02305006980896, 0.1914294958114624, 1.6550500392913818], [-0.022257449105381966, 0.03445248678326607, 0.04831656813621521, 0.03162458539009094], [-0.02156839892268181, 0.22884945571422577, 0.04894905909895897, -0.24543102085590363], [-0.01699141040444374, 0.033063795417547226, 0.044040437787771225, 0.062280986458063126], [-0.016330134123563766, -0.16266101598739624, 0.04528605937957764, 0.36852723360061646], [-0.019583353772759438, -0.3583962023258209, 0.05265660211443901, 0.675138533115387], [-0.026751277968287468, -0.16404402256011963, 0.06615937501192093, 0.399488240480423], [-0.03003215789794922, -0.3600390553474426, 0.07414913922548294, 0.7122742533683777], [-0.03723293915390968, -0.16601786017417908, 0.08839462697505951, 0.44382205605506897], [-0.040553297847509384, -0.3622720539569855, 0.09727106243371964, 0.763008177280426], [-0.04779873788356781, -0.16861480474472046, 0.11253122985363007, 0.5024480819702148], [-0.05117103457450867, -0.3651280701160431, 0.12258019298315048, 0.8283679485321045], [-0.05847359448671341, -0.17187608778476715, 0.13914754986763, 0.5766134858131409], [-0.061911117285490036, 0.0210493765771389, 0.1506798267364502, 0.3307998776435852], [-0.06149012967944145, 0.2137412428855896, 0.157295823097229, 0.08916951715946198], [-0.05721530318260193, 0.4062998294830322, 0.15907920897006989, -0.15004803240299225], [-0.04908930882811546, 0.2092999517917633, 0.1560782492160797, 0.1882929801940918], [-0.044903308153152466, 0.4018845558166504, 0.15984411537647247, -0.05137157067656517], [-0.03686561807990074, 0.2048746645450592, 0.15881668031215668, 0.28717041015625], [-0.0327681228518486, 0.00788638461381197, 0.16456007957458496, 0.6254302859306335], [-0.032610394060611725, -0.1891038864850998, 0.17706869542598724, 0.9650864005088806], [-0.03639247268438339, 0.003254740033298731, 0.1963704228401184, 0.7328465580940247], [-0.03470996022224426, 0.04528489708900452, 0.015921862795948982, 0.002742467215284705], [-0.033804260194301605, -0.1500617414712906, 0.015976712107658386, 0.3004060983657837], [-0.036805495619773865, 0.04482889175415039, 0.021984834223985672, 0.01280442625284195], [-0.03590891882777214, 0.23962876200675964, 0.02224092371761799, -0.2728617489337921], [-0.031116342172026634, 0.04419663920998573, 0.016783688217401505, 0.026752227917313576], [-0.03023240901529789, 0.23907393217086792, 0.017318733036518097, -0.2605883479118347], [-0.02545093186199665, 0.04370908439159393, 0.01210696529597044, 0.037506408989429474], [-0.02457674965262413, -0.15158437192440033, 0.01285709347575903, 0.33398449420928955], [-0.027608437463641167, -0.34688693284988403, 0.019536782056093216, 0.6306939721107483], [-0.034546174108982086, -0.5422759652137756, 0.03215066343545914, 0.9294650554656982], [-0.04539169371128082, -0.7378168106079102, 0.05073996260762215, 1.2320754528045654], [-0.060148030519485474, -0.9335532188415527, 0.07538147270679474, 1.5402133464813232], [-0.07881909608840942, -0.7394145131111145, 0.10618574172258377, 1.2719734907150269], [-0.09360738843679428, -0.9357193112373352, 0.1316252052783966, 1.5959320068359375], [-0.11232177168130875, -0.7423808574676514, 0.16354385018348694, 1.3470191955566406], [-0.1271693855524063, -0.939136803150177, 0.19048422574996948, 1.6860828399658203], [0.035648275166749954, 0.019629720598459244, -0.041184622794389725, -0.01570443995296955], [0.03604086861014366, -0.17487813532352448, -0.041498709470033646, 0.2637050747871399], [0.032543305307626724, -0.36938393115997314, -0.0362246073782444, 0.5430154800415039], [0.025155628100037575, -0.5639785528182983, -0.02536430023610592, 0.8240682482719421], [0.013876056298613548, -0.7587445378303528, -0.008882935158908367, 1.1086668968200684], [-0.0012988351518288255, -0.9537486433982849, 0.01329040341079235, 1.3985499143600464], [-0.020373808220028877, -1.1490333080291748, 0.04126140475273132, 1.6953582763671875], [-0.043354474008083344, -1.3446062803268433, 0.07516857236623764, 2.0005955696105957], [-0.07024659961462021, -1.1503452062606812, 0.11518047749996185, 1.7321056127548218], [-0.09325350821018219, -0.9567113518714905, 0.14982259273529053, 1.4773674011230469], [-0.11238773167133331, -0.7637028694152832, 0.1793699413537979, 1.2349811792373657], [-0.127661794424057, -0.5712811946868896, 0.2040695697069168, 1.0034319162368774], [-0.036039337515830994, -0.03723224997520447, -0.04315886273980141, 0.02597273513674736], [-0.03678398206830025, 0.15848121047019958, -0.04263940826058388, -0.28000885248184204], [-0.03361435607075691, 0.35418465733528137, -0.048239585012197495, -0.5858293771743774], [-0.026530664414167404, 0.5499479174613953, -0.05995617434382439, -0.8933095932006836], [-0.015531706623733044, 0.7458295226097107, -0.07782236486673355, -1.2042206525802612], [-0.0006151155102998018, 0.941866397857666, -0.10190677642822266, -1.5202425718307495], [0.01822221279144287, 1.138061761856079, -0.1323116272687912, -1.8429176807403564], [0.040983449667692184, 1.3343720436096191, -0.16916997730731964, -2.173595666885376], [0.022204197943210602, 0.025709448382258415, 0.024002883583307266, 0.0008003154653124511], [0.022718386724591255, -0.16974836587905884, 0.024018889293074608, 0.3009587526321411], [0.01932341977953911, -0.3652042746543884, 0.03003806434571743, 0.6011189222335815], [0.012019334360957146, -0.5607332587242126, 0.04206044226884842, 0.9031099677085876], [0.0008046688162721694, -0.36620551347732544, 0.060122642666101456, 0.6239385604858398], [-0.006519441492855549, -0.17197223007678986, 0.07260141521692276, 0.3507804274559021], [-0.009958886541426182, 0.022046171128749847, 0.07961702346801758, 0.08184555917978287], [-0.009517963044345379, -0.17412146925926208, 0.08125393092632294, 0.39854758977890015], [-0.013000392355024815, -0.370296448469162, 0.08922488242387772, 0.7157015800476074], [-0.020406322553753853, -0.5665327310562134, 0.10353891551494598, 1.0350823402404785], [-0.03173697739839554, -0.7628675103187561, 0.12424056231975555, 1.3583934307098389], [-0.046994324773550034, -0.5695032477378845, 0.15140843391418457, 1.107015609741211], [-0.05838438868522644, -0.7662557363510132, 0.17354874312877655, 1.4431121349334717], [-0.07370950281620026, -0.9630367755889893, 0.2024109810590744, 1.7846171855926514]], "actions": [0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.0226325374096632, -0.1621507853269577, 0.01831146888434887, 0.24969695508480072], [-0.025875553488731384, 0.032704953104257584, 0.023305408656597137, -0.03715437278151512], [-0.025221453979611397, -0.16274331510066986, 0.02256232127547264, 0.2627895772457123], [-0.028476320207118988, -0.3581799268722534, 0.027818111702799797, 0.5625026822090149], [-0.035639919340610504, -0.1634591668844223, 0.03906816616654396, 0.2787119746208191], [-0.038909103721380234, 0.031084304675459862, 0.04464240372180939, -0.0013974315952509642], [-0.038287416100502014, 0.22553853690624237, 0.044614456593990326, -0.2796676456928253], [-0.03377664461731911, 0.41999658942222595, 0.03902110457420349, -0.5579522252082825], [-0.025376712903380394, 0.2243492305278778, 0.027862058952450752, -0.25323525071144104], [-0.020889729261398315, 0.4190624952316284, 0.0227973535656929, -0.5370014309883118], [-0.012508478946983814, 0.6138566136360168, 0.012057325802743435, -0.8224148154258728], [-0.00023134703224059194, 0.418571799993515, -0.004390971269458532, -0.5259641408920288], [0.008140088990330696, 0.22351190447807312, -0.014910253696143627, -0.2346680462360382], [0.012610326521098614, 0.028606122359633446, -0.019603613764047623, 0.053274668753147125], [0.013182449154555798, -0.16622933745384216, -0.01853812113404274, 0.3397085964679718], [0.009857862256467342, -0.36108267307281494, -0.011743948794901371, 0.6264885067939758], [0.002636209363117814, -0.5560387372970581, 0.0007858205353841186, 0.9154497981071472], [-0.008484565652906895, -0.7511712908744812, 0.019094815477728844, 1.2083796262741089], [-0.023507991805672646, -0.9465346336364746, 0.043262407183647156, 1.5069847106933594], [-0.04243868589401245, -0.7519631385803223, 0.07340209931135178, 1.2281156778335571], [-0.05747794732451439, -0.5578585863113403, 0.09796441346406937, 0.9593037366867065], [-0.06863512098789215, -0.36418038606643677, 0.11715049296617508, 0.6989348530769348], [-0.07591872662305832, -0.5607149600982666, 0.131129190325737, 1.026079535484314], [-0.087133027613163, -0.7573157548904419, 0.1516507863998413, 1.3568905591964722], [-0.10227934271097183, -0.9539796113967896, 0.17878858745098114, 1.692915439605713], [-0.12135893106460571, -1.1506589651107788, 0.21264690160751343, 2.0355160236358643], [-0.04608498141169548, -0.19641034305095673, 0.002575164893642068, 0.2763350009918213], [-0.050013188272714615, -0.0013252266217023134, 0.008101864717900753, -0.015534601174294949], [-0.05003969371318817, -0.19656242430210114, 0.007791173178702593, 0.27969351410865784], [-0.05397094413638115, -0.0015524782938882709, 0.013385043479502201, -0.010521952994167805], [-0.05400199070572853, -0.1968638002872467, 0.013174604624509811, 0.2863538861274719], [-0.05793926864862442, -0.0019321977160871029, 0.018901681527495384, -0.0021449350751936436], [-0.057977911084890366, 0.19291365146636963, 0.018858782947063446, -0.2888047397136688], [-0.05411963909864426, 0.387761652469635, 0.013082688674330711, -0.5754806399345398], [-0.04636440798640251, 0.5826978087425232, 0.001573075889609754, -0.8640136122703552], [-0.03471045196056366, 0.38755446672439575, -0.015707196667790413, -0.5708364844322205], [-0.026959361508488655, 0.5828931331634521, -0.02712392620742321, -0.8684260845184326], [-0.015301498584449291, 0.7783734202384949, -0.0444924458861351, -1.1695120334625244], [0.000265969691099599, 0.974044919013977, -0.06788268685340881, -1.475805401802063], [0.019746867939829826, 1.1699273586273193, -0.0973987951874733, -1.7888944149017334], [0.04314541444182396, 0.9760239720344543, -0.13317668437957764, -1.528007984161377], [0.0626658946275711, 1.1724774837493896, -0.16373685002326965, -1.8591171503067017], [0.08611544221639633, 1.368974208831787, -0.20091918110847473, -2.1978437900543213], [0.11349493265151978, 1.1762778759002686, -0.24487605690956116, -1.9732874631881714], [0.018700994551181793, 0.16122350096702576, -0.015748370438814163, -0.3413577377796173], [0.021925466135144234, -0.03367089480161667, -0.02257552556693554, -0.053682249039411545], [0.021252047270536423, 0.1617673635482788, -0.023649170994758606, -0.3534015715122223], [0.024487394839525223, 0.3572174608707428, -0.03071720153093338, -0.6534469723701477], [0.031631745398044586, 0.1625364124774933, -0.04378614202141762, -0.37059256434440613], [0.03488247096538544, 0.35825222730636597, -0.051197994500398636, -0.6767539381980896], [0.042047515511512756, 0.5540467500686646, -0.06473307311534882, -0.9851065278053284], [0.053128451108932495, 0.3598487973213196, -0.08443520218133926, -0.7134379148483276], [0.06032542884349823, 0.16599103808403015, -0.09870395809412003, -0.4484816789627075], [0.06364525109529495, -0.027606314048171043, -0.10767359286546707, -0.1884709745645523], [0.06309312582015991, -0.22103624045848846, -0.11144301295280457, 0.06839873641729355], [0.05867239832878113, -0.02450760081410408, -0.11007504165172577, -0.2572619915008545], [0.0581822469830513, -0.21789996325969696, -0.11522027850151062, -0.001225856482051313], [0.05382424592971802, -0.021330274641513824, -0.1152447983622551, -0.3279252052307129], [0.05339764058589935, 0.17522762715816498, -0.12180329859256744, -0.6546133160591125], [0.056902192533016205, 0.3718160390853882, -0.13489556312561035, -0.9830328822135925], [0.06433851271867752, 0.5684621930122375, -0.15455622971057892, -1.314861536026001], [0.07570775598287582, 0.7651647925376892, -0.1808534562587738, -1.651657223701477], [0.09101105481386185, 0.9618799090385437, -0.21388660371303558, -1.9947988986968994], [-0.04794218763709068, -0.21651622653007507, 0.02196269854903221, 0.26673460006713867], [-0.05227251350879669, -0.4119446277618408, 0.02729739062488079, 0.5662630200386047], [-0.060511406511068344, -0.6074386835098267, 0.0386226512491703, 0.8674193024635315], [-0.0726601779460907, -0.8030642867088318, 0.05597103759646416, 1.1719911098480225], [-0.08872146904468536, -0.9988674521446228, 0.0794108584523201, 1.4816828966140747], [-0.10869881510734558, -0.8047990798950195, 0.10904451459646225, 1.2148199081420898], [-0.12479479610919952, -0.6112396717071533, 0.13334091007709503, 0.9582008123397827], [-0.1370195895433426, -0.8078779578208923, 0.15250493586063385, 1.289626121520996], [-0.1531771421432495, -1.0045746564865112, 0.17829746007919312, 1.625909686088562], [-0.1732686460018158, -1.2012896537780762, 0.2108156383037567, 1.9684464931488037], [-0.03356698900461197, -0.22143305838108063, 0.020002590492367744, 0.32682961225509644], [-0.03799565136432648, -0.02660151571035385, 0.026539182290434837, 0.04052112624049187], [-0.038527682423591614, -0.22209379076957703, 0.027349604293704033, 0.34145787358283997], [-0.042969558387994766, -0.41759395599365234, 0.03417876362800598, 0.6426382660865784], [-0.05132143571972847, -0.6131752133369446, 0.047031525522470474, 0.945885419845581], [-0.06358493864536285, -0.8088979721069336, 0.06594923883676529, 1.252967119216919], [-0.07976289838552475, -1.0047998428344727, 0.09100857377052307, 1.5655560493469238], [-0.09985889494419098, -1.2008839845657349, 0.12231969833374023, 1.885184645652771], [-0.12387657910585403, -1.3971059322357178, 0.16002339124679565, 2.213190793991089], [-0.15181869268417358, -1.593357801437378, 0.20428720116615295, 2.5506539344787598], [-0.18368585407733917, -1.4003782272338867, 0.25530028343200684, 2.3268473148345947], [0.010202767327427864, 0.24169619381427765, 0.046121060848236084, -0.24108925461769104], [0.015036690980196, 0.04594679921865463, 0.04129927605390549, 0.06577739119529724], [0.015955626964569092, -0.14974218606948853, 0.04261482134461403, 0.3711991012096405], [0.012960783205926418, -0.34544283151626587, 0.05003880336880684, 0.6770085692405701], [0.006051926873624325, -0.15105053782463074, 0.06357897818088531, 0.40049034357070923], [0.003030915977433324, 0.043114639818668365, 0.07158878445625305, 0.12851065397262573], [0.0038932086899876595, 0.2371419221162796, 0.07415899634361267, -0.14075566828250885], [0.008636047132313251, 0.43112772703170776, 0.07134388387203217, -0.4091518521308899], [0.017258601263165474, 0.6251694560050964, 0.06316084414720535, -0.6785167455673218], [0.029761990532279015, 0.42922958731651306, 0.04959050938487053, -0.3666359782218933], [0.038346581161022186, 0.23343929648399353, 0.04225778952240944, -0.05873797833919525], [0.04301536828279495, 0.42793068289756775, 0.04108303040266037, -0.3377945125102997], [0.0515739805996418, 0.232248917222023, 0.03432714194059372, -0.032444536685943604], [0.056218959391117096, 0.4268622100353241, 0.03367825224995613, -0.31410232186317444], [0.06475620716810226, 0.621488630771637, 0.027396203950047493, -0.5959768295288086], [0.0771859809756279, 0.8162167072296143, 0.015476667322218418, -0.8799058198928833], [0.09351031482219696, 0.6208879351615906, -0.0021214494481682777, -0.5823978185653687], [0.10592807084321976, 0.816039502620697, -0.013769405893981457, -0.8757482767105103], [0.12224885821342468, 1.0113458633422852, -0.03128437325358391, -1.172728180885315], [0.14247578382492065, 0.8166443109512329, -0.054738935083150864, -0.8900147676467896], [0.1588086634874344, 0.6223061084747314, -0.07253923267126083, -0.6150293350219727], [0.17125478386878967, 0.4282686710357666, -0.08483981341123581, -0.3460463881492615], [0.17982016503810883, 0.23444955050945282, -0.09176074713468552, -0.08127638697624207], [0.18450915813446045, 0.040754612535238266, -0.09338627010583878, 0.1811038702726364], [0.18532423675060272, 0.2370801866054535, -0.08976419270038605, -0.13951699435710907], [0.19006584584712982, 0.04335089027881622, -0.09255453199148178, 0.12355174869298935], [0.19093286991119385, 0.2396685630083084, -0.09008350223302841, -0.19683656096458435], [0.19572623074054718, 0.04594288393855095, -0.09402023255825043, 0.06612493842840195], [0.1966450959444046, 0.24227827787399292, -0.09269773215055466, -0.2546786665916443], [0.20149065554141998, 0.4385930895805359, -0.09779130667448044, -0.5751007795333862], [0.21026252210140228, 0.6349401473999023, -0.10929331928491592, -0.8969190120697021], [0.22296132147312164, 0.8313604593276978, -0.12723170220851898, -1.2218598127365112], [0.23958852887153625, 0.6380864381790161, -0.15166890621185303, -0.9715974926948547], [0.2523502707481384, 0.8348824977874756, -0.17110085487365723, -1.3078227043151855], [0.26904791593551636, 1.03170907497406, -0.19725731015205383, -1.6488099098205566], [0.2896820902824402, 0.8393639922142029, -0.23023350536823273, -1.4235056638717651], [-0.038376521319150925, -0.221075177192688, -0.013876471668481827, 0.25784730911254883], [-0.04279802367091179, -0.025757893919944763, -0.00871952623128891, -0.0391799621284008], [-0.04331318289041519, -0.2207537293434143, -0.009503125213086605, 0.2507391571998596], [-0.04772825539112091, -0.41573870182037354, -0.004488341975957155, 0.540409505367279], [-0.05604303255677223, -0.6107972860336304, 0.006319848820567131, 0.8316748738288879], [-0.06825897842645645, -0.8060050010681152, 0.022953346371650696, 1.1263387203216553], [-0.08437907695770264, -1.0014201402664185, 0.04548012092709541, 1.4261317253112793], [-0.10440748184919357, -1.1970735788345337, 0.07400275766849518, 1.7326750755310059], [-0.1283489465713501, -1.0028702020645142, 0.10865625739097595, 1.4639042615890503], [-0.14840635657310486, -1.199142575263977, 0.1379343420267105, 1.7884587049484253], [-0.1723892092704773, -1.3955169916152954, 0.17370352149009705, 2.1206469535827637], [-0.20029954612255096, -1.2024999856948853, 0.21611645817756653, 1.8862906694412231], [0.002716646995395422, -0.23504479229450226, 0.01946922391653061, 0.29309606552124023], [-0.0019842488691210747, -0.4304388463497162, 0.025331145152449608, 0.5918551683425903], [-0.01059302594512701, -0.6259061098098755, 0.03716824948787689, 0.892408549785614], [-0.023111147806048393, -0.82151198387146, 0.0550164170563221, 1.1965396404266357], [-0.03954138606786728, -1.0173012018203735, 0.07894720882177353, 1.5059458017349243], [-0.05988741293549538, -0.8232206106185913, 0.10906612873077393, 1.2389180660247803], [-0.0763518214225769, -1.0195611715316772, 0.1338444948196411, 1.56368088722229], [-0.09674304723739624, -0.8262693881988525, 0.16511811316013336, 1.315569281578064], [-0.11326843500137329, -1.02305006980896, 0.1914294958114624, 1.6550500392913818], [-0.13372944295406342, -1.2198210954666138, 0.22453048825263977, 2.0007522106170654], [-0.02156839892268181, 0.22884945571422577, 0.04894905909895897, -0.24543102085590363], [-0.01699141040444374, 0.033063795417547226, 0.044040437787771225, 0.062280986458063126], [-0.016330134123563766, -0.16266101598739624, 0.04528605937957764, 0.36852723360061646], [-0.019583353772759438, -0.3583962023258209, 0.05265660211443901, 0.675138533115387], [-0.026751277968287468, -0.16404402256011963, 0.06615937501192093, 0.399488240480423], [-0.03003215789794922, -0.3600390553474426, 0.07414913922548294, 0.7122742533683777], [-0.03723293915390968, -0.16601786017417908, 0.08839462697505951, 0.44382205605506897], [-0.040553297847509384, -0.3622720539569855, 0.09727106243371964, 0.763008177280426], [-0.04779873788356781, -0.16861480474472046, 0.11253122985363007, 0.5024480819702148], [-0.05117103457450867, -0.3651280701160431, 0.12258019298315048, 0.8283679485321045], [-0.05847359448671341, -0.17187608778476715, 0.13914754986763, 0.5766134858131409], [-0.061911117285490036, 0.0210493765771389, 0.1506798267364502, 0.3307998776435852], [-0.06149012967944145, 0.2137412428855896, 0.157295823097229, 0.08916951715946198], [-0.05721530318260193, 0.4062998294830322, 0.15907920897006989, -0.15004803240299225], [-0.04908930882811546, 0.2092999517917633, 0.1560782492160797, 0.1882929801940918], [-0.044903308153152466, 0.4018845558166504, 0.15984411537647247, -0.05137157067656517], [-0.03686561807990074, 0.2048746645450592, 0.15881668031215668, 0.28717041015625], [-0.0327681228518486, 0.00788638461381197, 0.16456007957458496, 0.6254302859306335], [-0.032610394060611725, -0.1891038864850998, 0.17706869542598724, 0.9650864005088806], [-0.03639247268438339, 0.003254740033298731, 0.1963704228401184, 0.7328465580940247], [-0.03632737696170807, -0.193960040807724, 0.2110273540019989, 1.0803459882736206], [-0.033804260194301605, -0.1500617414712906, 0.015976712107658386, 0.3004060983657837], [-0.036805495619773865, 0.04482889175415039, 0.021984834223985672, 0.01280442625284195], [-0.03590891882777214, 0.23962876200675964, 0.02224092371761799, -0.2728617489337921], [-0.031116342172026634, 0.04419663920998573, 0.016783688217401505, 0.026752227917313576], [-0.03023240901529789, 0.23907393217086792, 0.017318733036518097, -0.2605883479118347], [-0.02545093186199665, 0.04370908439159393, 0.01210696529597044, 0.037506408989429474], [-0.02457674965262413, -0.15158437192440033, 0.01285709347575903, 0.33398449420928955], [-0.027608437463641167, -0.34688693284988403, 0.019536782056093216, 0.6306939721107483], [-0.034546174108982086, -0.5422759652137756, 0.03215066343545914, 0.9294650554656982], [-0.04539169371128082, -0.7378168106079102, 0.05073996260762215, 1.2320754528045654], [-0.060148030519485474, -0.9335532188415527, 0.07538147270679474, 1.5402133464813232], [-0.07881909608840942, -0.7394145131111145, 0.10618574172258377, 1.2719734907150269], [-0.09360738843679428, -0.9357193112373352, 0.1316252052783966, 1.5959320068359375], [-0.11232177168130875, -0.7423808574676514, 0.16354385018348694, 1.3470191955566406], [-0.1271693855524063, -0.939136803150177, 0.19048422574996948, 1.6860828399658203], [-0.14595212042331696, -1.1358838081359863, 0.224205881357193, 2.031529664993286], [0.03604086861014366, -0.17487813532352448, -0.041498709470033646, 0.2637050747871399], [0.032543305307626724, -0.36938393115997314, -0.0362246073782444, 0.5430154800415039], [0.025155628100037575, -0.5639785528182983, -0.02536430023610592, 0.8240682482719421], [0.013876056298613548, -0.7587445378303528, -0.008882935158908367, 1.1086668968200684], [-0.0012988351518288255, -0.9537486433982849, 0.01329040341079235, 1.3985499143600464], [-0.020373808220028877, -1.1490333080291748, 0.04126140475273132, 1.6953582763671875], [-0.043354474008083344, -1.3446062803268433, 0.07516857236623764, 2.0005955696105957], [-0.07024659961462021, -1.1503452062606812, 0.11518047749996185, 1.7321056127548218], [-0.09325350821018219, -0.9567113518714905, 0.14982259273529053, 1.4773674011230469], [-0.11238773167133331, -0.7637028694152832, 0.1793699413537979, 1.2349811792373657], [-0.127661794424057, -0.5712811946868896, 0.2040695697069168, 1.0034319162368774], [-0.13908740878105164, -0.3793829083442688, 0.22413820028305054, 0.7811382412910461], [-0.03678398206830025, 0.15848121047019958, -0.04263940826058388, -0.28000885248184204], [-0.03361435607075691, 0.35418465733528137, -0.048239585012197495, -0.5858293771743774], [-0.026530664414167404, 0.5499479174613953, -0.05995617434382439, -0.8933095932006836], [-0.015531706623733044, 0.7458295226097107, -0.07782236486673355, -1.2042206525802612], [-0.0006151155102998018, 0.941866397857666, -0.10190677642822266, -1.5202425718307495], [0.01822221279144287, 1.138061761856079, -0.1323116272687912, -1.8429176807403564], [0.040983449667692184, 1.3343720436096191, -0.16916997730731964, -2.173595666885376], [0.06767088919878006, 1.1412547826766968, -0.2126418948173523, -1.937553882598877], [0.022718386724591255, -0.16974836587905884, 0.024018889293074608, 0.3009587526321411], [0.01932341977953911, -0.3652042746543884, 0.03003806434571743, 0.6011189222335815], [0.012019334360957146, -0.5607332587242126, 0.04206044226884842, 0.9031099677085876], [0.0008046688162721694, -0.36620551347732544, 0.060122642666101456, 0.6239385604858398], [-0.006519441492855549, -0.17197223007678986, 0.07260141521692276, 0.3507804274559021], [-0.009958886541426182, 0.022046171128749847, 0.07961702346801758, 0.08184555917978287], [-0.009517963044345379, -0.17412146925926208, 0.08125393092632294, 0.39854758977890015], [-0.013000392355024815, -0.370296448469162, 0.08922488242387772, 0.7157015800476074], [-0.020406322553753853, -0.5665327310562134, 0.10353891551494598, 1.0350823402404785], [-0.03173697739839554, -0.7628675103187561, 0.12424056231975555, 1.3583934307098389], [-0.046994324773550034, -0.5695032477378845, 0.15140843391418457, 1.107015609741211], [-0.05838438868522644, -0.7662557363510132, 0.17354874312877655, 1.4431121349334717], [-0.07370950281620026, -0.9630367755889893, 0.2024109810590744, 1.7846171855926514], [-0.09297023713588715, -0.7706831693649292, 0.23810333013534546, 1.5610805749893188]], "action_prob": [0.5000608563423157, 0.5006152987480164, 0.500034749507904, 0.4993596076965332, 0.5011224150657654, 0.5006982088088989, 0.5000666379928589, 0.49943485856056213, 0.5010063648223877, 0.4994203448295593, 0.4989668130874634, 0.5012794137001038, 0.501090943813324, 0.500669002532959, 0.5000292658805847, 0.499386191368103, 0.498940110206604, 0.4986981749534607, 0.49857714772224426, 0.501491904258728, 0.5015208721160889, 0.501501202583313, 0.4986251890659332, 0.4984268248081207, 0.49833980202674866, 0.4982913136482239, 0.49997714161872864, 0.5006805062294006, 0.4999612271785736, 0.5006972551345825, 0.4999407231807709, 0.50071781873703, 0.5000848770141602, 0.4994383752346039, 0.49898436665534973, 0.5012637972831726, 0.49892088770866394, 0.4986760914325714, 0.4985574781894684, 0.4984913170337677, 0.5015592575073242, 0.4983862340450287, 0.49834486842155457, 0.5016953945159912, 0.4999557435512543, 0.5006999373435974, 0.49992528557777405, 0.499270498752594, 0.501170814037323, 0.4992066025733948, 0.49877452850341797, 0.5014443397521973, 0.5013121366500854, 0.5009911060333252, 0.5004525780677795, 0.5001809000968933, 0.5005382299423218, 0.5000917911529541, 0.49937310814857483, 0.498818576335907, 0.4985113739967346, 0.4983616769313812, 0.4982808232307434, 0.4999234080314636, 0.49926263093948364, 0.4988122582435608, 0.49858328700065613, 0.4984802305698395, 0.5015733242034912, 0.5016141533851624, 0.4983852207660675, 0.49831125140190125, 0.4982750415802002, 0.499855101108551, 0.5007871389389038, 0.49982014298439026, 0.4991806447505951, 0.4987682104110718, 0.49856358766555786, 0.49846935272216797, 0.4984166920185089, 0.4983743727207184, 0.4983326494693756, 0.5017091035842896, 0.5000511407852173, 0.5005860328674316, 0.4999227523803711, 0.49926406145095825, 0.5011752247810364, 0.5008124113082886, 0.5002304911613464, 0.4995861351490021, 0.499090313911438, 0.5011990070343018, 0.5009352564811707, 0.4995953142642975, 0.5009397268295288, 0.49960190057754517, 0.49905475974082947, 0.49873101711273193, 0.5014244914054871, 0.49866676330566406, 0.49851492047309875, 0.5015504956245422, 0.5015665292739868, 0.5014997720718384, 0.5012648105621338, 0.5007980465888977, 0.49982741475105286, 0.5008665919303894, 0.4997484087944031, 0.500935435295105, 0.49966445565223694, 0.4989943504333496, 0.4985586404800415, 0.49836286902427673, 0.5017066597938538, 0.49827659130096436, 0.4982224702835083, 0.5017983913421631, 0.4999914765357971, 0.5006585121154785, 0.49998998641967773, 0.49933692812919617, 0.498880535364151, 0.49864035844802856, 0.49852871894836426, 0.49847057461738586, 0.5015723705291748, 0.49836966395378113, 0.498336523771286, 0.5016968846321106, 0.4999043941497803, 0.4992574155330658, 0.49882909655570984, 0.4986118674278259, 0.4985103905200958, 0.5015462636947632, 0.4984143376350403, 0.5016320943832397, 0.49831876158714294, 0.49828165769577026, 0.5000969767570496, 0.5005408525466919, 0.499874472618103, 0.49921783804893494, 0.5012150406837463, 0.49914002418518066, 0.5012767314910889, 0.4990496337413788, 0.5013444423675537, 0.4989478886127472, 0.5014174580574036, 0.5011631846427917, 0.5007032752037048, 0.5001010894775391, 0.5004695653915405, 0.5002113580703735, 0.5003808736801147, 0.4996751546859741, 0.49901774525642395, 0.5014039278030396, 0.4988881051540375, 0.5000126957893372, 0.5006555914878845, 0.5000146627426147, 0.5006222724914551, 0.5000184774398804, 0.5006235241889954, 0.4999808967113495, 0.49932152032852173, 0.4988655149936676, 0.4986245036125183, 0.49850863218307495, 0.5015551447868347, 0.4984096884727478, 0.5016450881958008, 0.498309850692749, 0.4982631802558899, 0.5001639723777771, 0.49951502680778503, 0.4990406930446625, 0.49877336621284485, 0.49863776564598083, 0.498562216758728, 0.4985067844390869, 0.5015445947647095, 0.5016043782234192, 0.5016613006591797, 0.5017051696777344, 0.5017110109329224, 0.5000380873680115, 0.4993598759174347, 0.4988841414451599, 0.49863380193710327, 0.4985145628452301, 0.49844890832901, 0.4983990490436554, 0.5016478300094604, 0.5000118017196655, 0.4993464946746826, 0.4988860487937927, 0.5013565421104431, 0.5011929273605347, 0.500821590423584, 0.4997659921646118, 0.49911344051361084, 0.4987034201622009, 0.4985034763813019, 0.5015905499458313, 0.49840638041496277, 0.4983244240283966, 0.5017257928848267], "advantages": [22.995222091674805, 22.220266342163086, 21.431838989257812, 20.64109230041504, 19.84178352355957, 19.029897689819336, 18.209327697753906, 17.380531311035156, 16.54392433166504, 15.703266143798828, 14.849627494812012, 13.988059997558594, 13.120848655700684, 12.245572090148926, 11.361936569213867, 10.469265937805176, 9.5669584274292, 8.654827117919922, 7.7329277992248535, 6.801340579986572, 5.85953426361084, 4.907903671264648, 3.9462273120880127, 2.9773120880126953, 1.9979807138442993, 1.0083611011505127, 16.54841423034668, 15.708266258239746, 14.854037284851074, 13.996788024902344, 13.125288009643555, 12.250585556030273, 11.361469268798828, 10.463432312011719, 9.55692195892334, 8.641968727111816, 7.720638275146484, 6.787089824676514, 5.844709873199463, 4.893215179443359, 3.9323623180389404, 2.962120532989502, 1.981783151626587, 0.991695761680603, 17.38275718688965, 16.545469284057617, 15.705193519592285, 14.850954055786133, 13.988761901855469, 13.121973991394043, 12.24232292175293, 11.354568481445312, 10.460332870483398, 9.55764389038086, 8.646395683288574, 7.726169586181641, 6.790973663330078, 5.8519816398620605, 4.897893905639648, 3.9348373413085938, 2.9629714488983154, 1.982005000114441, 0.9915837049484253, 9.561509132385254, 8.650840759277344, 7.730387210845947, 6.799881458282471, 5.8593645095825195, 4.908926010131836, 3.948002815246582, 2.9770829677581787, 1.9978786706924438, 1.008346438407898, 10.466465950012207, 9.564865112304688, 8.648694038391113, 7.728734016418457, 6.79880428314209, 5.858728408813477, 4.908579349517822, 3.9484474658966064, 2.978376865386963, 1.9983649253845215, 1.008374571800232, 30.359098434448242, 29.652992248535156, 28.945358276367188, 28.230422973632812, 27.50754165649414, 26.773405075073242, 26.03127670288086, 25.281484603881836, 24.52448081970215, 23.760433197021484, 22.99237823486328, 22.21725082397461, 21.429092407226562, 20.63819122314453, 19.834028244018555, 19.022335052490234, 18.203062057495117, 17.378293991088867, 16.542341232299805, 15.698469161987305, 14.847797393798828, 13.98900032043457, 13.122082710266113, 12.24691104888916, 11.363078117370605, 10.46467399597168, 9.562853813171387, 8.646269798278809, 7.72607421875, 6.790954113006592, 5.846964359283447, 4.894257068634033, 3.932609796524048, 2.9629464149475098, 1.9818856716156006, 0.9913784861564636, 11.361175537109375, 10.468588829040527, 9.561382293701172, 8.650634765625, 7.7301530838012695, 6.79966402053833, 5.859184265136719, 4.908787727355957, 3.9485180377960205, 2.978093147277832, 1.998308777809143, 1.008446216583252, 9.561837196350098, 8.651116371154785, 7.730556011199951, 6.799947261810303, 5.85935115814209, 4.908858299255371, 3.9479753971099854, 2.9781548976898193, 1.9978634119033813, 1.0082863569259644, 19.027565002441406, 18.20701026916504, 17.383766174316406, 16.55206871032715, 15.711249351501465, 14.857948303222656, 13.999977111816406, 13.129521369934082, 12.254016876220703, 11.366084098815918, 10.47265338897705, 9.566914558410645, 8.651481628417969, 7.726431369781494, 6.792069435119629, 5.853769779205322, 4.900453090667725, 3.943037748336792, 2.9754414558410645, 1.9971039295196533, 1.0060029029846191, 14.85419750213623, 13.996964454650879, 13.12549877166748, 12.245285987854004, 11.361715316772461, 10.463658332824707, 9.562088966369629, 8.651351928710938, 7.730776309967041, 6.800149917602539, 5.859533786773682, 4.909021854400635, 3.9481518268585205, 2.9783101081848145, 1.9980297088623047, 1.0084301233291626, 11.361287117004395, 10.468618392944336, 9.566401481628418, 8.654387474060059, 7.732593536376953, 6.801091194152832, 5.859920024871826, 4.909080505371094, 3.948512315750122, 2.9781277179718018, 1.9977740049362183, 1.0072861909866333, 7.72564697265625, 6.7906928062438965, 5.846938133239746, 4.8944525718688965, 3.9329757690429688, 2.9622020721435547, 1.9818757772445679, 0.9917917251586914, 13.12549114227295, 12.250791549682617, 11.366613388061523, 10.472732543945312, 9.567083358764648, 8.65165901184082, 7.726450443267822, 6.797236442565918, 5.857839107513428, 4.908137321472168, 3.9482569694519043, 2.9775540828704834, 1.9980956315994263, 1.0083919763565063], "value_targets": [22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [589830065, 589830065, 589830065, 589830065, 589830065, 589830065, 589830065, 589830065, 589830065, 589830065, 691935141, 691935141, 691935141, 691935141, 691935141, 691935141, 691935141, 691935141, 691935141, 691935141, 691935141, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 8696792, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 1908216693, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 853010846, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 236504457, 1092921004, 1092921004, 1092921004, 1092921004, 1092921004, 1092921004, 1092921004, 1092921004, 1092921004, 1092921004, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 364237636, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1771447307, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544, 1407963544], "obs": [[-0.005344755481928587, 0.0027487240731716156, 0.014686955139040947, 0.012807734310626984], [-0.005289780907332897, -0.19258074462413788, 0.014943109825253487, 0.3100881576538086], [-0.009141395799815655, -0.3879123628139496, 0.021144872531294823, 0.607446014881134], [-0.01689964346587658, -0.5833234786987305, 0.033293794840574265, 0.9067132472991943], [-0.028566112741827965, -0.7788800001144409, 0.05142805725336075, 1.2096720933914185], [-0.044143714010715485, -0.9746269583702087, 0.07562150061130524, 1.5180175304412842], [-0.06363625079393387, -0.7804966568946838, 0.10598184913396835, 1.2498657703399658], [-0.07924618571996689, -0.5868805646896362, 0.13097916543483734, 0.9921715259552002], [-0.0909838005900383, -0.7834887504577637, 0.15082259476184845, 1.32295560836792], [-0.10665357112884521, -0.9801596403121948, 0.1772817075252533, 1.6587868928909302], [-0.020260225981473923, -0.028288500383496284, 0.009921964257955551, -0.03404702991247177], [-0.02082599699497223, -0.22355131804943085, 0.009241024032235146, 0.261749804019928], [-0.025297023355960846, -0.41880396008491516, 0.014476019889116287, 0.5573330521583557], [-0.03367310017347336, -0.6141260862350464, 0.02562268078327179, 0.8545413613319397], [-0.04595562443137169, -0.8095877170562744, 0.042713508009910583, 1.1551698446273804], [-0.06214737892150879, -1.0052398443222046, 0.06581690162420273, 1.4609342813491821], [-0.08225217461585999, -0.8109835982322693, 0.09503559023141861, 1.1895170211791992], [-0.09847184270620346, -1.007200002670288, 0.11882592737674713, 1.5104118585586548], [-0.11861584335565567, -0.813701331615448, 0.14903417229652405, 1.2570632696151733], [-0.1348898708820343, -1.010382890701294, 0.174175426363945, 1.592469334602356], [-0.15509752929210663, -0.817703366279602, 0.20602482557296753, 1.3587719202041626], [0.03006465919315815, 0.031160185113549232, 0.014074956998229027, 0.02264290116727352], [0.030687863007187843, 0.22607748210430145, 0.014527814462780952, -0.2655662000179291], [0.03520941361784935, 0.03075123205780983, 0.009216491132974625, 0.03166329860687256], [0.03582443669438362, 0.22573980689048767, 0.009849756956100464, -0.2580975294113159], [0.04033923149108887, 0.03047863580286503, 0.004687806125730276, 0.037675801664590836], [0.04094880446791649, -0.16471022367477417, 0.005441321991384029, 0.331834077835083], [0.03765460103750229, 0.030333854258060455, 0.012078003957867622, 0.040872037410736084], [0.038261279463768005, -0.16495919227600098, 0.01289544440805912, 0.3373410999774933], [0.03496209532022476, -0.3602622449398041, 0.019642265513539314, 0.6340624690055847], [0.02775684930384159, -0.16541972756385803, 0.03232351690530777, 0.34762951731681824], [0.0244484543800354, -0.3609861731529236, 0.039276108145713806, 0.6503273844718933], [0.017228731885552406, -0.16643266379833221, 0.052282653748989105, 0.3702664077281952], [0.01390007883310318, 0.02790900319814682, 0.059687983244657516, 0.09451635181903839], [0.014458258636295795, 0.22212691605091095, 0.061578311026096344, -0.17875388264656067], [0.0189007967710495, 0.026180295273661613, 0.05800323188304901, 0.1327015608549118], [0.019424403086304665, 0.22042548656463623, 0.06065726280212402, -0.14113284647464752], [0.023832913488149643, 0.41462862491607666, 0.05783460661768913, -0.4140795171260834], [0.03212548419833183, 0.6088851690292358, 0.04955301433801651, -0.6879832744598389], [0.04430318996310234, 0.8032855987548828, 0.035793352872133255, -0.9646633267402649], [0.06036889925599098, 0.6077015399932861, 0.016500083729624748, -0.6609541773796082], [0.07252293080091476, 0.4123539328575134, 0.003281000768765807, -0.3631218373775482], [0.08077000826597214, 0.6074290871620178, -0.003981436137109995, -0.6547684073448181], [0.09291858971118927, 0.8026062846183777, -0.017076803371310234, -0.948702335357666], [0.10897071659564972, 0.9979538917541504, -0.03605085238814354, -1.2467014789581299], [0.12892979383468628, 0.803312361240387, -0.06098487973213196, -0.9655255079269409], [0.1449960470199585, 0.6090602278709412, -0.0802953913807869, -0.6926074028015137], [0.15717725455760956, 0.4151386618614197, -0.09414754062891006, -0.42624372243881226], [0.16548001766204834, 0.221467524766922, -0.10267241299152374, -0.16466207802295685], [0.16990937292575836, 0.027953753247857094, -0.10596565157175064, 0.09394728392362595], [0.17046844959259033, 0.22442232072353363, -0.10408671200275421, -0.2301981896162033], [0.17495688796043396, 0.030929837375879288, -0.10869067162275314, 0.027923472225666046], [0.17557549476623535, 0.22742904722690582, -0.10813220590353012, -0.2969782054424286], [0.18012407422065735, 0.03400137275457382, -0.11407176405191422, -0.04026024043560028], [0.18080410361289978, 0.2305586040019989, -0.11487697064876556, -0.36664432287216187], [0.18541526794433594, 0.42710962891578674, -0.12220986187458038, -0.693227231502533], [0.19395746290683746, 0.23387590050697327, -0.13607440888881683, -0.44137877225875854], [0.19863498210906982, 0.43063464760780334, -0.14490197598934174, -0.7736712098121643], [0.20724767446517944, 0.23777173459529877, -0.16037540137767792, -0.5298608541488647], [0.21200311183929443, 0.434743195772171, -0.17097261548042297, -0.868475079536438], [0.22069796919822693, 0.24230815470218658, -0.1883421242237091, -0.634052574634552], [0.22554413974285126, 0.05024309083819389, -0.2010231763124466, -0.4060955047607422], [0.22654899954795837, 0.2475632131099701, -0.20914508402347565, -0.7548190355300903], [0.015349479392170906, 0.003206053748726845, -0.03599541634321213, -0.0037300419062376022], [0.015413600020110607, -0.19138167798519135, -0.036070019006729126, 0.27738210558891296], [0.011585966683924198, 0.004235801286995411, -0.03052237629890442, -0.026455527171492577], [0.011670682579278946, 0.1997818648815155, -0.03105148673057556, -0.3286101818084717], [0.01566632091999054, 0.005115414969623089, -0.03762368857860565, -0.04587894305586815], [0.0157686285674572, -0.18944740295410156, -0.038541268557310104, 0.23469999432563782], [0.011979680508375168, 0.006203415337949991, -0.03384726867079735, -0.06988661736249924], [0.012103748507797718, 0.2017938643693924, -0.03524500131607056, -0.3730534613132477], [0.016139626502990723, 0.39739829301834106, -0.042706072330474854, -0.6766377687454224], [0.02408759295940399, 0.593086838722229, -0.05623882636427879, -0.9824546575546265], [0.03594932705163956, 0.39876168966293335, -0.07588791847229004, -0.7079533338546753], [0.04392456263303757, 0.5948482751846313, -0.09004698693752289, -1.0235263109207153], [0.05582152679562569, 0.791046679019928, -0.11051751673221588, -1.3430695533752441], [0.07164245843887329, 0.9873718619346619, -0.13737890124320984, -1.668186902999878], [0.09138990193605423, 1.1837979555130005, -0.17074264585971832, -2.000312566757202], [-0.0003364181611686945, 0.015084303915500641, -0.001488917856477201, 0.03409072756767273], [-3.473207834758796e-05, 0.2102275788784027, -0.0008071033516898751, -0.2590616047382355], [0.004169819410890341, 0.015117155387997627, -0.005988335236907005, 0.033366650342941284], [0.004472162574529648, -0.17991840839385986, -0.005321002099663019, 0.32415419816970825], [0.0008737943135201931, -0.3749642074108124, 0.0011620816076174378, 0.6151543855667114], [-0.006625489331781864, -0.1798585057258606, 0.01346516888588667, 0.3228376507759094], [-0.010222659446299076, 0.015069148503243923, 0.0199219211935997, 0.034431342035532], [-0.009921276941895485, -0.1803327351808548, 0.020610548555850983, 0.3333326578140259], [-0.013527931645512581, -0.3757418990135193, 0.027277201414108276, 0.6324431896209717], [-0.02104276977479458, -0.5712335705757141, 0.03992606699466705, 0.9335901141166687], [-0.03246743977069855, -0.37667232751846313, 0.0585978701710701, 0.6537160277366638], [-0.04000088572502136, -0.18241317570209503, 0.07167218625545502, 0.3800453245639801], [-0.04364915192127228, 0.011621693149209023, 0.07927309721708298, 0.11079384386539459], [-0.043416716158390045, 0.20552349090576172, 0.08148897439241409, -0.15586353838443756], [-0.03930624574422836, 0.009335072711110115, 0.07837170362472534, 0.1613737940788269], [-0.03911954537034035, -0.1868162900209427, 0.0815991759300232, 0.477715402841568], [-0.042855869978666306, 0.007064502220600843, 0.09115348756313324, 0.211825430393219], [-0.04271458089351654, -0.18923449516296387, 0.09538999199867249, 0.5318135023117065], [-0.04649927094578743, 0.004425440914928913, 0.10602626204490662, 0.2706463932991028], [-0.04641076177358627, -0.19203715026378632, 0.11143919080495834, 0.594798743724823], [-0.05025150626897812, -0.38852789998054504, 0.12333516776561737, 0.9204020500183105], [-0.058022063225507736, -0.5850814580917358, 0.14174321293830872, 1.2491614818572998], [-0.0697236955165863, -0.39203202724456787, 0.16672644019126892, 1.0040245056152344], [-0.07756433635950089, -0.19948191940784454, 0.18680693209171295, 0.7679951786994934], [-0.08155397325754166, -0.007355192676186562, 0.2021668255329132, 0.5394212603569031], [-0.04135406017303467, 0.025279272347688675, -0.03320702910423279, -0.03924328833818436], [-0.04084847494959831, 0.2208612859249115, -0.033991895616054535, -0.3422156572341919], [-0.03643124923110008, 0.02623901702463627, -0.04083620756864548, -0.06044257804751396], [-0.03590647131204605, -0.16827435791492462, -0.04204506054520607, 0.21908172965049744], [-0.03927195817232132, -0.36277085542678833, -0.037663426250219345, 0.4982110559940338], [-0.046527374535799026, -0.16713868081569672, -0.02769920416176319, 0.193900465965271], [-0.04987014830112457, 0.028368324041366577, -0.02382119558751583, -0.10739007592201233], [-0.049302779138088226, -0.16640430688858032, -0.025968996807932854, 0.17768320441246033], [-0.052630867809057236, -0.3611451983451843, -0.02241533249616623, 0.4620620012283325], [-0.05985376983880997, -0.16571372747421265, -0.013174092397093773, 0.16239890456199646], [-0.06316804885864258, 0.02959432080388069, -0.009926114231348038, -0.1344108134508133], [-0.06257615983486176, -0.16538405418395996, -0.012614330276846886, 0.15512411296367645], [-0.06588383764028549, 0.02991621568799019, -0.009511847980320454, -0.14151149988174438], [-0.06528551876544952, 0.22517310082912445, -0.012342077679932117, -0.4371800124645233], [-0.0607820525765419, 0.03022800013422966, -0.021085677668452263, -0.14841312170028687], [-0.06017749384045601, 0.22564545273780823, -0.024053940549492836, -0.44767287373542786], [-0.055664584040641785, 0.4210992753505707, -0.03300739824771881, -0.7478399276733398], [-0.047242600470781326, 0.22644785046577454, -0.047964196652173996, -0.46572428941726685], [-0.04271364212036133, 0.03203527256846428, -0.05727868154644966, -0.1885368674993515], [-0.04207293689250946, -0.16222241520881653, -0.06104942038655281, 0.08554107695817947], [-0.0453173853456974, -0.35641855001449585, -0.05933859944343567, 0.35835522413253784], [-0.052445754408836365, -0.5506489276885986, -0.0521714948117733, 0.6317527294158936], [-0.06345873326063156, -0.7450056672096252, -0.03953643888235092, 0.9075596928596497], [-0.07835885137319565, -0.9395707249641418, -0.02138524502515793, 1.1875585317611694], [-0.09715025871992111, -1.134408950805664, 0.0023659253492951393, 1.4734622240066528], [-0.11983843892812729, -0.9393160343170166, 0.031835172325372696, 1.1815192699432373], [-0.13862475752830505, -1.1348363161087036, 0.05546555668115616, 1.4840091466903687], [-0.1613214910030365, -0.9404328465461731, 0.0851457417011261, 1.209150791168213], [-0.18013015389442444, -1.136544942855835, 0.1093287542462349, 1.527255892753601], [-0.20286104083061218, -1.3328031301498413, 0.13987387716770172, 1.8519641160964966], [-0.2295171022415161, -1.5291591882705688, 0.17691315710544586, 2.1846108436584473], [-0.01027501281350851, 0.01324821263551712, 0.0358923077583313, 0.017890654504299164], [-0.010010048747062683, -0.18236960470676422, 0.036250121891498566, 0.3216784596443176], [-0.01365744136273861, -0.3779885172843933, 0.042683690786361694, 0.6255692839622498], [-0.021217212080955505, -0.573679506778717, 0.05519507825374603, 0.9313836097717285], [-0.03269080072641373, -0.37934410572052, 0.0738227516412735, 0.6565435528755188], [-0.04027768224477768, -0.5754119157791138, 0.08695361763238907, 0.9715283513069153], [-0.051785919815301895, -0.7715863585472107, 0.10638418793678284, 1.290210485458374], [-0.06721764802932739, -0.9678881764411926, 0.13218839466571808, 1.6142164468765259], [-0.08657541126012802, -0.7745506763458252, 0.16447272896766663, 1.3654905557632446], [-0.10206642746925354, -0.5818253755569458, 0.19178253412246704, 1.1284412145614624], [0.04747304692864418, 0.020594706758856773, -0.022415902465581894, 0.004318537190556526], [0.04788494110107422, -0.174198716878891, -0.022329531610012054, 0.2898455262184143], [0.04440096765756607, 0.021234409883618355, -0.016532622277736664, -0.00979540217667818], [0.04482565447688103, -0.17364658415317535, -0.016728529706597328, 0.27762576937675476], [0.04135272279381752, -0.3685259521007538, -0.011176014319062233, 0.5649859309196472], [0.033982206135988235, -0.1732489913702011, 0.00012370466720312834, 0.26880311965942383], [0.030517226085066795, -0.36837270855903625, 0.005499767139554024, 0.5615250468254089], [0.023149771615862846, -0.5635713934898376, 0.01673026941716671, 0.8559356331825256], [0.011878343299031258, -0.3686813712120056, 0.03384898230433464, 0.5685599446296692], [0.00450471555814147, -0.17405013740062714, 0.045220181345939636, 0.286730021238327], [0.0010237129172310233, -0.3697868287563324, 0.05095478147268295, 0.593325138092041], [-0.006372023839503527, -0.5655836462974548, 0.06282128393650055, 0.9016133546829224], [-0.017683696001768112, -0.7614978551864624, 0.08085355162620544, 1.2133623361587524], [-0.032913655042648315, -0.5675070285797119, 0.10512080043554306, 0.9470717310905457], [-0.044263795018196106, -0.3739456832408905, 0.12406223267316818, 0.6891810894012451], [-0.05174270644783974, -0.18074388802051544, 0.13784585893154144, 0.4379865825176239], [-0.05535758659243584, -0.37752023339271545, 0.14660558104515076, 0.7707496881484985], [-0.06290799379348755, -0.5743227601051331, 0.16202057898044586, 1.1057345867156982], [-0.07439444214105606, -0.3816584050655365, 0.18413527309894562, 0.8679487705230713], [-0.0820276141166687, -0.5787438154220581, 0.2014942467212677, 1.2124097347259521], [0.026511402800679207, -0.020933600142598152, -0.014680412597954273, -0.04812859371304512], [0.026092730462551117, -0.21584200859069824, -0.015642983838915825, 0.23988661170005798], [0.02177589014172554, -0.020500119775533676, -0.010845252312719822, -0.057689204812049866], [0.02136588841676712, -0.21546490490436554, -0.011999036185443401, 0.2315523326396942], [0.01705658994615078, -0.41041335463523865, -0.007367989514023066, 0.520426332950592], [0.008848322555422783, -0.21518847346305847, 0.003040537005290389, 0.22543077170848846], [0.004544552881270647, -0.020110104233026505, 0.007549152709543705, -0.06629150360822678], [0.004142350982874632, 0.1749027967453003, 0.006223322357982397, -0.3565830886363983], [0.007640406955033541, -0.02030707150697708, -0.0009083394543267787, -0.06194431334733963], [0.007234265562146902, -0.21541598439216614, -0.0021472256630659103, 0.23045188188552856], [0.0029259456787258387, -0.020263418555259705, 0.0024618119932711124, -0.06290757656097412], [0.002520677400752902, 0.17482315003871918, 0.0012036606203764677, -0.35481277108192444], [0.006017140578478575, -0.02031589485704899, -0.005892594810575247, -0.06175053492188454], [0.0056108226999640465, 0.17489004135131836, -0.007127605378627777, -0.35628676414489746], [0.00910862348973751, -0.020129848271608353, -0.014253340661525726, -0.06585986167192459], [0.008706026710569859, 0.17519351840019226, -0.015570538118481636, -0.36300551891326904], [0.012209896929562092, 0.370533287525177, -0.022830648347735405, -0.6605571508407593], [0.019620561972260475, 0.17573635280132294, -0.03604179248213768, -0.37514954805374146], [0.023135289549827576, -0.018855618312954903, -0.04354478418827057, -0.09404515475034714], [0.022758176550269127, -0.21332727372646332, -0.04542568698525429, 0.18458768725395203], [0.018491631373763084, -0.017585791647434235, -0.04173393175005913, -0.12207221239805222], [0.0181399155408144, 0.17810845375061035, -0.04417537525296211, -0.4276241958141327], [0.021702084690332413, -0.016360905021429062, -0.05272785946726799, -0.1491880714893341], [0.021374866366386414, -0.2106897085905075, -0.05571162328124046, 0.12640520930290222], [0.01716107316315174, -0.4049711227416992, -0.05318351835012436, 0.401004433631897], [0.00906165037304163, -0.2091367095708847, -0.04516343027353287, 0.0920395776629448], [0.004878916312009096, -0.013397494331002235, -0.04332263767719269, -0.2145433872938156], [0.0046109664253890514, 0.18231618404388428, -0.04761350527405739, -0.5205713510513306], [0.008257290348410606, 0.37807491421699524, -0.05802493169903755, -0.827869713306427], [0.01581878773868084, 0.5739402174949646, -0.07458232343196869, -1.1382229328155518], [0.027297591790556908, 0.7699539661407471, -0.09734678268432617, -1.4533331394195557], [0.042696673423051834, 0.5761529803276062, -0.12641344964504242, -1.1925827264785767], [0.05421973019838333, 0.38287460803985596, -0.15026509761810303, -0.9420452117919922], [0.06187722459435463, 0.5796669721603394, -0.16910600662231445, -1.2779192924499512], [0.07347056269645691, 0.38705533742904663, -0.1946643888950348, -1.042603611946106], [-0.04796016216278076, -0.03021615743637085, 0.009147790260612965, -0.01104249618947506], [-0.04856448248028755, 0.16477341949939728, 0.008926940150558949, -0.30082520842552185], [-0.04526901617646217, 0.35976698994636536, 0.002910436363890767, -0.5906794667243958], [-0.03807367384433746, 0.5548480749130249, -0.00890315230935812, -0.8824441432952881], [-0.02697671391069889, 0.35984817147254944, -0.02655203640460968, -0.5925734043121338], [-0.01977975107729435, 0.16510778665542603, -0.038403503596782684, -0.3083711564540863], [-0.016477594152092934, -0.029446519911289215, -0.0445709265768528, -0.028042715042829514], [-0.017066525295376778, -0.2239018976688385, -0.045131780207157135, 0.2502511441707611], [-0.0215445626527071, -0.02816547267138958, -0.04012675583362579, -0.056318748742341995], [-0.022107873111963272, 0.16750817000865936, -0.04125313088297844, -0.3613870441913605], [-0.018757708370685577, -0.02700386755168438, -0.04848087206482887, -0.08199220150709152], [-0.019297786056995392, 0.16877831518650055, -0.05012071877717972, -0.3895682096481323], [-0.015922220423817635, -0.025597751140594482, -0.057912081480026245, -0.1130995824933052], [-0.01643417589366436, -0.21984411776065826, -0.06017407402396202, 0.1607648730278015], [-0.02083105780184269, -0.4140552878379822, -0.05695877596735954, 0.43387386202812195], [-0.029112163931131363, -0.21817514300346375, -0.04828129708766937, 0.12379330396652222], [-0.033475667238235474, -0.41257333755493164, -0.0458054319024086, 0.40086159110069275], [-0.041727133095264435, -0.21683259308338165, -0.03778820112347603, 0.09409637004137039], [-0.04606378450989723, -0.4113931357860565, -0.03590627387166023, 0.37462174892425537], [-0.05429164692759514, -0.21578003466129303, -0.028413837775588036, 0.07083705067634583], [-0.05860724672675133, -0.02026248723268509, -0.026997096836566925, -0.2306734323501587], [-0.05901249870657921, 0.1752346307039261, -0.03161056712269783, -0.5317484140396118], [-0.055507805198431015, 0.3707866072654724, -0.0422455333173275, -0.8342218399047852], [-0.048092070966959, 0.5664594769477844, -0.05892996862530708, -1.1398857831954956], [-0.03676288202404976, 0.7623002529144287, -0.08172768354415894, -1.4504523277282715], [-0.02151687815785408, 0.9583259224891663, -0.11073673516511917, -1.7675106525421143], [-0.0023503585252910852, 0.7646154165267944, -0.1460869461297989, -1.5112147331237793], [0.012941950000822544, 0.5715339779853821, -0.17631123960018158, -1.2674744129180908], [0.024372629821300507, 0.37904688715934753, -0.20166072249412537, -1.0347872972488403]], "actions": [0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.005289780907332897, -0.19258074462413788, 0.014943109825253487, 0.3100881576538086], [-0.009141395799815655, -0.3879123628139496, 0.021144872531294823, 0.607446014881134], [-0.01689964346587658, -0.5833234786987305, 0.033293794840574265, 0.9067132472991943], [-0.028566112741827965, -0.7788800001144409, 0.05142805725336075, 1.2096720933914185], [-0.044143714010715485, -0.9746269583702087, 0.07562150061130524, 1.5180175304412842], [-0.06363625079393387, -0.7804966568946838, 0.10598184913396835, 1.2498657703399658], [-0.07924618571996689, -0.5868805646896362, 0.13097916543483734, 0.9921715259552002], [-0.0909838005900383, -0.7834887504577637, 0.15082259476184845, 1.32295560836792], [-0.10665357112884521, -0.9801596403121948, 0.1772817075252533, 1.6587868928909302], [-0.1262567639350891, -0.7874922156333923, 0.210457444190979, 1.4261635541915894], [-0.02082599699497223, -0.22355131804943085, 0.009241024032235146, 0.261749804019928], [-0.025297023355960846, -0.41880396008491516, 0.014476019889116287, 0.5573330521583557], [-0.03367310017347336, -0.6141260862350464, 0.02562268078327179, 0.8545413613319397], [-0.04595562443137169, -0.8095877170562744, 0.042713508009910583, 1.1551698446273804], [-0.06214737892150879, -1.0052398443222046, 0.06581690162420273, 1.4609342813491821], [-0.08225217461585999, -0.8109835982322693, 0.09503559023141861, 1.1895170211791992], [-0.09847184270620346, -1.007200002670288, 0.11882592737674713, 1.5104118585586548], [-0.11861584335565567, -0.813701331615448, 0.14903417229652405, 1.2570632696151733], [-0.1348898708820343, -1.010382890701294, 0.174175426363945, 1.592469334602356], [-0.15509752929210663, -0.817703366279602, 0.20602482557296753, 1.3587719202041626], [-0.171451598405838, -0.6256727576255798, 0.23320025205612183, 1.1369613409042358], [0.030687863007187843, 0.22607748210430145, 0.014527814462780952, -0.2655662000179291], [0.03520941361784935, 0.03075123205780983, 0.009216491132974625, 0.03166329860687256], [0.03582443669438362, 0.22573980689048767, 0.009849756956100464, -0.2580975294113159], [0.04033923149108887, 0.03047863580286503, 0.004687806125730276, 0.037675801664590836], [0.04094880446791649, -0.16471022367477417, 0.005441321991384029, 0.331834077835083], [0.03765460103750229, 0.030333854258060455, 0.012078003957867622, 0.040872037410736084], [0.038261279463768005, -0.16495919227600098, 0.01289544440805912, 0.3373410999774933], [0.03496209532022476, -0.3602622449398041, 0.019642265513539314, 0.6340624690055847], [0.02775684930384159, -0.16541972756385803, 0.03232351690530777, 0.34762951731681824], [0.0244484543800354, -0.3609861731529236, 0.039276108145713806, 0.6503273844718933], [0.017228731885552406, -0.16643266379833221, 0.052282653748989105, 0.3702664077281952], [0.01390007883310318, 0.02790900319814682, 0.059687983244657516, 0.09451635181903839], [0.014458258636295795, 0.22212691605091095, 0.061578311026096344, -0.17875388264656067], [0.0189007967710495, 0.026180295273661613, 0.05800323188304901, 0.1327015608549118], [0.019424403086304665, 0.22042548656463623, 0.06065726280212402, -0.14113284647464752], [0.023832913488149643, 0.41462862491607666, 0.05783460661768913, -0.4140795171260834], [0.03212548419833183, 0.6088851690292358, 0.04955301433801651, -0.6879832744598389], [0.04430318996310234, 0.8032855987548828, 0.035793352872133255, -0.9646633267402649], [0.06036889925599098, 0.6077015399932861, 0.016500083729624748, -0.6609541773796082], [0.07252293080091476, 0.4123539328575134, 0.003281000768765807, -0.3631218373775482], [0.08077000826597214, 0.6074290871620178, -0.003981436137109995, -0.6547684073448181], [0.09291858971118927, 0.8026062846183777, -0.017076803371310234, -0.948702335357666], [0.10897071659564972, 0.9979538917541504, -0.03605085238814354, -1.2467014789581299], [0.12892979383468628, 0.803312361240387, -0.06098487973213196, -0.9655255079269409], [0.1449960470199585, 0.6090602278709412, -0.0802953913807869, -0.6926074028015137], [0.15717725455760956, 0.4151386618614197, -0.09414754062891006, -0.42624372243881226], [0.16548001766204834, 0.221467524766922, -0.10267241299152374, -0.16466207802295685], [0.16990937292575836, 0.027953753247857094, -0.10596565157175064, 0.09394728392362595], [0.17046844959259033, 0.22442232072353363, -0.10408671200275421, -0.2301981896162033], [0.17495688796043396, 0.030929837375879288, -0.10869067162275314, 0.027923472225666046], [0.17557549476623535, 0.22742904722690582, -0.10813220590353012, -0.2969782054424286], [0.18012407422065735, 0.03400137275457382, -0.11407176405191422, -0.04026024043560028], [0.18080410361289978, 0.2305586040019989, -0.11487697064876556, -0.36664432287216187], [0.18541526794433594, 0.42710962891578674, -0.12220986187458038, -0.693227231502533], [0.19395746290683746, 0.23387590050697327, -0.13607440888881683, -0.44137877225875854], [0.19863498210906982, 0.43063464760780334, -0.14490197598934174, -0.7736712098121643], [0.20724767446517944, 0.23777173459529877, -0.16037540137767792, -0.5298608541488647], [0.21200311183929443, 0.434743195772171, -0.17097261548042297, -0.868475079536438], [0.22069796919822693, 0.24230815470218658, -0.1883421242237091, -0.634052574634552], [0.22554413974285126, 0.05024309083819389, -0.2010231763124466, -0.4060955047607422], [0.22654899954795837, 0.2475632131099701, -0.20914508402347565, -0.7548190355300903], [0.2315002679824829, 0.05584331974387169, -0.2242414653301239, -0.5345472693443298], [0.015413600020110607, -0.19138167798519135, -0.036070019006729126, 0.27738210558891296], [0.011585966683924198, 0.004235801286995411, -0.03052237629890442, -0.026455527171492577], [0.011670682579278946, 0.1997818648815155, -0.03105148673057556, -0.3286101818084717], [0.01566632091999054, 0.005115414969623089, -0.03762368857860565, -0.04587894305586815], [0.0157686285674572, -0.18944740295410156, -0.038541268557310104, 0.23469999432563782], [0.011979680508375168, 0.006203415337949991, -0.03384726867079735, -0.06988661736249924], [0.012103748507797718, 0.2017938643693924, -0.03524500131607056, -0.3730534613132477], [0.016139626502990723, 0.39739829301834106, -0.042706072330474854, -0.6766377687454224], [0.02408759295940399, 0.593086838722229, -0.05623882636427879, -0.9824546575546265], [0.03594932705163956, 0.39876168966293335, -0.07588791847229004, -0.7079533338546753], [0.04392456263303757, 0.5948482751846313, -0.09004698693752289, -1.0235263109207153], [0.05582152679562569, 0.791046679019928, -0.11051751673221588, -1.3430695533752441], [0.07164245843887329, 0.9873718619346619, -0.13737890124320984, -1.668186902999878], [0.09138990193605423, 1.1837979555130005, -0.17074264585971832, -2.000312566757202], [0.11506585776805878, 0.9908217787742615, -0.21074889600276947, -1.7650121450424194], [-3.473207834758796e-05, 0.2102275788784027, -0.0008071033516898751, -0.2590616047382355], [0.004169819410890341, 0.015117155387997627, -0.005988335236907005, 0.033366650342941284], [0.004472162574529648, -0.17991840839385986, -0.005321002099663019, 0.32415419816970825], [0.0008737943135201931, -0.3749642074108124, 0.0011620816076174378, 0.6151543855667114], [-0.006625489331781864, -0.1798585057258606, 0.01346516888588667, 0.3228376507759094], [-0.010222659446299076, 0.015069148503243923, 0.0199219211935997, 0.034431342035532], [-0.009921276941895485, -0.1803327351808548, 0.020610548555850983, 0.3333326578140259], [-0.013527931645512581, -0.3757418990135193, 0.027277201414108276, 0.6324431896209717], [-0.02104276977479458, -0.5712335705757141, 0.03992606699466705, 0.9335901141166687], [-0.03246743977069855, -0.37667232751846313, 0.0585978701710701, 0.6537160277366638], [-0.04000088572502136, -0.18241317570209503, 0.07167218625545502, 0.3800453245639801], [-0.04364915192127228, 0.011621693149209023, 0.07927309721708298, 0.11079384386539459], [-0.043416716158390045, 0.20552349090576172, 0.08148897439241409, -0.15586353838443756], [-0.03930624574422836, 0.009335072711110115, 0.07837170362472534, 0.1613737940788269], [-0.03911954537034035, -0.1868162900209427, 0.0815991759300232, 0.477715402841568], [-0.042855869978666306, 0.007064502220600843, 0.09115348756313324, 0.211825430393219], [-0.04271458089351654, -0.18923449516296387, 0.09538999199867249, 0.5318135023117065], [-0.04649927094578743, 0.004425440914928913, 0.10602626204490662, 0.2706463932991028], [-0.04641076177358627, -0.19203715026378632, 0.11143919080495834, 0.594798743724823], [-0.05025150626897812, -0.38852789998054504, 0.12333516776561737, 0.9204020500183105], [-0.058022063225507736, -0.5850814580917358, 0.14174321293830872, 1.2491614818572998], [-0.0697236955165863, -0.39203202724456787, 0.16672644019126892, 1.0040245056152344], [-0.07756433635950089, -0.19948191940784454, 0.18680693209171295, 0.7679951786994934], [-0.08155397325754166, -0.007355192676186562, 0.2021668255329132, 0.5394212603569031], [-0.08170107752084732, -0.2046590894460678, 0.21295525133609772, 0.888382613658905], [-0.04084847494959831, 0.2208612859249115, -0.033991895616054535, -0.3422156572341919], [-0.03643124923110008, 0.02623901702463627, -0.04083620756864548, -0.06044257804751396], [-0.03590647131204605, -0.16827435791492462, -0.04204506054520607, 0.21908172965049744], [-0.03927195817232132, -0.36277085542678833, -0.037663426250219345, 0.4982110559940338], [-0.046527374535799026, -0.16713868081569672, -0.02769920416176319, 0.193900465965271], [-0.04987014830112457, 0.028368324041366577, -0.02382119558751583, -0.10739007592201233], [-0.049302779138088226, -0.16640430688858032, -0.025968996807932854, 0.17768320441246033], [-0.052630867809057236, -0.3611451983451843, -0.02241533249616623, 0.4620620012283325], [-0.05985376983880997, -0.16571372747421265, -0.013174092397093773, 0.16239890456199646], [-0.06316804885864258, 0.02959432080388069, -0.009926114231348038, -0.1344108134508133], [-0.06257615983486176, -0.16538405418395996, -0.012614330276846886, 0.15512411296367645], [-0.06588383764028549, 0.02991621568799019, -0.009511847980320454, -0.14151149988174438], [-0.06528551876544952, 0.22517310082912445, -0.012342077679932117, -0.4371800124645233], [-0.0607820525765419, 0.03022800013422966, -0.021085677668452263, -0.14841312170028687], [-0.06017749384045601, 0.22564545273780823, -0.024053940549492836, -0.44767287373542786], [-0.055664584040641785, 0.4210992753505707, -0.03300739824771881, -0.7478399276733398], [-0.047242600470781326, 0.22644785046577454, -0.047964196652173996, -0.46572428941726685], [-0.04271364212036133, 0.03203527256846428, -0.05727868154644966, -0.1885368674993515], [-0.04207293689250946, -0.16222241520881653, -0.06104942038655281, 0.08554107695817947], [-0.0453173853456974, -0.35641855001449585, -0.05933859944343567, 0.35835522413253784], [-0.052445754408836365, -0.5506489276885986, -0.0521714948117733, 0.6317527294158936], [-0.06345873326063156, -0.7450056672096252, -0.03953643888235092, 0.9075596928596497], [-0.07835885137319565, -0.9395707249641418, -0.02138524502515793, 1.1875585317611694], [-0.09715025871992111, -1.134408950805664, 0.0023659253492951393, 1.4734622240066528], [-0.11983843892812729, -0.9393160343170166, 0.031835172325372696, 1.1815192699432373], [-0.13862475752830505, -1.1348363161087036, 0.05546555668115616, 1.4840091466903687], [-0.1613214910030365, -0.9404328465461731, 0.0851457417011261, 1.209150791168213], [-0.18013015389442444, -1.136544942855835, 0.1093287542462349, 1.527255892753601], [-0.20286104083061218, -1.3328031301498413, 0.13987387716770172, 1.8519641160964966], [-0.2295171022415161, -1.5291591882705688, 0.17691315710544586, 2.1846108436584473], [-0.2601003050804138, -1.3361397981643677, 0.22060537338256836, 1.9513423442840576], [-0.010010048747062683, -0.18236960470676422, 0.036250121891498566, 0.3216784596443176], [-0.01365744136273861, -0.3779885172843933, 0.042683690786361694, 0.6255692839622498], [-0.021217212080955505, -0.573679506778717, 0.05519507825374603, 0.9313836097717285], [-0.03269080072641373, -0.37934410572052, 0.0738227516412735, 0.6565435528755188], [-0.04027768224477768, -0.5754119157791138, 0.08695361763238907, 0.9715283513069153], [-0.051785919815301895, -0.7715863585472107, 0.10638418793678284, 1.290210485458374], [-0.06721764802932739, -0.9678881764411926, 0.13218839466571808, 1.6142164468765259], [-0.08657541126012802, -0.7745506763458252, 0.16447272896766663, 1.3654905557632446], [-0.10206642746925354, -0.5818253755569458, 0.19178253412246704, 1.1284412145614624], [-0.1137029305100441, -0.3896609842777252, 0.2143513560295105, 0.9015184044837952], [0.04788494110107422, -0.174198716878891, -0.022329531610012054, 0.2898455262184143], [0.04440096765756607, 0.021234409883618355, -0.016532622277736664, -0.00979540217667818], [0.04482565447688103, -0.17364658415317535, -0.016728529706597328, 0.27762576937675476], [0.04135272279381752, -0.3685259521007538, -0.011176014319062233, 0.5649859309196472], [0.033982206135988235, -0.1732489913702011, 0.00012370466720312834, 0.26880311965942383], [0.030517226085066795, -0.36837270855903625, 0.005499767139554024, 0.5615250468254089], [0.023149771615862846, -0.5635713934898376, 0.01673026941716671, 0.8559356331825256], [0.011878343299031258, -0.3686813712120056, 0.03384898230433464, 0.5685599446296692], [0.00450471555814147, -0.17405013740062714, 0.045220181345939636, 0.286730021238327], [0.0010237129172310233, -0.3697868287563324, 0.05095478147268295, 0.593325138092041], [-0.006372023839503527, -0.5655836462974548, 0.06282128393650055, 0.9016133546829224], [-0.017683696001768112, -0.7614978551864624, 0.08085355162620544, 1.2133623361587524], [-0.032913655042648315, -0.5675070285797119, 0.10512080043554306, 0.9470717310905457], [-0.044263795018196106, -0.3739456832408905, 0.12406223267316818, 0.6891810894012451], [-0.05174270644783974, -0.18074388802051544, 0.13784585893154144, 0.4379865825176239], [-0.05535758659243584, -0.37752023339271545, 0.14660558104515076, 0.7707496881484985], [-0.06290799379348755, -0.5743227601051331, 0.16202057898044586, 1.1057345867156982], [-0.07439444214105606, -0.3816584050655365, 0.18413527309894562, 0.8679487705230713], [-0.0820276141166687, -0.5787438154220581, 0.2014942467212677, 1.2124097347259521], [-0.0936024934053421, -0.3867097795009613, 0.22574244439601898, 0.9890255928039551], [0.026092730462551117, -0.21584200859069824, -0.015642983838915825, 0.23988661170005798], [0.02177589014172554, -0.020500119775533676, -0.010845252312719822, -0.057689204812049866], [0.02136588841676712, -0.21546490490436554, -0.011999036185443401, 0.2315523326396942], [0.01705658994615078, -0.41041335463523865, -0.007367989514023066, 0.520426332950592], [0.008848322555422783, -0.21518847346305847, 0.003040537005290389, 0.22543077170848846], [0.004544552881270647, -0.020110104233026505, 0.007549152709543705, -0.06629150360822678], [0.004142350982874632, 0.1749027967453003, 0.006223322357982397, -0.3565830886363983], [0.007640406955033541, -0.02030707150697708, -0.0009083394543267787, -0.06194431334733963], [0.007234265562146902, -0.21541598439216614, -0.0021472256630659103, 0.23045188188552856], [0.0029259456787258387, -0.020263418555259705, 0.0024618119932711124, -0.06290757656097412], [0.002520677400752902, 0.17482315003871918, 0.0012036606203764677, -0.35481277108192444], [0.006017140578478575, -0.02031589485704899, -0.005892594810575247, -0.06175053492188454], [0.0056108226999640465, 0.17489004135131836, -0.007127605378627777, -0.35628676414489746], [0.00910862348973751, -0.020129848271608353, -0.014253340661525726, -0.06585986167192459], [0.008706026710569859, 0.17519351840019226, -0.015570538118481636, -0.36300551891326904], [0.012209896929562092, 0.370533287525177, -0.022830648347735405, -0.6605571508407593], [0.019620561972260475, 0.17573635280132294, -0.03604179248213768, -0.37514954805374146], [0.023135289549827576, -0.018855618312954903, -0.04354478418827057, -0.09404515475034714], [0.022758176550269127, -0.21332727372646332, -0.04542568698525429, 0.18458768725395203], [0.018491631373763084, -0.017585791647434235, -0.04173393175005913, -0.12207221239805222], [0.0181399155408144, 0.17810845375061035, -0.04417537525296211, -0.4276241958141327], [0.021702084690332413, -0.016360905021429062, -0.05272785946726799, -0.1491880714893341], [0.021374866366386414, -0.2106897085905075, -0.05571162328124046, 0.12640520930290222], [0.01716107316315174, -0.4049711227416992, -0.05318351835012436, 0.401004433631897], [0.00906165037304163, -0.2091367095708847, -0.04516343027353287, 0.0920395776629448], [0.004878916312009096, -0.013397494331002235, -0.04332263767719269, -0.2145433872938156], [0.0046109664253890514, 0.18231618404388428, -0.04761350527405739, -0.5205713510513306], [0.008257290348410606, 0.37807491421699524, -0.05802493169903755, -0.827869713306427], [0.01581878773868084, 0.5739402174949646, -0.07458232343196869, -1.1382229328155518], [0.027297591790556908, 0.7699539661407471, -0.09734678268432617, -1.4533331394195557], [0.042696673423051834, 0.5761529803276062, -0.12641344964504242, -1.1925827264785767], [0.05421973019838333, 0.38287460803985596, -0.15026509761810303, -0.9420452117919922], [0.06187722459435463, 0.5796669721603394, -0.16910600662231445, -1.2779192924499512], [0.07347056269645691, 0.38705533742904663, -0.1946643888950348, -1.042603611946106], [0.08121167123317719, 0.19497592747211456, -0.21551646292209625, -0.8167968392372131], [-0.04856448248028755, 0.16477341949939728, 0.008926940150558949, -0.30082520842552185], [-0.04526901617646217, 0.35976698994636536, 0.002910436363890767, -0.5906794667243958], [-0.03807367384433746, 0.5548480749130249, -0.00890315230935812, -0.8824441432952881], [-0.02697671391069889, 0.35984817147254944, -0.02655203640460968, -0.5925734043121338], [-0.01977975107729435, 0.16510778665542603, -0.038403503596782684, -0.3083711564540863], [-0.016477594152092934, -0.029446519911289215, -0.0445709265768528, -0.028042715042829514], [-0.017066525295376778, -0.2239018976688385, -0.045131780207157135, 0.2502511441707611], [-0.0215445626527071, -0.02816547267138958, -0.04012675583362579, -0.056318748742341995], [-0.022107873111963272, 0.16750817000865936, -0.04125313088297844, -0.3613870441913605], [-0.018757708370685577, -0.02700386755168438, -0.04848087206482887, -0.08199220150709152], [-0.019297786056995392, 0.16877831518650055, -0.05012071877717972, -0.3895682096481323], [-0.015922220423817635, -0.025597751140594482, -0.057912081480026245, -0.1130995824933052], [-0.01643417589366436, -0.21984411776065826, -0.06017407402396202, 0.1607648730278015], [-0.02083105780184269, -0.4140552878379822, -0.05695877596735954, 0.43387386202812195], [-0.029112163931131363, -0.21817514300346375, -0.04828129708766937, 0.12379330396652222], [-0.033475667238235474, -0.41257333755493164, -0.0458054319024086, 0.40086159110069275], [-0.041727133095264435, -0.21683259308338165, -0.03778820112347603, 0.09409637004137039], [-0.04606378450989723, -0.4113931357860565, -0.03590627387166023, 0.37462174892425537], [-0.05429164692759514, -0.21578003466129303, -0.028413837775588036, 0.07083705067634583], [-0.05860724672675133, -0.02026248723268509, -0.026997096836566925, -0.2306734323501587], [-0.05901249870657921, 0.1752346307039261, -0.03161056712269783, -0.5317484140396118], [-0.055507805198431015, 0.3707866072654724, -0.0422455333173275, -0.8342218399047852], [-0.048092070966959, 0.5664594769477844, -0.05892996862530708, -1.1398857831954956], [-0.03676288202404976, 0.7623002529144287, -0.08172768354415894, -1.4504523277282715], [-0.02151687815785408, 0.9583259224891663, -0.11073673516511917, -1.7675106525421143], [-0.0023503585252910852, 0.7646154165267944, -0.1460869461297989, -1.5112147331237793], [0.012941950000822544, 0.5715339779853821, -0.17631123960018158, -1.2674744129180908], [0.024372629821300507, 0.37904688715934753, -0.20166072249412537, -1.0347872972488403], [0.031953565776348114, 0.18709351122379303, -0.22235646843910217, -0.8115792274475098]], "action_prob": [0.4999545216560364, 0.499300092458725, 0.49885618686676025, 0.4986256957054138, 0.498516321182251, 0.5015443563461304, 0.5015813112258911, 0.4984225928783417, 0.4983404874801636, 0.5017037391662598, 0.49995991587638855, 0.499303936958313, 0.49885454773902893, 0.4986222982406616, 0.498514860868454, 0.5015423893928528, 0.4984205961227417, 0.5016262531280518, 0.49832701683044434, 0.5017099380493164, 0.5017664432525635, 0.49998074769973755, 0.5006658434867859, 0.4999791085720062, 0.5006709098815918, 0.5000259280204773, 0.5006266832351685, 0.5000047087669373, 0.49935102462768555, 0.5010960102081299, 0.4992946684360504, 0.5011468529701233, 0.5007746815681458, 0.5001814961433411, 0.5004655122756958, 0.500224769115448, 0.49957287311553955, 0.49906817078590393, 0.49877554178237915, 0.5013696551322937, 0.5012907981872559, 0.49896934628486633, 0.4986632764339447, 0.4985232949256897, 0.5015397667884827, 0.50156170129776, 0.5015114545822144, 0.5013089179992676, 0.5008816123008728, 0.49972614645957947, 0.5009602904319763, 0.4996284246444702, 0.5010403394699097, 0.49952319264411926, 0.49887755513191223, 0.5015081167221069, 0.4987664520740509, 0.5015801787376404, 0.4986492395401001, 0.5016547441482544, 0.5014708042144775, 0.4989027976989746, 0.5015665888786316, 0.5000945329666138, 0.5005505084991455, 0.4998886287212372, 0.5007634162902832, 0.5001550316810608, 0.5004976987838745, 0.4998231828212738, 0.49918442964553833, 0.49877509474754333, 0.5014296174049377, 0.49869081377983093, 0.4985002875328064, 0.4984123110771179, 0.4983607828617096, 0.5016821026802063, 0.5000155568122864, 0.5006416440010071, 0.4999980628490448, 0.49935027956962585, 0.5010949373245239, 0.5006932616233826, 0.4999331831932068, 0.4992794990539551, 0.49883952736854553, 0.5013880133628845, 0.5012392997741699, 0.500887393951416, 0.5003137588500977, 0.5003294348716736, 0.49962547421455383, 0.500992476940155, 0.49953365325927734, 0.5010634064674377, 0.49943041801452637, 0.4988599121570587, 0.49854177236557007, 0.5016096830368042, 0.5015586018562317, 0.5013879537582397, 0.4989570677280426, 0.49987444281578064, 0.5007655620574951, 0.5001732707023621, 0.49951568245887756, 0.5009819865226746, 0.5004909038543701, 0.5001909732818604, 0.49952301383018494, 0.5009946823120117, 0.5004918575286865, 0.5001880526542664, 0.5004862546920776, 0.4998056888580322, 0.500792384147644, 0.49976953864097595, 0.49917250871658325, 0.5011942982673645, 0.5008976459503174, 0.5003684163093567, 0.4997122585773468, 0.49915748834609985, 0.49881646037101746, 0.4986441731452942, 0.4985596537590027, 0.5014917254447937, 0.498464435338974, 0.50157630443573, 0.49837324023246765, 0.49834364652633667, 0.49831798672676086, 0.5017104744911194, 0.49991923570632935, 0.49925822019577026, 0.49881479144096375, 0.5014114379882812, 0.4987317621707916, 0.49852028489112854, 0.49842408299446106, 0.5016294121742249, 0.5016761422157288, 0.5016911029815674, 0.5001119375228882, 0.5005383491516113, 0.5001168251037598, 0.4994617700576782, 0.5010074377059937, 0.49942997097969055, 0.49895650148391724, 0.5013005137443542, 0.5011122822761536, 0.4992992579936981, 0.49883532524108887, 0.49859657883644104, 0.5015144348144531, 0.5014946460723877, 0.5013701319694519, 0.4989345073699951, 0.4985530376434326, 0.5016201734542847, 0.4984501004219055, 0.5016982555389404, 0.500076949596405, 0.5005767345428467, 0.5000783801078796, 0.49942153692245483, 0.5010465383529663, 0.5006109476089478, 0.49996060132980347, 0.5006798505783081, 0.5000529289245605, 0.5006078481674194, 0.49995627999305725, 0.5006862282752991, 0.49993863701820374, 0.5007060766220093, 0.49991390109062195, 0.4992685616016388, 0.5011613368988037, 0.5007910132408142, 0.5001934766769409, 0.5004596710205078, 0.49977660179138184, 0.500855028629303, 0.5002833604812622, 0.4996277689933777, 0.5008877515792847, 0.5003610253334045, 0.4996645152568817, 0.4990692138671875, 0.4987102150917053, 0.4985297918319702, 0.5015628933906555, 0.5015694499015808, 0.49849584698677063, 0.5016510486602783, 0.5016064643859863, 0.5000933408737183, 0.49943849444389343, 0.49897482991218567, 0.5012789368629456, 0.5010925531387329, 0.5006844997406006, 0.5000624060630798, 0.5005776882171631, 0.4999123513698578, 0.5007429718971252, 0.4998589754104614, 0.5007898211479187, 0.500203549861908, 0.4995534121990204, 0.500943124294281, 0.4995640814304352, 0.500950038433075, 0.4995696544647217, 0.5009587407112122, 0.5004299283027649, 0.49973946809768677, 0.49915066361427307, 0.4987891912460327, 0.49860045313835144, 0.4984990954399109, 0.5015679001808167, 0.5016105771064758, 0.5016236305236816, 0.5015744566917419], "advantages": [9.561938285827637, 8.651209831237793, 7.730644226074219, 6.8000288009643555, 5.859424114227295, 4.908923149108887, 3.948042392730713, 2.977179527282715, 1.9978947639465332, 1.0083078145980835, 10.465890884399414, 9.564318656921387, 8.653058052062988, 7.731853485107422, 6.80074405670166, 5.859816074371338, 4.908472537994385, 3.948418140411377, 2.977861166000366, 1.9982532262802124, 1.0081079006195068, 34.434329986572266, 33.76930618286133, 33.103153228759766, 32.42466354370117, 31.744918823242188, 31.058202743530273, 30.359102249145508, 29.658401489257812, 28.949954986572266, 28.230236053466797, 27.50737190246582, 26.77316665649414, 26.030969619750977, 25.281145095825195, 24.5294246673584, 23.76441764831543, 22.99204444885254, 22.212488174438477, 21.425634384155273, 20.633285522460938, 19.83359718322754, 19.021926879882812, 18.202709197998047, 17.375717163085938, 16.541872024536133, 15.700037956237793, 14.850241661071777, 13.992399215698242, 13.126175880432129, 12.24555492401123, 11.361663818359375, 10.463253021240234, 9.56130599975586, 8.644765853881836, 7.7197184562683105, 6.7893218994140625, 5.845678806304932, 4.896145820617676, 3.9335670471191406, 2.964489221572876, 1.986096978187561, 0.9936341643333435, 13.99405288696289, 13.127979278564453, 12.247586250305176, 11.358391761779785, 10.465670585632324, 9.563987731933594, 8.64755630493164, 7.722048282623291, 6.787911415100098, 5.845099925994873, 4.895206928253174, 3.933306932449341, 2.962268114089966, 1.9817891120910645, 0.9916256666183472, 22.218156814575195, 21.429689407348633, 20.638851165771484, 19.839941024780273, 19.03233528137207, 18.212331771850586, 17.38347625732422, 16.551748275756836, 15.710954666137695, 14.860912322998047, 13.999622344970703, 13.129009246826172, 12.249049186706543, 11.360061645507812, 10.467784881591797, 9.566134452819824, 8.650362014770508, 7.730275630950928, 6.796093463897705, 5.85717248916626, 4.907859802246094, 3.9482173919677734, 2.977358818054199, 1.9963148832321167, 1.0048922300338745, 26.769136428833008, 26.026668548583984, 25.28205680847168, 24.530046463012695, 23.76999282836914, 22.997465133666992, 22.216732025146484, 21.433822631835938, 20.642608642578125, 19.838462829589844, 19.025856018066406, 18.21076202392578, 17.381715774536133, 16.544647216796875, 15.704174041748047, 14.850150108337402, 13.988266944885254, 13.121174812316895, 12.245966911315918, 11.362242698669434, 10.469355583190918, 9.56686019897461, 8.654646873474121, 7.732746601104736, 6.801201343536377, 5.85929536819458, 4.908864974975586, 3.9479029178619385, 2.978166103363037, 1.9983645677566528, 1.0084978342056274, 9.562023162841797, 8.651344299316406, 7.730794906616211, 6.800167083740234, 5.85748815536499, 4.907907962799072, 3.948125123977661, 2.9782514572143555, 1.9979941844940186, 1.0076334476470947, 18.209327697753906, 17.38585662841797, 16.548526763916016, 15.7083101272583, 14.859026908874512, 13.996749877929688, 13.130230903625488, 12.254217147827148, 11.366419792175293, 10.468988418579102, 9.566883087158203, 8.654866218566895, 7.733010292053223, 6.80031156539917, 5.857766628265381, 4.905168056488037, 3.9466466903686523, 2.977581024169922, 1.9967681169509888, 1.007840871810913, 29.654808044433594, 28.947004318237305, 28.2264404296875, 27.504226684570312, 26.774181365966797, 26.032194137573242, 25.282230377197266, 24.524826049804688, 23.76519012451172, 22.99794578552246, 22.21731948852539, 21.42894172668457, 20.638019561767578, 19.833667755126953, 19.0266056060791, 18.205961227416992, 17.377710342407227, 16.54514503479004, 15.704756736755371, 14.855998039245605, 13.992984771728516, 13.121519088745117, 12.246448516845703, 11.362749099731445, 10.46976375579834, 9.56273365020752, 8.646251678466797, 7.720954418182373, 6.78712272644043, 5.844577789306641, 4.893007278442383, 3.9327518939971924, 2.963104009628296, 1.9820772409439087, 0.9925652146339417, 25.282682418823242, 24.525236129760742, 23.7607479095459, 22.989269256591797, 22.212820053100586, 21.429203033447266, 20.638206481933594, 19.8392391204834, 19.026594161987305, 18.20589256286621, 17.382266998291016, 16.54497528076172, 15.704505920410156, 14.85571002960205, 13.997954368591309, 13.126593589782715, 12.251461029052734, 11.362433433532715, 10.46955394744873, 9.562511444091797, 8.646092414855957, 7.72089147567749, 6.787143230438232, 5.844657897949219, 4.893125534057617, 3.932271718978882, 2.962035894393921, 1.982165813446045, 0.9926379323005676], "value_targets": [9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 704766924, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 949548093, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 988732540, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1186031101, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1712694865, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1617307986, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 1926379545, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 397575110, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 1500279124, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 429636314, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 1268666990, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502, 782944502], "obs": [[-0.0031250922475010157, -0.021380947902798653, -0.021721085533499718, -0.027043821290135384], [-0.0035527111031115055, -0.21618478000164032, -0.022261962294578552, 0.2587074935436249], [-0.00787640642374754, -0.4109819531440735, -0.01708781160414219, 0.5442863702774048], [-0.016096046194434166, -0.605859637260437, -0.006202084012329578, 0.8315367102622986], [-0.02821323834359646, -0.8008962869644165, 0.010428650304675102, 1.1222625970840454], [-0.04423116520047188, -0.6059126257896423, 0.03287390246987343, 0.8328689932823181], [-0.05634941905736923, -0.801468014717102, 0.04953128471970558, 1.1357067823410034], [-0.07237877696752548, -0.9972017407417297, 0.07224541902542114, 1.443503499031067], [-0.09232281148433685, -1.1931347846984863, 0.10111548751592636, 1.7578580379486084], [-0.1161855086684227, -0.999293327331543, 0.13627265393733978, 1.498258352279663], [-0.1361713707447052, -0.806065022945404, 0.16623781621456146, 1.2510433197021484], [-0.1522926688194275, -0.6134167909622192, 0.19125868380069733, 1.0147037506103516], [0.03721551597118378, 0.007522519677877426, 0.005587015300989151, -0.03599095344543457], [0.03736596554517746, 0.20256391167640686, 0.004867196083068848, -0.32690590620040894], [0.04141724482178688, 0.0073730009607970715, -0.0016709218034520745, -0.03269205242395401], [0.0415647067129612, -0.18772494792938232, -0.0023247627541422844, 0.25946322083473206], [0.03781020641326904, 0.007430113386362791, 0.002864501439034939, -0.03395206853747368], [0.03795880824327469, 0.20251086354255676, 0.0021854599472135305, -0.3257298469543457], [0.04200902581214905, 0.3976016342639923, -0.004329136572778225, -0.617722749710083], [0.04996106028556824, 0.20254042744636536, -0.016683591529726982, -0.32640644907951355], [0.05401186645030975, 0.0076599325984716415, -0.02321172133088112, -0.039031144231557846], [0.0541650652885437, -0.18712159991264343, -0.023992344737052917, 0.2462388277053833], [0.050422634929418564, 0.008334648795425892, -0.019067566841840744, -0.053914252668619156], [0.05058932676911354, 0.20372474193572998, -0.020145852118730545, -0.3525516390800476], [0.054663822054862976, 0.3991272747516632, -0.027196886017918587, -0.6515184640884399], [0.06264636665582657, 0.5946172475814819, -0.0402272529900074, -0.9526398777961731], [0.0745387151837349, 0.7902567386627197, -0.05928005278110504, -1.2576853036880493], [0.09034384787082672, 0.9860851168632507, -0.08443375676870346, -1.5683300495147705], [0.11006554961204529, 1.182107925415039, -0.11580035835504532, -1.886110782623291], [0.1337077021598816, 0.9884200692176819, -0.1535225808620453, -1.6314940452575684], [0.15347610414028168, 1.1849758625030518, -0.18615245819091797, -1.9678186178207397], [-0.01071529183536768, -0.019362231716513634, 0.020720381289720535, 0.0027254936285316944], [-0.01110253669321537, 0.17545652389526367, 0.02077489160001278, -0.28334856033325195], [-0.007593405898660421, -0.019955486059188843, 0.01510792039334774, 0.015813587233424187], [-0.00799251627177, 0.17494657635688782, 0.015424191951751709, -0.27206459641456604], [-0.004493584390729666, 0.36984509229660034, 0.009982900694012642, -0.5598430037498474], [0.0029033173341304064, 0.5648254752159119, -0.001213960349559784, -0.849364161491394], [0.014199827797710896, 0.7599639892578125, -0.01820124313235283, -1.1424286365509033], [0.02939910627901554, 0.9553189873695374, -0.04104981571435928, -1.4407634735107422], [0.04850548878312111, 1.1509218215942383, -0.06986508518457413, -1.745985746383667], [0.07152391970157623, 0.9566602110862732, -0.10478480160236359, -1.4758278131484985], [0.09065712988376617, 1.1528946161270142, -0.1343013495206833, -1.799315333366394], [0.1137150228023529, 0.9595064520835876, -0.17028766870498657, -1.5512112379074097], [0.13290515542030334, 1.1562124490737915, -0.2013118863105774, -1.8918254375457764], [0.04792596772313118, 0.04012172296643257, -0.025692787021398544, -0.0028587777633219957], [0.04872840270400047, 0.23560254275798798, -0.025749962776899338, -0.3035360872745514], [0.05344045162200928, 0.04085685312747955, -0.03182068467140198, -0.019084040075540543], [0.0542575903236866, -0.15379464626312256, -0.03220236673951149, 0.2633917033672333], [0.051181696355342865, 0.04177180305123329, -0.026934532448649406, -0.039271749556064606], [0.05201713368296623, 0.23726943135261536, -0.02771996706724167, -0.3403296172618866], [0.05676252022385597, 0.042552635073661804, -0.034526560455560684, -0.05651526153087616], [0.05761357396841049, 0.23815219104290009, -0.03565686568617821, -0.3598885238170624], [0.06237661838531494, 0.43376240134239197, -0.042854636907577515, -0.6635982394218445], [0.07105186581611633, 0.6294534802436829, -0.05612659826874733, -0.9694607853889465], [0.0836409330368042, 0.4351280927658081, -0.07551581412553787, -0.6949242353439331], [0.09234349429607391, 0.6312117576599121, -0.08941429853439331, -1.0103920698165894], [0.10496773570775986, 0.43738943338394165, -0.10962214320898056, -0.7470727562904358], [0.1137155219912529, 0.2439369261264801, -0.12456359714269638, -0.4908002018928528], [0.11859425902366638, 0.44057556986808777, -0.13437959551811218, -0.8199999332427979], [0.1274057775735855, 0.24752336740493774, -0.1507796049118042, -0.5724210739135742], [0.13235624134540558, 0.4444020390510559, -0.16222801804542542, -0.9085499048233032], [0.14124427735805511, 0.2518036365509033, -0.18039901554584503, -0.6709316372871399], [0.14628034830093384, 0.44891393184661865, -0.1938176453113556, -1.0145491361618042], [-0.006987347267568111, 0.019807280972599983, 0.04687238484621048, -0.03075495921075344], [-0.006591201759874821, 0.21422681212425232, 0.04625728353857994, -0.3082885146141052], [-0.002306665526703, 0.018477320671081543, 0.040091514587402344, -0.0013835744466632605], [-0.0019371192902326584, 0.2130020558834076, 0.04006384313106537, -0.2811524569988251], [0.0023229217622429132, 0.4075303077697754, 0.034440793097019196, -0.5609350800514221], [0.010473527945578098, 0.602152407169342, 0.023222092539072037, -0.842571496963501], [0.02251657471060753, 0.7969498038291931, 0.0063706631772220135, -1.1278622150421143], [0.038455571979284286, 0.6017450094223022, -0.016186580061912537, -0.8331878781318665], [0.050490472465753555, 0.7970843315124512, -0.03285033628344536, -1.1309171915054321], [0.0664321556687355, 0.9926206469535828, -0.05546868219971657, -1.4337196350097656], [0.0862845703959465, 0.7982251048088074, -0.08414307236671448, -1.158874273300171], [0.10224907100200653, 0.9943366646766663, -0.10732056200504303, -1.4767097234725952], [0.12213580310344696, 0.800676703453064, -0.13685475289821625, -1.2193827629089355], [0.13814933598041534, 0.6075581312179565, -0.16124241054058075, -0.9725232720375061], [0.1503005027770996, 0.8044332265853882, -0.1806928813457489, -1.3112053871154785], [0.16638916730880737, 0.6119999885559082, -0.20691698789596558, -1.0800899267196655], [-0.01564539037644863, 0.04950530454516411, -0.019894389435648918, 0.02746976539492607], [-0.014655284583568573, -0.14532577991485596, -0.01934499479830265, 0.31380999088287354], [-0.01756179891526699, 0.050066329538822174, -0.013068795204162598, 0.01508959848433733], [-0.016560472548007965, 0.24537323415279388, -0.012767002917826176, -0.28168785572052], [-0.011653007939457893, 0.44067496061325073, -0.018400760367512703, -0.5783699750900269], [-0.0028395093977451324, 0.24581564962863922, -0.029968159273266792, -0.2915400266647339], [0.002076803706586361, 0.05113353952765465, -0.03579895943403244, -0.008457282558083534], [0.0030994745902717113, 0.2467501312494278, -0.0359681062400341, -0.31221678853034973], [0.0080344770103693, 0.44236552715301514, -0.04221244156360626, -0.6160224676132202], [0.01688178814947605, 0.6380510330200195, -0.054532889276742935, -0.9216960072517395], [0.029642809182405472, 0.833865761756897, -0.0729668140411377, -1.2310062646865845], [0.046320125460624695, 1.029846429824829, -0.09758693724870682, -1.545628309249878], [0.0669170543551445, 1.2259957790374756, -0.12849950790405273, -1.8670973777770996], [0.091436967253685, 1.0324931144714355, -0.16584144532680511, -1.61691153049469], [0.11208683252334595, 1.2291369438171387, -0.1981796771287918, -1.956364393234253], [0.04756912216544151, 0.0037067648954689503, -0.025916757062077522, -0.049291208386421204], [0.047643259167671204, -0.19103416800498962, -0.0269025806337595, 0.23510341346263885], [0.043822575360536575, 0.004461625590920448, -0.022200511768460274, -0.06594256311655045], [0.043911807239055634, 0.1998947262763977, -0.0235193632543087, -0.3655463755130768], [0.047909703105688095, 0.005114762112498283, -0.030830292031168938, -0.08037130534648895], [0.04801199585199356, -0.18955197930335999, -0.03243771567940712, 0.20242737233638763], [0.04422095790505409, -0.38419535756111145, -0.02838917076587677, 0.48470383882522583], [0.0365370512008667, -0.5789054036140442, -0.01869509369134903, 0.7683059573173523], [0.024958942085504532, -0.3835311830043793, -0.003328974125906825, 0.4697997570037842], [0.017288317903876305, -0.18836236000061035, 0.006067021284252405, 0.176069438457489], [0.013521070592105389, -0.3835706114768982, 0.009588410146534443, 0.47066012024879456], [0.005849658045917749, -0.18858540058135986, 0.019001612439751625, 0.18101470172405243], [0.0020779501646757126, 0.006259563844650984, 0.02262190729379654, -0.10561385005712509], [0.002203141339123249, -0.18917915225028992, 0.0205096285790205, 0.19411948323249817], [-0.0015804414870217443, 0.005643508862704039, 0.024392019957304, -0.09202363342046738], [-0.001467571360990405, 0.2004075050354004, 0.02255154587328434, -0.3769121766090393], [0.00254057883284986, 0.39520201086997986, 0.01501330267637968, -0.6624000668525696], [0.010444619692862034, 0.5901119112968445, 0.001765301451086998, -0.9503182172775269], [0.02224685810506344, 0.7852100729942322, -0.017241062596440315, -1.242445945739746], [0.03795105963945389, 0.9805489778518677, -0.042089980095624924, -1.5404794216156006], [0.05756203830242157, 1.176151156425476, -0.07289957255125046, -1.8459935188293457], [0.08108506351709366, 0.9819042086601257, -0.1098194420337677, -1.576810598373413], [0.10072314739227295, 1.1781501770019531, -0.14135564863681793, -1.9016282558441162], [0.12428614497184753, 1.3744902610778809, -0.17938822507858276, -2.234621286392212], [-0.039395298808813095, 0.031996726989746094, -0.0179740060120821, -0.03963232785463333], [-0.03875536471605301, -0.16286292672157288, -0.018766652792692184, 0.2473258674144745], [-0.04201262444257736, -0.35771191120147705, -0.013820135965943336, 0.5340307950973511], [-0.04916686192154884, -0.5526368021965027, -0.003139520063996315, 0.822327196598053], [-0.060219597071409225, -0.7477156519889832, 0.013307024724781513, 1.1140210628509521], [-0.07517390698194504, -0.5527709126472473, 0.03558744490146637, 0.8255420327186584], [-0.08622933179140091, -0.7483610510826111, 0.05209828540682793, 1.129201889038086], [-0.10119654983282089, -0.5539587140083313, 0.0746823251247406, 0.8533040285110474], [-0.11227572709321976, -0.3599298894405365, 0.09174840152263641, 0.5850082635879517], [-0.11947432160377502, -0.16620475053787231, 0.10344856977462769, 0.32257896661758423], [-0.12279842048883438, -0.362635999917984, 0.10990014672279358, 0.6460102796554565], [-0.1300511360168457, -0.5591038465499878, 0.12282035499811172, 0.9711797833442688], [-0.14123322069644928, -0.36582517623901367, 0.14224395155906677, 0.7194641828536987], [-0.14854972064495087, -0.1729278713464737, 0.15663322806358337, 0.4747193455696106], [-0.1520082801580429, -0.36987465620040894, 0.16612762212753296, 0.812385082244873], [-0.15940576791763306, -0.5668349266052246, 0.18237532675266266, 1.1523752212524414], [-0.170742467045784, -0.3744988739490509, 0.20542283356189728, 0.9219774007797241], [0.02307797595858574, -0.024393772706389427, 0.021981889382004738, 0.03712058812379837], [0.02259010076522827, -0.2198239415884018, 0.022724300622940063, 0.33665716648101807], [0.018193623051047325, -0.025032619014382362, 0.029457444325089455, 0.05122600123286247], [0.017692970111966133, -0.22056430578231812, 0.030481964349746704, 0.35305550694465637], [0.013281683437526226, -0.02588876150548458, 0.037543073296546936, 0.07013816386461258], [0.012763909064233303, -0.22152827680110931, 0.03894583880901337, 0.3744257390499115], [0.008333343081176281, -0.41718119382858276, 0.046434350311756134, 0.6791297197341919], [-1.0280592505296227e-05, -0.6129163503646851, 0.060016945004463196, 0.9860628247261047], [-0.012268607504665852, -0.41864731907844543, 0.07973819971084595, 0.7128183245658875], [-0.02064155414700508, -0.22471463680267334, 0.09399456530809402, 0.44626179337501526], [-0.025135846808552742, -0.4210319221019745, 0.102919802069664, 0.7670315504074097], [-0.033556483685970306, -0.6174088716506958, 0.11826043576002121, 1.0902432203292847], [-0.04590466246008873, -0.8138741254806519, 0.1400652974843979, 1.4175703525543213], [-0.062182143330574036, -0.6207364797592163, 0.16841670870780945, 1.171745777130127], [-0.07459687441587448, -0.4281558394432068, 0.1918516308069229, 0.9362426996231079], [-0.004526657052338123, -0.03037251904606819, -0.04130048677325249, -0.012527158483862877], [-0.005134107545018196, 0.1653166562318802, -0.04155103117227554, -0.317949503660202], [-0.0018277744529768825, 0.3610050082206726, -0.047910019755363464, -0.6234411597251892], [0.005392326042056084, 0.5567619800567627, -0.06037884205579758, -0.9308198690414429], [0.016527565196156502, 0.36250463128089905, -0.0789952427148819, -0.6577053666114807], [0.023777658119797707, 0.16856592893600464, -0.09214934706687927, -0.3909049928188324], [0.027148976922035217, 0.3648666441440582, -0.09996744990348816, -0.7111603617668152], [0.03444631025195122, 0.17126068472862244, -0.11419065296649933, -0.45154282450675964], [0.037871524691581726, -0.02207680605351925, -0.1232215091586113, -0.19692444801330566], [0.037429988384246826, -0.21524055302143097, -0.1271599978208542, 0.05448874831199646], [0.03312517702579498, -0.018546363338828087, -0.12607023119926453, -0.2754547595977783], [0.03275424987077713, 0.1781277060508728, -0.13157932460308075, -0.6050910949707031], [0.036316804587841034, -0.014932616613805294, -0.143681138753891, -0.3565766513347626], [0.03601815178990364, -0.20775070786476135, -0.15081267058849335, -0.11242686957120895], [0.03186313807964325, -0.010825635865330696, -0.15306121110916138, -0.4486326575279236], [0.03164662420749664, 0.18609243631362915, -0.16203387081623077, -0.785381019115448], [0.03536847233772278, 0.3830256164073944, -0.17774148285388947, -1.1243412494659424], [0.04302898421883583, 0.19062143564224243, -0.20022831857204437, -0.8922630548477173], [0.014936696738004684, -0.038504235446453094, 0.019000763073563576, 0.04666405916213989], [0.014166612178087234, 0.15634018182754517, 0.019934043288230896, -0.23996391892433167], [0.01729341596364975, 0.3511717617511749, 0.015134764835238457, -0.5262930393218994], [0.024316851049661636, 0.15584015846252441, 0.004608904477208853, -0.22887971997261047], [0.02743365429341793, -0.039347343146800995, 3.1310180929722264e-05, 0.06525345146656036], [0.026646707206964493, 0.15577416121959686, 0.001336379093118012, -0.22741959989070892], [0.029762189835309982, -0.039366867393255234, -0.003212012816220522, 0.06568457186222076], [0.028974853456020355, 0.1558009833097458, -0.001898321439512074, -0.22801002860069275], [0.03209087252616882, -0.03929378092288971, -0.0064585222862660885, 0.06407348811626434], [0.03130499646067619, -0.23432254791259766, -0.005177052225917578, 0.35471174120903015], [0.02661854587495327, -0.03912736475467682, 0.0019171824678778648, 0.06040084734559059], [0.025835998356342316, 0.15596704185009003, 0.0031251993495970964, -0.23167657852172852], [0.02895534038543701, 0.3510442078113556, -0.0015083322068676353, -0.5233720541000366], [0.03597622364759445, 0.5461873412132263, -0.011975773610174656, -0.8165299296379089], [0.04689997062087059, 0.3512313961982727, -0.028306372463703156, -0.5276377201080322], [0.053924597799777985, 0.15651890635490417, -0.03885912522673607, -0.24400697648525238], [0.05705497786402702, 0.35217371582984924, -0.04373926669359207, -0.5486893653869629], [0.06409845501184464, 0.5478819608688354, -0.05471305176615715, -0.8548261523246765], [0.07505609095096588, 0.743705153465271, -0.07180957496166229, -1.1641991138458252], [0.08993019163608551, 0.9396847486495972, -0.09509355574846268, -1.4785046577453613], [0.10872388631105423, 1.1358304023742676, -0.12466365098953247, -1.799309253692627], [0.13144049048423767, 0.9423040151596069, -0.160649836063385, -1.5478287935256958], [0.15028657019138336, 1.1389484405517578, -0.19160641729831696, -1.8860254287719727], [-0.04220907390117645, -0.047612931579351425, -0.0030526963528245687, -0.021378139033913612], [-0.04316133260726929, -0.24269096553325653, -0.003480259096249938, 0.27034005522727966], [-0.04801515117287636, -0.04751953110098839, 0.0019265421433374286, -0.02343851886689663], [-0.04896554350852966, 0.14757473766803741, 0.0014577718684449792, -0.3155129849910736], [-0.04601404815912247, -0.0475679449737072, -0.004852487705647945, -0.022370673716068268], [-0.046965405344963074, -0.24261997640132904, -0.005299901124089956, 0.2687772810459137], [-0.05181780457496643, -0.4376658797264099, 7.564473344245926e-05, 0.5597838759422302], [-0.06057112291455269, -0.2425449937582016, 0.011271323077380657, 0.26712480187416077], [-0.06542202085256577, -0.4378259778022766, 0.01661381870508194, 0.5633413791656494], [-0.074178546667099, -0.24294105172157288, 0.027880646288394928, 0.2759385406970978], [-0.07903736084699631, -0.048227742314338684, 0.033399417996406555, -0.007822053506970406], [-0.08000192046165466, -0.24381236732006073, 0.03324297443032265, 0.2952088713645935], [-0.08487816900014877, -0.43939208984375, 0.03914715349674225, 0.5981879830360413], [-0.09366600960493088, -0.2448391318321228, 0.05111091211438179, 0.31808847188949585], [-0.09856279194355011, -0.4406503736972809, 0.05747268348932266, 0.6264418363571167], [-0.10737580060958862, -0.24637576937675476, 0.070001520216465, 0.35239875316619873], [-0.11230331659317017, -0.05231545493006706, 0.07704949378967285, 0.08258484303951263], [-0.11334962397813797, 0.14162229001522064, 0.0787011906504631, -0.18482856452465057], [-0.11051717400550842, 0.3355351388454437, 0.07500462234020233, -0.4516831934452057], [-0.10380647331476212, 0.1394370198249817, 0.06597095727920532, -0.13633234798908234], [-0.10101773589849472, -0.05656478926539421, 0.06324431300163269, 0.1764122098684311], [-0.10214903205633163, 0.1375977247953415, 0.06677255779504776, -0.09566786140203476], [-0.09939707815647125, -0.05841454491019249, 0.06485919654369354, 0.21731188893318176], [-0.1005653664469719, -0.2544008493423462, 0.06920543313026428, 0.5297284126281738], [-0.10565338283777237, -0.060317203402519226, 0.07980000227689743, 0.259630024433136], [-0.1068597286939621, 0.13358023762702942, 0.08499260246753693, -0.006854258012026548], [-0.10418812185525894, 0.3273869454860687, 0.08485551923513412, -0.27155718207359314], [-0.09764038026332855, 0.521202027797699, 0.07942437380552292, -0.5363161563873291], [-0.0872163400053978, 0.3250584006309509, 0.06869805604219437, -0.21970199048519135], [-0.08071517199277878, 0.519134521484375, 0.06430400907993317, -0.48994818329811096], [-0.07033248245716095, 0.3231671452522278, 0.05450505018234253, -0.1777123063802719], [-0.06386914104223251, 0.5174684524536133, 0.050950802862644196, -0.4527148902416229], [-0.05351977422833443, 0.32166439294815063, 0.041896503418684006, -0.1444169133901596], [-0.04708648473024368, 0.12596827745437622, 0.03900816664099693, 0.1611836701631546], [-0.04456711933016777, -0.0696897804737091, 0.04223183915019035, 0.46591296792030334], [-0.045960914343595505, -0.26538223028182983, 0.05155009776353836, 0.7716023921966553], [-0.0512685589492321, -0.4611741900444031, 0.06698215007781982, 1.0800492763519287], [-0.06049204245209694, -0.26699748635292053, 0.08858313411474228, 0.8091152906417847], [-0.0658319965004921, -0.46321433782577515, 0.10476543754339218, 1.1282960176467896], [-0.07509627938270569, -0.6595408320426941, 0.12733136117458344, 1.4519157409667969], [-0.08828709274530411, -0.8559762835502625, 0.1563696712255478, 1.7815178632736206], [-0.10540661960840225, -1.052473545074463, 0.19200003147125244, 2.118453025817871]], "actions": [0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.0035527111031115055, -0.21618478000164032, -0.022261962294578552, 0.2587074935436249], [-0.00787640642374754, -0.4109819531440735, -0.01708781160414219, 0.5442863702774048], [-0.016096046194434166, -0.605859637260437, -0.006202084012329578, 0.8315367102622986], [-0.02821323834359646, -0.8008962869644165, 0.010428650304675102, 1.1222625970840454], [-0.04423116520047188, -0.6059126257896423, 0.03287390246987343, 0.8328689932823181], [-0.05634941905736923, -0.801468014717102, 0.04953128471970558, 1.1357067823410034], [-0.07237877696752548, -0.9972017407417297, 0.07224541902542114, 1.443503499031067], [-0.09232281148433685, -1.1931347846984863, 0.10111548751592636, 1.7578580379486084], [-0.1161855086684227, -0.999293327331543, 0.13627265393733978, 1.498258352279663], [-0.1361713707447052, -0.806065022945404, 0.16623781621456146, 1.2510433197021484], [-0.1522926688194275, -0.6134167909622192, 0.19125868380069733, 1.0147037506103516], [-0.16456100344657898, -0.421288400888443, 0.21155275404453278, 0.7876540422439575], [0.03736596554517746, 0.20256391167640686, 0.004867196083068848, -0.32690590620040894], [0.04141724482178688, 0.0073730009607970715, -0.0016709218034520745, -0.03269205242395401], [0.0415647067129612, -0.18772494792938232, -0.0023247627541422844, 0.25946322083473206], [0.03781020641326904, 0.007430113386362791, 0.002864501439034939, -0.03395206853747368], [0.03795880824327469, 0.20251086354255676, 0.0021854599472135305, -0.3257298469543457], [0.04200902581214905, 0.3976016342639923, -0.004329136572778225, -0.617722749710083], [0.04996106028556824, 0.20254042744636536, -0.016683591529726982, -0.32640644907951355], [0.05401186645030975, 0.0076599325984716415, -0.02321172133088112, -0.039031144231557846], [0.0541650652885437, -0.18712159991264343, -0.023992344737052917, 0.2462388277053833], [0.050422634929418564, 0.008334648795425892, -0.019067566841840744, -0.053914252668619156], [0.05058932676911354, 0.20372474193572998, -0.020145852118730545, -0.3525516390800476], [0.054663822054862976, 0.3991272747516632, -0.027196886017918587, -0.6515184640884399], [0.06264636665582657, 0.5946172475814819, -0.0402272529900074, -0.9526398777961731], [0.0745387151837349, 0.7902567386627197, -0.05928005278110504, -1.2576853036880493], [0.09034384787082672, 0.9860851168632507, -0.08443375676870346, -1.5683300495147705], [0.11006554961204529, 1.182107925415039, -0.11580035835504532, -1.886110782623291], [0.1337077021598816, 0.9884200692176819, -0.1535225808620453, -1.6314940452575684], [0.15347610414028168, 1.1849758625030518, -0.18615245819091797, -1.9678186178207397], [0.1771756261587143, 0.9922462105751038, -0.22550882399082184, -1.7381319999694824], [-0.01110253669321537, 0.17545652389526367, 0.02077489160001278, -0.28334856033325195], [-0.007593405898660421, -0.019955486059188843, 0.01510792039334774, 0.015813587233424187], [-0.00799251627177, 0.17494657635688782, 0.015424191951751709, -0.27206459641456604], [-0.004493584390729666, 0.36984509229660034, 0.009982900694012642, -0.5598430037498474], [0.0029033173341304064, 0.5648254752159119, -0.001213960349559784, -0.849364161491394], [0.014199827797710896, 0.7599639892578125, -0.01820124313235283, -1.1424286365509033], [0.02939910627901554, 0.9553189873695374, -0.04104981571435928, -1.4407634735107422], [0.04850548878312111, 1.1509218215942383, -0.06986508518457413, -1.745985746383667], [0.07152391970157623, 0.9566602110862732, -0.10478480160236359, -1.4758278131484985], [0.09065712988376617, 1.1528946161270142, -0.1343013495206833, -1.799315333366394], [0.1137150228023529, 0.9595064520835876, -0.17028766870498657, -1.5512112379074097], [0.13290515542030334, 1.1562124490737915, -0.2013118863105774, -1.8918254375457764], [0.15602940320968628, 1.3528705835342407, -0.23914839327335358, -2.2396421432495117], [0.04872840270400047, 0.23560254275798798, -0.025749962776899338, -0.3035360872745514], [0.05344045162200928, 0.04085685312747955, -0.03182068467140198, -0.019084040075540543], [0.0542575903236866, -0.15379464626312256, -0.03220236673951149, 0.2633917033672333], [0.051181696355342865, 0.04177180305123329, -0.026934532448649406, -0.039271749556064606], [0.05201713368296623, 0.23726943135261536, -0.02771996706724167, -0.3403296172618866], [0.05676252022385597, 0.042552635073661804, -0.034526560455560684, -0.05651526153087616], [0.05761357396841049, 0.23815219104290009, -0.03565686568617821, -0.3598885238170624], [0.06237661838531494, 0.43376240134239197, -0.042854636907577515, -0.6635982394218445], [0.07105186581611633, 0.6294534802436829, -0.05612659826874733, -0.9694607853889465], [0.0836409330368042, 0.4351280927658081, -0.07551581412553787, -0.6949242353439331], [0.09234349429607391, 0.6312117576599121, -0.08941429853439331, -1.0103920698165894], [0.10496773570775986, 0.43738943338394165, -0.10962214320898056, -0.7470727562904358], [0.1137155219912529, 0.2439369261264801, -0.12456359714269638, -0.4908002018928528], [0.11859425902366638, 0.44057556986808777, -0.13437959551811218, -0.8199999332427979], [0.1274057775735855, 0.24752336740493774, -0.1507796049118042, -0.5724210739135742], [0.13235624134540558, 0.4444020390510559, -0.16222801804542542, -0.9085499048233032], [0.14124427735805511, 0.2518036365509033, -0.18039901554584503, -0.6709316372871399], [0.14628034830093384, 0.44891393184661865, -0.1938176453113556, -1.0145491361618042], [0.15525862574577332, 0.6460179686546326, -0.2141086310148239, -1.3612957000732422], [-0.006591201759874821, 0.21422681212425232, 0.04625728353857994, -0.3082885146141052], [-0.002306665526703, 0.018477320671081543, 0.040091514587402344, -0.0013835744466632605], [-0.0019371192902326584, 0.2130020558834076, 0.04006384313106537, -0.2811524569988251], [0.0023229217622429132, 0.4075303077697754, 0.034440793097019196, -0.5609350800514221], [0.010473527945578098, 0.602152407169342, 0.023222092539072037, -0.842571496963501], [0.02251657471060753, 0.7969498038291931, 0.0063706631772220135, -1.1278622150421143], [0.038455571979284286, 0.6017450094223022, -0.016186580061912537, -0.8331878781318665], [0.050490472465753555, 0.7970843315124512, -0.03285033628344536, -1.1309171915054321], [0.0664321556687355, 0.9926206469535828, -0.05546868219971657, -1.4337196350097656], [0.0862845703959465, 0.7982251048088074, -0.08414307236671448, -1.158874273300171], [0.10224907100200653, 0.9943366646766663, -0.10732056200504303, -1.4767097234725952], [0.12213580310344696, 0.800676703453064, -0.13685475289821625, -1.2193827629089355], [0.13814933598041534, 0.6075581312179565, -0.16124241054058075, -0.9725232720375061], [0.1503005027770996, 0.8044332265853882, -0.1806928813457489, -1.3112053871154785], [0.16638916730880737, 0.6119999885559082, -0.20691698789596558, -1.0800899267196655], [0.17862917482852936, 0.8091627359390259, -0.2285187840461731, -1.4299260377883911], [-0.014655284583568573, -0.14532577991485596, -0.01934499479830265, 0.31380999088287354], [-0.01756179891526699, 0.050066329538822174, -0.013068795204162598, 0.01508959848433733], [-0.016560472548007965, 0.24537323415279388, -0.012767002917826176, -0.28168785572052], [-0.011653007939457893, 0.44067496061325073, -0.018400760367512703, -0.5783699750900269], [-0.0028395093977451324, 0.24581564962863922, -0.029968159273266792, -0.2915400266647339], [0.002076803706586361, 0.05113353952765465, -0.03579895943403244, -0.008457282558083534], [0.0030994745902717113, 0.2467501312494278, -0.0359681062400341, -0.31221678853034973], [0.0080344770103693, 0.44236552715301514, -0.04221244156360626, -0.6160224676132202], [0.01688178814947605, 0.6380510330200195, -0.054532889276742935, -0.9216960072517395], [0.029642809182405472, 0.833865761756897, -0.0729668140411377, -1.2310062646865845], [0.046320125460624695, 1.029846429824829, -0.09758693724870682, -1.545628309249878], [0.0669170543551445, 1.2259957790374756, -0.12849950790405273, -1.8670973777770996], [0.091436967253685, 1.0324931144714355, -0.16584144532680511, -1.61691153049469], [0.11208683252334595, 1.2291369438171387, -0.1981796771287918, -1.956364393234253], [0.1366695761680603, 1.036594271659851, -0.23730696737766266, -1.7310876846313477], [0.047643259167671204, -0.19103416800498962, -0.0269025806337595, 0.23510341346263885], [0.043822575360536575, 0.004461625590920448, -0.022200511768460274, -0.06594256311655045], [0.043911807239055634, 0.1998947262763977, -0.0235193632543087, -0.3655463755130768], [0.047909703105688095, 0.005114762112498283, -0.030830292031168938, -0.08037130534648895], [0.04801199585199356, -0.18955197930335999, -0.03243771567940712, 0.20242737233638763], [0.04422095790505409, -0.38419535756111145, -0.02838917076587677, 0.48470383882522583], [0.0365370512008667, -0.5789054036140442, -0.01869509369134903, 0.7683059573173523], [0.024958942085504532, -0.3835311830043793, -0.003328974125906825, 0.4697997570037842], [0.017288317903876305, -0.18836236000061035, 0.006067021284252405, 0.176069438457489], [0.013521070592105389, -0.3835706114768982, 0.009588410146534443, 0.47066012024879456], [0.005849658045917749, -0.18858540058135986, 0.019001612439751625, 0.18101470172405243], [0.0020779501646757126, 0.006259563844650984, 0.02262190729379654, -0.10561385005712509], [0.002203141339123249, -0.18917915225028992, 0.0205096285790205, 0.19411948323249817], [-0.0015804414870217443, 0.005643508862704039, 0.024392019957304, -0.09202363342046738], [-0.001467571360990405, 0.2004075050354004, 0.02255154587328434, -0.3769121766090393], [0.00254057883284986, 0.39520201086997986, 0.01501330267637968, -0.6624000668525696], [0.010444619692862034, 0.5901119112968445, 0.001765301451086998, -0.9503182172775269], [0.02224685810506344, 0.7852100729942322, -0.017241062596440315, -1.242445945739746], [0.03795105963945389, 0.9805489778518677, -0.042089980095624924, -1.5404794216156006], [0.05756203830242157, 1.176151156425476, -0.07289957255125046, -1.8459935188293457], [0.08108506351709366, 0.9819042086601257, -0.1098194420337677, -1.576810598373413], [0.10072314739227295, 1.1781501770019531, -0.14135564863681793, -1.9016282558441162], [0.12428614497184753, 1.3744902610778809, -0.17938822507858276, -2.234621286392212], [0.15177595615386963, 1.5708035230636597, -0.2240806370973587, -2.5768234729766846], [-0.03875536471605301, -0.16286292672157288, -0.018766652792692184, 0.2473258674144745], [-0.04201262444257736, -0.35771191120147705, -0.013820135965943336, 0.5340307950973511], [-0.04916686192154884, -0.5526368021965027, -0.003139520063996315, 0.822327196598053], [-0.060219597071409225, -0.7477156519889832, 0.013307024724781513, 1.1140210628509521], [-0.07517390698194504, -0.5527709126472473, 0.03558744490146637, 0.8255420327186584], [-0.08622933179140091, -0.7483610510826111, 0.05209828540682793, 1.129201889038086], [-0.10119654983282089, -0.5539587140083313, 0.0746823251247406, 0.8533040285110474], [-0.11227572709321976, -0.3599298894405365, 0.09174840152263641, 0.5850082635879517], [-0.11947432160377502, -0.16620475053787231, 0.10344856977462769, 0.32257896661758423], [-0.12279842048883438, -0.362635999917984, 0.10990014672279358, 0.6460102796554565], [-0.1300511360168457, -0.5591038465499878, 0.12282035499811172, 0.9711797833442688], [-0.14123322069644928, -0.36582517623901367, 0.14224395155906677, 0.7194641828536987], [-0.14854972064495087, -0.1729278713464737, 0.15663322806358337, 0.4747193455696106], [-0.1520082801580429, -0.36987465620040894, 0.16612762212753296, 0.812385082244873], [-0.15940576791763306, -0.5668349266052246, 0.18237532675266266, 1.1523752212524414], [-0.170742467045784, -0.3744988739490509, 0.20542283356189728, 0.9219774007797241], [-0.17823244631290436, -0.5717151165008545, 0.22386237978935242, 1.2715524435043335], [0.02259010076522827, -0.2198239415884018, 0.022724300622940063, 0.33665716648101807], [0.018193623051047325, -0.025032619014382362, 0.029457444325089455, 0.05122600123286247], [0.017692970111966133, -0.22056430578231812, 0.030481964349746704, 0.35305550694465637], [0.013281683437526226, -0.02588876150548458, 0.037543073296546936, 0.07013816386461258], [0.012763909064233303, -0.22152827680110931, 0.03894583880901337, 0.3744257390499115], [0.008333343081176281, -0.41718119382858276, 0.046434350311756134, 0.6791297197341919], [-1.0280592505296227e-05, -0.6129163503646851, 0.060016945004463196, 0.9860628247261047], [-0.012268607504665852, -0.41864731907844543, 0.07973819971084595, 0.7128183245658875], [-0.02064155414700508, -0.22471463680267334, 0.09399456530809402, 0.44626179337501526], [-0.025135846808552742, -0.4210319221019745, 0.102919802069664, 0.7670315504074097], [-0.033556483685970306, -0.6174088716506958, 0.11826043576002121, 1.0902432203292847], [-0.04590466246008873, -0.8138741254806519, 0.1400652974843979, 1.4175703525543213], [-0.062182143330574036, -0.6207364797592163, 0.16841670870780945, 1.171745777130127], [-0.07459687441587448, -0.4281558394432068, 0.1918516308069229, 0.9362426996231079], [-0.08315999060869217, -0.6252747774124146, 0.21057647466659546, 1.2825552225112915], [-0.005134107545018196, 0.1653166562318802, -0.04155103117227554, -0.317949503660202], [-0.0018277744529768825, 0.3610050082206726, -0.047910019755363464, -0.6234411597251892], [0.005392326042056084, 0.5567619800567627, -0.06037884205579758, -0.9308198690414429], [0.016527565196156502, 0.36250463128089905, -0.0789952427148819, -0.6577053666114807], [0.023777658119797707, 0.16856592893600464, -0.09214934706687927, -0.3909049928188324], [0.027148976922035217, 0.3648666441440582, -0.09996744990348816, -0.7111603617668152], [0.03444631025195122, 0.17126068472862244, -0.11419065296649933, -0.45154282450675964], [0.037871524691581726, -0.02207680605351925, -0.1232215091586113, -0.19692444801330566], [0.037429988384246826, -0.21524055302143097, -0.1271599978208542, 0.05448874831199646], [0.03312517702579498, -0.018546363338828087, -0.12607023119926453, -0.2754547595977783], [0.03275424987077713, 0.1781277060508728, -0.13157932460308075, -0.6050910949707031], [0.036316804587841034, -0.014932616613805294, -0.143681138753891, -0.3565766513347626], [0.03601815178990364, -0.20775070786476135, -0.15081267058849335, -0.11242686957120895], [0.03186313807964325, -0.010825635865330696, -0.15306121110916138, -0.4486326575279236], [0.03164662420749664, 0.18609243631362915, -0.16203387081623077, -0.785381019115448], [0.03536847233772278, 0.3830256164073944, -0.17774148285388947, -1.1243412494659424], [0.04302898421883583, 0.19062143564224243, -0.20022831857204437, -0.8922630548477173], [0.04684141278266907, -0.001304033794440329, -0.21807357668876648, -0.6686010360717773], [0.014166612178087234, 0.15634018182754517, 0.019934043288230896, -0.23996391892433167], [0.01729341596364975, 0.3511717617511749, 0.015134764835238457, -0.5262930393218994], [0.024316851049661636, 0.15584015846252441, 0.004608904477208853, -0.22887971997261047], [0.02743365429341793, -0.039347343146800995, 3.1310180929722264e-05, 0.06525345146656036], [0.026646707206964493, 0.15577416121959686, 0.001336379093118012, -0.22741959989070892], [0.029762189835309982, -0.039366867393255234, -0.003212012816220522, 0.06568457186222076], [0.028974853456020355, 0.1558009833097458, -0.001898321439512074, -0.22801002860069275], [0.03209087252616882, -0.03929378092288971, -0.0064585222862660885, 0.06407348811626434], [0.03130499646067619, -0.23432254791259766, -0.005177052225917578, 0.35471174120903015], [0.02661854587495327, -0.03912736475467682, 0.0019171824678778648, 0.06040084734559059], [0.025835998356342316, 0.15596704185009003, 0.0031251993495970964, -0.23167657852172852], [0.02895534038543701, 0.3510442078113556, -0.0015083322068676353, -0.5233720541000366], [0.03597622364759445, 0.5461873412132263, -0.011975773610174656, -0.8165299296379089], [0.04689997062087059, 0.3512313961982727, -0.028306372463703156, -0.5276377201080322], [0.053924597799777985, 0.15651890635490417, -0.03885912522673607, -0.24400697648525238], [0.05705497786402702, 0.35217371582984924, -0.04373926669359207, -0.5486893653869629], [0.06409845501184464, 0.5478819608688354, -0.05471305176615715, -0.8548261523246765], [0.07505609095096588, 0.743705153465271, -0.07180957496166229, -1.1641991138458252], [0.08993019163608551, 0.9396847486495972, -0.09509355574846268, -1.4785046577453613], [0.10872388631105423, 1.1358304023742676, -0.12466365098953247, -1.799309253692627], [0.13144049048423767, 0.9423040151596069, -0.160649836063385, -1.5478287935256958], [0.15028657019138336, 1.1389484405517578, -0.19160641729831696, -1.8860254287719727], [0.17306554317474365, 1.335568904876709, -0.22932691872119904, -2.2315468788146973], [-0.04316133260726929, -0.24269096553325653, -0.003480259096249938, 0.27034005522727966], [-0.04801515117287636, -0.04751953110098839, 0.0019265421433374286, -0.02343851886689663], [-0.04896554350852966, 0.14757473766803741, 0.0014577718684449792, -0.3155129849910736], [-0.04601404815912247, -0.0475679449737072, -0.004852487705647945, -0.022370673716068268], [-0.046965405344963074, -0.24261997640132904, -0.005299901124089956, 0.2687772810459137], [-0.05181780457496643, -0.4376658797264099, 7.564473344245926e-05, 0.5597838759422302], [-0.06057112291455269, -0.2425449937582016, 0.011271323077380657, 0.26712480187416077], [-0.06542202085256577, -0.4378259778022766, 0.01661381870508194, 0.5633413791656494], [-0.074178546667099, -0.24294105172157288, 0.027880646288394928, 0.2759385406970978], [-0.07903736084699631, -0.048227742314338684, 0.033399417996406555, -0.007822053506970406], [-0.08000192046165466, -0.24381236732006073, 0.03324297443032265, 0.2952088713645935], [-0.08487816900014877, -0.43939208984375, 0.03914715349674225, 0.5981879830360413], [-0.09366600960493088, -0.2448391318321228, 0.05111091211438179, 0.31808847188949585], [-0.09856279194355011, -0.4406503736972809, 0.05747268348932266, 0.6264418363571167], [-0.10737580060958862, -0.24637576937675476, 0.070001520216465, 0.35239875316619873], [-0.11230331659317017, -0.05231545493006706, 0.07704949378967285, 0.08258484303951263], [-0.11334962397813797, 0.14162229001522064, 0.0787011906504631, -0.18482856452465057], [-0.11051717400550842, 0.3355351388454437, 0.07500462234020233, -0.4516831934452057], [-0.10380647331476212, 0.1394370198249817, 0.06597095727920532, -0.13633234798908234], [-0.10101773589849472, -0.05656478926539421, 0.06324431300163269, 0.1764122098684311], [-0.10214903205633163, 0.1375977247953415, 0.06677255779504776, -0.09566786140203476], [-0.09939707815647125, -0.05841454491019249, 0.06485919654369354, 0.21731188893318176], [-0.1005653664469719, -0.2544008493423462, 0.06920543313026428, 0.5297284126281738], [-0.10565338283777237, -0.060317203402519226, 0.07980000227689743, 0.259630024433136], [-0.1068597286939621, 0.13358023762702942, 0.08499260246753693, -0.006854258012026548], [-0.10418812185525894, 0.3273869454860687, 0.08485551923513412, -0.27155718207359314], [-0.09764038026332855, 0.521202027797699, 0.07942437380552292, -0.5363161563873291], [-0.0872163400053978, 0.3250584006309509, 0.06869805604219437, -0.21970199048519135], [-0.08071517199277878, 0.519134521484375, 0.06430400907993317, -0.48994818329811096], [-0.07033248245716095, 0.3231671452522278, 0.05450505018234253, -0.1777123063802719], [-0.06386914104223251, 0.5174684524536133, 0.050950802862644196, -0.4527148902416229], [-0.05351977422833443, 0.32166439294815063, 0.041896503418684006, -0.1444169133901596], [-0.04708648473024368, 0.12596827745437622, 0.03900816664099693, 0.1611836701631546], [-0.04456711933016777, -0.0696897804737091, 0.04223183915019035, 0.46591296792030334], [-0.045960914343595505, -0.26538223028182983, 0.05155009776353836, 0.7716023921966553], [-0.0512685589492321, -0.4611741900444031, 0.06698215007781982, 1.0800492763519287], [-0.06049204245209694, -0.26699748635292053, 0.08858313411474228, 0.8091152906417847], [-0.0658319965004921, -0.46321433782577515, 0.10476543754339218, 1.1282960176467896], [-0.07509627938270569, -0.6595408320426941, 0.12733136117458344, 1.4519157409667969], [-0.08828709274530411, -0.8559762835502625, 0.1563696712255478, 1.7815178632736206], [-0.10540661960840225, -1.052473545074463, 0.19200003147125244, 2.118453025817871], [-0.1264560967683792, -0.85971599817276, 0.23436909914016724, 1.8907318115234375]], "action_prob": [0.5000396966934204, 0.4993916451931, 0.4989362955093384, 0.4986914396286011, 0.5014268159866333, 0.49861031770706177, 0.4985005557537079, 0.4984441101551056, 0.5015977621078491, 0.5016566514968872, 0.5017049908638, 0.5017200112342834, 0.4999227225780487, 0.5007179379463196, 0.5000907182693481, 0.5005698204040527, 0.4999195337295532, 0.4992777109146118, 0.5011541843414307, 0.5007684230804443, 0.5001524090766907, 0.5005026459693909, 0.4998387098312378, 0.4991983473300934, 0.49878033995628357, 0.49857014417648315, 0.4984724819660187, 0.4984182119369507, 0.5016247630119324, 0.4983113408088684, 0.5017238259315491, 0.5000860691070557, 0.5005670189857483, 0.5000900030136108, 0.49943262338638306, 0.49896135926246643, 0.4987039864063263, 0.49857810139656067, 0.49850937724113464, 0.5015413165092468, 0.4984051585197449, 0.5016361474990845, 0.4983026385307312, 0.4982692301273346, 0.49983927607536316, 0.5008067488670349, 0.5001992583274841, 0.500456690788269, 0.4997851848602295, 0.5008493065834045, 0.49974244832992554, 0.4991128146648407, 0.49871864914894104, 0.5014716982841492, 0.4986359477043152, 0.501539945602417, 0.5014538168907166, 0.4987978935241699, 0.5015250444412231, 0.4986862540245056, 0.5015994906425476, 0.4985705018043518, 0.4983237385749817, 0.5000268816947937, 0.5006012320518494, 0.500049352645874, 0.4994119107723236, 0.4989648163318634, 0.49872130155563354, 0.5013990998268127, 0.4986417591571808, 0.49852800369262695, 0.5015315413475037, 0.49843448400497437, 0.5016146898269653, 0.5016583800315857, 0.49833598732948303, 0.5017321705818176, 0.4982452094554901, 0.5000752210617065, 0.5005792379379272, 0.4999232292175293, 0.4992787837982178, 0.501149594783783, 0.5007750391960144, 0.49983030557632446, 0.49918821454048157, 0.49877622723579407, 0.4985732436180115, 0.4984799921512604, 0.49842724204063416, 0.5016157031059265, 0.49832308292388916, 0.5017113089561462, 0.5001590847969055, 0.5004963874816895, 0.49982893466949463, 0.5008097290992737, 0.5002108812332153, 0.4995521306991577, 0.49905824661254883, 0.5012219548225403, 0.5009923577308655, 0.4994826912879944, 0.5010253190994263, 0.5005576014518738, 0.5001012682914734, 0.5005788207054138, 0.49992337822914124, 0.49930259585380554, 0.4988909065723419, 0.49867305159568787, 0.49856409430503845, 0.49850010871887207, 0.5015506148338318, 0.4983920753002167, 0.49835023283958435, 0.4983091950416565, 0.5001083612442017, 0.49944519996643066, 0.49895644187927246, 0.49868708848953247, 0.5014421939849854, 0.4986068308353424, 0.5015142560005188, 0.5014781951904297, 0.5013108849525452, 0.49906694889068604, 0.4986197352409363, 0.5015910863876343, 0.5014786124229431, 0.4988095462322235, 0.49844279885292053, 0.5017172694206238, 0.49834027886390686, 0.49988627433776855, 0.5007532835006714, 0.4998484253883362, 0.5007880330085754, 0.49980291724205017, 0.4991716742515564, 0.4987739026546478, 0.5014235377311707, 0.5013114809989929, 0.4989793598651886, 0.49862080812454224, 0.4984545111656189, 0.5016233325004578, 0.5016427040100098, 0.4984004497528076, 0.4999559223651886, 0.49928757548332214, 0.4988330602645874, 0.5014013648033142, 0.5012518763542175, 0.4990956783294678, 0.5013197660446167, 0.5010082125663757, 0.5004822611808777, 0.5001457333564758, 0.4994201958179474, 0.5011554956436157, 0.5007075071334839, 0.4998927414417267, 0.4991838335990906, 0.4986911118030548, 0.5015702247619629, 0.5014224052429199, 0.5001499652862549, 0.4994848370552063, 0.5010105967521667, 0.5005402565002441, 0.5001268982887268, 0.5005467534065247, 0.5001190900802612, 0.5005556344985962, 0.49989140033721924, 0.5007287263870239, 0.5001248121261597, 0.4994523823261261, 0.49895256757736206, 0.5013222098350525, 0.501111626625061, 0.49933430552482605, 0.49884024262428284, 0.4985814094543457, 0.49846476316452026, 0.4984064996242523, 0.5016352534294128, 0.4983031451702118, 0.4982691705226898, 0.49991971254348755, 0.5007243752479553, 0.500092089176178, 0.500566303730011, 0.49992161989212036, 0.4992777109146118, 0.5011584162712097, 0.49923714995384216, 0.5011990070343018, 0.5008141398429871, 0.4997991621494293, 0.49915164709091187, 0.5012691617012024, 0.4990849196910858, 0.5013229846954346, 0.5009932518005371, 0.500434398651123, 0.4997897446155548, 0.5007290840148926, 0.5001832246780396, 0.5005191564559937, 0.5001317858695984, 0.49942830204963684, 0.5011317133903503, 0.5006560683250427, 0.5000220537185669, 0.4994378089904785, 0.5009573698043823, 0.4994432330131531, 0.5009747743606567, 0.4994446635246277, 0.5009925365447998, 0.5005584955215454, 0.4998975396156311, 0.499240905046463, 0.49879443645477295, 0.5014453530311584, 0.49870479106903076, 0.4984791874885559, 0.4983651041984558, 0.4982963800430298, 0.5017574429512024], "advantages": [11.361226081848145, 10.468610763549805, 9.56643295288086, 8.65444278717041, 7.732664108276367, 6.799712657928467, 5.8592352867126465, 4.908825874328613, 3.948538303375244, 2.9781546592712402, 1.9977998733520508, 1.0073068141937256, 17.382863998413086, 16.54562759399414, 15.705423355102539, 14.856743812561035, 13.993903160095215, 13.12242603302002, 12.242766380310059, 11.358478546142578, 10.465818405151367, 9.564162254333496, 8.647789001464844, 7.722278118133545, 6.788087844848633, 5.845207214355469, 4.893375396728516, 3.932313919067383, 2.9617855548858643, 1.9816913604736328, 0.9914916753768921, 12.2479829788208, 11.358880043029785, 10.46636962890625, 9.559244155883789, 8.643515586853027, 7.719254970550537, 6.786245346069336, 5.844217777252197, 4.8929362297058105, 3.9324493408203125, 2.961867570877075, 1.9818034172058105, 0.9915605187416077, 17.383066177368164, 16.545732498168945, 15.705450057983398, 14.856690406799316, 13.993758201599121, 13.122227668762207, 12.247320175170898, 11.35815143585205, 10.460701942443848, 9.554941177368164, 8.642561912536621, 7.718461990356445, 6.7874016761779785, 5.847463607788086, 4.89451789855957, 3.935262680053711, 2.9631705284118652, 1.9841879606246948, 0.9925976395606995, 14.854034423828125, 13.991369247436523, 13.125489234924316, 12.245315551757812, 11.35680103302002, 10.459986686706543, 9.554665565490723, 8.642053604125977, 7.71831750869751, 6.785671710968018, 5.844588279724121, 4.893021106719971, 3.9327287673950195, 2.9630045890808105, 1.9820164442062378, 0.9924274682998657, 13.994292259216309, 13.128256797790527, 12.247926712036133, 11.358760833740234, 10.461241722106934, 9.55893325805664, 8.648054122924805, 7.722494602203369, 6.788265705108643, 5.845364570617676, 4.893526077270508, 3.932462453842163, 2.96193265914917, 1.981833815574646, 0.99163419008255, 21.431724548339844, 20.640836715698242, 19.836332321166992, 19.023845672607422, 18.208547592163086, 17.38511085510254, 16.552873611450195, 15.71153736114502, 14.858412742614746, 13.99596881866455, 13.129634857177734, 12.249763488769531, 11.360603332519531, 10.468153953552246, 9.561007499694824, 8.644890785217285, 7.720168113708496, 6.786792755126953, 5.844515323638916, 4.8930745124816895, 3.932248592376709, 2.961998224258423, 1.9816784858703613, 0.9915996789932251, 15.70518684387207, 14.85649299621582, 13.998723983764648, 13.131585121154785, 12.255085945129395, 11.36777114868164, 10.47348690032959, 9.568258285522461, 8.653375625610352, 7.728664875030518, 6.798981189727783, 5.859041213989258, 4.907001972198486, 3.944838523864746, 2.9766383171081543, 1.9977821111679077, 1.0071159601211548, 13.994617462158203, 13.128626823425293, 12.248493194580078, 11.364863395690918, 10.466958045959473, 9.565323829650879, 8.653846740722656, 7.7324018478393555, 6.7992777824401855, 5.856154918670654, 4.907124996185303, 3.947714328765869, 2.9780611991882324, 1.997639775276184, 1.007041573524475, 16.548425674438477, 15.70262622833252, 14.848958015441895, 13.987458229064941, 13.119897842407227, 12.244172096252441, 11.355659484863281, 10.461952209472656, 9.559764862060547, 8.648710250854492, 7.722814559936523, 6.788177013397217, 5.848565101623535, 4.899868488311768, 3.936253309249878, 2.9637725353240967, 1.9823906421661377, 0.9931284785270691, 20.63910675048828, 19.834712982177734, 19.022695541381836, 18.2071475982666, 17.38381004333496, 16.546470642089844, 15.706352233886719, 14.852060317993164, 13.994815826416016, 13.128718376159668, 12.248530387878418, 11.35932731628418, 10.461645126342773, 9.55562686920166, 8.643667221069336, 7.723163604736328, 6.788688659667969, 5.84556245803833, 4.893565654754639, 3.932403087615967, 2.9618167877197266, 1.9817627668380737, 0.9915125966072083, 34.433868408203125, 33.774349212646484, 33.10260009765625, 32.42413330078125, 31.744312286376953, 31.05762481689453, 30.363433837890625, 29.65777587890625, 28.949485778808594, 28.22959327697754, 27.501930236816406, 26.772478103637695, 26.035032272338867, 25.285823822021484, 24.533349990844727, 23.769075393676758, 22.99655532836914, 22.216127395629883, 21.42823028564453, 20.637239456176758, 19.838640213012695, 19.026247024536133, 18.211374282836914, 17.38780975341797, 16.55109405517578, 15.70556354522705, 14.851648330688477, 13.989655494689941, 13.123246192932129, 12.243660926818848, 11.3596773147583, 10.462167739868164, 9.56023120880127, 8.649641036987305, 7.729616165161133, 6.79954195022583, 5.859302997589111, 4.90733003616333, 3.9479310512542725, 2.978276491165161, 1.9984782934188843, 1.0085840225219727], "value_targets": [11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [844192110, 844192110, 844192110, 844192110, 844192110, 844192110, 844192110, 844192110, 844192110, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1461604849, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1180112290, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1785535566, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 1762956862, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 160206712, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 1019827568, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 543086147, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1355069864, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 1140140742, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908, 443992908], "obs": [[-0.0170515775680542, 0.0380326546728611, -0.013067979365587234, -0.0007819504826329648], [-0.016290925443172455, 0.2333395630121231, -0.013083619065582752, -0.2975591719150543], [-0.011624133214354515, 0.4286455512046814, -0.01903480291366577, -0.5943395495414734], [-0.0030512227676808834, 0.6240286827087402, -0.03092159330844879, -0.8929570317268372], [0.009429351426661015, 0.8195561170578003, -0.048780735582113266, -1.1951974630355835], [0.025820473209023476, 1.0152745246887207, -0.07268468290567398, -1.502761721611023], [0.04612596333026886, 1.2111996412277222, -0.10273991525173187, -1.8172239065170288], [0.07034995406866074, 1.4073033332824707, -0.13908439874649048, -2.1399807929992676], [0.09849601984024048, 1.603498935699463, -0.1818840056657791, -2.472191333770752], [0.03944617882370949, 0.04734145477414131, -0.00785142369568348, 0.042204808443784714], [0.04039300978183746, 0.24257510900497437, -0.007007327396422625, -0.2529449462890625], [0.04524451121687889, 0.437796413898468, -0.012066226452589035, -0.5478298664093018], [0.05400043725967407, 0.6330857872962952, -0.02302282303571701, -0.8442899584770203], [0.06666215509176254, 0.4382854402065277, -0.039908621460199356, -0.5589349865913391], [0.07542786002159119, 0.24374572932720184, -0.05108732357621193, -0.27908778190612793], [0.08030277490615845, 0.04938837140798569, -0.05666907876729965, -0.002945263171568513], [0.08129054307937622, 0.2452753186225891, -0.05672798305749893, -0.3129557967185974], [0.08619605004787445, 0.051005467772483826, -0.06298709660768509, -0.03868886083364487], [0.08721616119146347, 0.24697145819664001, -0.06376087665557861, -0.35056090354919434], [0.0921555906534195, 0.44293949007987976, -0.07077209651470184, -0.662648618221283], [0.1010143831372261, 0.6389710307121277, -0.0840250700712204, -0.9767494797706604], [0.11379379779100418, 0.8351131677627563, -0.10356005281209946, -1.294598937034607], [0.1304960697889328, 0.6414481997489929, -0.12945203483104706, -1.0360502004623413], [0.14332503080368042, 0.448262482881546, -0.15017303824424744, -0.7866489291191101], [0.15229026973247528, 0.2554874122142792, -0.16590601205825806, -0.5447258949279785], [0.15740002691745758, 0.06303761154413223, -0.17680053412914276, -0.3085678815841675], [0.15866078436374664, 0.2601800560951233, -0.18297189474105835, -0.6513807773590088], [0.1638643741607666, 0.0680142194032669, -0.19599950313568115, -0.42143774032592773], [0.16522465646266937, 0.2652944326400757, -0.2044282704591751, -0.7689478397369385], [-0.020616576075553894, -0.01619887910783291, 0.0003790059417951852, -0.03443345054984093], [-0.02094055339694023, -0.2113262563943863, -0.00030966303893364966, 0.2583690285682678], [-0.025167079642415047, -0.4064438045024872, 0.004857717547565699, 0.550954282283783], [-0.03329595550894737, -0.601633608341217, 0.015876803547143936, 0.8451637625694275], [-0.04532862827181816, -0.7969685792922974, 0.03278007730841637, 1.1427967548370361], [-0.061267998069524765, -0.9925031661987305, 0.05563601478934288, 1.445576786994934], [-0.08111806213855743, -0.7981081008911133, 0.08454754948616028, 1.1707838773727417], [-0.09708022326231003, -0.994221568107605, 0.10796322673559189, 1.4887306690216064], [-0.11696465313434601, -0.8005675077438354, 0.13773784041404724, 1.23162043094635], [-0.1329760104417801, -0.9971655011177063, 0.1623702496290207, 1.5640915632247925], [-0.15291932225227356, -0.8043144345283508, 0.19365207850933075, 1.3261470794677734], [-0.03104867786169052, 0.010100197046995163, -0.013139110989868641, -0.00025123709929175675], [-0.030846673995256424, -0.18483087420463562, -0.013144136406481266, 0.288257360458374], [-0.03454329073429108, 0.010476022027432919, -0.007378988899290562, -0.008541958406567574], [-0.03433376923203468, -0.184539332985878, -0.0075498283840715885, 0.281803697347641], [-0.03802455589175224, 0.010689492337405682, -0.0019137541530653834, -0.013250813819468021], [-0.03781076893210411, 0.20583884418010712, -0.002178770489990711, -0.3065369427204132], [-0.03369399160146713, 0.4009917676448822, -0.008309509605169296, -0.5999062061309814], [-0.025674154981970787, 0.5962289571762085, -0.02030763402581215, -0.8951948881149292], [-0.013749576173722744, 0.7916203141212463, -0.038211531937122345, -1.1941914558410645], [0.0020828302949666977, 0.9872156977653503, -0.06209535896778107, -1.4986019134521484], [0.02182714454829693, 1.1830347776412964, -0.09206739813089371, -1.8100086450576782], [0.045487839728593826, 0.989051878452301, -0.1282675713300705, -1.5472962856292725], [0.065268874168396, 1.1854593753814697, -0.15921349823474884, -1.8770945072174072], [0.08897806704044342, 1.3819199800491333, -0.19675537943840027, -2.2146694660186768], [0.019721126183867455, -0.015018705278635025, 0.03985356539487839, 0.00945441797375679], [0.019420752301812172, -0.21068887412548065, 0.04004265367984772, 0.31444045901298523], [0.015206974931061268, -0.40635767579078674, 0.046331461519002914, 0.6194778084754944], [0.0070798215456306934, -0.6020950675010681, 0.058721017092466354, 0.9263854026794434], [-0.004962080158293247, -0.407813161611557, 0.07724872976541519, 0.6527189016342163], [-0.01311834342777729, -0.6039210557937622, 0.09030310064554214, 0.9686920046806335], [-0.02519676461815834, -0.410119891166687, 0.10967694222927094, 0.7056878209114075], [-0.03339916095137596, -0.6065768003463745, 0.1237906962633133, 1.03078293800354], [-0.04553069919347763, -0.8031087517738342, 0.14440636336803436, 1.3596266508102417], [-0.06159287318587303, -0.9997156262397766, 0.1715988963842392, 1.6937752962112427], [-0.08158718794584274, -0.806939959526062, 0.205474391579628, 1.459061622619629], [-0.04156394302845001, 0.004897077102214098, -0.03142695128917694, -0.032406486570835114], [-0.04146600142121315, -0.18976043164730072, -0.03207508102059364, 0.2501975893974304], [-0.0452612079679966, 0.005804532207548618, -0.02707112953066826, -0.052427422255277634], [-0.04514511674642563, -0.18891900777816772, -0.028119677677750587, 0.23159292340278625], [-0.04892349615693092, -0.38362810015678406, -0.023487819358706474, 0.5152750015258789], [-0.0565960593521595, -0.5784115195274353, -0.013182319700717926, 0.8004648089408875], [-0.06816428899765015, -0.7733502388000488, 0.0028269763570278883, 1.0889719724655151], [-0.08363129198551178, -0.5782656669616699, 0.024606414139270782, 0.7971773743629456], [-0.09519661217927933, -0.7737164497375488, 0.04054996371269226, 1.0974984169006348], [-0.11067093908786774, -0.969348132610321, 0.06249992921948433, 1.4026230573654175], [-0.1300579011440277, -0.7750557661056519, 0.09055238962173462, 1.130116581916809], [-0.14555901288986206, -0.9712392687797546, 0.11315472424030304, 1.4497721195220947], [-0.16498379409313202, -0.7776753306388855, 0.1421501636505127, 1.1944795846939087], [-0.18053731322288513, -0.5846509337425232, 0.16603976488113403, 0.9495149254798889], [-0.19223032891750336, -0.39210617542266846, 0.18503005802631378, 0.713261604309082], [-0.20007245242595673, -0.5892420411109924, 0.1992952972650528, 1.0580068826675415], [0.015441014431416988, -0.023111725226044655, 0.00963112898170948, -0.03835587576031685], [0.014978780411183834, 0.17187079787254333, 0.008864011615514755, -0.32798460125923157], [0.01841619610786438, -0.023376213386654854, 0.002304319990798831, -0.032519590109586716], [0.01794867217540741, 0.17171262204647064, 0.0016539280768483877, -0.32447460293769836], [0.021382924169301987, 0.36681097745895386, -0.004835563711822033, -0.6166355013847351], [0.028719143941998482, 0.5620001554489136, -0.01716827228665352, -0.9108374714851379], [0.039959147572517395, 0.7573501467704773, -0.035385023802518845, -1.2088664770126343], [0.05510615184903145, 0.952910840511322, -0.05956235155463219, -1.5124249458312988], [0.07416436821222305, 0.7585586309432983, -0.08981084823608398, -1.2389144897460938], [0.08933553844690323, 0.5646975636482239, -0.1145891398191452, -0.9756638407707214], [0.10062948614358902, 0.7611544132232666, -0.13410241901874542, -1.3020321130752563], [0.11585257947444916, 0.957698404788971, -0.16014306247234344, -1.6335091590881348], [0.13500654697418213, 0.7647778987884521, -0.19281324744224548, -1.394712209701538], [-0.008968932554125786, -0.003059974405914545, 0.02374747209250927, -0.030294144526124], [-0.009030132554471493, -0.19851428270339966, 0.023141589015722275, 0.2697857618331909], [-0.01300041750073433, -0.39395871758461, 0.02853730320930481, 0.56967693567276], [-0.0208795927464962, -0.19924835860729218, 0.03993084281682968, 0.28611913323402405], [-0.02486455999314785, -0.3949163556098938, 0.04565322399139404, 0.5911237597465515], [-0.032762885093688965, -0.20046231150627136, 0.057475700974464417, 0.31316396594047546], [-0.03677213191986084, -0.006204243749380112, 0.06373897939920425, 0.03914656490087509], [-0.03689621761441231, -0.20217955112457275, 0.0645219087600708, 0.3512391746044159], [-0.0409398078918457, -0.39815691113471985, 0.07154669612646103, 0.6635497808456421], [-0.04890294745564461, -0.5941974520683289, 0.08481769263744354, 0.9778750538825989], [-0.0607868954539299, -0.40030884742736816, 0.1043751910328865, 0.7129942178726196], [-0.06879307329654694, -0.2067749798297882, 0.11863507330417633, 0.45490387082099915], [-0.07292857021093369, -0.40335702896118164, 0.12773315608501434, 0.7825012803077698], [-0.08099571615457535, -0.21020033955574036, 0.1433831751346588, 0.53257817029953], [-0.08519972115755081, -0.017355220392346382, 0.15403473377227783, 0.28828921914100647], [-0.0855468213558197, 0.1752730756998062, 0.15980052947998047, 0.04787518084049225], [-0.08204136043787003, 0.367785781621933, 0.16075803339481354, -0.19043301045894623], [-0.07468564808368683, 0.17077283561229706, 0.15694937109947205, 0.14833559095859528], [-0.07127019017934799, 0.3633398115634918, 0.15991607308387756, -0.09101060032844543], [-0.06400339305400848, 0.5558513402938843, 0.15809586644172668, -0.32927823066711426], [-0.052886366844177246, 0.7484109401702881, 0.1515102982521057, -0.5682287216186523], [-0.03791814669966698, 0.9411194920539856, 0.14014573395252228, -0.8096062541007996], [-0.019095757976174355, 0.7443840503692627, 0.12395360320806503, -0.4763283133506775], [-0.004208077676594257, 0.9375578165054321, 0.11442703753709793, -0.7275166511535645], [0.014543077908456326, 1.1309274435043335, 0.09987670183181763, -0.9821061491966248], [0.03716162592172623, 0.9346193075180054, 0.0802345797419548, -0.6597963571548462], [0.05585401505231857, 0.7384778261184692, 0.0670386552810669, -0.3429670035839081], [0.07062356919050217, 0.5424693822860718, 0.06017931550741196, -0.02992013283073902], [0.0814729556441307, 0.7366790175437927, 0.059580910950899124, -0.30302518606185913], [0.09620653837919235, 0.930903434753418, 0.053520407527685165, -0.5763384699821472], [0.11482460796833038, 1.125235915184021, 0.0419936403632164, -0.8516923189163208], [0.1373293250799179, 0.9295673966407776, 0.02495979331433773, -0.5461057424545288], [0.15592066943645477, 0.734103798866272, 0.014037678018212318, -0.24566426873207092], [0.17060275375843048, 0.5387842059135437, 0.0091243926435709, 0.05141320452094078], [0.18137843906879425, 0.34353259205818176, 0.010152656584978104, 0.3469609320163727], [0.18824908137321472, 0.5385086536407471, 0.01709187589585781, 0.05749671533703804], [0.19901925325393677, 0.733381450176239, 0.01824180968105793, -0.22974497079849243], [0.21368688344955444, 0.928238034248352, 0.013646909967064857, -0.5166184306144714], [0.23225164413452148, 0.732926607131958, 0.0033145416527986526, -0.2196665108203888], [0.2469101846218109, 0.9280010461807251, -0.001078788423910737, -0.5113020539283752], [0.2654702067375183, 0.7328943014144897, -0.011304829269647598, -0.2189592719078064], [0.2801280915737152, 0.537935733795166, -0.015684014186263084, 0.07013630867004395], [0.290886789560318, 0.3430421054363251, -0.014281288720667362, 0.35782986879348755], [0.2977476418018341, 0.5383641719818115, -0.007124691270291805, 0.060678139328956604], [0.30851492285728455, 0.7335875034332275, -0.005911128595471382, -0.23424413800239563], [0.3231866657733917, 0.5385505557060242, -0.010596010833978653, 0.056568387895822525], [0.3339576721191406, 0.7338228225708008, -0.009464642964303493, -0.2394387423992157], [0.34863415360450745, 0.9290786981582642, -0.01425341796129942, -0.5350919961929321], [0.36721572279930115, 1.124398112297058, -0.024955257773399353, -0.8322317600250244], [0.3897036910057068, 1.3198519945144653, -0.04159989207983017, -1.1326574087142944], [0.41610071063041687, 1.1252986192703247, -0.06425303965806961, -0.8533065915107727], [0.4386066794395447, 0.9311085343360901, -0.0813191756606102, -0.5814999938011169], [0.4572288691997528, 1.1272701025009155, -0.09294917434453964, -0.8986514806747437], [0.47977426648139954, 1.323520541191101, -0.1109222024679184, -1.2190442085266113], [0.5062446594238281, 1.5198837518692017, -0.1353030949831009, -1.5443230867385864], [0.5366423726081848, 1.716347098350525, -0.1661895513534546, -1.875982642173767], [0.57096928358078, 1.9128473997116089, -0.2037092000246048, -2.2153072357177734], [-0.049672070890665054, -0.048218391835689545, 0.010871964506804943, 0.029155798256397247], [-0.05063644051551819, 0.1467459797859192, 0.011455080471932888, -0.26007717847824097], [-0.04770151898264885, -0.048537611961364746, 0.006253537256270647, 0.03619671240448952], [-0.04867227375507355, -0.24374867975711823, 0.006977471522986889, 0.3308461010456085], [-0.053547244518995285, -0.4389692544937134, 0.013594393618404865, 0.6257212162017822], [-0.06232663244009018, -0.6342782974243164, 0.026108818128705025, 0.9226543307304382], [-0.0750121995806694, -0.8297430872917175, 0.044561903923749924, 1.2234266996383667], [-0.09160705655813217, -0.6352225542068481, 0.06903044134378433, 0.9450324773788452], [-0.1043115109205246, -0.4410949647426605, 0.0879310891032219, 0.6748133897781372], [-0.11313340812921524, -0.24729792773723602, 0.1014273539185524, 0.4110593795776367], [-0.11807937175035477, -0.053749144077301025, 0.10964854806661606, 0.15199680626392365], [-0.11915434896945953, -0.25025638937950134, 0.11268848180770874, 0.47715964913368225], [-0.12415947765111923, -0.4467740058898926, 0.12223167717456818, 0.8031267523765564], [-0.13309496641159058, -0.2535211145877838, 0.13829420506954193, 0.5512568950653076], [-0.13816538453102112, -0.06058473140001297, 0.1493193507194519, 0.30514439940452576], [-0.13937707245349884, 0.13212889432907104, 0.15542224049568176, 0.0630275085568428], [-0.1367345005273819, -0.06484036147594452, 0.1566827893257141, 0.40043047070503235], [-0.13803130388259888, -0.2617974579334259, 0.16469138860702515, 0.7381235957145691], [-0.14326725900173187, -0.06928642094135284, 0.17945386469364166, 0.5014650225639343], [-0.14465297758579254, -0.266423761844635, 0.1894831657409668, 0.8448991179466248], [-0.14998145401477814, -0.4635556936264038, 0.206381157040596, 1.1906797885894775], [-0.0113771241158247, -0.011821405962109566, -0.0301225446164608, 0.037884220480918884], [-0.011613552458584309, -0.20649874210357666, -0.02936485968530178, 0.32091304659843445], [-0.015743527561426163, -0.40119045972824097, -0.022946598008275032, 0.6041927337646484], [-0.023767337203025818, -0.5959841012954712, -0.01086274441331625, 0.8895605802536011], [-0.03568701818585396, -0.4007164537906647, 0.006928466726094484, 0.5934827923774719], [-0.04370134696364403, -0.20569217205047607, 0.01879812218248844, 0.3029903173446655], [-0.047815192490816116, -0.010843103751540184, 0.024857928976416588, 0.016294676810503006], [-0.04803205281496048, 0.1839136928319931, 0.025183822959661484, -0.2684427797794342], [-0.044353779405355453, 0.37866735458374023, 0.01981496624648571, -0.5530773997306824], [-0.03678043186664581, 0.1832728385925293, 0.008753418922424316, -0.2542179226875305], [-0.033114977180957794, 0.3782687187194824, 0.003669060068204999, -0.5441270470619202], [-0.025549601763486862, 0.18309539556503296, -0.0072134812362492085, -0.2502903640270233], [-0.02188769355416298, -0.011922803707420826, -0.012219288386404514, 0.040108587592840195], [-0.022126149386167526, 0.18337221443653107, -0.011417116969823837, -0.25640445947647095], [-0.01845870539546013, 0.3786553144454956, -0.016545206308364868, -0.5526665449142456], [-0.010885599069297314, 0.574005663394928, -0.027598537504673004, -0.8505160212516785], [0.0005945139564573765, 0.37927067279815674, -0.04460885748267174, -0.5666377544403076], [0.008179927244782448, 0.5749890804290771, -0.055941611528396606, -0.8730339407920837], [0.019679708406329155, 0.7708252668380737, -0.0734022930264473, -1.1827670335769653], [0.03509621322154999, 0.5767285227775574, -0.09705763310194016, -0.9139667749404907], [0.04663078486919403, 0.38304391503334045, -0.11533696949481964, -0.6532973051071167], [0.05429166555404663, 0.1897008717060089, -0.1284029185771942, -0.3990435302257538], [0.05808568000793457, 0.38638827204704285, -0.1363837867975235, -0.729292631149292], [0.06581344455480576, 0.5831053853034973, -0.15096963942050934, -1.061600923538208], [0.07747555524110794, 0.7798686623573303, -0.17220164835453033, -1.3976054191589355], [0.09307292848825455, 0.5872551202774048, -0.20015376806259155, -1.1633356809616089], [-0.017174551263451576, -0.04119570180773735, 0.004096720367670059, 0.02791690081357956], [-0.01799846440553665, 0.15386725962162018, 0.004655058030039072, -0.2634706497192383], [-0.014921119436621666, -0.04132082313299179, -0.0006143549107946455, 0.030676884576678276], [-0.015747535973787308, -0.2364339530467987, -8.172331718014902e-07, 0.3231659233570099], [-0.020476214587688446, -0.4315558969974518, 0.006462500896304846, 0.6158486008644104], [-0.029107334092259407, -0.23652483522891998, 0.01877947337925434, 0.32520803809165955], [-0.033837828785181046, -0.43190905451774597, 0.025283632799983025, 0.623753547668457], [-0.04247600957751274, -0.6273747086524963, 0.03775870427489281, 0.9242909550666809], [-0.05502350628376007, -0.822985827922821, 0.05624452233314514, 1.228596806526184], [-0.07148322463035583, -1.0187846422195435, 0.08081646263599396, 1.5383578538894653], [-0.09185891598463058, -0.8247228264808655, 0.11158362030982971, 1.2719494104385376], [-0.10835336893796921, -1.0210778713226318, 0.13702259957790375, 1.5973879098892212], [-0.12877492606639862, -1.2175321578979492, 0.16897036135196686, 1.9294660091400146], [-0.1531255692243576, -1.414014220237732, 0.20755968987941742, 2.26943302154541]], "actions": [1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.016290925443172455, 0.2333395630121231, -0.013083619065582752, -0.2975591719150543], [-0.011624133214354515, 0.4286455512046814, -0.01903480291366577, -0.5943395495414734], [-0.0030512227676808834, 0.6240286827087402, -0.03092159330844879, -0.8929570317268372], [0.009429351426661015, 0.8195561170578003, -0.048780735582113266, -1.1951974630355835], [0.025820473209023476, 1.0152745246887207, -0.07268468290567398, -1.502761721611023], [0.04612596333026886, 1.2111996412277222, -0.10273991525173187, -1.8172239065170288], [0.07034995406866074, 1.4073033332824707, -0.13908439874649048, -2.1399807929992676], [0.09849601984024048, 1.603498935699463, -0.1818840056657791, -2.472191333770752], [0.13056600093841553, 1.410312294960022, -0.2313278317451477, -2.240370988845825], [0.04039300978183746, 0.24257510900497437, -0.007007327396422625, -0.2529449462890625], [0.04524451121687889, 0.437796413898468, -0.012066226452589035, -0.5478298664093018], [0.05400043725967407, 0.6330857872962952, -0.02302282303571701, -0.8442899584770203], [0.06666215509176254, 0.4382854402065277, -0.039908621460199356, -0.5589349865913391], [0.07542786002159119, 0.24374572932720184, -0.05108732357621193, -0.27908778190612793], [0.08030277490615845, 0.04938837140798569, -0.05666907876729965, -0.002945263171568513], [0.08129054307937622, 0.2452753186225891, -0.05672798305749893, -0.3129557967185974], [0.08619605004787445, 0.051005467772483826, -0.06298709660768509, -0.03868886083364487], [0.08721616119146347, 0.24697145819664001, -0.06376087665557861, -0.35056090354919434], [0.0921555906534195, 0.44293949007987976, -0.07077209651470184, -0.662648618221283], [0.1010143831372261, 0.6389710307121277, -0.0840250700712204, -0.9767494797706604], [0.11379379779100418, 0.8351131677627563, -0.10356005281209946, -1.294598937034607], [0.1304960697889328, 0.6414481997489929, -0.12945203483104706, -1.0360502004623413], [0.14332503080368042, 0.448262482881546, -0.15017303824424744, -0.7866489291191101], [0.15229026973247528, 0.2554874122142792, -0.16590601205825806, -0.5447258949279785], [0.15740002691745758, 0.06303761154413223, -0.17680053412914276, -0.3085678815841675], [0.15866078436374664, 0.2601800560951233, -0.18297189474105835, -0.6513807773590088], [0.1638643741607666, 0.0680142194032669, -0.19599950313568115, -0.42143774032592773], [0.16522465646266937, 0.2652944326400757, -0.2044282704591751, -0.7689478397369385], [0.1705305576324463, 0.4625552296638489, -0.2198072224855423, -1.1183619499206543], [-0.02094055339694023, -0.2113262563943863, -0.00030966303893364966, 0.2583690285682678], [-0.025167079642415047, -0.4064438045024872, 0.004857717547565699, 0.550954282283783], [-0.03329595550894737, -0.601633608341217, 0.015876803547143936, 0.8451637625694275], [-0.04532862827181816, -0.7969685792922974, 0.03278007730841637, 1.1427967548370361], [-0.061267998069524765, -0.9925031661987305, 0.05563601478934288, 1.445576786994934], [-0.08111806213855743, -0.7981081008911133, 0.08454754948616028, 1.1707838773727417], [-0.09708022326231003, -0.994221568107605, 0.10796322673559189, 1.4887306690216064], [-0.11696465313434601, -0.8005675077438354, 0.13773784041404724, 1.23162043094635], [-0.1329760104417801, -0.9971655011177063, 0.1623702496290207, 1.5640915632247925], [-0.15291932225227356, -0.8043144345283508, 0.19365207850933075, 1.3261470794677734], [-0.1690056025981903, -1.0012807846069336, 0.22017502784729004, 1.6726526021957397], [-0.030846673995256424, -0.18483087420463562, -0.013144136406481266, 0.288257360458374], [-0.03454329073429108, 0.010476022027432919, -0.007378988899290562, -0.008541958406567574], [-0.03433376923203468, -0.184539332985878, -0.0075498283840715885, 0.281803697347641], [-0.03802455589175224, 0.010689492337405682, -0.0019137541530653834, -0.013250813819468021], [-0.03781076893210411, 0.20583884418010712, -0.002178770489990711, -0.3065369427204132], [-0.03369399160146713, 0.4009917676448822, -0.008309509605169296, -0.5999062061309814], [-0.025674154981970787, 0.5962289571762085, -0.02030763402581215, -0.8951948881149292], [-0.013749576173722744, 0.7916203141212463, -0.038211531937122345, -1.1941914558410645], [0.0020828302949666977, 0.9872156977653503, -0.06209535896778107, -1.4986019134521484], [0.02182714454829693, 1.1830347776412964, -0.09206739813089371, -1.8100086450576782], [0.045487839728593826, 0.989051878452301, -0.1282675713300705, -1.5472962856292725], [0.065268874168396, 1.1854593753814697, -0.15921349823474884, -1.8770945072174072], [0.08897806704044342, 1.3819199800491333, -0.19675537943840027, -2.2146694660186768], [0.11661646515130997, 1.1891510486602783, -0.24104878306388855, -1.988568663597107], [0.019420752301812172, -0.21068887412548065, 0.04004265367984772, 0.31444045901298523], [0.015206974931061268, -0.40635767579078674, 0.046331461519002914, 0.6194778084754944], [0.0070798215456306934, -0.6020950675010681, 0.058721017092466354, 0.9263854026794434], [-0.004962080158293247, -0.407813161611557, 0.07724872976541519, 0.6527189016342163], [-0.01311834342777729, -0.6039210557937622, 0.09030310064554214, 0.9686920046806335], [-0.02519676461815834, -0.410119891166687, 0.10967694222927094, 0.7056878209114075], [-0.03339916095137596, -0.6065768003463745, 0.1237906962633133, 1.03078293800354], [-0.04553069919347763, -0.8031087517738342, 0.14440636336803436, 1.3596266508102417], [-0.06159287318587303, -0.9997156262397766, 0.1715988963842392, 1.6937752962112427], [-0.08158718794584274, -0.806939959526062, 0.205474391579628, 1.459061622619629], [-0.09772598743438721, -0.6148439049720764, 0.23465563356876373, 1.236964225769043], [-0.04146600142121315, -0.18976043164730072, -0.03207508102059364, 0.2501975893974304], [-0.0452612079679966, 0.005804532207548618, -0.02707112953066826, -0.052427422255277634], [-0.04514511674642563, -0.18891900777816772, -0.028119677677750587, 0.23159292340278625], [-0.04892349615693092, -0.38362810015678406, -0.023487819358706474, 0.5152750015258789], [-0.0565960593521595, -0.5784115195274353, -0.013182319700717926, 0.8004648089408875], [-0.06816428899765015, -0.7733502388000488, 0.0028269763570278883, 1.0889719724655151], [-0.08363129198551178, -0.5782656669616699, 0.024606414139270782, 0.7971773743629456], [-0.09519661217927933, -0.7737164497375488, 0.04054996371269226, 1.0974984169006348], [-0.11067093908786774, -0.969348132610321, 0.06249992921948433, 1.4026230573654175], [-0.1300579011440277, -0.7750557661056519, 0.09055238962173462, 1.130116581916809], [-0.14555901288986206, -0.9712392687797546, 0.11315472424030304, 1.4497721195220947], [-0.16498379409313202, -0.7776753306388855, 0.1421501636505127, 1.1944795846939087], [-0.18053731322288513, -0.5846509337425232, 0.16603976488113403, 0.9495149254798889], [-0.19223032891750336, -0.39210617542266846, 0.18503005802631378, 0.713261604309082], [-0.20007245242595673, -0.5892420411109924, 0.1992952972650528, 1.0580068826675415], [-0.21185728907585144, -0.7863655090332031, 0.22045543789863586, 1.4060451984405518], [0.014978780411183834, 0.17187079787254333, 0.008864011615514755, -0.32798460125923157], [0.01841619610786438, -0.023376213386654854, 0.002304319990798831, -0.032519590109586716], [0.01794867217540741, 0.17171262204647064, 0.0016539280768483877, -0.32447460293769836], [0.021382924169301987, 0.36681097745895386, -0.004835563711822033, -0.6166355013847351], [0.028719143941998482, 0.5620001554489136, -0.01716827228665352, -0.9108374714851379], [0.039959147572517395, 0.7573501467704773, -0.035385023802518845, -1.2088664770126343], [0.05510615184903145, 0.952910840511322, -0.05956235155463219, -1.5124249458312988], [0.07416436821222305, 0.7585586309432983, -0.08981084823608398, -1.2389144897460938], [0.08933553844690323, 0.5646975636482239, -0.1145891398191452, -0.9756638407707214], [0.10062948614358902, 0.7611544132232666, -0.13410241901874542, -1.3020321130752563], [0.11585257947444916, 0.957698404788971, -0.16014306247234344, -1.6335091590881348], [0.13500654697418213, 0.7647778987884521, -0.19281324744224548, -1.394712209701538], [0.15030209720134735, 0.5725060701370239, -0.2207074910402298, -1.167985439300537], [-0.009030132554471493, -0.19851428270339966, 0.023141589015722275, 0.2697857618331909], [-0.01300041750073433, -0.39395871758461, 0.02853730320930481, 0.56967693567276], [-0.0208795927464962, -0.19924835860729218, 0.03993084281682968, 0.28611913323402405], [-0.02486455999314785, -0.3949163556098938, 0.04565322399139404, 0.5911237597465515], [-0.032762885093688965, -0.20046231150627136, 0.057475700974464417, 0.31316396594047546], [-0.03677213191986084, -0.006204243749380112, 0.06373897939920425, 0.03914656490087509], [-0.03689621761441231, -0.20217955112457275, 0.0645219087600708, 0.3512391746044159], [-0.0409398078918457, -0.39815691113471985, 0.07154669612646103, 0.6635497808456421], [-0.04890294745564461, -0.5941974520683289, 0.08481769263744354, 0.9778750538825989], [-0.0607868954539299, -0.40030884742736816, 0.1043751910328865, 0.7129942178726196], [-0.06879307329654694, -0.2067749798297882, 0.11863507330417633, 0.45490387082099915], [-0.07292857021093369, -0.40335702896118164, 0.12773315608501434, 0.7825012803077698], [-0.08099571615457535, -0.21020033955574036, 0.1433831751346588, 0.53257817029953], [-0.08519972115755081, -0.017355220392346382, 0.15403473377227783, 0.28828921914100647], [-0.0855468213558197, 0.1752730756998062, 0.15980052947998047, 0.04787518084049225], [-0.08204136043787003, 0.367785781621933, 0.16075803339481354, -0.19043301045894623], [-0.07468564808368683, 0.17077283561229706, 0.15694937109947205, 0.14833559095859528], [-0.07127019017934799, 0.3633398115634918, 0.15991607308387756, -0.09101060032844543], [-0.06400339305400848, 0.5558513402938843, 0.15809586644172668, -0.32927823066711426], [-0.052886366844177246, 0.7484109401702881, 0.1515102982521057, -0.5682287216186523], [-0.03791814669966698, 0.9411194920539856, 0.14014573395252228, -0.8096062541007996], [-0.019095757976174355, 0.7443840503692627, 0.12395360320806503, -0.4763283133506775], [-0.004208077676594257, 0.9375578165054321, 0.11442703753709793, -0.7275166511535645], [0.014543077908456326, 1.1309274435043335, 0.09987670183181763, -0.9821061491966248], [0.03716162592172623, 0.9346193075180054, 0.0802345797419548, -0.6597963571548462], [0.05585401505231857, 0.7384778261184692, 0.0670386552810669, -0.3429670035839081], [0.07062356919050217, 0.5424693822860718, 0.06017931550741196, -0.02992013283073902], [0.0814729556441307, 0.7366790175437927, 0.059580910950899124, -0.30302518606185913], [0.09620653837919235, 0.930903434753418, 0.053520407527685165, -0.5763384699821472], [0.11482460796833038, 1.125235915184021, 0.0419936403632164, -0.8516923189163208], [0.1373293250799179, 0.9295673966407776, 0.02495979331433773, -0.5461057424545288], [0.15592066943645477, 0.734103798866272, 0.014037678018212318, -0.24566426873207092], [0.17060275375843048, 0.5387842059135437, 0.0091243926435709, 0.05141320452094078], [0.18137843906879425, 0.34353259205818176, 0.010152656584978104, 0.3469609320163727], [0.18824908137321472, 0.5385086536407471, 0.01709187589585781, 0.05749671533703804], [0.19901925325393677, 0.733381450176239, 0.01824180968105793, -0.22974497079849243], [0.21368688344955444, 0.928238034248352, 0.013646909967064857, -0.5166184306144714], [0.23225164413452148, 0.732926607131958, 0.0033145416527986526, -0.2196665108203888], [0.2469101846218109, 0.9280010461807251, -0.001078788423910737, -0.5113020539283752], [0.2654702067375183, 0.7328943014144897, -0.011304829269647598, -0.2189592719078064], [0.2801280915737152, 0.537935733795166, -0.015684014186263084, 0.07013630867004395], [0.290886789560318, 0.3430421054363251, -0.014281288720667362, 0.35782986879348755], [0.2977476418018341, 0.5383641719818115, -0.007124691270291805, 0.060678139328956604], [0.30851492285728455, 0.7335875034332275, -0.005911128595471382, -0.23424413800239563], [0.3231866657733917, 0.5385505557060242, -0.010596010833978653, 0.056568387895822525], [0.3339576721191406, 0.7338228225708008, -0.009464642964303493, -0.2394387423992157], [0.34863415360450745, 0.9290786981582642, -0.01425341796129942, -0.5350919961929321], [0.36721572279930115, 1.124398112297058, -0.024955257773399353, -0.8322317600250244], [0.3897036910057068, 1.3198519945144653, -0.04159989207983017, -1.1326574087142944], [0.41610071063041687, 1.1252986192703247, -0.06425303965806961, -0.8533065915107727], [0.4386066794395447, 0.9311085343360901, -0.0813191756606102, -0.5814999938011169], [0.4572288691997528, 1.1272701025009155, -0.09294917434453964, -0.8986514806747437], [0.47977426648139954, 1.323520541191101, -0.1109222024679184, -1.2190442085266113], [0.5062446594238281, 1.5198837518692017, -0.1353030949831009, -1.5443230867385864], [0.5366423726081848, 1.716347098350525, -0.1661895513534546, -1.875982642173767], [0.57096928358078, 1.9128473997116089, -0.2037092000246048, -2.2153072357177734], [0.6092262268066406, 2.1092538833618164, -0.24801534414291382, -2.563302516937256], [-0.05063644051551819, 0.1467459797859192, 0.011455080471932888, -0.26007717847824097], [-0.04770151898264885, -0.048537611961364746, 0.006253537256270647, 0.03619671240448952], [-0.04867227375507355, -0.24374867975711823, 0.006977471522986889, 0.3308461010456085], [-0.053547244518995285, -0.4389692544937134, 0.013594393618404865, 0.6257212162017822], [-0.06232663244009018, -0.6342782974243164, 0.026108818128705025, 0.9226543307304382], [-0.0750121995806694, -0.8297430872917175, 0.044561903923749924, 1.2234266996383667], [-0.09160705655813217, -0.6352225542068481, 0.06903044134378433, 0.9450324773788452], [-0.1043115109205246, -0.4410949647426605, 0.0879310891032219, 0.6748133897781372], [-0.11313340812921524, -0.24729792773723602, 0.1014273539185524, 0.4110593795776367], [-0.11807937175035477, -0.053749144077301025, 0.10964854806661606, 0.15199680626392365], [-0.11915434896945953, -0.25025638937950134, 0.11268848180770874, 0.47715964913368225], [-0.12415947765111923, -0.4467740058898926, 0.12223167717456818, 0.8031267523765564], [-0.13309496641159058, -0.2535211145877838, 0.13829420506954193, 0.5512568950653076], [-0.13816538453102112, -0.06058473140001297, 0.1493193507194519, 0.30514439940452576], [-0.13937707245349884, 0.13212889432907104, 0.15542224049568176, 0.0630275085568428], [-0.1367345005273819, -0.06484036147594452, 0.1566827893257141, 0.40043047070503235], [-0.13803130388259888, -0.2617974579334259, 0.16469138860702515, 0.7381235957145691], [-0.14326725900173187, -0.06928642094135284, 0.17945386469364166, 0.5014650225639343], [-0.14465297758579254, -0.266423761844635, 0.1894831657409668, 0.8448991179466248], [-0.14998145401477814, -0.4635556936264038, 0.206381157040596, 1.1906797885894775], [-0.1592525690793991, -0.6606650352478027, 0.23019474744796753, 1.5403157472610474], [-0.011613552458584309, -0.20649874210357666, -0.02936485968530178, 0.32091304659843445], [-0.015743527561426163, -0.40119045972824097, -0.022946598008275032, 0.6041927337646484], [-0.023767337203025818, -0.5959841012954712, -0.01086274441331625, 0.8895605802536011], [-0.03568701818585396, -0.4007164537906647, 0.006928466726094484, 0.5934827923774719], [-0.04370134696364403, -0.20569217205047607, 0.01879812218248844, 0.3029903173446655], [-0.047815192490816116, -0.010843103751540184, 0.024857928976416588, 0.016294676810503006], [-0.04803205281496048, 0.1839136928319931, 0.025183822959661484, -0.2684427797794342], [-0.044353779405355453, 0.37866735458374023, 0.01981496624648571, -0.5530773997306824], [-0.03678043186664581, 0.1832728385925293, 0.008753418922424316, -0.2542179226875305], [-0.033114977180957794, 0.3782687187194824, 0.003669060068204999, -0.5441270470619202], [-0.025549601763486862, 0.18309539556503296, -0.0072134812362492085, -0.2502903640270233], [-0.02188769355416298, -0.011922803707420826, -0.012219288386404514, 0.040108587592840195], [-0.022126149386167526, 0.18337221443653107, -0.011417116969823837, -0.25640445947647095], [-0.01845870539546013, 0.3786553144454956, -0.016545206308364868, -0.5526665449142456], [-0.010885599069297314, 0.574005663394928, -0.027598537504673004, -0.8505160212516785], [0.0005945139564573765, 0.37927067279815674, -0.04460885748267174, -0.5666377544403076], [0.008179927244782448, 0.5749890804290771, -0.055941611528396606, -0.8730339407920837], [0.019679708406329155, 0.7708252668380737, -0.0734022930264473, -1.1827670335769653], [0.03509621322154999, 0.5767285227775574, -0.09705763310194016, -0.9139667749404907], [0.04663078486919403, 0.38304391503334045, -0.11533696949481964, -0.6532973051071167], [0.05429166555404663, 0.1897008717060089, -0.1284029185771942, -0.3990435302257538], [0.05808568000793457, 0.38638827204704285, -0.1363837867975235, -0.729292631149292], [0.06581344455480576, 0.5831053853034973, -0.15096963942050934, -1.061600923538208], [0.07747555524110794, 0.7798686623573303, -0.17220164835453033, -1.3976054191589355], [0.09307292848825455, 0.5872551202774048, -0.20015376806259155, -1.1633356809616089], [0.10481803119182587, 0.7843389511108398, -0.22342047095298767, -1.5115126371383667], [-0.01799846440553665, 0.15386725962162018, 0.004655058030039072, -0.2634706497192383], [-0.014921119436621666, -0.04132082313299179, -0.0006143549107946455, 0.030676884576678276], [-0.015747535973787308, -0.2364339530467987, -8.172331718014902e-07, 0.3231659233570099], [-0.020476214587688446, -0.4315558969974518, 0.006462500896304846, 0.6158486008644104], [-0.029107334092259407, -0.23652483522891998, 0.01877947337925434, 0.32520803809165955], [-0.033837828785181046, -0.43190905451774597, 0.025283632799983025, 0.623753547668457], [-0.04247600957751274, -0.6273747086524963, 0.03775870427489281, 0.9242909550666809], [-0.05502350628376007, -0.822985827922821, 0.05624452233314514, 1.228596806526184], [-0.07148322463035583, -1.0187846422195435, 0.08081646263599396, 1.5383578538894653], [-0.09185891598463058, -0.8247228264808655, 0.11158362030982971, 1.2719494104385376], [-0.10835336893796921, -1.0210778713226318, 0.13702259957790375, 1.5973879098892212], [-0.12877492606639862, -1.2175321578979492, 0.16897036135196686, 1.9294660091400146], [-0.1531255692243576, -1.414014220237732, 0.20755968987941742, 2.26943302154541], [-0.18140585720539093, -1.6103824377059937, 0.2529483437538147, 2.618248701095581]], "action_prob": [0.4999227523803711, 0.4992787539958954, 0.4988511800765991, 0.4986320734024048, 0.49852797389030457, 0.49846911430358887, 0.4984223246574402, 0.4983769953250885, 0.501667857170105, 0.4999271035194397, 0.49927517771720886, 0.49883198738098145, 0.501394510269165, 0.5012378692626953, 0.5008631348609924, 0.49973613023757935, 0.5009119510650635, 0.49967101216316223, 0.499034583568573, 0.498644083738327, 0.49846351146698, 0.5016133189201355, 0.5016270279884338, 0.5015623569488525, 0.5013492107391357, 0.4990663230419159, 0.5014444589614868, 0.49891388416290283, 0.498462438583374, 0.4999995529651642, 0.49934259057044983, 0.49888473749160767, 0.4986439645290375, 0.49853113293647766, 0.501528799533844, 0.4984370172023773, 0.5016126036643982, 0.49834346771240234, 0.501695990562439, 0.4982500672340393, 0.5000185966491699, 0.5006340146064758, 0.5000154972076416, 0.5006405711174011, 0.49999186396598816, 0.49934566020965576, 0.49890682101249695, 0.4986751973628998, 0.49856171011924744, 0.4984966516494751, 0.5015542507171631, 0.49839073419570923, 0.49834904074668884, 0.5016916990280151, 0.499898761510849, 0.49924424290657043, 0.4988133907318115, 0.5014039874076843, 0.4987294673919678, 0.5014723539352417, 0.49863773584365845, 0.4984561502933502, 0.4983748495578766, 0.5016729235649109, 0.5017268061637878, 0.5000790953636169, 0.5005733966827393, 0.5000944137573242, 0.4994371235370636, 0.4989551603794098, 0.49869030714035034, 0.501436173915863, 0.4986124634742737, 0.4984932839870453, 0.5015641450881958, 0.4984017014503479, 0.5016450881958008, 0.5016894936561584, 0.5016914010047913, 0.49840235710144043, 0.4982388913631439, 0.4999966621398926, 0.500651478767395, 0.49998751282691956, 0.49933603405952454, 0.4988865852355957, 0.49864816665649414, 0.4985329806804657, 0.5015307068824768, 0.501564621925354, 0.49844714999198914, 0.49835705757141113, 0.5016903281211853, 0.5017423033714294, 0.49997884035110474, 0.4993135929107666, 0.5011454820632935, 0.49925440549850464, 0.5011959075927734, 0.5008165836334229, 0.4997827708721161, 0.4991288185119629, 0.498712420463562, 0.5014891624450684, 0.5013778805732727, 0.4989110827445984, 0.5014500021934509, 0.501201868057251, 0.5007451772689819, 0.5001441240310669, 0.5004259943962097, 0.5002568364143372, 0.49966371059417725, 0.4992116689682007, 0.4989306330680847, 0.5012292861938477, 0.4988832473754883, 0.498708575963974, 0.5013887286186218, 0.5013687014579773, 0.5012205243110657, 0.4991588890552521, 0.4987643361091614, 0.49855509400367737, 0.5015432834625244, 0.5015102028846741, 0.5013332366943359, 0.5009231567382812, 0.499699205160141, 0.4990856349468231, 0.4986536502838135, 0.5015711188316345, 0.49861499667167664, 0.5016105771064758, 0.5014267563819885, 0.5010128021240234, 0.4995969831943512, 0.4989835321903229, 0.5014489889144897, 0.498960018157959, 0.4985295832157135, 0.49831491708755493, 0.49823981523513794, 0.5017749071121216, 0.5018271803855896, 0.4981759190559387, 0.4981287717819214, 0.4981386661529541, 0.49815836548805237, 0.4981713891029358, 0.4981752634048462, 0.5001794695854187, 0.5004860162734985, 0.49982190132141113, 0.4991926848888397, 0.4987863004207611, 0.4985833466053009, 0.5015102028846741, 0.5015037059783936, 0.5013963580131531, 0.5011049509048462, 0.4994105100631714, 0.4988175630569458, 0.5015089511871338, 0.5012899041175842, 0.5008614659309387, 0.4997284412384033, 0.4990272521972656, 0.5014406442642212, 0.4988901913166046, 0.4984722435474396, 0.4982728958129883, 0.49998295307159424, 0.4993498921394348, 0.4989171326160431, 0.5013140439987183, 0.5011442303657532, 0.5007490515708923, 0.5001271367073059, 0.4994756579399109, 0.5009920597076416, 0.4994503855705261, 0.5010242462158203, 0.5005853772163391, 0.5000643134117126, 0.4993968605995178, 0.4989232122898102, 0.5013299584388733, 0.49885088205337524, 0.4986073672771454, 0.5015051364898682, 0.5014820694923401, 0.5013493895530701, 0.49897056818008423, 0.49857577681541443, 0.49839648604393005, 0.501681923866272, 0.498299777507782, 0.5001266598701477, 0.5005404353141785, 0.49988090991973877, 0.4992488622665405, 0.5011657476425171, 0.4992005527019501, 0.49878814816474915, 0.4985823631286621, 0.498487263917923, 0.5015659332275391, 0.4983905255794525, 0.49834713339805603, 0.4983113408088684, 0.4982749819755554], "advantages": [8.648172378540039, 7.72265625, 6.788433074951172, 5.845515727996826, 4.893653869628906, 3.9325673580169678, 2.9620180130004883, 1.9818116426467896, 0.991786539554596, 18.209674835205078, 17.380699157714844, 16.543916702270508, 15.699410438537598, 14.849394798278809, 13.991435050964355, 13.125296592712402, 12.244879722595215, 11.361051559448242, 10.46284008026123, 9.556272506713867, 8.641336441040039, 7.71775484085083, 6.7862162590026855, 5.8456315994262695, 4.8960113525390625, 3.93729829788208, 2.9643943309783936, 1.9859397411346436, 0.9935905933380127, 10.465849876403809, 9.564258575439453, 8.652997016906738, 7.7318034172058105, 6.8007073402404785, 5.8597917556762695, 4.908419609069824, 3.9483842849731445, 2.977795124053955, 1.9982131719589233, 1.0080348253250122, 13.125330924987793, 12.250551223754883, 11.361358642578125, 10.468785285949707, 9.561605453491211, 8.645350456237793, 7.72047758102417, 6.786997318267822, 5.844661712646484, 4.893192291259766, 3.9323532581329346, 2.9621036052703857, 1.9817770719528198, 0.9916948080062866, 10.46640682220459, 9.56485652923584, 8.653512001037598, 7.732182025909424, 6.798948287963867, 5.858850955963135, 4.906827449798584, 3.947540760040283, 2.9779672622680664, 1.9982271194458008, 1.0081579685211182, 14.853784561157227, 13.996441841125488, 13.12480354309082, 12.250021934509277, 11.365923881530762, 10.472208976745605, 9.568876266479492, 8.654369354248047, 7.7327189445495605, 6.801302909851074, 5.859380722045898, 4.909029483795166, 3.9480934143066406, 2.97717022895813, 1.9960688352584839, 1.0075480937957764, 12.247615814208984, 11.358514785766602, 10.465930938720703, 9.558808326721191, 8.643142700195312, 7.718957901000977, 6.786014556884766, 5.844038486480713, 4.893361568450928, 3.933379650115967, 2.9622321128845215, 1.9816941022872925, 0.9918243288993835, 43.609256744384766, 43.042503356933594, 42.46942138671875, 41.886146545410156, 41.3013801574707, 40.706398010253906, 40.10488510131836, 39.50275421142578, 38.8938102722168, 38.277915954589844, 37.6533317565918, 37.02189254760742, 36.387725830078125, 35.74369430541992, 35.09262466430664, 34.434635162353516, 33.77007293701172, 33.10429000854492, 32.42622375488281, 31.74163246154785, 31.05060577392578, 30.353052139282227, 29.651268005371094, 28.93939208984375, 28.220731735229492, 27.496976852416992, 26.766542434692383, 26.029361724853516, 25.27996253967285, 24.52351951599121, 23.75992774963379, 22.991281509399414, 22.215442657470703, 21.432268142700195, 20.641332626342773, 19.83710289001465, 19.024953842163086, 18.20509147644043, 17.380950927734375, 16.5444278717041, 15.703495979309082, 14.85449504852295, 13.997016906738281, 13.125635147094727, 12.24562931060791, 11.361700057983398, 10.463871002197266, 9.557443618774414, 8.64238452911377, 7.718536853790283, 6.787384986877441, 5.847218036651611, 4.894622802734375, 3.932905673980713, 2.9618613719940186, 1.981292486190796, 0.9910222291946411, 19.027494430541992, 18.206823348999023, 17.383472442626953, 16.551694869995117, 15.710872650146484, 14.860836029052734, 14.001648902893066, 13.132206916809082, 12.253522872924805, 11.365391731262207, 10.467756271362305, 9.566187858581543, 8.65464973449707, 7.730498313903809, 6.7964768409729, 5.852658748626709, 4.90480375289917, 3.9465534687042236, 2.9747207164764404, 1.9967372417449951, 1.0079593658447266, 22.99595069885254, 22.220779418945312, 21.437185287475586, 20.644990921020508, 19.84193229675293, 19.03006935119629, 18.209468841552734, 17.38059425354004, 16.54391098022461, 15.703227996826172, 14.84953784942627, 13.991717338562012, 13.125738143920898, 12.245392799377441, 11.356738090515137, 10.45986270904541, 9.556879997253418, 8.641816139221191, 7.718142032623291, 6.786762237548828, 5.846421718597412, 4.897131443023682, 3.934380054473877, 2.962770462036133, 1.981959581375122, 0.9922758340835571, 13.125704765319824, 12.245399475097656, 11.361815452575684, 10.469194412231445, 9.566920280456543, 8.651344299316406, 7.730740070343018, 6.8000946044921875, 5.8594746589660645, 4.9089674949646, 3.9481048583984375, 2.9782679080963135, 1.9983844757080078, 1.0084586143493652], "value_targets": [8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 1159698636, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 946821005, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 514900772, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1405949296, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 1939384189, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 123852729, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 1325793438, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 745346269, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 593399454, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 250215783, 1489924340, 1489924340, 1489924340, 1489924340, 1489924340, 1489924340, 1489924340, 1489924340, 1489924340, 1489924340], "obs": [[-0.014189225621521473, 0.0036457327660173178, -0.043428272008895874, 0.011530174873769283], [-0.014116310514509678, -0.1908273547887802, -0.043197669088840485, 0.2902008891105652], [-0.01793285831809044, 0.004883083514869213, -0.03739364817738533, -0.015787094831466675], [-0.01783519610762596, -0.189683198928833, -0.03770939260721207, 0.2648671269416809], [-0.021628860384225845, 0.005956120323389769, -0.03241204842925072, -0.03946715220808983], [-0.021509738638997078, -0.18868641555309296, -0.033201392740011215, 0.24281582236289978], [-0.025283467024564743, 0.006893666461110115, -0.028345076367259026, -0.06015202775597572], [-0.02514559216797352, 0.20241032540798187, -0.02954811602830887, -0.361641526222229], [-0.02109738625586033, 0.007720548659563065, -0.036780945956707, -0.0784202367067337], [-0.02094297483563423, 0.20334993302822113, -0.03834935277700424, -0.3824770152568817], [-0.01687597669661045, 0.3989948332309723, -0.045998893678188324, -0.6870005130767822], [-0.008896080777049065, 0.5947240591049194, -0.059738900512456894, -0.9938027858734131], [0.002998401178047061, 0.7905921339988708, -0.07961495965719223, -1.3046334981918335], [0.018810244277119637, 0.9866282343864441, -0.10570763051509857, -1.621138334274292], [0.03854280710220337, 0.7928982973098755, -0.13813039660453796, -1.3631856441497803], [0.05440077558159828, 0.5997505784034729, -0.1653941124677658, -1.1167049407958984], [0.06639578938484192, 0.4071393311023712, -0.18772821128368378, -0.8801352381706238], [0.07453857362270355, 0.6042473912239075, -0.20533090829849243, -1.2254712581634521], [-0.015102613717317581, 0.03577321022748947, -0.0003087593649979681, 9.740804671309888e-05], [-0.01438714936375618, 0.23089958727359772, -0.00030681121279485524, -0.2926829159259796], [-0.009769157506525517, 0.03578201308846474, -0.006160469725728035, -9.677329944679514e-05], [-0.009053518064320087, 0.23099176585674286, -0.006162405014038086, -0.294717013835907], [-0.0044336821883916855, 0.4262010455131531, -0.01205674558877945, -0.5893371105194092], [0.004090338479727507, 0.6214897036552429, -0.023843487724661827, -0.8857934474945068], [0.01652013324201107, 0.8169271349906921, -0.041559357196092606, -1.1858755350112915], [0.032858673483133316, 0.6223680377006531, -0.0652768686413765, -0.9065038561820984], [0.04530603438615799, 0.4281877875328064, -0.08340694010257721, -0.6350315809249878], [0.05386979132890701, 0.23432214558124542, -0.09610757231712341, -0.3697372376918793], [0.05855623632669449, 0.04068771377205849, -0.1035023182630539, -0.10883810371160507], [0.05936998873949051, 0.2371288388967514, -0.10567907989025116, -0.4322982728481293], [0.06411256641149521, 0.43357595801353455, -0.11432504653930664, -0.7563368678092957], [0.07278408855199814, 0.24019980430603027, -0.12945178151130676, -0.5017045736312866], [0.07758808135986328, 0.0471174493432045, -0.13948588073253632, -0.25245699286460876], [0.07853043079376221, 0.2439269721508026, -0.14453501999378204, -0.5856800079345703], [0.08340896666049957, 0.4407460391521454, -0.15624861419200897, -0.9201757907867432], [0.0922238901257515, 0.6375951766967773, -0.1746521294116974, -1.2576029300689697], [0.10497579723596573, 0.8344681859016418, -0.1998041868209839, -1.5995069742202759], [-0.03472517430782318, -0.030197905376553535, -0.0166822150349617, 0.035872459411621094], [-0.03532912954688072, 0.16515925526618958, -0.015964766964316368, -0.262026846408844], [-0.03202594444155693, 0.3605054020881653, -0.021205302327871323, -0.5597021579742432], [-0.024815836921334267, 0.1656874120235443, -0.03239934518933296, -0.27377477288246155], [-0.021502088755369186, 0.36125630140304565, -0.037874843925237656, -0.5764979124069214], [-0.014276963658630848, 0.5568881034851074, -0.049404799938201904, -0.8808677196502686], [-0.0031392008531838655, 0.7526451349258423, -0.06702215224504471, -1.1886640787124634], [0.011913701891899109, 0.5584529042243958, -0.09079543501138687, -0.9177194833755493], [0.023082759231328964, 0.3646680414676666, -0.10914982855319977, -0.6548966765403748], [0.030376121401786804, 0.17122143507003784, -0.12224775552749634, -0.3984799087047577], [0.03380054980516434, -0.02197340875864029, -0.13021735846996307, -0.14670175313949585], [0.033361081033945084, -0.21501345932483673, -0.13315139710903168, 0.10223101824522018], [0.029060812667012215, -0.018259504809975624, -0.13110676407814026, -0.22931848466396332], [0.028695622459053993, 0.1784685105085373, -0.13569314777851105, -0.5603130459785461], [0.03226499259471893, -0.014514226466417313, -0.14689940214157104, -0.31327131390571594], [0.031974706798791885, 0.1823616474866867, -0.1531648337841034, -0.6484377384185791], [0.03562194108963013, -0.010332281701266766, -0.1661335825920105, -0.4076352119445801], [0.035415295511484146, 0.18670758605003357, -0.17428629100322723, -0.7477445006370544], [0.0391494482755661, 0.3837506175041199, -0.1892411708831787, -1.0898125171661377], [0.04073445498943329, 0.007214659359306097, 0.01475654635578394, 0.01804453507065773], [0.040878746658563614, 0.20212191343307495, 0.015117437578737736, -0.26994624733924866], [0.044921185821294785, 0.39702489972114563, 0.009718512184917927, -0.5578229427337646], [0.05286168307065964, 0.5920090675354004, -0.0014379468047991395, -0.8474282622337341], [0.0647018626332283, 0.3969067931175232, -0.018386511132121086, -0.5551978349685669], [0.07264000177383423, 0.5922819972038269, -0.02949046902358532, -0.85361647605896], [0.08448564261198044, 0.39757415652275085, -0.0465627983212471, -0.5703506469726562], [0.09243712574243546, 0.20313508808612823, -0.05796980857849121, -0.292692631483078], [0.09649982303380966, 0.008885509334504604, -0.06382366269826889, -0.01884131133556366], [0.09667753428220749, 0.20486195385456085, -0.0642004907131195, -0.33095887303352356], [0.10077477246522903, 0.010709813795983791, -0.0708196684718132, -0.05919261649250984], [0.10098896920681, 0.20677195489406586, -0.07200352102518082, -0.3733522295951843], [0.10512440651655197, 0.01274277176707983, -0.07947055995464325, -0.10421332716941833], [0.10537926852703094, 0.208908349275589, -0.0815548300743103, -0.4208727777004242], [0.10955743491649628, 0.015030905604362488, -0.08997228741645813, -0.15497374534606934], [0.10985805094242096, 0.21131817996501923, -0.09307175874710083, -0.4746299386024475], [0.11408441513776779, 0.40762272477149963, -0.10256435722112656, -0.7951359748840332], [0.12223687022924423, 0.6039915680885315, -0.11846707761287689, -1.1182423830032349], [0.13431669771671295, 0.8004516363143921, -0.14083191752433777, -1.4456149339675903], [0.1503257304430008, 0.6073150634765625, -0.16974422335624695, -1.2000460624694824], [0.16247203946113586, 0.8041765093803406, -0.19374515116214752, -1.540759801864624], [-0.043295323848724365, -0.0486668236553669, -0.02703801542520523, -0.04195248335599899], [-0.0442686602473259, 0.1468321979045868, -0.027877066284418106, -0.3430420458316803], [-0.04133201390504837, 0.342339426279068, -0.034737907350063324, -0.6443837285041809], [-0.03448522835969925, 0.5379278659820557, -0.047625582665205, -0.9478002190589905], [-0.02372667007148266, 0.7336575984954834, -0.06658158451318741, -1.2550586462020874], [-0.009053518064320087, 0.9295659065246582, -0.09168276190757751, -1.5678304433822632], [0.009537800215184689, 0.7356508374214172, -0.1230393648147583, -1.3050965070724487], [0.0242508165538311, 0.5422848463058472, -0.14914129674434662, -1.053322672843933], [0.03509651497006416, 0.3494209945201874, -0.17020775377750397, -0.8109234571456909], [0.04208493232727051, 0.15698851644992828, -0.18642622232437134, -0.5762456059455872], [0.04522470384836197, -0.03509852662682533, -0.19795113801956177, -0.34759992361068726], [0.0445227324962616, -0.22693544626235962, -0.20490312576293945, -0.12328223884105682], [0.039984025061130524, -0.029557397589087486, -0.20736877620220184, -0.4729766547679901], [0.0019082191865891218, -0.046380624175071716, 0.03479662910103798, 0.04208206757903099], [0.0009806066518649459, 0.14822551608085632, 0.035638272762298584, -0.23942230641841888], [0.003945116885006428, -0.04738694056868553, 0.030849825590848923, 0.064285509288311], [0.0029973783530294895, 0.14727942645549774, 0.03213553503155708, -0.21850669384002686], [0.005942966789007187, 0.3419276177883148, 0.02776540257036686, -0.5008820295333862], [0.012781519442796707, 0.1464255005121231, 0.01774776168167591, -0.1995798796415329], [0.015710029751062393, 0.3412891626358032, 0.013756164349615574, -0.4866117835044861], [0.022535813972353935, 0.5362143516540527, 0.004023928195238113, -0.7749276757240295], [0.033260099589824677, 0.3410372734069824, -0.011474626138806343, -0.4809814393520355], [0.04008084535598755, 0.1460791677236557, -0.02109425514936447, -0.19193698465824127], [0.043002430349588394, 0.34149643778800964, -0.024932993575930595, -0.49119892716407776], [0.049832358956336975, 0.14673489332199097, -0.03475697338581085, -0.20647695660591125], [0.052767056971788406, -0.04787324368953705, -0.03888651356101036, 0.07504244893789291], [0.05180959030985832, -0.24241676926612854, -0.03738566115498543, 0.3552073836326599], [0.04696125537157059, -0.4369877576828003, -0.030281515792012215, 0.6358711123466492], [0.03822150081396103, -0.24145685136318207, -0.017564093694090843, 0.3338077962398529], [0.03339236229658127, -0.046089380979537964, -0.010887937620282173, 0.03563821315765381], [0.03247057646512985, -0.2410535216331482, -0.010175173170864582, 0.32486608624458313], [0.02764950506389141, -0.4360291361808777, -0.003677851054817438, 0.6143229007720947], [0.018928922712802887, -0.24085597693920135, 0.008608607575297356, 0.32048389315605164], [0.014111802913248539, -0.04585767164826393, 0.015018284320831299, 0.03052816540002823], [0.01319464948028326, -0.24119172990322113, 0.01562884822487831, 0.3279114365577698], [0.008370814844965935, -0.4365326464176178, 0.02218707650899887, 0.6254817247390747], [-0.00035983853740617633, -0.6319571733474731, 0.03469671308994293, 0.9250688552856445], [-0.012998982332646847, -0.43732061982154846, 0.053198087960481644, 0.6434885263442993], [-0.02174539491534233, -0.24297890067100525, 0.06606785953044891, 0.368021160364151], [-0.026604972779750824, -0.43897438049316406, 0.07342828065156937, 0.6807827949523926], [-0.03538446128368378, -0.24494494497776031, 0.08704394102096558, 0.4120914340019226], [-0.040283359587192535, -0.05115779861807823, 0.09528576582670212, 0.148069828748703], [-0.0413065142929554, -0.24750594794750214, 0.09824716299772263, 0.46922767162323], [-0.04625663533806801, -0.05389918386936188, 0.10763171315193176, 0.20905621349811554], [-0.047334618866443634, -0.25038236379623413, 0.11181283742189407, 0.5336581468582153], [-0.05234226584434509, -0.05699579790234566, 0.12248600274324417, 0.27819424867630005], [-0.05348218232393265, 0.13618525862693787, 0.12804989516735077, 0.026514552533626556], [-0.0507584773004055, -0.060518309473991394, 0.12858018279075623, 0.35669809579849243], [-0.05196884274482727, -0.25721147656440735, 0.13571414351463318, 0.6870008111000061], [-0.05711307004094124, -0.45393016934394836, 0.14945416152477264, 1.0191431045532227], [-0.0661916732788086, -0.6506936550140381, 0.16983701288700104, 1.3547743558883667], [-0.07920555025339127, -0.8474907279014587, 0.19693250954151154, 1.6954151391983032], [-0.03062400035560131, 0.03386823460459709, 0.03472475707530975, 0.047242987900972366], [-0.02994663454592228, 0.22847549617290497, 0.03566961735486984, -0.2342848926782608], [-0.025377124547958374, 0.03286253660917282, 0.03098391927778721, 0.06943254172801971], [-0.024719875305891037, -0.16268961131572723, 0.032372571527957916, 0.3717277944087982], [-0.027973666787147522, -0.35825616121292114, 0.03980712592601776, 0.6744397878646851], [-0.03513878956437111, -0.5539080500602722, 0.05329592153429985, 0.9793853163719177], [-0.046216949820518494, -0.7497023940086365, 0.07288362830877304, 1.2883213758468628], [-0.061210997402668, -0.555579423904419, 0.09865006059408188, 1.0193188190460205], [-0.07232258468866348, -0.3619007170200348, 0.11903643608093262, 0.759169340133667], [-0.07956060022115707, -0.5584441423416138, 0.13421982526779175, 1.0868123769760132], [-0.0907294824719429, -0.7550561428070068, 0.15595607459545135, 1.4184201955795288], [-0.1058306097984314, -0.9517266154289246, 0.1843244731426239, 1.755510926246643], [0.047721315175294876, 0.028775136917829514, -0.024130048230290413, -0.046346478164196014], [0.048296816647052765, 0.22423464059829712, -0.025056978687644005, -0.34654393792152405], [0.05278151109814644, 0.419703871011734, -0.031987857073545456, -0.6470217108726501], [0.06117558851838112, 0.22504186630249023, -0.04492828994989395, -0.3645809292793274], [0.06567642092704773, 0.42077258229255676, -0.05221990868449211, -0.6710851788520813], [0.07409187406301498, 0.22641399502754211, -0.0656416118144989, -0.3952903747558594], [0.07862015813589096, 0.03228185325860977, -0.07354742288589478, -0.12400409579277039], [0.07926579564809799, 0.22837620973587036, -0.07602750509977341, -0.4389539062976837], [0.08383331447839737, 0.42448723316192627, -0.08480658382177353, -0.754601240158081], [0.09232306480407715, 0.6206695437431335, -0.09989860653877258, -1.0727204084396362], [0.10473645478487015, 0.8169598579406738, -0.12135301530361176, -1.3950092792510986], [0.12107565253973007, 1.0133647918701172, -0.14925320446491241, -1.723040223121643], [0.14134295284748077, 1.2098469734191895, -0.18371400237083435, -2.0582046508789062], [-0.01383152138441801, -0.035649556666612625, 0.022591322660446167, -0.04871153086423874], [-0.014544513076543808, -0.2310880422592163, 0.021617092192173004, 0.2510126829147339], [-0.01916627399623394, -0.036281343549489975, 0.026637345552444458, -0.03477416932582855], [-0.019891900941729546, 0.1584486961364746, 0.025941861793398857, -0.3189351558685303], [-0.01672292686998844, 0.3531917631626129, 0.019563158974051476, -0.6033254265785217], [-0.009659091010689735, 0.15780173242092133, 0.007496650796383619, -0.30454525351524353], [-0.006503056734800339, 0.35281604528427124, 0.0014057457447052002, -0.5948545336723328], [0.0005532640498131514, 0.15767444670200348, -0.010491344146430492, -0.30172911286354065], [0.003706753021106124, -0.037296414375305176, -0.01652592606842518, -0.012373306788504124], [0.002960824640467763, -0.2321775108575821, -0.016773393377661705, 0.27505001425743103], [-0.001682725502178073, -0.4270561933517456, -0.011272392235696316, 0.5623957514762878], [-0.01022384874522686, -0.6220181584358215, -2.447709812258836e-05, 0.8515061140060425], [-0.022664211690425873, -0.817139744758606, 0.017005644738674164, 1.1441813707351685], [-0.03900700807571411, -0.6222440600395203, 0.039889272302389145, 0.856879472732544], [-0.05145188793540001, -0.8178861141204834, 0.05702686309814453, 1.1618335247039795], [-0.06780961155891418, -1.0137025117874146, 0.08026353269815445, 1.4718375205993652], [-0.0880836620926857, -0.8196486234664917, 0.1097002774477005, 1.205265760421753], [-0.10447663813829422, -1.0160038471221924, 0.13380560278892517, 1.5302153825759888], [-0.12479671090841293, -1.2124613523483276, 0.16440990567207336, 1.861489176750183], [-0.1490459442138672, -1.0194799900054932, 0.20163968205451965, 1.624039649963379], [-0.02344769425690174, -0.0008192180539481342, -0.025171592831611633, 0.028134983032941818], [-0.023464078083634377, -0.19557131826877594, -0.02460889331996441, 0.31277093291282654], [-0.02737550437450409, -0.00010758837743196636, -0.018353473395109177, 0.012429819442331791], [-0.02737765572965145, -0.1949615776538849, -0.018104877322912216, 0.29926598072052], [-0.0312768891453743, -0.3898208439350128, -0.01211955863982439, 0.5861844420433044], [-0.03907330706715584, -0.19453126192092896, -0.000395869865315035, 0.2897084951400757], [-0.04296392947435379, -0.38964757323265076, 0.005398300010710955, 0.5822665691375732], [-0.05075688287615776, -0.584844708442688, 0.01704363152384758, 0.8766451478004456], [-0.062453776597976685, -0.7801941633224487, 0.03457653149962425, 1.1746371984481812], [-0.078057661652565, -0.5855381488800049, 0.05806927755475044, 0.892991304397583], [-0.0897684246301651, -0.3912498652935028, 0.07592910528182983, 0.6191128492355347], [-0.09759341925382614, -0.5873456597328186, 0.08831135928630829, 0.9347107410430908], [-0.10934033244848251, -0.3935187757015228, 0.10700557380914688, 0.6710332036018372], [-0.11721070855855942, -0.20003432035446167, 0.1204262375831604, 0.41386616230010986], [-0.12121139466762543, -0.006806789431720972, 0.12870356440544128, 0.161443829536438], [-0.12134753167629242, 0.18626022338867188, 0.13193243741989136, -0.0880269780755043], [-0.11762232333421707, -0.010481828823685646, 0.13017189502716064, 0.24319714307785034], [-0.11783196032047272, -0.2071996033191681, 0.13503584265708923, 0.573939859867096], [-0.12197595834732056, -0.40393054485321045, 0.1465146392583847, 0.9059298634529114], [-0.1300545632839203, -0.21106377243995667, 0.16463324427604675, 0.6626506447792053], [-0.13427583873271942, -0.40804702043533325, 0.1778862476348877, 1.0023140907287598], [-0.14243678748607635, -0.2156900018453598, 0.19793252646923065, 0.7703548669815063], [0.011439342051744461, 0.03256664425134659, 0.022343695163726807, 0.004964124411344528], [0.012090674601495266, -0.16286849975585938, 0.022442977875471115, 0.3046121597290039], [0.008833304978907108, -0.3583029806613922, 0.02853522077202797, 0.6042877435684204], [0.0016672450583428144, -0.5538121461868286, 0.04062097519636154, 0.9058203101158142], [-0.009408997371792793, -0.3592630624771118, 0.0587373822927475, 0.6261767148971558], [-0.016594259068369865, -0.5551536083221436, 0.07126091420650482, 0.936764657497406], [-0.027697332203388214, -0.7511604428291321, 0.08999621123075485, 1.2509616613388062], [-0.04272054135799408, -0.9473129510879517, 0.11501544713973999, 1.570422887802124], [-0.06166679784655571, -1.1436046361923218, 0.14642390608787537, 1.8966550827026367], [-0.08453889191150665, -1.3399786949157715, 0.18435700237751007, 2.230959177017212]], "actions": [0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.014116310514509678, -0.1908273547887802, -0.043197669088840485, 0.2902008891105652], [-0.01793285831809044, 0.004883083514869213, -0.03739364817738533, -0.015787094831466675], [-0.01783519610762596, -0.189683198928833, -0.03770939260721207, 0.2648671269416809], [-0.021628860384225845, 0.005956120323389769, -0.03241204842925072, -0.03946715220808983], [-0.021509738638997078, -0.18868641555309296, -0.033201392740011215, 0.24281582236289978], [-0.025283467024564743, 0.006893666461110115, -0.028345076367259026, -0.06015202775597572], [-0.02514559216797352, 0.20241032540798187, -0.02954811602830887, -0.361641526222229], [-0.02109738625586033, 0.007720548659563065, -0.036780945956707, -0.0784202367067337], [-0.02094297483563423, 0.20334993302822113, -0.03834935277700424, -0.3824770152568817], [-0.01687597669661045, 0.3989948332309723, -0.045998893678188324, -0.6870005130767822], [-0.008896080777049065, 0.5947240591049194, -0.059738900512456894, -0.9938027858734131], [0.002998401178047061, 0.7905921339988708, -0.07961495965719223, -1.3046334981918335], [0.018810244277119637, 0.9866282343864441, -0.10570763051509857, -1.621138334274292], [0.03854280710220337, 0.7928982973098755, -0.13813039660453796, -1.3631856441497803], [0.05440077558159828, 0.5997505784034729, -0.1653941124677658, -1.1167049407958984], [0.06639578938484192, 0.4071393311023712, -0.18772821128368378, -0.8801352381706238], [0.07453857362270355, 0.6042473912239075, -0.20533090829849243, -1.2254712581634521], [0.08662351965904236, 0.4122733175754547, -0.22984033823013306, -1.0035032033920288], [-0.01438714936375618, 0.23089958727359772, -0.00030681121279485524, -0.2926829159259796], [-0.009769157506525517, 0.03578201308846474, -0.006160469725728035, -9.677329944679514e-05], [-0.009053518064320087, 0.23099176585674286, -0.006162405014038086, -0.294717013835907], [-0.0044336821883916855, 0.4262010455131531, -0.01205674558877945, -0.5893371105194092], [0.004090338479727507, 0.6214897036552429, -0.023843487724661827, -0.8857934474945068], [0.01652013324201107, 0.8169271349906921, -0.041559357196092606, -1.1858755350112915], [0.032858673483133316, 0.6223680377006531, -0.0652768686413765, -0.9065038561820984], [0.04530603438615799, 0.4281877875328064, -0.08340694010257721, -0.6350315809249878], [0.05386979132890701, 0.23432214558124542, -0.09610757231712341, -0.3697372376918793], [0.05855623632669449, 0.04068771377205849, -0.1035023182630539, -0.10883810371160507], [0.05936998873949051, 0.2371288388967514, -0.10567907989025116, -0.4322982728481293], [0.06411256641149521, 0.43357595801353455, -0.11432504653930664, -0.7563368678092957], [0.07278408855199814, 0.24019980430603027, -0.12945178151130676, -0.5017045736312866], [0.07758808135986328, 0.0471174493432045, -0.13948588073253632, -0.25245699286460876], [0.07853043079376221, 0.2439269721508026, -0.14453501999378204, -0.5856800079345703], [0.08340896666049957, 0.4407460391521454, -0.15624861419200897, -0.9201757907867432], [0.0922238901257515, 0.6375951766967773, -0.1746521294116974, -1.2576029300689697], [0.10497579723596573, 0.8344681859016418, -0.1998041868209839, -1.5995069742202759], [0.12166515737771988, 0.642194926738739, -0.2317943274974823, -1.3751871585845947], [-0.03532912954688072, 0.16515925526618958, -0.015964766964316368, -0.262026846408844], [-0.03202594444155693, 0.3605054020881653, -0.021205302327871323, -0.5597021579742432], [-0.024815836921334267, 0.1656874120235443, -0.03239934518933296, -0.27377477288246155], [-0.021502088755369186, 0.36125630140304565, -0.037874843925237656, -0.5764979124069214], [-0.014276963658630848, 0.5568881034851074, -0.049404799938201904, -0.8808677196502686], [-0.0031392008531838655, 0.7526451349258423, -0.06702215224504471, -1.1886640787124634], [0.011913701891899109, 0.5584529042243958, -0.09079543501138687, -0.9177194833755493], [0.023082759231328964, 0.3646680414676666, -0.10914982855319977, -0.6548966765403748], [0.030376121401786804, 0.17122143507003784, -0.12224775552749634, -0.3984799087047577], [0.03380054980516434, -0.02197340875864029, -0.13021735846996307, -0.14670175313949585], [0.033361081033945084, -0.21501345932483673, -0.13315139710903168, 0.10223101824522018], [0.029060812667012215, -0.018259504809975624, -0.13110676407814026, -0.22931848466396332], [0.028695622459053993, 0.1784685105085373, -0.13569314777851105, -0.5603130459785461], [0.03226499259471893, -0.014514226466417313, -0.14689940214157104, -0.31327131390571594], [0.031974706798791885, 0.1823616474866867, -0.1531648337841034, -0.6484377384185791], [0.03562194108963013, -0.010332281701266766, -0.1661335825920105, -0.4076352119445801], [0.035415295511484146, 0.18670758605003357, -0.17428629100322723, -0.7477445006370544], [0.0391494482755661, 0.3837506175041199, -0.1892411708831787, -1.0898125171661377], [0.04682445898652077, 0.5807940363883972, -0.21103742718696594, -1.4354064464569092], [0.040878746658563614, 0.20212191343307495, 0.015117437578737736, -0.26994624733924866], [0.044921185821294785, 0.39702489972114563, 0.009718512184917927, -0.5578229427337646], [0.05286168307065964, 0.5920090675354004, -0.0014379468047991395, -0.8474282622337341], [0.0647018626332283, 0.3969067931175232, -0.018386511132121086, -0.5551978349685669], [0.07264000177383423, 0.5922819972038269, -0.02949046902358532, -0.85361647605896], [0.08448564261198044, 0.39757415652275085, -0.0465627983212471, -0.5703506469726562], [0.09243712574243546, 0.20313508808612823, -0.05796980857849121, -0.292692631483078], [0.09649982303380966, 0.008885509334504604, -0.06382366269826889, -0.01884131133556366], [0.09667753428220749, 0.20486195385456085, -0.0642004907131195, -0.33095887303352356], [0.10077477246522903, 0.010709813795983791, -0.0708196684718132, -0.05919261649250984], [0.10098896920681, 0.20677195489406586, -0.07200352102518082, -0.3733522295951843], [0.10512440651655197, 0.01274277176707983, -0.07947055995464325, -0.10421332716941833], [0.10537926852703094, 0.208908349275589, -0.0815548300743103, -0.4208727777004242], [0.10955743491649628, 0.015030905604362488, -0.08997228741645813, -0.15497374534606934], [0.10985805094242096, 0.21131817996501923, -0.09307175874710083, -0.4746299386024475], [0.11408441513776779, 0.40762272477149963, -0.10256435722112656, -0.7951359748840332], [0.12223687022924423, 0.6039915680885315, -0.11846707761287689, -1.1182423830032349], [0.13431669771671295, 0.8004516363143921, -0.14083191752433777, -1.4456149339675903], [0.1503257304430008, 0.6073150634765625, -0.16974422335624695, -1.2000460624694824], [0.16247203946113586, 0.8041765093803406, -0.19374515116214752, -1.540759801864624], [0.17855556309223175, 0.6118398904800415, -0.22456033527851105, -1.3142582178115845], [-0.0442686602473259, 0.1468321979045868, -0.027877066284418106, -0.3430420458316803], [-0.04133201390504837, 0.342339426279068, -0.034737907350063324, -0.6443837285041809], [-0.03448522835969925, 0.5379278659820557, -0.047625582665205, -0.9478002190589905], [-0.02372667007148266, 0.7336575984954834, -0.06658158451318741, -1.2550586462020874], [-0.009053518064320087, 0.9295659065246582, -0.09168276190757751, -1.5678304433822632], [0.009537800215184689, 0.7356508374214172, -0.1230393648147583, -1.3050965070724487], [0.0242508165538311, 0.5422848463058472, -0.14914129674434662, -1.053322672843933], [0.03509651497006416, 0.3494209945201874, -0.17020775377750397, -0.8109234571456909], [0.04208493232727051, 0.15698851644992828, -0.18642622232437134, -0.5762456059455872], [0.04522470384836197, -0.03509852662682533, -0.19795113801956177, -0.34759992361068726], [0.0445227324962616, -0.22693544626235962, -0.20490312576293945, -0.12328223884105682], [0.039984025061130524, -0.029557397589087486, -0.20736877620220184, -0.4729766547679901], [0.039392877370119095, 0.16779693961143494, -0.21682830154895782, -0.8231964111328125], [0.0009806066518649459, 0.14822551608085632, 0.035638272762298584, -0.23942230641841888], [0.003945116885006428, -0.04738694056868553, 0.030849825590848923, 0.064285509288311], [0.0029973783530294895, 0.14727942645549774, 0.03213553503155708, -0.21850669384002686], [0.005942966789007187, 0.3419276177883148, 0.02776540257036686, -0.5008820295333862], [0.012781519442796707, 0.1464255005121231, 0.01774776168167591, -0.1995798796415329], [0.015710029751062393, 0.3412891626358032, 0.013756164349615574, -0.4866117835044861], [0.022535813972353935, 0.5362143516540527, 0.004023928195238113, -0.7749276757240295], [0.033260099589824677, 0.3410372734069824, -0.011474626138806343, -0.4809814393520355], [0.04008084535598755, 0.1460791677236557, -0.02109425514936447, -0.19193698465824127], [0.043002430349588394, 0.34149643778800964, -0.024932993575930595, -0.49119892716407776], [0.049832358956336975, 0.14673489332199097, -0.03475697338581085, -0.20647695660591125], [0.052767056971788406, -0.04787324368953705, -0.03888651356101036, 0.07504244893789291], [0.05180959030985832, -0.24241676926612854, -0.03738566115498543, 0.3552073836326599], [0.04696125537157059, -0.4369877576828003, -0.030281515792012215, 0.6358711123466492], [0.03822150081396103, -0.24145685136318207, -0.017564093694090843, 0.3338077962398529], [0.03339236229658127, -0.046089380979537964, -0.010887937620282173, 0.03563821315765381], [0.03247057646512985, -0.2410535216331482, -0.010175173170864582, 0.32486608624458313], [0.02764950506389141, -0.4360291361808777, -0.003677851054817438, 0.6143229007720947], [0.018928922712802887, -0.24085597693920135, 0.008608607575297356, 0.32048389315605164], [0.014111802913248539, -0.04585767164826393, 0.015018284320831299, 0.03052816540002823], [0.01319464948028326, -0.24119172990322113, 0.01562884822487831, 0.3279114365577698], [0.008370814844965935, -0.4365326464176178, 0.02218707650899887, 0.6254817247390747], [-0.00035983853740617633, -0.6319571733474731, 0.03469671308994293, 0.9250688552856445], [-0.012998982332646847, -0.43732061982154846, 0.053198087960481644, 0.6434885263442993], [-0.02174539491534233, -0.24297890067100525, 0.06606785953044891, 0.368021160364151], [-0.026604972779750824, -0.43897438049316406, 0.07342828065156937, 0.6807827949523926], [-0.03538446128368378, -0.24494494497776031, 0.08704394102096558, 0.4120914340019226], [-0.040283359587192535, -0.05115779861807823, 0.09528576582670212, 0.148069828748703], [-0.0413065142929554, -0.24750594794750214, 0.09824716299772263, 0.46922767162323], [-0.04625663533806801, -0.05389918386936188, 0.10763171315193176, 0.20905621349811554], [-0.047334618866443634, -0.25038236379623413, 0.11181283742189407, 0.5336581468582153], [-0.05234226584434509, -0.05699579790234566, 0.12248600274324417, 0.27819424867630005], [-0.05348218232393265, 0.13618525862693787, 0.12804989516735077, 0.026514552533626556], [-0.0507584773004055, -0.060518309473991394, 0.12858018279075623, 0.35669809579849243], [-0.05196884274482727, -0.25721147656440735, 0.13571414351463318, 0.6870008111000061], [-0.05711307004094124, -0.45393016934394836, 0.14945416152477264, 1.0191431045532227], [-0.0661916732788086, -0.6506936550140381, 0.16983701288700104, 1.3547743558883667], [-0.07920555025339127, -0.8474907279014587, 0.19693250954151154, 1.6954151391983032], [-0.09615536034107208, -0.6551108360290527, 0.23084081709384918, 1.4699475765228271], [-0.02994663454592228, 0.22847549617290497, 0.03566961735486984, -0.2342848926782608], [-0.025377124547958374, 0.03286253660917282, 0.03098391927778721, 0.06943254172801971], [-0.024719875305891037, -0.16268961131572723, 0.032372571527957916, 0.3717277944087982], [-0.027973666787147522, -0.35825616121292114, 0.03980712592601776, 0.6744397878646851], [-0.03513878956437111, -0.5539080500602722, 0.05329592153429985, 0.9793853163719177], [-0.046216949820518494, -0.7497023940086365, 0.07288362830877304, 1.2883213758468628], [-0.061210997402668, -0.555579423904419, 0.09865006059408188, 1.0193188190460205], [-0.07232258468866348, -0.3619007170200348, 0.11903643608093262, 0.759169340133667], [-0.07956060022115707, -0.5584441423416138, 0.13421982526779175, 1.0868123769760132], [-0.0907294824719429, -0.7550561428070068, 0.15595607459545135, 1.4184201955795288], [-0.1058306097984314, -0.9517266154289246, 0.1843244731426239, 1.755510926246643], [-0.12486513704061508, -1.1483980417251587, 0.2194346934556961, 2.0994057655334473], [0.048296816647052765, 0.22423464059829712, -0.025056978687644005, -0.34654393792152405], [0.05278151109814644, 0.419703871011734, -0.031987857073545456, -0.6470217108726501], [0.06117558851838112, 0.22504186630249023, -0.04492828994989395, -0.3645809292793274], [0.06567642092704773, 0.42077258229255676, -0.05221990868449211, -0.6710851788520813], [0.07409187406301498, 0.22641399502754211, -0.0656416118144989, -0.3952903747558594], [0.07862015813589096, 0.03228185325860977, -0.07354742288589478, -0.12400409579277039], [0.07926579564809799, 0.22837620973587036, -0.07602750509977341, -0.4389539062976837], [0.08383331447839737, 0.42448723316192627, -0.08480658382177353, -0.754601240158081], [0.09232306480407715, 0.6206695437431335, -0.09989860653877258, -1.0727204084396362], [0.10473645478487015, 0.8169598579406738, -0.12135301530361176, -1.3950092792510986], [0.12107565253973007, 1.0133647918701172, -0.14925320446491241, -1.723040223121643], [0.14134295284748077, 1.2098469734191895, -0.18371400237083435, -2.0582046508789062], [0.16553989052772522, 1.406309962272644, -0.22487810254096985, -2.401648759841919], [-0.014544513076543808, -0.2310880422592163, 0.021617092192173004, 0.2510126829147339], [-0.01916627399623394, -0.036281343549489975, 0.026637345552444458, -0.03477416932582855], [-0.019891900941729546, 0.1584486961364746, 0.025941861793398857, -0.3189351558685303], [-0.01672292686998844, 0.3531917631626129, 0.019563158974051476, -0.6033254265785217], [-0.009659091010689735, 0.15780173242092133, 0.007496650796383619, -0.30454525351524353], [-0.006503056734800339, 0.35281604528427124, 0.0014057457447052002, -0.5948545336723328], [0.0005532640498131514, 0.15767444670200348, -0.010491344146430492, -0.30172911286354065], [0.003706753021106124, -0.037296414375305176, -0.01652592606842518, -0.012373306788504124], [0.002960824640467763, -0.2321775108575821, -0.016773393377661705, 0.27505001425743103], [-0.001682725502178073, -0.4270561933517456, -0.011272392235696316, 0.5623957514762878], [-0.01022384874522686, -0.6220181584358215, -2.447709812258836e-05, 0.8515061140060425], [-0.022664211690425873, -0.817139744758606, 0.017005644738674164, 1.1441813707351685], [-0.03900700807571411, -0.6222440600395203, 0.039889272302389145, 0.856879472732544], [-0.05145188793540001, -0.8178861141204834, 0.05702686309814453, 1.1618335247039795], [-0.06780961155891418, -1.0137025117874146, 0.08026353269815445, 1.4718375205993652], [-0.0880836620926857, -0.8196486234664917, 0.1097002774477005, 1.205265760421753], [-0.10447663813829422, -1.0160038471221924, 0.13380560278892517, 1.5302153825759888], [-0.12479671090841293, -1.2124613523483276, 0.16440990567207336, 1.861489176750183], [-0.1490459442138672, -1.0194799900054932, 0.20163968205451965, 1.624039649963379], [-0.1694355309009552, -1.216322898864746, 0.2341204732656479, 1.972203016281128], [-0.023464078083634377, -0.19557131826877594, -0.02460889331996441, 0.31277093291282654], [-0.02737550437450409, -0.00010758837743196636, -0.018353473395109177, 0.012429819442331791], [-0.02737765572965145, -0.1949615776538849, -0.018104877322912216, 0.29926598072052], [-0.0312768891453743, -0.3898208439350128, -0.01211955863982439, 0.5861844420433044], [-0.03907330706715584, -0.19453126192092896, -0.000395869865315035, 0.2897084951400757], [-0.04296392947435379, -0.38964757323265076, 0.005398300010710955, 0.5822665691375732], [-0.05075688287615776, -0.584844708442688, 0.01704363152384758, 0.8766451478004456], [-0.062453776597976685, -0.7801941633224487, 0.03457653149962425, 1.1746371984481812], [-0.078057661652565, -0.5855381488800049, 0.05806927755475044, 0.892991304397583], [-0.0897684246301651, -0.3912498652935028, 0.07592910528182983, 0.6191128492355347], [-0.09759341925382614, -0.5873456597328186, 0.08831135928630829, 0.9347107410430908], [-0.10934033244848251, -0.3935187757015228, 0.10700557380914688, 0.6710332036018372], [-0.11721070855855942, -0.20003432035446167, 0.1204262375831604, 0.41386616230010986], [-0.12121139466762543, -0.006806789431720972, 0.12870356440544128, 0.161443829536438], [-0.12134753167629242, 0.18626022338867188, 0.13193243741989136, -0.0880269780755043], [-0.11762232333421707, -0.010481828823685646, 0.13017189502716064, 0.24319714307785034], [-0.11783196032047272, -0.2071996033191681, 0.13503584265708923, 0.573939859867096], [-0.12197595834732056, -0.40393054485321045, 0.1465146392583847, 0.9059298634529114], [-0.1300545632839203, -0.21106377243995667, 0.16463324427604675, 0.6626506447792053], [-0.13427583873271942, -0.40804702043533325, 0.1778862476348877, 1.0023140907287598], [-0.14243678748607635, -0.2156900018453598, 0.19793252646923065, 0.7703548669815063], [-0.1467505842447281, -0.02376232109963894, 0.21333962678909302, 0.5458973050117493], [0.012090674601495266, -0.16286849975585938, 0.022442977875471115, 0.3046121597290039], [0.008833304978907108, -0.3583029806613922, 0.02853522077202797, 0.6042877435684204], [0.0016672450583428144, -0.5538121461868286, 0.04062097519636154, 0.9058203101158142], [-0.009408997371792793, -0.3592630624771118, 0.0587373822927475, 0.6261767148971558], [-0.016594259068369865, -0.5551536083221436, 0.07126091420650482, 0.936764657497406], [-0.027697332203388214, -0.7511604428291321, 0.08999621123075485, 1.2509616613388062], [-0.04272054135799408, -0.9473129510879517, 0.11501544713973999, 1.570422887802124], [-0.06166679784655571, -1.1436046361923218, 0.14642390608787537, 1.8966550827026367], [-0.08453889191150665, -1.3399786949157715, 0.18435700237751007, 2.230959177017212], [-0.11133846640586853, -1.536312222480774, 0.22897619009017944, 2.5743632316589355]], "action_prob": [0.5000669360160828, 0.5005732774734497, 0.5000888109207153, 0.5005590319633484, 0.5001078844070435, 0.5005459189414978, 0.4998753070831299, 0.5007645487785339, 0.49983054399490356, 0.499195396900177, 0.4987909495830536, 0.4985875189304352, 0.49848881363868713, 0.5015701651573181, 0.5016130208969116, 0.5016245245933533, 0.49843457341194153, 0.5017023682594299, 0.49995163083076477, 0.5006906390190125, 0.4999353885650635, 0.4992917478084564, 0.49886131286621094, 0.498639315366745, 0.5014662742614746, 0.501447319984436, 0.501319944858551, 0.5010002255439758, 0.4995422065258026, 0.49892377853393555, 0.5014312863349915, 0.5011831521987915, 0.49927929043769836, 0.49872931838035583, 0.49844375252723694, 0.4983188509941101, 0.5017423629760742, 0.5000908374786377, 0.49941927194595337, 0.5010615587234497, 0.49936580657958984, 0.49889078736305237, 0.4986400902271271, 0.5014790892601013, 0.5014498829841614, 0.5013077259063721, 0.5009752511978149, 0.5004327893257141, 0.5001922249794006, 0.4994652271270752, 0.5011308193206787, 0.4993336796760559, 0.5012220144271851, 0.49919411540031433, 0.49868521094322205, 0.4984181523323059, 0.5000078082084656, 0.49935615062713623, 0.49889853596687317, 0.5013450384140015, 0.498835951089859, 0.5014036297798157, 0.501236081123352, 0.5008480548858643, 0.4997563660144806, 0.5009019374847412, 0.49968501925468445, 0.5009607672691345, 0.4996050000190735, 0.5010248422622681, 0.4995152950286865, 0.49890556931495667, 0.49855250120162964, 0.49839192628860474, 0.501680314540863, 0.49829524755477905, 0.5017669796943665, 0.5000087022781372, 0.49934685230255127, 0.4988928735256195, 0.49865174293518066, 0.4985322952270508, 0.5015366077423096, 0.5015692114830017, 0.501560389995575, 0.5014634728431702, 0.5012142658233643, 0.50077223777771, 0.4998064339160919, 0.4990893602371216, 0.5001992583274841, 0.500461220741272, 0.5002195239067078, 0.4995550215244293, 0.5009539127349854, 0.49954161047935486, 0.4990231692790985, 0.5012715458869934, 0.5010321140289307, 0.4994529187679291, 0.5010708570480347, 0.5005987882614136, 0.4999448359012604, 0.49933838844299316, 0.5010614395141602, 0.5006896257400513, 0.49992603063583374, 0.49930036067962646, 0.5011119246482849, 0.5007420182228088, 0.4998655915260315, 0.4992327094078064, 0.49882328510284424, 0.5013836026191711, 0.5012539625167847, 0.4990718960762024, 0.5013137459754944, 0.5010165572166443, 0.4995078444480896, 0.50108802318573, 0.499402791261673, 0.5011643171310425, 0.5007124543190002, 0.499900221824646, 0.4991908669471741, 0.4986979365348816, 0.49844735860824585, 0.498331218957901, 0.5017327070236206, 0.500097393989563, 0.5005472898483276, 0.4998844265937805, 0.4992324709892273, 0.49880021810531616, 0.4985787272453308, 0.5015271902084351, 0.5015139579772949, 0.49859780073165894, 0.49841195344924927, 0.49832725524902344, 0.4982772767543793, 0.49980616569519043, 0.4991697371006012, 0.5012391805648804, 0.4991050362586975, 0.5012935996055603, 0.500971794128418, 0.4995806813240051, 0.4989672303199768, 0.4986065924167633, 0.4984404444694519, 0.49836552143096924, 0.4983207583427429, 0.49828189611434937, 0.49994608759880066, 0.5007141828536987, 0.5000851154327393, 0.4994376599788666, 0.5010216236114502, 0.49940943717956543, 0.5010565519332886, 0.5006304383277893, 0.4999893009662628, 0.49934789538383484, 0.49890846014022827, 0.4986761808395386, 0.5014357566833496, 0.498593270778656, 0.4984905421733856, 0.501563549041748, 0.4983966052532196, 0.4983530044555664, 0.5016811490058899, 0.4982524812221527, 0.4999942481517792, 0.5006458163261414, 0.49999871850013733, 0.49935293197631836, 0.5010954141616821, 0.4993198812007904, 0.49886733293533325, 0.4986300468444824, 0.501481294631958, 0.5014550089836121, 0.49869173765182495, 0.5015209317207336, 0.5013983249664307, 0.5010881423950195, 0.5005631446838379, 0.5000594258308411, 0.4993364214897156, 0.4987615942955017, 0.5015497803688049, 0.4986477196216583, 0.5016275644302368, 0.5014687776565552, 0.5000126957893372, 0.49934667348861694, 0.498883992433548, 0.5013602375984192, 0.49880552291870117, 0.49857330322265625, 0.4984651505947113, 0.4984056055545807, 0.4983595013618469, 0.4983154237270355], "advantages": [16.548593521118164, 15.708296775817871, 14.853951454162598, 13.996578216552734, 13.124938011169434, 12.250131607055664, 11.360848426818848, 10.462762832641602, 9.560944557189941, 8.644686698913574, 7.719914436340332, 6.786563396453857, 5.844343185424805, 4.892965316772461, 3.9325332641601562, 2.962611675262451, 1.983189582824707, 0.9921531081199646, 17.383081436157227, 16.545822143554688, 15.70561408996582, 14.851396560668945, 13.989177703857422, 13.11898422241211, 12.240577697753906, 11.3549165725708, 10.460785865783691, 9.558209419250488, 8.647043228149414, 7.721452713012695, 6.787357807159424, 5.8473615646362305, 4.898414134979248, 3.9351861476898193, 2.9631731510162354, 1.98210608959198, 0.9916216731071472, 17.383407592773438, 16.54606056213379, 15.700847625732422, 14.851531982421875, 13.989197731018066, 13.118938446044922, 12.240513801574707, 11.35481071472168, 10.460613250732422, 9.557943344116211, 8.646668434143066, 7.726369380950928, 6.791123867034912, 5.846968173980713, 4.897911071777344, 3.9348092079162598, 2.966228723526001, 1.983832836151123, 0.9924691319465637, 19.027462005615234, 18.20680809020996, 17.3784122467041, 16.5423526763916, 15.700919151306152, 14.847867965698242, 13.989251136779785, 13.122599601745605, 12.247672080993652, 11.358366012573242, 10.465563774108887, 9.55828857421875, 8.647233009338379, 7.7216362953186035, 6.791938304901123, 5.847664833068848, 4.894689559936523, 3.9328808784484863, 2.961914539337158, 1.9821423292160034, 0.9915592074394226, 12.247437477111816, 11.358269691467285, 10.460808753967285, 9.555057525634766, 8.64074420928955, 7.717578411102295, 6.7857279777526855, 5.844707489013672, 4.8945231437683105, 3.935187339782715, 2.9666502475738525, 1.9886751174926758, 0.9955840110778809, 32.42761993408203, 31.74234962463379, 31.05581283569336, 30.356660842895508, 29.650907516479492, 28.942798614501953, 28.22269630432129, 27.49602699279785, 26.765405654907227, 26.02808380126953, 25.2784366607666, 24.526042938232422, 23.766429901123047, 22.99893569946289, 22.223051071166992, 21.435302734375, 20.638959884643555, 19.839998245239258, 19.032323837280273, 18.212360382080078, 17.383522033691406, 16.551748275756836, 15.710901260375977, 14.860821723937988, 13.999545097351074, 13.128947257995605, 12.253523826599121, 11.365415573120117, 10.467769622802734, 9.566134452819824, 8.650437355041504, 7.730342864990234, 6.796253204345703, 5.85235071182251, 4.904443740844727, 3.946194887161255, 2.9773497581481934, 1.998039722442627, 1.0084166526794434, 11.361961364746094, 10.463930130004883, 9.5624418258667, 8.65170669555664, 7.731070041656494, 6.800365924835205, 5.859682083129883, 4.908125877380371, 3.946549415588379, 2.9775192737579346, 1.99810791015625, 1.008436918258667, 12.247442245483398, 11.358282089233398, 10.460816383361816, 9.558382034301758, 8.642738342285156, 7.721839904785156, 6.79220724105835, 5.847942352294922, 4.894941806793213, 3.933096408843994, 2.9620938301086426, 1.9816386699676514, 0.9914913177490234, 18.208938598632812, 17.385616302490234, 16.54838752746582, 15.702773094177246, 14.849209785461426, 13.991338729858398, 13.120423316955566, 12.245060920715332, 11.36139965057373, 10.468778610229492, 9.56656265258789, 8.654529571533203, 7.732716083526611, 6.799818515777588, 5.859298229217529, 4.908857822418213, 3.947934865951538, 2.9781646728515625, 1.9983237981796265, 1.0083366632461548, 19.83710289001465, 19.03005599975586, 18.209335327148438, 17.385881423950195, 16.553529739379883, 15.70837688446045, 14.859138488769531, 14.000593185424805, 13.132786750793457, 12.254478454589844, 11.366793632507324, 10.47298812866211, 9.567444801330566, 8.652199745178223, 7.727199077606201, 6.792670249938965, 5.854387283325195, 4.906095027923584, 3.9472954273223877, 2.975817918777466, 1.9973341226577759, 1.0063831806182861, 9.561878204345703, 8.651180267333984, 7.730645179748535, 6.800041675567627, 5.857285976409912, 4.907748699188232, 3.948000431060791, 2.9781527519226074, 1.9982625246047974, 1.0083345174789429], "value_targets": [16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 70774560, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 825865911, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 882575134, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 274608080, 491321481, 491321481, 491321481, 491321481, 491321481, 491321481, 491321481, 491321481, 491321481, 491321481, 491321481, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 315217980, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1172250884, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1688245362, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1798773449, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995, 1867501995], "obs": [[-0.00091463269200176, 0.03423618897795677, 0.01201606448739767, 0.03835877776145935], [-0.00022990892466623336, -0.16105599701404572, 0.012783240526914597, 0.3348085284233093], [-0.0034510288387537003, -0.35635751485824585, 0.019479410722851753, 0.6314950585365295], [-0.01057817880064249, -0.16151268780231476, 0.03210931271314621, 0.34500986337661743], [-0.013808432966470718, 0.033138126134872437, 0.03900951147079468, 0.06262264400720596], [-0.013145670294761658, -0.16252078115940094, 0.04026196151971817, 0.367353618144989], [-0.016396086663007736, -0.35819104313850403, 0.047609034925699234, 0.6724549531936646], [-0.02355990745127201, -0.5539413094520569, 0.06105813384056091, 0.9797394275665283], [-0.03463873267173767, -0.3596886098384857, 0.08065292239189148, 0.7068433165550232], [-0.04183250665664673, -0.5558298230171204, 0.0947897881269455, 1.0237849950790405], [-0.052949100732803345, -0.3620893657207489, 0.11526548862457275, 0.7623053789138794], [-0.06019088998436928, -0.1687278300523758, 0.1305115967988968, 0.5080007910728455], [-0.0635654479265213, -0.3654237985610962, 0.14067161083221436, 0.8387970924377441], [-0.07087392359972, -0.17247407138347626, 0.15744756162166595, 0.5934526324272156], [-0.07432340085506439, 0.02013436146080494, 0.1693166047334671, 0.3542121648788452], [-0.07392071932554245, 0.21249516308307648, 0.17640085518360138, 0.11933863908052444], [-0.06967081129550934, 0.40470874309539795, 0.17878761887550354, -0.11291416734457016], [-0.061576638370752335, 0.2075354903936386, 0.17652933299541473, 0.23041526973247528], [-0.05742592737078667, 0.010388102382421494, 0.18113765120506287, 0.573171079158783], [-0.05721816420555115, 0.2025700956583023, 0.1926010698080063, 0.34257814288139343], [-0.05316676199436188, 0.005304535385221243, 0.19945262372493744, 0.6892805099487305], [-0.011392524465918541, 0.012708257883787155, 0.021807152777910233, 0.00696406839415431], [-0.01113835908472538, -0.18271954357624054, 0.021946433931589127, 0.3064468502998352], [-0.014792749658226967, -0.3781472444534302, 0.02807537093758583, 0.6059695482254028], [-0.022355694323778152, -0.18342888355255127, 0.040194761008024216, 0.32226020097732544], [-0.02602427266538143, -0.3790994882583618, 0.04663996770977974, 0.6273431181907654], [-0.033606261014938354, -0.1846584677696228, 0.05918682739138603, 0.34970593452453613], [-0.03729943186044693, 0.009573966264724731, 0.06618094444274902, 0.07625821232795715], [-0.03710795193910599, -0.18643124401569366, 0.06770610809326172, 0.3890654146671295], [-0.040836576372385025, 0.007667649071663618, 0.075487419962883, 0.11847452074289322], [-0.04068322479724884, -0.1884501427412033, 0.07785691320896149, 0.4339856803417206], [-0.044452227652072906, 0.005488177295774221, 0.08653662353754044, 0.1668262630701065], [-0.044342461973428726, 0.19927167892456055, 0.08987314999103546, -0.09735127538442612], [-0.04035703092813492, 0.39299827814102173, 0.08792611956596375, -0.36038124561309814], [-0.032497063279151917, 0.5867675542831421, 0.080718494951725, -0.6240953207015991], [-0.02076171338558197, 0.7806752920150757, 0.0682365894317627, -0.890304446220398], [-0.005148207303136587, 0.5846971273422241, 0.050430502742528915, -0.576975405216217], [0.006545735523104668, 0.38890594244003296, 0.03889099508523941, -0.2688416838645935], [0.014323854818940163, 0.19325119256973267, 0.03351416066288948, 0.03584960848093033], [0.018188878893852234, -0.0023349265102297068, 0.03423115238547325, 0.3389153778553009], [0.018142180517315865, -0.1979268193244934, 0.041009459644556046, 0.6421933174133301], [0.014183643274009228, -0.39359569549560547, 0.05385332554578781, 0.9475032687187195], [0.006311730016022921, -0.5893998146057129, 0.07280339300632477, 1.2566088438034058], [-0.005476266611367464, -0.3952813744544983, 0.09793557226657867, 0.9875878691673279], [-0.013381894677877426, -0.20159746706485748, 0.11768732964992523, 0.7272011637687683], [-0.017413843423128128, -0.008282216265797615, 0.13223135471343994, 0.4737543761730194], [-0.017579488456249237, 0.18474870920181274, 0.1417064368724823, 0.2254984825849533], [-0.013884513638913631, 0.3775910437107086, 0.14621640741825104, -0.019343148916959763], [-0.00633269315585494, 0.18070773780345917, 0.14582954347133636, 0.3156651258468628], [-0.0027185382787138224, -0.016157792881131172, 0.15214285254478455, 0.6505511403083801], [-0.003041693940758705, -0.2130347192287445, 0.1651538759469986, 0.9870128035545349], [-0.007302388548851013, -0.02046307362616062, 0.1848941296339035, 0.7504206299781799], [-0.007711649872362614, -0.2175881564617157, 0.19990253448486328, 1.0951181650161743], [-0.03296623006463051, -0.04057500511407852, 0.010318961925804615, 0.03681466728448868], [-0.03377773240208626, 0.15439745783805847, 0.011055255308747292, -0.2525947391986847], [-0.03068978153169155, 0.34935981035232544, 0.006003360729664564, -0.5417702198028564], [-0.023702586069703102, 0.15415401756763458, -0.004832043778151274, -0.2472018152475357], [-0.020619504153728485, 0.3493446409702301, -0.009776080027222633, -0.5414049625396729], [-0.01363261230289936, 0.544602632522583, -0.020604180172085762, -0.8371520638465881], [-0.0027405598666518927, 0.7399998307228088, -0.0373472198843956, -1.1362428665161133], [0.012059437111020088, 0.5453858375549316, -0.060072075575590134, -0.8555029034614563], [0.022967152297496796, 0.3511316776275635, -0.07718213647603989, -0.5822978615760803], [0.029989786446094513, 0.5472453236579895, -0.08882809430360794, -0.8982616066932678], [0.040934693068265915, 0.743451714515686, -0.10679332911968231, -1.2174919843673706], [0.055803727358579636, 0.5498564839363098, -0.13114316761493683, -0.9600911140441895], [0.06680085510015488, 0.35671791434288025, -0.15034498274326324, -0.7113165855407715], [0.07393521815538406, 0.5535666346549988, -0.16457131505012512, -1.0472939014434814], [0.08500654995441437, 0.7504444122314453, -0.18551719188690186, -1.3867863416671753], [0.04066140949726105, 0.015569309704005718, 0.04847016930580139, -0.020681651309132576], [0.04097279533743858, 0.2099638432264328, 0.04805653542280197, -0.2976863384246826], [0.0451720729470253, 0.4043689966201782, 0.04210280999541283, -0.5748342275619507], [0.05325945466756821, 0.2086828649044037, 0.03060612641274929, -0.26919057965278625], [0.0574331097304821, 0.4033549726009369, 0.02522231452167034, -0.5520651936531067], [0.06550020724534988, 0.5981137752532959, 0.01418101042509079, -0.8366959095001221], [0.07746248692274094, 0.7930392026901245, -0.002552908379584551, -1.1248855590820312], [0.09332326799631119, 0.9881945252418518, -0.02505061961710453, -1.4183682203292847], [0.11308716237545013, 1.1836174726486206, -0.053417984396219254, -1.718774676322937], [0.13675950467586517, 0.9891468286514282, -0.08779347687959671, -1.4431822299957275], [0.15654245018959045, 1.1852328777313232, -0.11665712296962738, -1.761956810951233], [0.18024709820747375, 0.9916082620620728, -0.15189625322818756, -1.5077131986618042], [0.2000792771577835, 1.188210368156433, -0.18205052614212036, -1.8437068462371826], [-0.022016160190105438, -0.03953339904546738, 0.0190452728420496, 0.012752422131597996], [-0.02280682884156704, 0.15531031787395477, 0.019300322979688644, -0.2738611698150635], [-0.01970062218606472, 0.3501516282558441, 0.013823098503053188, -0.5603947639465332], [-0.01269758865237236, 0.5450769066810608, 0.0026152029167860746, -0.8486908674240112], [-0.0017960512777790427, 0.7401630878448486, -0.014358614571392536, -1.1405502557754517], [0.013007209636271, 0.5452317595481873, -0.037169620394706726, -0.8524047136306763], [0.023911844938993454, 0.7408401370048523, -0.05421771481633186, -1.156540036201477], [0.03872864693403244, 0.9366253614425659, -0.07734851539134979, -1.4657185077667236], [0.05746115371584892, 1.1326045989990234, -0.10666288435459137, -1.7815262079238892], [0.0801132470369339, 1.3287523984909058, -0.14229340851306915, -2.105375289916992], [0.10668829083442688, 1.1353150606155396, -0.18440091609954834, -1.8598449230194092], [-0.01675986684858799, -0.010181896388530731, 0.03850333392620087, -0.04938904941082001], [-0.016963506117463112, 0.18436740338802338, 0.0375155545771122, -0.3296795189380646], [-0.013276156969368458, -0.011267955414950848, 0.03092196397483349, -0.02540598250925541], [-0.013501516543328762, -0.20681940019130707, 0.03041384369134903, 0.2768705487251282], [-0.01763790473341942, -0.40236175060272217, 0.03595125675201416, 0.5789887309074402], [-0.025685139000415802, -0.597968578338623, 0.04753103107213974, 0.8827767968177795], [-0.037644512951374054, -0.4035232961177826, 0.06518656760454178, 0.6054071187973022], [-0.045714978128671646, -0.20937055349349976, 0.07729470729827881, 0.3339478075504303], [-0.04990238696336746, -0.40550264716148376, 0.08397366106510162, 0.6499695777893066], [-0.05801244080066681, -0.21164456009864807, 0.09697305411100388, 0.3848663568496704], [-0.06224533170461655, -0.018023459240794182, 0.10467038303613663, 0.12426463514566422], [-0.06260579824447632, -0.21447710692882538, 0.10715567320585251, 0.44804927706718445], [-0.06689534336328506, -0.41093870997428894, 0.11611665785312653, 0.772494912147522], [-0.07511411607265472, -0.21758955717086792, 0.13156655430793762, 0.5184858441352844], [-0.07946591079235077, -0.414294570684433, 0.1419362723827362, 0.849562406539917], [-0.08775179833173752, -0.6110371947288513, 0.1589275300502777, 1.1832979917526245], [-0.09997254610061646, -0.4182933270931244, 0.1825934797525406, 0.9443539977073669], [-0.10833840817213058, -0.22603805363178253, 0.20148056745529175, 0.7141498327255249], [0.03634027764201164, 0.007280356250703335, -0.0425717756152153, 0.0034441109746694565], [0.03648588806390762, 0.20298618078231812, -0.04250289499759674, -0.3023609519004822], [0.04054560884833336, 0.008494946174323559, -0.048550114035606384, -0.023379679769277573], [0.04071550816297531, -0.18589834868907928, -0.049017708748579025, 0.25359854102134705], [0.03699754178524017, 0.009887998923659325, -0.043945737183094025, -0.054133664816617966], [0.03719530254602432, 0.20561161637306213, -0.045028410851955414, -0.3603515326976776], [0.04130753502249718, 0.011157696135342121, -0.0522354394197464, -0.08220018446445465], [0.04153068736195564, 0.20698800683021545, -0.05387944355607033, -0.3908952474594116], [0.04567044973373413, 0.012670484371483326, -0.061697348952293396, -0.11567481607198715], [0.045923858880996704, -0.1815156638622284, -0.06401084363460541, 0.15692268311977386], [0.04229354485869408, -0.3756655156612396, -0.0608723908662796, 0.42874470353126526], [0.03478023409843445, -0.1797366887331009, -0.052297499030828476, 0.1175103634595871], [0.03118550032377243, -0.3740718364715576, -0.04994729161262512, 0.3932460844516754], [0.023704063147306442, -0.5684507489204407, -0.042082369327545166, 0.6697724461555481], [0.012335048988461494, -0.7629631161689758, -0.028686920180916786, 0.948914110660553], [-0.002924213418737054, -0.9576873183250427, -0.009708639234304428, 1.2324475049972534], [-0.022077960893511772, -0.762441873550415, 0.014940310269594193, 0.9367387890815735], [-0.03732679784297943, -0.5675245523452759, 0.03367508575320244, 0.6487877368927002], [-0.04867728799581528, -0.7630990743637085, 0.04665084183216095, 0.9518817663192749], [-0.06393927335739136, -0.5686349272727966, 0.06568847596645355, 0.6742132306098938], [-0.07531196624040604, -0.7646053433418274, 0.07917274534702301, 0.986833393573761], [-0.09060407429933548, -0.9606931209564209, 0.0989094078540802, 1.3032962083816528], [-0.10981793701648712, -0.7669550180435181, 0.12497533112764359, 1.0431413650512695], [-0.12515704333782196, -0.9634948968887329, 0.1458381563425064, 1.372299075126648], [-0.14442694187164307, -1.1601080894470215, 0.1732841432094574, 1.7068127393722534], [-0.16762909293174744, -1.3567478656768799, 0.20742039382457733, 2.048046112060547], [-0.04269209876656532, 0.022726716473698616, -0.029326491057872772, 0.029817404225468636], [-0.04223756119608879, 0.21825668215751648, -0.02873014286160469, -0.2719721794128418], [-0.03787242993712425, 0.023556223139166832, -0.03416958823800087, 0.011512481607496738], [-0.03740130364894867, -0.17105945944786072, -0.033939339220523834, 0.29322168231010437], [-0.04082249477505684, -0.3656814992427826, -0.028074903413653374, 0.575010359287262], [-0.04813612252473831, -0.5603988170623779, -0.016574695706367493, 0.8587183952331543], [-0.0593441016972065, -0.3650550842285156, 0.0005996706895530224, 0.5608702301979065], [-0.06664520502090454, -0.560185432434082, 0.011817075312137604, 0.8537420034408569], [-0.07784891128540039, -0.36522653698921204, 0.02889191545546055, 0.5647982358932495], [-0.08515343815088272, -0.560741662979126, 0.04018788039684296, 0.8664416074752808], [-0.09636827558279037, -0.7563868165016174, 0.057516712695360184, 1.1714844703674316], [-0.11149600893259048, -0.9522075057029724, 0.08094640076160431, 1.4816303253173828], [-0.1305401623249054, -1.1482183933258057, 0.1105790063738823, 1.798456072807312], [-0.15350453555583954, -1.3443902730941772, 0.14654812216758728, 2.1233606338500977], [-0.1803923398256302, -1.1509994268417358, 0.18901534378528595, 1.8793151378631592], [0.036379627883434296, -0.040967877954244614, 0.02609533816576004, -0.012006140314042568], [0.03556027263402939, -0.23645415902137756, 0.02585521526634693, 0.288794606924057], [0.030831187963485718, -0.4319351017475128, 0.03163110837340355, 0.5895186066627502], [0.022192485630512238, -0.23726999759674072, 0.04342147707939148, 0.3069649934768677], [0.017447086051106453, -0.4329829216003418, 0.049560777842998505, 0.613019585609436], [0.00878742802888155, -0.23858731985092163, 0.06182117015123367, 0.33634912967681885], [0.004015681333839893, -0.04439713805913925, 0.06854815036058426, 0.0637841522693634], [0.0031277386005967855, -0.2404315322637558, 0.06982383877038956, 0.3772825300693512], [-0.0016808919608592987, -0.04636712744832039, 0.07736948877573013, 0.10740678012371063], [-0.002608234528452158, 0.14756575226783752, 0.07951762527227402, -0.15989835560321808], [0.0003430804063100368, -0.0485992506146431, 0.07631965726613998, 0.1567729115486145], [-0.0006289046141318977, 0.14535173773765564, 0.07945511490106583, -0.11089050024747849], [0.0022781300358474255, 0.3392505347728729, 0.07723730057477951, -0.37748590111732483], [0.00906314142048359, 0.533195436000824, 0.06968758255243301, -0.6448507308959961], [0.01972704939544201, 0.3371751010417938, 0.05679057165980339, -0.33106228709220886], [0.026470551267266273, 0.5314446091651917, 0.05016932636499405, -0.6053093075752258], [0.0370994433760643, 0.7258304357528687, 0.03806313872337341, -0.8817775845527649], [0.05161605030298233, 0.9204152822494507, 0.020427586510777473, -1.1622555255889893], [0.07002435624599457, 1.1152652502059937, -0.0028175238985568285, -1.4484643936157227], [0.09232966601848602, 0.9201781153678894, -0.03178681060671806, -1.1566630601882935], [0.11073322594165802, 0.7254846096038818, -0.054920073598623276, -0.8741141557693481], [0.1252429187297821, 0.5311506390571594, -0.07240235805511475, -0.5991910696029663], [0.1358659267425537, 0.3371123969554901, -0.0843861773610115, -0.3301638960838318], [0.142608180642128, 0.5333278775215149, -0.09098945558071136, -0.648219883441925], [0.15327472984790802, 0.7295917272567749, -0.10395385324954987, -0.9681118726730347], [0.1678665727376938, 0.5360075235366821, -0.12331609427928925, -0.7098105549812317], [0.17858672142028809, 0.3427897095680237, -0.13751229643821716, -0.45834779739379883], [0.18544252216815948, 0.5395603775978088, -0.14667925238609314, -0.7910189032554626], [0.19623371958732605, 0.7363590598106384, -0.16249963641166687, -1.1260162591934204], [0.21096090972423553, 0.5436956286430359, -0.18501995503902435, -0.8883932828903198], [0.22183482348918915, 0.3515012860298157, -0.2027878314256668, -0.6591082215309143], [0.023674143478274345, -0.043896500021219254, -0.011729965917766094, -0.04553337022662163], [0.022796213626861572, 0.1513916701078415, -0.01264063362032175, -0.3418940007686615], [0.02582404762506485, 0.34669116139411926, -0.019478512927889824, -0.6385360956192017], [0.032757870852947235, 0.15184615552425385, -0.03224923461675644, -0.3520503342151642], [0.03579479455947876, -0.042802710086107254, -0.03929024189710617, -0.06970848888158798], [0.034938737750053406, -0.23733998835086823, -0.04068441316485405, 0.21032385528087616], [0.03019193932414055, -0.43185731768608093, -0.03647793456912041, 0.48990049958229065], [0.021554792299866676, -0.6264461874961853, -0.026679925620555878, 0.7708674669265747], [0.009025868959724903, -0.43096742033958435, -0.011262575164437294, 0.46991074085235596], [0.00040652044117450714, -0.625928521156311, -0.0018643602961674333, 0.7590226531028748], [-0.012112049385905266, -0.8210247159004211, 0.013316093012690544, 1.0511183738708496], [-0.028532544150948524, -1.0163207054138184, 0.03433845937252045, 1.3479511737823486], [-0.04885895922780037, -0.8216467499732971, 0.06129748374223709, 1.0662059783935547], [-0.06529189646244049, -0.6273871064186096, 0.08262160420417786, 0.7933739423751831], [-0.07783963531255722, -0.4334906339645386, 0.09848908334970474, 0.5277844667434692], [-0.08650945127010345, -0.6298503279685974, 0.10904476791620255, 0.8498055934906006], [-0.09910645335912704, -0.436370849609375, 0.12604087591171265, 0.5933058261871338], [-0.1078338697552681, -0.2432176023721695, 0.1379069983959198, 0.3428322374820709], [-0.11269822716712952, -0.44000446796417236, 0.14476364850997925, 0.6756263375282288], [-0.12149831652641296, -0.2471591681241989, 0.15827617049217224, 0.431796133518219], [-0.12644149363040924, -0.05459078773856163, 0.16691209375858307, 0.19289325177669525], [-0.12753331661224365, 0.13779908418655396, 0.17076995968818665, -0.04283633083105087], [-0.12477733194828033, -0.059307798743247986, 0.16991323232650757, 0.2984860837459564], [-0.125963494181633, 0.13303625583648682, 0.175882950425148, 0.06383926421403885], [-0.12330276519060135, -0.064114049077034, 0.17715974152088165, 0.40644580125808716], [-0.12458503991365433, 0.1281115561723709, 0.18528865277767181, 0.17443333566188812], [-0.12202281504869461, -0.06911203265190125, 0.18877732753753662, 0.5193686485290527], [-0.12340505421161652, 0.12292099744081497, 0.19916468858718872, 0.29160791635513306], [-0.12094663083553314, 0.31472861766815186, 0.20499685406684875, 0.06775201857089996], [-0.11465205997228622, 0.11734775453805923, 0.2063518911600113, 0.41747188568115234]], "actions": [0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.00022990892466623336, -0.16105599701404572, 0.012783240526914597, 0.3348085284233093], [-0.0034510288387537003, -0.35635751485824585, 0.019479410722851753, 0.6314950585365295], [-0.01057817880064249, -0.16151268780231476, 0.03210931271314621, 0.34500986337661743], [-0.013808432966470718, 0.033138126134872437, 0.03900951147079468, 0.06262264400720596], [-0.013145670294761658, -0.16252078115940094, 0.04026196151971817, 0.367353618144989], [-0.016396086663007736, -0.35819104313850403, 0.047609034925699234, 0.6724549531936646], [-0.02355990745127201, -0.5539413094520569, 0.06105813384056091, 0.9797394275665283], [-0.03463873267173767, -0.3596886098384857, 0.08065292239189148, 0.7068433165550232], [-0.04183250665664673, -0.5558298230171204, 0.0947897881269455, 1.0237849950790405], [-0.052949100732803345, -0.3620893657207489, 0.11526548862457275, 0.7623053789138794], [-0.06019088998436928, -0.1687278300523758, 0.1305115967988968, 0.5080007910728455], [-0.0635654479265213, -0.3654237985610962, 0.14067161083221436, 0.8387970924377441], [-0.07087392359972, -0.17247407138347626, 0.15744756162166595, 0.5934526324272156], [-0.07432340085506439, 0.02013436146080494, 0.1693166047334671, 0.3542121648788452], [-0.07392071932554245, 0.21249516308307648, 0.17640085518360138, 0.11933863908052444], [-0.06967081129550934, 0.40470874309539795, 0.17878761887550354, -0.11291416734457016], [-0.061576638370752335, 0.2075354903936386, 0.17652933299541473, 0.23041526973247528], [-0.05742592737078667, 0.010388102382421494, 0.18113765120506287, 0.573171079158783], [-0.05721816420555115, 0.2025700956583023, 0.1926010698080063, 0.34257814288139343], [-0.05316676199436188, 0.005304535385221243, 0.19945262372493744, 0.6892805099487305], [-0.05306067317724228, -0.1919441819190979, 0.21323823928833008, 1.037539005279541], [-0.01113835908472538, -0.18271954357624054, 0.021946433931589127, 0.3064468502998352], [-0.014792749658226967, -0.3781472444534302, 0.02807537093758583, 0.6059695482254028], [-0.022355694323778152, -0.18342888355255127, 0.040194761008024216, 0.32226020097732544], [-0.02602427266538143, -0.3790994882583618, 0.04663996770977974, 0.6273431181907654], [-0.033606261014938354, -0.1846584677696228, 0.05918682739138603, 0.34970593452453613], [-0.03729943186044693, 0.009573966264724731, 0.06618094444274902, 0.07625821232795715], [-0.03710795193910599, -0.18643124401569366, 0.06770610809326172, 0.3890654146671295], [-0.040836576372385025, 0.007667649071663618, 0.075487419962883, 0.11847452074289322], [-0.04068322479724884, -0.1884501427412033, 0.07785691320896149, 0.4339856803417206], [-0.044452227652072906, 0.005488177295774221, 0.08653662353754044, 0.1668262630701065], [-0.044342461973428726, 0.19927167892456055, 0.08987314999103546, -0.09735127538442612], [-0.04035703092813492, 0.39299827814102173, 0.08792611956596375, -0.36038124561309814], [-0.032497063279151917, 0.5867675542831421, 0.080718494951725, -0.6240953207015991], [-0.02076171338558197, 0.7806752920150757, 0.0682365894317627, -0.890304446220398], [-0.005148207303136587, 0.5846971273422241, 0.050430502742528915, -0.576975405216217], [0.006545735523104668, 0.38890594244003296, 0.03889099508523941, -0.2688416838645935], [0.014323854818940163, 0.19325119256973267, 0.03351416066288948, 0.03584960848093033], [0.018188878893852234, -0.0023349265102297068, 0.03423115238547325, 0.3389153778553009], [0.018142180517315865, -0.1979268193244934, 0.041009459644556046, 0.6421933174133301], [0.014183643274009228, -0.39359569549560547, 0.05385332554578781, 0.9475032687187195], [0.006311730016022921, -0.5893998146057129, 0.07280339300632477, 1.2566088438034058], [-0.005476266611367464, -0.3952813744544983, 0.09793557226657867, 0.9875878691673279], [-0.013381894677877426, -0.20159746706485748, 0.11768732964992523, 0.7272011637687683], [-0.017413843423128128, -0.008282216265797615, 0.13223135471343994, 0.4737543761730194], [-0.017579488456249237, 0.18474870920181274, 0.1417064368724823, 0.2254984825849533], [-0.013884513638913631, 0.3775910437107086, 0.14621640741825104, -0.019343148916959763], [-0.00633269315585494, 0.18070773780345917, 0.14582954347133636, 0.3156651258468628], [-0.0027185382787138224, -0.016157792881131172, 0.15214285254478455, 0.6505511403083801], [-0.003041693940758705, -0.2130347192287445, 0.1651538759469986, 0.9870128035545349], [-0.007302388548851013, -0.02046307362616062, 0.1848941296339035, 0.7504206299781799], [-0.007711649872362614, -0.2175881564617157, 0.19990253448486328, 1.0951181650161743], [-0.012063412927091122, -0.02557898685336113, 0.2218049019575119, 0.8712206482887268], [-0.03377773240208626, 0.15439745783805847, 0.011055255308747292, -0.2525947391986847], [-0.03068978153169155, 0.34935981035232544, 0.006003360729664564, -0.5417702198028564], [-0.023702586069703102, 0.15415401756763458, -0.004832043778151274, -0.2472018152475357], [-0.020619504153728485, 0.3493446409702301, -0.009776080027222633, -0.5414049625396729], [-0.01363261230289936, 0.544602632522583, -0.020604180172085762, -0.8371520638465881], [-0.0027405598666518927, 0.7399998307228088, -0.0373472198843956, -1.1362428665161133], [0.012059437111020088, 0.5453858375549316, -0.060072075575590134, -0.8555029034614563], [0.022967152297496796, 0.3511316776275635, -0.07718213647603989, -0.5822978615760803], [0.029989786446094513, 0.5472453236579895, -0.08882809430360794, -0.8982616066932678], [0.040934693068265915, 0.743451714515686, -0.10679332911968231, -1.2174919843673706], [0.055803727358579636, 0.5498564839363098, -0.13114316761493683, -0.9600911140441895], [0.06680085510015488, 0.35671791434288025, -0.15034498274326324, -0.7113165855407715], [0.07393521815538406, 0.5535666346549988, -0.16457131505012512, -1.0472939014434814], [0.08500654995441437, 0.7504444122314453, -0.18551719188690186, -1.3867863416671753], [0.10001543909311295, 0.9473300576210022, -0.21325291693210602, -1.7312769889831543], [0.04097279533743858, 0.2099638432264328, 0.04805653542280197, -0.2976863384246826], [0.0451720729470253, 0.4043689966201782, 0.04210280999541283, -0.5748342275619507], [0.05325945466756821, 0.2086828649044037, 0.03060612641274929, -0.26919057965278625], [0.0574331097304821, 0.4033549726009369, 0.02522231452167034, -0.5520651936531067], [0.06550020724534988, 0.5981137752532959, 0.01418101042509079, -0.8366959095001221], [0.07746248692274094, 0.7930392026901245, -0.002552908379584551, -1.1248855590820312], [0.09332326799631119, 0.9881945252418518, -0.02505061961710453, -1.4183682203292847], [0.11308716237545013, 1.1836174726486206, -0.053417984396219254, -1.718774676322937], [0.13675950467586517, 0.9891468286514282, -0.08779347687959671, -1.4431822299957275], [0.15654245018959045, 1.1852328777313232, -0.11665712296962738, -1.761956810951233], [0.18024709820747375, 0.9916082620620728, -0.15189625322818756, -1.5077131986618042], [0.2000792771577835, 1.188210368156433, -0.18205052614212036, -1.8437068462371826], [0.22384348511695862, 0.9955037236213684, -0.2189246565103531, -1.6126514673233032], [-0.02280682884156704, 0.15531031787395477, 0.019300322979688644, -0.2738611698150635], [-0.01970062218606472, 0.3501516282558441, 0.013823098503053188, -0.5603947639465332], [-0.01269758865237236, 0.5450769066810608, 0.0026152029167860746, -0.8486908674240112], [-0.0017960512777790427, 0.7401630878448486, -0.014358614571392536, -1.1405502557754517], [0.013007209636271, 0.5452317595481873, -0.037169620394706726, -0.8524047136306763], [0.023911844938993454, 0.7408401370048523, -0.05421771481633186, -1.156540036201477], [0.03872864693403244, 0.9366253614425659, -0.07734851539134979, -1.4657185077667236], [0.05746115371584892, 1.1326045989990234, -0.10666288435459137, -1.7815262079238892], [0.0801132470369339, 1.3287523984909058, -0.14229340851306915, -2.105375289916992], [0.10668829083442688, 1.1353150606155396, -0.18440091609954834, -1.8598449230194092], [0.12939459085464478, 0.942633330821991, -0.2215978056192398, -1.6296296119689941], [-0.016963506117463112, 0.18436740338802338, 0.0375155545771122, -0.3296795189380646], [-0.013276156969368458, -0.011267955414950848, 0.03092196397483349, -0.02540598250925541], [-0.013501516543328762, -0.20681940019130707, 0.03041384369134903, 0.2768705487251282], [-0.01763790473341942, -0.40236175060272217, 0.03595125675201416, 0.5789887309074402], [-0.025685139000415802, -0.597968578338623, 0.04753103107213974, 0.8827767968177795], [-0.037644512951374054, -0.4035232961177826, 0.06518656760454178, 0.6054071187973022], [-0.045714978128671646, -0.20937055349349976, 0.07729470729827881, 0.3339478075504303], [-0.04990238696336746, -0.40550264716148376, 0.08397366106510162, 0.6499695777893066], [-0.05801244080066681, -0.21164456009864807, 0.09697305411100388, 0.3848663568496704], [-0.06224533170461655, -0.018023459240794182, 0.10467038303613663, 0.12426463514566422], [-0.06260579824447632, -0.21447710692882538, 0.10715567320585251, 0.44804927706718445], [-0.06689534336328506, -0.41093870997428894, 0.11611665785312653, 0.772494912147522], [-0.07511411607265472, -0.21758955717086792, 0.13156655430793762, 0.5184858441352844], [-0.07946591079235077, -0.414294570684433, 0.1419362723827362, 0.849562406539917], [-0.08775179833173752, -0.6110371947288513, 0.1589275300502777, 1.1832979917526245], [-0.09997254610061646, -0.4182933270931244, 0.1825934797525406, 0.9443539977073669], [-0.10833840817213058, -0.22603805363178253, 0.20148056745529175, 0.7141498327255249], [-0.11285917460918427, -0.4232943654060364, 0.21576355397701263, 1.0628842115402222], [0.03648588806390762, 0.20298618078231812, -0.04250289499759674, -0.3023609519004822], [0.04054560884833336, 0.008494946174323559, -0.048550114035606384, -0.023379679769277573], [0.04071550816297531, -0.18589834868907928, -0.049017708748579025, 0.25359854102134705], [0.03699754178524017, 0.009887998923659325, -0.043945737183094025, -0.054133664816617966], [0.03719530254602432, 0.20561161637306213, -0.045028410851955414, -0.3603515326976776], [0.04130753502249718, 0.011157696135342121, -0.0522354394197464, -0.08220018446445465], [0.04153068736195564, 0.20698800683021545, -0.05387944355607033, -0.3908952474594116], [0.04567044973373413, 0.012670484371483326, -0.061697348952293396, -0.11567481607198715], [0.045923858880996704, -0.1815156638622284, -0.06401084363460541, 0.15692268311977386], [0.04229354485869408, -0.3756655156612396, -0.0608723908662796, 0.42874470353126526], [0.03478023409843445, -0.1797366887331009, -0.052297499030828476, 0.1175103634595871], [0.03118550032377243, -0.3740718364715576, -0.04994729161262512, 0.3932460844516754], [0.023704063147306442, -0.5684507489204407, -0.042082369327545166, 0.6697724461555481], [0.012335048988461494, -0.7629631161689758, -0.028686920180916786, 0.948914110660553], [-0.002924213418737054, -0.9576873183250427, -0.009708639234304428, 1.2324475049972534], [-0.022077960893511772, -0.762441873550415, 0.014940310269594193, 0.9367387890815735], [-0.03732679784297943, -0.5675245523452759, 0.03367508575320244, 0.6487877368927002], [-0.04867728799581528, -0.7630990743637085, 0.04665084183216095, 0.9518817663192749], [-0.06393927335739136, -0.5686349272727966, 0.06568847596645355, 0.6742132306098938], [-0.07531196624040604, -0.7646053433418274, 0.07917274534702301, 0.986833393573761], [-0.09060407429933548, -0.9606931209564209, 0.0989094078540802, 1.3032962083816528], [-0.10981793701648712, -0.7669550180435181, 0.12497533112764359, 1.0431413650512695], [-0.12515704333782196, -0.9634948968887329, 0.1458381563425064, 1.372299075126648], [-0.14442694187164307, -1.1601080894470215, 0.1732841432094574, 1.7068127393722534], [-0.16762909293174744, -1.3567478656768799, 0.20742039382457733, 2.048046112060547], [-0.19476406276226044, -1.553307294845581, 0.24838131666183472, 2.3971107006073], [-0.04223756119608879, 0.21825668215751648, -0.02873014286160469, -0.2719721794128418], [-0.03787242993712425, 0.023556223139166832, -0.03416958823800087, 0.011512481607496738], [-0.03740130364894867, -0.17105945944786072, -0.033939339220523834, 0.29322168231010437], [-0.04082249477505684, -0.3656814992427826, -0.028074903413653374, 0.575010359287262], [-0.04813612252473831, -0.5603988170623779, -0.016574695706367493, 0.8587183952331543], [-0.0593441016972065, -0.3650550842285156, 0.0005996706895530224, 0.5608702301979065], [-0.06664520502090454, -0.560185432434082, 0.011817075312137604, 0.8537420034408569], [-0.07784891128540039, -0.36522653698921204, 0.02889191545546055, 0.5647982358932495], [-0.08515343815088272, -0.560741662979126, 0.04018788039684296, 0.8664416074752808], [-0.09636827558279037, -0.7563868165016174, 0.057516712695360184, 1.1714844703674316], [-0.11149600893259048, -0.9522075057029724, 0.08094640076160431, 1.4816303253173828], [-0.1305401623249054, -1.1482183933258057, 0.1105790063738823, 1.798456072807312], [-0.15350453555583954, -1.3443902730941772, 0.14654812216758728, 2.1233606338500977], [-0.1803923398256302, -1.1509994268417358, 0.18901534378528595, 1.8793151378631592], [-0.20341232419013977, -0.9583743214607239, 0.22660164535045624, 1.6507636308670044], [0.03556027263402939, -0.23645415902137756, 0.02585521526634693, 0.288794606924057], [0.030831187963485718, -0.4319351017475128, 0.03163110837340355, 0.5895186066627502], [0.022192485630512238, -0.23726999759674072, 0.04342147707939148, 0.3069649934768677], [0.017447086051106453, -0.4329829216003418, 0.049560777842998505, 0.613019585609436], [0.00878742802888155, -0.23858731985092163, 0.06182117015123367, 0.33634912967681885], [0.004015681333839893, -0.04439713805913925, 0.06854815036058426, 0.0637841522693634], [0.0031277386005967855, -0.2404315322637558, 0.06982383877038956, 0.3772825300693512], [-0.0016808919608592987, -0.04636712744832039, 0.07736948877573013, 0.10740678012371063], [-0.002608234528452158, 0.14756575226783752, 0.07951762527227402, -0.15989835560321808], [0.0003430804063100368, -0.0485992506146431, 0.07631965726613998, 0.1567729115486145], [-0.0006289046141318977, 0.14535173773765564, 0.07945511490106583, -0.11089050024747849], [0.0022781300358474255, 0.3392505347728729, 0.07723730057477951, -0.37748590111732483], [0.00906314142048359, 0.533195436000824, 0.06968758255243301, -0.6448507308959961], [0.01972704939544201, 0.3371751010417938, 0.05679057165980339, -0.33106228709220886], [0.026470551267266273, 0.5314446091651917, 0.05016932636499405, -0.6053093075752258], [0.0370994433760643, 0.7258304357528687, 0.03806313872337341, -0.8817775845527649], [0.05161605030298233, 0.9204152822494507, 0.020427586510777473, -1.1622555255889893], [0.07002435624599457, 1.1152652502059937, -0.0028175238985568285, -1.4484643936157227], [0.09232966601848602, 0.9201781153678894, -0.03178681060671806, -1.1566630601882935], [0.11073322594165802, 0.7254846096038818, -0.054920073598623276, -0.8741141557693481], [0.1252429187297821, 0.5311506390571594, -0.07240235805511475, -0.5991910696029663], [0.1358659267425537, 0.3371123969554901, -0.0843861773610115, -0.3301638960838318], [0.142608180642128, 0.5333278775215149, -0.09098945558071136, -0.648219883441925], [0.15327472984790802, 0.7295917272567749, -0.10395385324954987, -0.9681118726730347], [0.1678665727376938, 0.5360075235366821, -0.12331609427928925, -0.7098105549812317], [0.17858672142028809, 0.3427897095680237, -0.13751229643821716, -0.45834779739379883], [0.18544252216815948, 0.5395603775978088, -0.14667925238609314, -0.7910189032554626], [0.19623371958732605, 0.7363590598106384, -0.16249963641166687, -1.1260162591934204], [0.21096090972423553, 0.5436956286430359, -0.18501995503902435, -0.8883932828903198], [0.22183482348918915, 0.3515012860298157, -0.2027878314256668, -0.6591082215309143], [0.228864848613739, 0.5487815737724304, -0.2159699946641922, -1.0081766843795776], [0.022796213626861572, 0.1513916701078415, -0.01264063362032175, -0.3418940007686615], [0.02582404762506485, 0.34669116139411926, -0.019478512927889824, -0.6385360956192017], [0.032757870852947235, 0.15184615552425385, -0.03224923461675644, -0.3520503342151642], [0.03579479455947876, -0.042802710086107254, -0.03929024189710617, -0.06970848888158798], [0.034938737750053406, -0.23733998835086823, -0.04068441316485405, 0.21032385528087616], [0.03019193932414055, -0.43185731768608093, -0.03647793456912041, 0.48990049958229065], [0.021554792299866676, -0.6264461874961853, -0.026679925620555878, 0.7708674669265747], [0.009025868959724903, -0.43096742033958435, -0.011262575164437294, 0.46991074085235596], [0.00040652044117450714, -0.625928521156311, -0.0018643602961674333, 0.7590226531028748], [-0.012112049385905266, -0.8210247159004211, 0.013316093012690544, 1.0511183738708496], [-0.028532544150948524, -1.0163207054138184, 0.03433845937252045, 1.3479511737823486], [-0.04885895922780037, -0.8216467499732971, 0.06129748374223709, 1.0662059783935547], [-0.06529189646244049, -0.6273871064186096, 0.08262160420417786, 0.7933739423751831], [-0.07783963531255722, -0.4334906339645386, 0.09848908334970474, 0.5277844667434692], [-0.08650945127010345, -0.6298503279685974, 0.10904476791620255, 0.8498055934906006], [-0.09910645335912704, -0.436370849609375, 0.12604087591171265, 0.5933058261871338], [-0.1078338697552681, -0.2432176023721695, 0.1379069983959198, 0.3428322374820709], [-0.11269822716712952, -0.44000446796417236, 0.14476364850997925, 0.6756263375282288], [-0.12149831652641296, -0.2471591681241989, 0.15827617049217224, 0.431796133518219], [-0.12644149363040924, -0.05459078773856163, 0.16691209375858307, 0.19289325177669525], [-0.12753331661224365, 0.13779908418655396, 0.17076995968818665, -0.04283633083105087], [-0.12477733194828033, -0.059307798743247986, 0.16991323232650757, 0.2984860837459564], [-0.125963494181633, 0.13303625583648682, 0.175882950425148, 0.06383926421403885], [-0.12330276519060135, -0.064114049077034, 0.17715974152088165, 0.40644580125808716], [-0.12458503991365433, 0.1281115561723709, 0.18528865277767181, 0.17443333566188812], [-0.12202281504869461, -0.06911203265190125, 0.18877732753753662, 0.5193686485290527], [-0.12340505421161652, 0.12292099744081497, 0.19916468858718872, 0.29160791635513306], [-0.12094663083553314, 0.31472861766815186, 0.20499685406684875, 0.06775201857089996], [-0.11465205997228622, 0.11734775453805923, 0.2063518911600113, 0.41747188568115234], [-0.11230510473251343, 0.3090396225452423, 0.2147013247013092, 0.19627203047275543]], "action_prob": [0.49998369812965393, 0.49932730197906494, 0.5011230707168579, 0.5007285475730896, 0.499886691570282, 0.49923115968704224, 0.49879735708236694, 0.501424252986908, 0.498711496591568, 0.5014951229095459, 0.50138258934021, 0.49890193343162537, 0.5014584064483643, 0.5012155175209045, 0.5007724761962891, 0.5001837611198425, 0.5003885626792908, 0.49969086050987244, 0.5009872913360596, 0.4995364248752594, 0.49889957904815674, 0.4999595880508423, 0.4992991089820862, 0.5011516809463501, 0.4992387294769287, 0.5012035369873047, 0.500834047794342, 0.49975696206092834, 0.5008909702301025, 0.4996797442436218, 0.5009536743164062, 0.5004076957702637, 0.4997641146183014, 0.4992353320121765, 0.4989074766635895, 0.5012667179107666, 0.5011471509933472, 0.5008166432380676, 0.5002250075340271, 0.49953362345695496, 0.4989977478981018, 0.4986867606639862, 0.5014740824699402, 0.5014073848724365, 0.5012102127075195, 0.500819742679596, 0.5002484321594238, 0.5003588795661926, 0.4996453523635864, 0.49900853633880615, 0.5013912916183472, 0.4988844096660614, 0.5014782547950745, 0.5001620054244995, 0.4994959831237793, 0.5009946227073669, 0.4994630217552185, 0.4989694356918335, 0.49869853258132935, 0.5014331340789795, 0.5013866424560547, 0.4987921416759491, 0.49854692816734314, 0.5015630125999451, 0.5015460252761841, 0.4985731840133667, 0.49838024377822876, 0.49829715490341187, 0.5000118613243103, 0.4993802309036255, 0.5010610222816467, 0.4993676245212555, 0.4989131987094879, 0.49866917729377747, 0.49855318665504456, 0.49849218130111694, 0.5015523433685303, 0.4983904957771301, 0.5016441345214844, 0.49829182028770447, 0.5017341375350952, 0.5001383423805237, 0.4994787275791168, 0.4989980459213257, 0.49873086810112, 0.5014021396636963, 0.498648464679718, 0.4985237121582031, 0.49845799803733826, 0.498410165309906, 0.5016346573829651, 0.5017021298408508, 0.5000444650650024, 0.5005895495414734, 0.49994102120399475, 0.49927738308906555, 0.4988265335559845, 0.5014034509658813, 0.5012527108192444, 0.49910444021224976, 0.5013147592544556, 0.5009900331497192, 0.49955546855926514, 0.49893277883529663, 0.5014283657073975, 0.4988245964050293, 0.4984976351261139, 0.5016476511955261, 0.5016022324562073, 0.4985645115375519, 0.49987781047821045, 0.500784158706665, 0.5001737475395203, 0.5004717707633972, 0.4997968077659607, 0.500847578048706, 0.49973928928375244, 0.5008965134620667, 0.5003272891044617, 0.4996747076511383, 0.5008407235145569, 0.49969083070755005, 0.49915701150894165, 0.4988367557525635, 0.4986734092235565, 0.5014118552207947, 0.501413106918335, 0.4986737370491028, 0.5014776587486267, 0.49859514832496643, 0.4984571933746338, 0.5016014575958252, 0.49837014079093933, 0.4983241856098175, 0.49829617142677307, 0.498268187046051, 0.4999755918979645, 0.5006838440895081, 0.5000627040863037, 0.4994151294231415, 0.49895134568214417, 0.50130295753479, 0.4988953471183777, 0.5013593435287476, 0.4988294541835785, 0.49858081340789795, 0.4984685182571411, 0.49841225147247314, 0.4983716309070587, 0.5016674995422363, 0.5017392635345459, 0.4999236762523651, 0.4992750883102417, 0.501154363155365, 0.4992124140262604, 0.5012070536613464, 0.5008618831634521, 0.49971112608909607, 0.5009194612503052, 0.5003686547279358, 0.5002808570861816, 0.5004288554191589, 0.49977919459342957, 0.4992297291755676, 0.5011138916015625, 0.4992179572582245, 0.49885571002960205, 0.4986693263053894, 0.4985772371292114, 0.5014781355857849, 0.5015175342559814, 0.5015172362327576, 0.501417338848114, 0.498870313167572, 0.49852389097213745, 0.5016202330589294, 0.5015624761581421, 0.4986484944820404, 0.4983709156513214, 0.5017310380935669, 0.5017198324203491, 0.4984011650085449, 0.4999731481075287, 0.4993158280849457, 0.501136839389801, 0.500740110874176, 0.5001240372657776, 0.49947863817214966, 0.4990125894546509, 0.50124591588974, 0.49896326661109924, 0.498701810836792, 0.4985770583152771, 0.5014885663986206, 0.5015137791633606, 0.5014830827713013, 0.4986727237701416, 0.5015462040901184, 0.5014205574989319, 0.4988935887813568, 0.5014941096305847, 0.5012289881706238, 0.5007548332214355, 0.49984607100486755, 0.5008812546730042, 0.49970051646232605, 0.5010046362876892, 0.49954479932785034, 0.5011244416236877, 0.5006187558174133, 0.4999704360961914, 0.5007603168487549], "advantages": [19.027559280395508, 18.212419509887695, 17.38839340209961, 16.551855087280273, 15.706303596496582, 14.857648849487305, 13.999709129333496, 13.132323265075684, 12.253694534301758, 11.368634223937988, 10.47232723236084, 9.566438674926758, 8.654839515686035, 7.730796813964844, 6.7968974113464355, 5.8531904220581055, 4.899947166442871, 3.9425837993621826, 2.975149631500244, 1.9931491613388062, 1.00577974319458, 27.502059936523438, 26.772573471069336, 26.035079956054688, 25.285863876342773, 24.53335189819336, 23.769058227539062, 22.996498107910156, 22.221519470214844, 21.43340492248535, 20.642587661743164, 19.838619232177734, 19.026304244995117, 18.20608139038086, 17.37815284729004, 16.54242515563965, 15.700922966003418, 14.851645469665527, 13.994391441345215, 13.128499984741211, 12.253236770629883, 11.368326187133789, 10.473838806152344, 9.568830490112305, 8.654231071472168, 7.7298359870910645, 6.795599460601807, 5.851750373840332, 4.903895854949951, 3.9458861351013184, 2.9772427082061768, 1.9960846900939941, 1.0075349807739258, 13.994527816772461, 13.12300968170166, 12.24323558807373, 11.359121322631836, 10.461485862731934, 9.555535316467285, 8.641053199768066, 7.719120979309082, 6.788394451141357, 5.845343589782715, 4.893431663513184, 3.933436155319214, 2.964141845703125, 1.9826695919036865, 0.9919284582138062, 12.247872352600098, 11.358863830566406, 10.461411476135254, 9.55935001373291, 8.643627166748047, 7.719335079193115, 6.786276340484619, 5.844198226928711, 4.892873287200928, 3.9324331283569336, 2.9617996215820312, 1.9817816019058228, 0.9914819002151489, 10.466353416442871, 9.559237480163574, 8.643515586853027, 7.719260215759277, 6.786256790161133, 5.8456244468688965, 4.893668174743652, 3.932527780532837, 2.961951732635498, 1.9817345142364502, 0.9916364550590515, 16.548259735107422, 15.702699661254883, 14.85406494140625, 13.996865272521973, 13.130385398864746, 12.25438117980957, 11.366695404052734, 10.469425201416016, 9.567273139953613, 8.651965141296387, 7.7268781661987305, 6.797651767730713, 5.858184337615967, 4.905731201171875, 3.9470107555389404, 2.9778037071228027, 1.9970875978469849, 1.006084680557251, 22.99564552307129, 22.214948654174805, 21.431888580322266, 20.640926361083984, 19.836368560791016, 19.02382469177246, 18.208459854125977, 17.379493713378906, 16.547452926635742, 15.707168579101562, 14.858009338378906, 13.995319366455078, 13.128962516784668, 12.253214836120605, 11.368014335632324, 10.473418235778809, 9.568327903747559, 8.653605461120605, 7.732184410095215, 6.798994064331055, 5.858832836151123, 4.908627986907959, 3.947537899017334, 2.977980852127075, 1.998268961906433, 1.0084419250488281, 13.994281768798828, 13.122699737548828, 12.24783992767334, 11.364137649536133, 10.47097110748291, 9.568096160888672, 8.653036117553711, 7.731869220733643, 6.798306941986084, 5.858438014984131, 4.908443927764893, 3.9484164714813232, 2.9784114360809326, 1.9984374046325684, 1.008541226387024, 26.769710540771484, 26.03281593322754, 25.287822723388672, 24.53110122680664, 23.77092933654785, 22.998979568481445, 22.21867561340332, 21.43581199645996, 20.63979721069336, 19.835552215576172, 19.028881072998047, 18.208358764648438, 17.379817962646484, 16.54349708557129, 15.702689170837402, 14.84929370880127, 13.987896919250488, 13.118285179138184, 12.240233421325684, 11.354290008544922, 10.459758758544922, 9.556680679321289, 8.645060539245605, 7.720086574554443, 6.78655481338501, 5.846121788024902, 4.896688938140869, 3.934054136276245, 2.9625024795532227, 1.983106017112732, 0.994195282459259, 26.029590606689453, 25.27964973449707, 24.52277946472168, 23.762466430664062, 22.99503517150879, 22.219905853271484, 21.43644905090332, 20.644405364990234, 19.841108322143555, 19.03303337097168, 18.216190338134766, 17.390663146972656, 16.555646896362305, 15.711819648742676, 14.858964920043945, 14.000614166259766, 13.130632400512695, 12.251331329345703, 11.367254257202148, 10.470341682434082, 9.563886642456055, 8.64803695678711, 7.728550910949707, 6.794217586517334, 5.855900287628174, 4.902772426605225, 3.9451744556427, 2.972929000854492, 1.9906282424926758, 1.0038609504699707], "value_targets": [19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 895596278, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 460298866, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 963400219, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 1966176880, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 182903451, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1427096865, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309, 1857050309], "obs": [[0.04360872134566307, 0.015283504500985146, -0.03838257119059563, -0.005857521202415228], [0.043914392590522766, -0.17926757037639618, -0.03849972411990166, 0.2744724452495575], [0.040329042822122574, 0.016381945461034775, -0.033010274171829224, -0.030100475996732712], [0.040656678378582, 0.21196134388446808, -0.03361228480935097, -0.33301302790641785], [0.04489590600132942, 0.017333533614873886, -0.0402725450694561, -0.05111634358763695], [0.04524257779121399, -0.17718850076198578, -0.041294872760772705, 0.22859320044517517], [0.04169880598783493, 0.018498495221138, -0.03672300651669502, -0.07682429999113083], [0.04206877574324608, -0.17607828974723816, -0.03825949504971504, 0.2040499597787857], [0.03854721039533615, 0.01956932619214058, -0.03417849540710449, -0.1004522517323494], [0.03893859684467316, 0.21516402065753937, -0.036187540739774704, -0.4037194550037384], [0.04324187710881233, 0.020573480054736137, -0.04426192864775658, -0.12266156077384949], [0.043653346598148346, -0.17388731241226196, -0.046715158969163895, 0.15573517978191376], [0.040175601840019226, 0.021871287375688553, -0.043600454926490784, -0.15131163597106934], [0.04061302915215492, 0.21758955717086792, -0.04662668704986572, -0.457424521446228], [0.04496482014656067, 0.023156728595495224, -0.05577518045902252, -0.1797955185174942], [0.04542795196175575, 0.21903061866760254, -0.059371087700128555, -0.48953887820243835], [0.0498085655272007, 0.41493770480155945, -0.06916186958551407, -0.8003265857696533], [0.058107320219278336, 0.22082911431789398, -0.08516839891672134, -0.5301771759986877], [0.06252390146255493, 0.4170393943786621, -0.09577193856239319, -0.8484350442886353], [0.07086469233036041, 0.6133279800415039, -0.1127406433224678, -1.1696325540542603], [0.08313124626874924, 0.8097211122512817, -0.13613329827785492, -1.4954276084899902], [0.09932567179203033, 0.6164917945861816, -0.16604185104370117, -1.2481648921966553], [0.11165551096200943, 0.4238414466381073, -0.191005140542984, -1.0117560625076294], [-0.0029231072403490543, 0.04152971878647804, 0.035796016454696655, 0.011828417889773846], [-0.0020925127901136875, -0.15408682823181152, 0.03603258728981018, 0.31558704376220703], [-0.0051742494106292725, 0.040503837168216705, 0.04234432801604271, 0.03448180481791496], [-0.004364172462373972, 0.23499378561973572, 0.043033961206674576, -0.2445461004972458], [0.000335703109158203, 0.42947548627853394, 0.03814304247498512, -0.5233504772186279], [0.008925213478505611, 0.2338380515575409, 0.02767603099346161, -0.21889644861221313], [0.013601974584162235, 0.42855367064476013, 0.023298101499676704, -0.5027223229408264], [0.022173047065734863, 0.23311123251914978, 0.013243655674159527, -0.20278918743133545], [0.02683527208864689, 0.4280413091182709, 0.009187871590256691, -0.49126511812210083], [0.03539609909057617, 0.6230324506759644, -0.0006374308723025024, -0.7810382843017578], [0.04785674810409546, 0.42791926860809326, -0.016258196905255318, -0.48855599761009216], [0.0564151331782341, 0.23303042352199554, -0.02602931670844555, -0.2010410726070404], [0.061075739562511444, 0.4285147786140442, -0.030050138011574745, -0.5018200278282166], [0.06964603811502457, 0.23382902145385742, -0.0400865375995636, -0.21875664591789246], [0.07432261854410172, 0.42950037121772766, -0.04446167126297951, -0.5238102078437805], [0.0829126238822937, 0.23503145575523376, -0.054937876760959625, -0.24546249210834503], [0.08761325478553772, 0.04073544219136238, -0.05984712392091751, 0.029398202896118164], [0.08842796087265015, -0.1534794718027115, -0.05925916135311127, 0.3026144802570343], [0.08535837382078171, -0.3477090001106262, -0.05320687219500542, 0.5760353207588196], [0.07840419560670853, -0.15188315510749817, -0.04168616607785225, 0.26707684993743896], [0.07536652684211731, -0.3463861346244812, -0.036344628781080246, 0.54632568359375], [0.0684388056397438, -0.15077289938926697, -0.0254181157797575, 0.2424166053533554], [0.06542334705591202, 0.04470273479819298, -0.020569782704114914, -0.058174245059490204], [0.06631740182638168, 0.24011348187923431, -0.021733267232775688, -0.35727545619010925], [0.07111967355012894, 0.04530715197324753, -0.028878776356577873, -0.07152403146028519], [0.07202581316232681, -0.1493891328573227, -0.03030925802886486, 0.2119094431400299], [0.0690380334854126, -0.3440649211406708, -0.02607106789946556, 0.49487945437431335], [0.062156736850738525, -0.5388096570968628, -0.016173480078577995, 0.7792332768440247], [0.05138054117560387, -0.34346914291381836, -0.0005888136220164597, 0.48150601983070374], [0.044511158019304276, -0.5385828018188477, 0.00904130656272173, 0.7740033268928528], [0.03373950347304344, -0.7338279485702515, 0.024521373212337494, 1.0695171356201172], [0.019062945619225502, -0.5390387177467346, 0.04591171443462372, 0.784629762172699], [0.008282170630991459, -0.7347604632377625, 0.06160430982708931, 1.0913963317871094], [-0.006413038820028305, -0.930637776851654, 0.08343223482370377, 1.4027551412582397], [-0.02502579428255558, -0.7366454601287842, 0.11148734390735626, 1.1372795104980469], [-0.03975870460271835, -0.9330348372459412, 0.13423292338848114, 1.462744116783142], [-0.058419398963451385, -1.1295219659805298, 0.16348780691623688, 1.794169545173645], [-0.08100984245538712, -0.9365659356117249, 0.19937120378017426, 1.5564465522766113], [0.011267504654824734, -0.011888597160577774, 0.03088000789284706, -0.0363457053899765], [0.011029733344912529, 0.18277722597122192, 0.030153093859553337, -0.3191279470920563], [0.014685277827084064, 0.37745705246925354, 0.023770535364747047, -0.6021512746810913], [0.022234419360756874, 0.572238564491272, 0.011727509088814259, -0.8872531652450562], [0.03367919102311134, 0.3769594430923462, -0.006017553620040417, -0.5909067392349243], [0.04121837764978409, 0.5721651315689087, -0.017835689708590508, -0.8854791522026062], [0.052661679685115814, 0.3772898018360138, -0.03554527088999748, -0.598456084728241], [0.06020747870206833, 0.18268275260925293, -0.04751439392566681, -0.31717798113822937], [0.06386113166809082, -0.011731371283531189, -0.0538579523563385, -0.039849910885095596], [0.06362650543451309, -0.20604129135608673, -0.05465495213866234, 0.23536576330661774], [0.059505678713321686, -0.4003415107727051, -0.04994763433933258, 0.5103203058242798], [0.05149884894490242, -0.5947255492210388, -0.03974122926592827, 0.7868542671203613], [0.03960433602333069, -0.3990808427333832, -0.024004144594073296, 0.48193809390068054], [0.03162271901965141, -0.5938559174537659, -0.014365381561219692, 0.7669599652290344], [0.0197456032037735, -0.7887771725654602, 0.0009738172520883381, 1.0550884008407593], [0.0039700595661997795, -0.5936681628227234, 0.022075586020946503, 0.7627112865447998], [-0.007903303019702435, -0.7890870571136475, 0.03732981160283089, 1.062258005142212], [-0.023685045540332794, -0.5944787263870239, 0.058574970811605453, 0.7815212607383728], [-0.035574618726968765, -0.4002087712287903, 0.07420539855957031, 0.5078272819519043], [-0.043578796088695526, -0.5962935090065002, 0.08436194062232971, 0.8229413032531738], [-0.05550466477870941, -0.7924619913101196, 0.10082077234983444, 1.140920639038086], [-0.07135390490293503, -0.9887468218803406, 0.12363918125629425, 1.4634437561035156], [-0.09112884104251862, -0.7953375577926636, 0.152908056974411, 1.2118018865585327], [-0.10703559219837189, -0.6024836897850037, 0.1771440953016281, 0.9706763029098511], [-0.11908526718616486, -0.4101244807243347, 0.19655762612819672, 0.7384613156318665], [0.015904536470770836, 0.02349567413330078, 0.00691257556900382, -0.0054565658792853355], [0.01637444831430912, -0.17172472178936005, 0.006803444121032953, 0.28939932584762573], [0.012939954176545143, -0.36694303154945374, 0.01259143091738224, 0.5842201709747314], [0.005601094104349613, -0.1719997078180313, 0.02427583374083042, 0.29553017020225525], [0.0021610998082906008, 0.02276790142059326, 0.03018643707036972, 0.010601237416267395], [0.002616457873955369, 0.21744422614574432, 0.03039846196770668, -0.27240675687789917], [0.006965342443436384, 0.02190200239419937, 0.02495032735168934, 0.02970684878528118], [0.007403382565826178, 0.21665742993354797, 0.025544464588165283, -0.2550007402896881], [0.011736530810594559, 0.02118024416267872, 0.02044445089995861, 0.04562864080071449], [0.012160136364400387, 0.2160031646490097, 0.02135702222585678, -0.24053440988063812], [0.01648019813001156, 0.020582735538482666, 0.016546335071325302, 0.0588078647851944], [0.016891853883862495, 0.2154635787010193, 0.017722491174936295, -0.22860899567604065], [0.021201126277446747, 0.020092912018299103, 0.013150312006473541, 0.06961113214492798], [0.02160298451781273, 0.21502389013767242, 0.014542534947395325, -0.21889396011829376], [0.02590346150100231, 0.40993496775627136, 0.01016465574502945, -0.5069543123245239], [0.03410216048359871, 0.6049122214317322, 2.5568986529833637e-05, -0.7964167594909668], [0.046200405806303024, 0.8000338077545166, -0.015902765095233917, -1.0890916585922241], [0.062201082706451416, 0.9953618049621582, -0.037684597074985504, -1.3867217302322388], [0.08210831880569458, 1.1909326314926147, -0.0654190331697464, -1.6909464597702026], [0.10592696815729141, 1.3867465257644653, -0.09923796355724335, -2.003258466720581], [0.1336618959903717, 1.5827537775039673, -0.13930313289165497, -2.324950695037842], [0.16531698405742645, 1.778838872909546, -0.1858021467924118, -2.6570520401000977], [0.009698866866528988, -0.03878827020525932, 0.0012264170218259096, -0.04481720179319382], [0.008923102170228958, -0.23392778635025024, 0.00033007300226017833, 0.24825242161750793], [0.004244545940309763, -0.038810551166534424, 0.00529512157663703, -0.044326379895210266], [0.0034683351404964924, -0.2340080291032791, 0.004408593755215406, 0.2500225007534027], [-0.0012118255253881216, -0.4291926622390747, 0.009409043937921524, 0.5440927147865295], [-0.009795678779482841, -0.23420418798923492, 0.02029089815914631, 0.2543891668319702], [-0.014479762874543667, -0.42960989475250244, 0.02537868171930313, 0.5534024834632874], [-0.023071959614753723, -0.6250788569450378, 0.03644673153758049, 0.8539720773696899], [-0.03557353839278221, -0.43047213554382324, 0.053526174277067184, 0.5729687809944153], [-0.04418297857046127, -0.2361399233341217, 0.06498555094003677, 0.2976171374320984], [-0.04890577867627144, -0.0420016311109066, 0.07093789428472519, 0.02611670456826687], [-0.04974580928683281, 0.15203510224819183, 0.07146022468805313, -0.24336811900138855], [-0.046705108135938644, -0.04403094947338104, 0.06659286469221115, 0.0709717869758606], [-0.047585729509592056, -0.24004128575325012, 0.0680122971534729, 0.383899450302124], [-0.05238655209541321, -0.045947544276714325, 0.07569028437137604, 0.11341213434934616], [-0.053305502980947495, -0.2420678585767746, 0.07795853167772293, 0.4289820194244385], [-0.05814686045050621, -0.048131510615348816, 0.0865381732583046, 0.16185764968395233], [-0.05910949036478996, 0.14565183222293854, 0.08977532386779785, -0.1023191511631012], [-0.05619645491242409, 0.339380145072937, 0.08772893995046616, -0.3653828799724579], [-0.04940885305404663, 0.1431281417608261, 0.08042128384113312, -0.046377718448638916], [-0.04654628783464432, 0.33701032400131226, 0.07949373126029968, -0.3126426339149475], [-0.03980608284473419, 0.1408511847257614, 0.07324087619781494, 0.004013403318822384], [-0.036989059299230576, 0.3348504900932312, 0.0733211413025856, -0.26469185948371887], [-0.030292049050331116, 0.13876278698444366, 0.0680273100733757, 0.050186559557914734], [-0.027516793459653854, 0.33284667134284973, 0.06903103739023209, -0.22028131783008575], [-0.020859859883785248, 0.5269174575805664, 0.06462541222572327, -0.49041515588760376], [-0.010321510955691338, 0.7210710644721985, 0.05481711030006409, -0.762050986289978], [0.004099910147488117, 0.9153968095779419, 0.03957608714699745, -1.0369936227798462], [0.02240784652531147, 0.7197718024253845, 0.018836217001080513, -0.7321534752845764], [0.03680328279733658, 0.9146284461021423, 0.004193147644400597, -1.0188491344451904], [0.0550958514213562, 1.109694242477417, -0.01618383452296257, -1.31021249294281], [0.07728973776102066, 0.9147809743881226, -0.04238808527588844, -1.0226386785507202], [0.09558535367250443, 1.1104412078857422, -0.06284085661172867, -1.3283237218856812], [0.11779417842626572, 0.9161660671234131, -0.08940733224153519, -1.055949330329895], [0.13611750304698944, 0.7223354578018188, -0.11052632331848145, -0.7926154136657715], [0.15056420862674713, 0.5288903117179871, -0.1263786256313324, -0.5366469025611877], [0.1611420214176178, 0.7255414724349976, -0.13711155951023102, -0.866327702999115], [0.17565284669399261, 0.5325251221656799, -0.15443812310695648, -0.6197049617767334], [0.18630334734916687, 0.7294283509254456, -0.16683222353458405, -0.9567690491676331], [0.20089191198349, 0.9263531565666199, -0.1859675943851471, -1.2968764305114746], [0.036388099193573, 0.019063998013734818, -0.021909575909376144, -0.0377533957362175], [0.036769378930330276, 0.21449317038059235, -0.022664643824100494, -0.3372676968574524], [0.04105924442410469, 0.01970095746219158, -0.029409999027848244, -0.05181725695729256], [0.04145326092839241, 0.2152319997549057, -0.03044634312391281, -0.35363227128982544], [0.045757900923490524, 0.020555909723043442, -0.03751898929476738, -0.07070332020521164], [0.04616902023553848, 0.21619510650634766, -0.038933057337999344, -0.37498360872268677], [0.05049292370676994, 0.021647177636623383, -0.046432726085186005, -0.09482626616954803], [0.05092586576938629, 0.21740281581878662, -0.04832925274968147, -0.4017895758152008], [0.05527392402291298, 0.022998491302132607, -0.05636504292488098, -0.12472683191299438], [0.05573389306664467, -0.17127256095409393, -0.058859579265117645, 0.14965440332889557], [0.05230844020843506, -0.3655044138431549, -0.05586649104952812, 0.4232029616832733], [0.044998351484537125, -0.5597922801971436, -0.047402434051036835, 0.6977638602256775], [0.03380250930786133, -0.7542259693145752, -0.033447157591581345, 0.9751557111740112], [0.018717987462878227, -0.9488837122917175, -0.013944041915237904, 1.2571473121643066], [-0.0002596861741039902, -0.7535860538482666, 0.011198905296623707, 0.960129976272583], [-0.015331408008933067, -0.5586164593696594, 0.030401505529880524, 0.6709862947463989], [-0.026503736153244972, -0.3639300465583801, 0.04382123053073883, 0.38802826404571533], [-0.03378233686089516, -0.5596457123756409, 0.05158179625868797, 0.6941993236541748], [-0.04497525095939636, -0.3652758002281189, 0.0654657781124115, 0.41819047927856445], [-0.052280768752098083, -0.5612614154815674, 0.07382959127426147, 0.7307723760604858], [-0.06350599229335785, -0.3672332465648651, 0.0884450376033783, 0.46220916509628296], [-0.0708506628870964, -0.1734653264284134, 0.09768921881914139, 0.19866232573986053], [-0.07431996613740921, 0.02013351023197174, 0.10166247189044952, -0.061676397919654846], [-0.07391729950904846, -0.17628799378871918, 0.10042893886566162, 0.2612719237804413], [-0.07744305580854416, -0.37268945574760437, 0.10565438121557236, 0.5838661789894104], [-0.08489684760570526, -0.1791938692331314, 0.11733170598745346, 0.32624590396881104], [-0.08848072588443756, -0.3757738471031189, 0.12385661900043488, 0.6535049676895142], [-0.0959962010383606, -0.18257436156272888, 0.13692672550678253, 0.40224650502204895], [-0.09964768588542938, -0.37934577465057373, 0.14497165381908417, 0.7347717881202698], [-0.10723460465669632, -0.18649233877658844, 0.15966708958148956, 0.4909987151622772], [-0.11096444725990295, 0.006059728097170591, 0.16948705911636353, 0.25258734822273254], [-0.11084325611591339, 0.1984073370695114, 0.17453880608081818, 0.017791016027331352], [-0.10687510669231415, 0.0012678105849772692, 0.17489463090896606, 0.36006176471710205], [-0.10684975236654282, 0.1935284286737442, 0.18209585547447205, 0.1272275745868683], [-0.10297918319702148, -0.0036716482136398554, 0.18464040756225586, 0.47137781977653503], [-0.10305261611938477, -0.20085571706295013, 0.19406796991825104, 0.8161028027534485], [0.02159099467098713, -0.0410957932472229, -0.018057698383927345, -0.017980942502617836], [0.02076908014714718, 0.1542804092168808, -0.018417317420244217, -0.31630614399909973], [0.023854687809944153, -0.04057443141937256, -0.024743441492319107, -0.02948783151805401], [0.023043198511004448, -0.23533296585083008, -0.02533319778740406, 0.25528672337532043], [0.018336540088057518, -0.430084228515625, -0.02022746205329895, 0.5398727059364319], [0.00973485503345728, -0.23468387126922607, -0.009430008940398693, 0.2408856600522995], [0.005041177850216627, -0.4296698570251465, -0.004612295888364315, 0.5305792689323425], [-0.003552219131961465, -0.23448331654071808, 0.005999289453029633, 0.2364465594291687], [-0.008241885341703892, -0.0394475944340229, 0.010728220455348492, -0.054337985813617706], [-0.009030837565660477, 0.15551890432834625, 0.009641461074352264, -0.34361687302589417], [-0.005920459516346455, 0.3505023717880249, 0.0027691235300153494, -0.6332439184188843], [0.0010895880404859781, 0.15534189343452454, -0.009895754978060722, -0.339690238237381], [0.004196425899863243, 0.35060325264930725, -0.016689559444785118, -0.6354771852493286], [0.011208491399884224, 0.5459539294242859, -0.029399104416370392, -0.933368980884552], [0.02212757058441639, 0.7414599657058716, -0.048066481947898865, -1.2351433038711548], [0.03695676848292351, 0.9371656179428101, -0.07276935130357742, -1.5424888134002686], [0.05570008233189583, 0.7429899573326111, -0.10361912846565247, -1.2733714580535889], [0.07055988162755966, 0.93927001953125, -0.12908655405044556, -1.5966219902038574], [0.089345283806324, 0.7458931803703308, -0.1610189974308014, -1.3468163013458252], [0.10426314175128937, 0.5531196594238281, -0.1879553198814392, -1.1085317134857178]], "actions": [0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[0.043914392590522766, -0.17926757037639618, -0.03849972411990166, 0.2744724452495575], [0.040329042822122574, 0.016381945461034775, -0.033010274171829224, -0.030100475996732712], [0.040656678378582, 0.21196134388446808, -0.03361228480935097, -0.33301302790641785], [0.04489590600132942, 0.017333533614873886, -0.0402725450694561, -0.05111634358763695], [0.04524257779121399, -0.17718850076198578, -0.041294872760772705, 0.22859320044517517], [0.04169880598783493, 0.018498495221138, -0.03672300651669502, -0.07682429999113083], [0.04206877574324608, -0.17607828974723816, -0.03825949504971504, 0.2040499597787857], [0.03854721039533615, 0.01956932619214058, -0.03417849540710449, -0.1004522517323494], [0.03893859684467316, 0.21516402065753937, -0.036187540739774704, -0.4037194550037384], [0.04324187710881233, 0.020573480054736137, -0.04426192864775658, -0.12266156077384949], [0.043653346598148346, -0.17388731241226196, -0.046715158969163895, 0.15573517978191376], [0.040175601840019226, 0.021871287375688553, -0.043600454926490784, -0.15131163597106934], [0.04061302915215492, 0.21758955717086792, -0.04662668704986572, -0.457424521446228], [0.04496482014656067, 0.023156728595495224, -0.05577518045902252, -0.1797955185174942], [0.04542795196175575, 0.21903061866760254, -0.059371087700128555, -0.48953887820243835], [0.0498085655272007, 0.41493770480155945, -0.06916186958551407, -0.8003265857696533], [0.058107320219278336, 0.22082911431789398, -0.08516839891672134, -0.5301771759986877], [0.06252390146255493, 0.4170393943786621, -0.09577193856239319, -0.8484350442886353], [0.07086469233036041, 0.6133279800415039, -0.1127406433224678, -1.1696325540542603], [0.08313124626874924, 0.8097211122512817, -0.13613329827785492, -1.4954276084899902], [0.09932567179203033, 0.6164917945861816, -0.16604185104370117, -1.2481648921966553], [0.11165551096200943, 0.4238414466381073, -0.191005140542984, -1.0117560625076294], [0.12013233453035355, 0.23170973360538483, -0.2112402617931366, -0.7846143841743469], [-0.0020925127901136875, -0.15408682823181152, 0.03603258728981018, 0.31558704376220703], [-0.0051742494106292725, 0.040503837168216705, 0.04234432801604271, 0.03448180481791496], [-0.004364172462373972, 0.23499378561973572, 0.043033961206674576, -0.2445461004972458], [0.000335703109158203, 0.42947548627853394, 0.03814304247498512, -0.5233504772186279], [0.008925213478505611, 0.2338380515575409, 0.02767603099346161, -0.21889644861221313], [0.013601974584162235, 0.42855367064476013, 0.023298101499676704, -0.5027223229408264], [0.022173047065734863, 0.23311123251914978, 0.013243655674159527, -0.20278918743133545], [0.02683527208864689, 0.4280413091182709, 0.009187871590256691, -0.49126511812210083], [0.03539609909057617, 0.6230324506759644, -0.0006374308723025024, -0.7810382843017578], [0.04785674810409546, 0.42791926860809326, -0.016258196905255318, -0.48855599761009216], [0.0564151331782341, 0.23303042352199554, -0.02602931670844555, -0.2010410726070404], [0.061075739562511444, 0.4285147786140442, -0.030050138011574745, -0.5018200278282166], [0.06964603811502457, 0.23382902145385742, -0.0400865375995636, -0.21875664591789246], [0.07432261854410172, 0.42950037121772766, -0.04446167126297951, -0.5238102078437805], [0.0829126238822937, 0.23503145575523376, -0.054937876760959625, -0.24546249210834503], [0.08761325478553772, 0.04073544219136238, -0.05984712392091751, 0.029398202896118164], [0.08842796087265015, -0.1534794718027115, -0.05925916135311127, 0.3026144802570343], [0.08535837382078171, -0.3477090001106262, -0.05320687219500542, 0.5760353207588196], [0.07840419560670853, -0.15188315510749817, -0.04168616607785225, 0.26707684993743896], [0.07536652684211731, -0.3463861346244812, -0.036344628781080246, 0.54632568359375], [0.0684388056397438, -0.15077289938926697, -0.0254181157797575, 0.2424166053533554], [0.06542334705591202, 0.04470273479819298, -0.020569782704114914, -0.058174245059490204], [0.06631740182638168, 0.24011348187923431, -0.021733267232775688, -0.35727545619010925], [0.07111967355012894, 0.04530715197324753, -0.028878776356577873, -0.07152403146028519], [0.07202581316232681, -0.1493891328573227, -0.03030925802886486, 0.2119094431400299], [0.0690380334854126, -0.3440649211406708, -0.02607106789946556, 0.49487945437431335], [0.062156736850738525, -0.5388096570968628, -0.016173480078577995, 0.7792332768440247], [0.05138054117560387, -0.34346914291381836, -0.0005888136220164597, 0.48150601983070374], [0.044511158019304276, -0.5385828018188477, 0.00904130656272173, 0.7740033268928528], [0.03373950347304344, -0.7338279485702515, 0.024521373212337494, 1.0695171356201172], [0.019062945619225502, -0.5390387177467346, 0.04591171443462372, 0.784629762172699], [0.008282170630991459, -0.7347604632377625, 0.06160430982708931, 1.0913963317871094], [-0.006413038820028305, -0.930637776851654, 0.08343223482370377, 1.4027551412582397], [-0.02502579428255558, -0.7366454601287842, 0.11148734390735626, 1.1372795104980469], [-0.03975870460271835, -0.9330348372459412, 0.13423292338848114, 1.462744116783142], [-0.058419398963451385, -1.1295219659805298, 0.16348780691623688, 1.794169545173645], [-0.08100984245538712, -0.9365659356117249, 0.19937120378017426, 1.5564465522766113], [-0.09974116086959839, -0.7443118095397949, 0.23050013184547424, 1.3320053815841675], [0.011029733344912529, 0.18277722597122192, 0.030153093859553337, -0.3191279470920563], [0.014685277827084064, 0.37745705246925354, 0.023770535364747047, -0.6021512746810913], [0.022234419360756874, 0.572238564491272, 0.011727509088814259, -0.8872531652450562], [0.03367919102311134, 0.3769594430923462, -0.006017553620040417, -0.5909067392349243], [0.04121837764978409, 0.5721651315689087, -0.017835689708590508, -0.8854791522026062], [0.052661679685115814, 0.3772898018360138, -0.03554527088999748, -0.598456084728241], [0.06020747870206833, 0.18268275260925293, -0.04751439392566681, -0.31717798113822937], [0.06386113166809082, -0.011731371283531189, -0.0538579523563385, -0.039849910885095596], [0.06362650543451309, -0.20604129135608673, -0.05465495213866234, 0.23536576330661774], [0.059505678713321686, -0.4003415107727051, -0.04994763433933258, 0.5103203058242798], [0.05149884894490242, -0.5947255492210388, -0.03974122926592827, 0.7868542671203613], [0.03960433602333069, -0.3990808427333832, -0.024004144594073296, 0.48193809390068054], [0.03162271901965141, -0.5938559174537659, -0.014365381561219692, 0.7669599652290344], [0.0197456032037735, -0.7887771725654602, 0.0009738172520883381, 1.0550884008407593], [0.0039700595661997795, -0.5936681628227234, 0.022075586020946503, 0.7627112865447998], [-0.007903303019702435, -0.7890870571136475, 0.03732981160283089, 1.062258005142212], [-0.023685045540332794, -0.5944787263870239, 0.058574970811605453, 0.7815212607383728], [-0.035574618726968765, -0.4002087712287903, 0.07420539855957031, 0.5078272819519043], [-0.043578796088695526, -0.5962935090065002, 0.08436194062232971, 0.8229413032531738], [-0.05550466477870941, -0.7924619913101196, 0.10082077234983444, 1.140920639038086], [-0.07135390490293503, -0.9887468218803406, 0.12363918125629425, 1.4634437561035156], [-0.09112884104251862, -0.7953375577926636, 0.152908056974411, 1.2118018865585327], [-0.10703559219837189, -0.6024836897850037, 0.1771440953016281, 0.9706763029098511], [-0.11908526718616486, -0.4101244807243347, 0.19655762612819672, 0.7384613156318665], [-0.12728776037693024, -0.6073390245437622, 0.21132685244083405, 1.0860035419464111], [0.01637444831430912, -0.17172472178936005, 0.006803444121032953, 0.28939932584762573], [0.012939954176545143, -0.36694303154945374, 0.01259143091738224, 0.5842201709747314], [0.005601094104349613, -0.1719997078180313, 0.02427583374083042, 0.29553017020225525], [0.0021610998082906008, 0.02276790142059326, 0.03018643707036972, 0.010601237416267395], [0.002616457873955369, 0.21744422614574432, 0.03039846196770668, -0.27240675687789917], [0.006965342443436384, 0.02190200239419937, 0.02495032735168934, 0.02970684878528118], [0.007403382565826178, 0.21665742993354797, 0.025544464588165283, -0.2550007402896881], [0.011736530810594559, 0.02118024416267872, 0.02044445089995861, 0.04562864080071449], [0.012160136364400387, 0.2160031646490097, 0.02135702222585678, -0.24053440988063812], [0.01648019813001156, 0.020582735538482666, 0.016546335071325302, 0.0588078647851944], [0.016891853883862495, 0.2154635787010193, 0.017722491174936295, -0.22860899567604065], [0.021201126277446747, 0.020092912018299103, 0.013150312006473541, 0.06961113214492798], [0.02160298451781273, 0.21502389013767242, 0.014542534947395325, -0.21889396011829376], [0.02590346150100231, 0.40993496775627136, 0.01016465574502945, -0.5069543123245239], [0.03410216048359871, 0.6049122214317322, 2.5568986529833637e-05, -0.7964167594909668], [0.046200405806303024, 0.8000338077545166, -0.015902765095233917, -1.0890916585922241], [0.062201082706451416, 0.9953618049621582, -0.037684597074985504, -1.3867217302322388], [0.08210831880569458, 1.1909326314926147, -0.0654190331697464, -1.6909464597702026], [0.10592696815729141, 1.3867465257644653, -0.09923796355724335, -2.003258466720581], [0.1336618959903717, 1.5827537775039673, -0.13930313289165497, -2.324950695037842], [0.16531698405742645, 1.778838872909546, -0.1858021467924118, -2.6570520401000977], [0.20089375972747803, 1.974802851676941, -0.2389431893825531, -3.000250816345215], [0.008923102170228958, -0.23392778635025024, 0.00033007300226017833, 0.24825242161750793], [0.004244545940309763, -0.038810551166534424, 0.00529512157663703, -0.044326379895210266], [0.0034683351404964924, -0.2340080291032791, 0.004408593755215406, 0.2500225007534027], [-0.0012118255253881216, -0.4291926622390747, 0.009409043937921524, 0.5440927147865295], [-0.009795678779482841, -0.23420418798923492, 0.02029089815914631, 0.2543891668319702], [-0.014479762874543667, -0.42960989475250244, 0.02537868171930313, 0.5534024834632874], [-0.023071959614753723, -0.6250788569450378, 0.03644673153758049, 0.8539720773696899], [-0.03557353839278221, -0.43047213554382324, 0.053526174277067184, 0.5729687809944153], [-0.04418297857046127, -0.2361399233341217, 0.06498555094003677, 0.2976171374320984], [-0.04890577867627144, -0.0420016311109066, 0.07093789428472519, 0.02611670456826687], [-0.04974580928683281, 0.15203510224819183, 0.07146022468805313, -0.24336811900138855], [-0.046705108135938644, -0.04403094947338104, 0.06659286469221115, 0.0709717869758606], [-0.047585729509592056, -0.24004128575325012, 0.0680122971534729, 0.383899450302124], [-0.05238655209541321, -0.045947544276714325, 0.07569028437137604, 0.11341213434934616], [-0.053305502980947495, -0.2420678585767746, 0.07795853167772293, 0.4289820194244385], [-0.05814686045050621, -0.048131510615348816, 0.0865381732583046, 0.16185764968395233], [-0.05910949036478996, 0.14565183222293854, 0.08977532386779785, -0.1023191511631012], [-0.05619645491242409, 0.339380145072937, 0.08772893995046616, -0.3653828799724579], [-0.04940885305404663, 0.1431281417608261, 0.08042128384113312, -0.046377718448638916], [-0.04654628783464432, 0.33701032400131226, 0.07949373126029968, -0.3126426339149475], [-0.03980608284473419, 0.1408511847257614, 0.07324087619781494, 0.004013403318822384], [-0.036989059299230576, 0.3348504900932312, 0.0733211413025856, -0.26469185948371887], [-0.030292049050331116, 0.13876278698444366, 0.0680273100733757, 0.050186559557914734], [-0.027516793459653854, 0.33284667134284973, 0.06903103739023209, -0.22028131783008575], [-0.020859859883785248, 0.5269174575805664, 0.06462541222572327, -0.49041515588760376], [-0.010321510955691338, 0.7210710644721985, 0.05481711030006409, -0.762050986289978], [0.004099910147488117, 0.9153968095779419, 0.03957608714699745, -1.0369936227798462], [0.02240784652531147, 0.7197718024253845, 0.018836217001080513, -0.7321534752845764], [0.03680328279733658, 0.9146284461021423, 0.004193147644400597, -1.0188491344451904], [0.0550958514213562, 1.109694242477417, -0.01618383452296257, -1.31021249294281], [0.07728973776102066, 0.9147809743881226, -0.04238808527588844, -1.0226386785507202], [0.09558535367250443, 1.1104412078857422, -0.06284085661172867, -1.3283237218856812], [0.11779417842626572, 0.9161660671234131, -0.08940733224153519, -1.055949330329895], [0.13611750304698944, 0.7223354578018188, -0.11052632331848145, -0.7926154136657715], [0.15056420862674713, 0.5288903117179871, -0.1263786256313324, -0.5366469025611877], [0.1611420214176178, 0.7255414724349976, -0.13711155951023102, -0.866327702999115], [0.17565284669399261, 0.5325251221656799, -0.15443812310695648, -0.6197049617767334], [0.18630334734916687, 0.7294283509254456, -0.16683222353458405, -0.9567690491676331], [0.20089191198349, 0.9263531565666199, -0.1859675943851471, -1.2968764305114746], [0.2194189727306366, 1.1232850551605225, -0.21190513670444489, -1.6415408849716187], [0.036769378930330276, 0.21449317038059235, -0.022664643824100494, -0.3372676968574524], [0.04105924442410469, 0.01970095746219158, -0.029409999027848244, -0.05181725695729256], [0.04145326092839241, 0.2152319997549057, -0.03044634312391281, -0.35363227128982544], [0.045757900923490524, 0.020555909723043442, -0.03751898929476738, -0.07070332020521164], [0.04616902023553848, 0.21619510650634766, -0.038933057337999344, -0.37498360872268677], [0.05049292370676994, 0.021647177636623383, -0.046432726085186005, -0.09482626616954803], [0.05092586576938629, 0.21740281581878662, -0.04832925274968147, -0.4017895758152008], [0.05527392402291298, 0.022998491302132607, -0.05636504292488098, -0.12472683191299438], [0.05573389306664467, -0.17127256095409393, -0.058859579265117645, 0.14965440332889557], [0.05230844020843506, -0.3655044138431549, -0.05586649104952812, 0.4232029616832733], [0.044998351484537125, -0.5597922801971436, -0.047402434051036835, 0.6977638602256775], [0.03380250930786133, -0.7542259693145752, -0.033447157591581345, 0.9751557111740112], [0.018717987462878227, -0.9488837122917175, -0.013944041915237904, 1.2571473121643066], [-0.0002596861741039902, -0.7535860538482666, 0.011198905296623707, 0.960129976272583], [-0.015331408008933067, -0.5586164593696594, 0.030401505529880524, 0.6709862947463989], [-0.026503736153244972, -0.3639300465583801, 0.04382123053073883, 0.38802826404571533], [-0.03378233686089516, -0.5596457123756409, 0.05158179625868797, 0.6941993236541748], [-0.04497525095939636, -0.3652758002281189, 0.0654657781124115, 0.41819047927856445], [-0.052280768752098083, -0.5612614154815674, 0.07382959127426147, 0.7307723760604858], [-0.06350599229335785, -0.3672332465648651, 0.0884450376033783, 0.46220916509628296], [-0.0708506628870964, -0.1734653264284134, 0.09768921881914139, 0.19866232573986053], [-0.07431996613740921, 0.02013351023197174, 0.10166247189044952, -0.061676397919654846], [-0.07391729950904846, -0.17628799378871918, 0.10042893886566162, 0.2612719237804413], [-0.07744305580854416, -0.37268945574760437, 0.10565438121557236, 0.5838661789894104], [-0.08489684760570526, -0.1791938692331314, 0.11733170598745346, 0.32624590396881104], [-0.08848072588443756, -0.3757738471031189, 0.12385661900043488, 0.6535049676895142], [-0.0959962010383606, -0.18257436156272888, 0.13692672550678253, 0.40224650502204895], [-0.09964768588542938, -0.37934577465057373, 0.14497165381908417, 0.7347717881202698], [-0.10723460465669632, -0.18649233877658844, 0.15966708958148956, 0.4909987151622772], [-0.11096444725990295, 0.006059728097170591, 0.16948705911636353, 0.25258734822273254], [-0.11084325611591339, 0.1984073370695114, 0.17453880608081818, 0.017791016027331352], [-0.10687510669231415, 0.0012678105849772692, 0.17489463090896606, 0.36006176471710205], [-0.10684975236654282, 0.1935284286737442, 0.18209585547447205, 0.1272275745868683], [-0.10297918319702148, -0.0036716482136398554, 0.18464040756225586, 0.47137781977653503], [-0.10305261611938477, -0.20085571706295013, 0.19406796991825104, 0.8161028027534485], [-0.10706973075866699, -0.398029625415802, 0.21039003133773804, 1.1630101203918457], [0.02076908014714718, 0.1542804092168808, -0.018417317420244217, -0.31630614399909973], [0.023854687809944153, -0.04057443141937256, -0.024743441492319107, -0.02948783151805401], [0.023043198511004448, -0.23533296585083008, -0.02533319778740406, 0.25528672337532043], [0.018336540088057518, -0.430084228515625, -0.02022746205329895, 0.5398727059364319], [0.00973485503345728, -0.23468387126922607, -0.009430008940398693, 0.2408856600522995], [0.005041177850216627, -0.4296698570251465, -0.004612295888364315, 0.5305792689323425], [-0.003552219131961465, -0.23448331654071808, 0.005999289453029633, 0.2364465594291687], [-0.008241885341703892, -0.0394475944340229, 0.010728220455348492, -0.054337985813617706], [-0.009030837565660477, 0.15551890432834625, 0.009641461074352264, -0.34361687302589417], [-0.005920459516346455, 0.3505023717880249, 0.0027691235300153494, -0.6332439184188843], [0.0010895880404859781, 0.15534189343452454, -0.009895754978060722, -0.339690238237381], [0.004196425899863243, 0.35060325264930725, -0.016689559444785118, -0.6354771852493286], [0.011208491399884224, 0.5459539294242859, -0.029399104416370392, -0.933368980884552], [0.02212757058441639, 0.7414599657058716, -0.048066481947898865, -1.2351433038711548], [0.03695676848292351, 0.9371656179428101, -0.07276935130357742, -1.5424888134002686], [0.05570008233189583, 0.7429899573326111, -0.10361912846565247, -1.2733714580535889], [0.07055988162755966, 0.93927001953125, -0.12908655405044556, -1.5966219902038574], [0.089345283806324, 0.7458931803703308, -0.1610189974308014, -1.3468163013458252], [0.10426314175128937, 0.5531196594238281, -0.1879553198814392, -1.1085317134857178], [0.11532554030418396, 0.3608972430229187, -0.21012595295906067, -0.8802102208137512]], "action_prob": [0.500144898891449, 0.500501811504364, 0.499835729598999, 0.5008118748664856, 0.5002107620239258, 0.5004433393478394, 0.5002355575561523, 0.50042325258255, 0.4997405409812927, 0.5008828043937683, 0.5003125071525574, 0.5003477334976196, 0.4996538460254669, 0.5009505748748779, 0.4995894730091095, 0.49899590015411377, 0.501352071762085, 0.49890828132629395, 0.49858030676841736, 0.498427152633667, 0.5016476511955261, 0.5016722083091736, 0.5016381740570068, 0.4999805986881256, 0.5006897449493408, 0.5000648498535156, 0.4994259178638458, 0.5010260939598083, 0.49941372871398926, 0.501050591468811, 0.49939313530921936, 0.4989210367202759, 0.5013319849967957, 0.5011382102966309, 0.49929237365722656, 0.5011801719665527, 0.499235600233078, 0.5012273788452148, 0.5008317232131958, 0.5002203583717346, 0.49958324432373047, 0.5008840560913086, 0.49958091974258423, 0.5009030103683472, 0.5004306435585022, 0.4997577667236328, 0.5008680820465088, 0.5002811551094055, 0.4996178150177002, 0.49910834431648254, 0.5011872053146362, 0.4990571439266205, 0.4987601041793823, 0.5013870000839233, 0.49867868423461914, 0.4985411465167999, 0.5015289783477783, 0.4984467029571533, 0.49838754534721375, 0.5016543865203857, 0.5017146468162537, 0.5000262260437012, 0.499386191368103, 0.49893996119499207, 0.5013019442558289, 0.49887967109680176, 0.5013609528541565, 0.501190185546875, 0.5007992386817932, 0.5001899600028992, 0.4995485246181488, 0.4990783929824829, 0.5011894106864929, 0.49903404712677, 0.49876004457473755, 0.5013759136199951, 0.49868249893188477, 0.5014462471008301, 0.5013993978500366, 0.4987850785255432, 0.49853816628456116, 0.4984329342842102, 0.5016177892684937, 0.5016595125198364, 0.5016636252403259, 0.49841776490211487, 0.5000452995300293, 0.4993833303451538, 0.5010817050933838, 0.5006657838821411, 0.5000340938568115, 0.5006076693534851, 0.5000455975532532, 0.5006020665168762, 0.5000542402267456, 0.5005980730056763, 0.5000604391098022, 0.5005956888198853, 0.5000644326210022, 0.49940523505210876, 0.49893099069595337, 0.49867546558380127, 0.4985547959804535, 0.4984920918941498, 0.4984467625617981, 0.4984036982059479, 0.4983600676059723, 0.4983176589012146, 0.49999743700027466, 0.500655472278595, 0.4999842643737793, 0.4993303716182709, 0.5011191368103027, 0.499284565448761, 0.49883773922920227, 0.5013903379440308, 0.5012369751930237, 0.5008723139762878, 0.5002844333648682, 0.5003599524497986, 0.4996660053730011, 0.5009623765945435, 0.4995875954627991, 0.5010242462158203, 0.5005006790161133, 0.4998566508293152, 0.5006927847862244, 0.4999021589756012, 0.5006699562072754, 0.49994590878486633, 0.500645101070404, 0.49998846650123596, 0.499381959438324, 0.4989680051803589, 0.49874264001846313, 0.5013712048530579, 0.4986681044101715, 0.4985584020614624, 0.5014998912811279, 0.4984700381755829, 0.5015770792961121, 0.5016149878501892, 0.5016098618507385, 0.49849942326545715, 0.5016684532165527, 0.4984081983566284, 0.4982715845108032, 0.49823230504989624, 0.49984681606292725, 0.5007953643798828, 0.4998091459274292, 0.5008298754692078, 0.4997639060020447, 0.5008699297904968, 0.4997102916240692, 0.5009160041809082, 0.5003525614738464, 0.4996970295906067, 0.4991736114025116, 0.4988597631454468, 0.4986971616744995, 0.5013903379440308, 0.5013906359672546, 0.5013047456741333, 0.4989554286003113, 0.5013596415519714, 0.49887967109680176, 0.5014185309410095, 0.5012056827545166, 0.5007681250572205, 0.4998500943183899, 0.49915412068367004, 0.5013178586959839, 0.4990460276603699, 0.5013906359672546, 0.4989292621612549, 0.5014668703079224, 0.5011940598487854, 0.5007163286209106, 0.49988386034965515, 0.5008432269096375, 0.49973708391189575, 0.49903249740600586, 0.4985611140727997, 0.4999925196170807, 0.5006721019744873, 0.500038206577301, 0.4993961751461029, 0.5010507106781006, 0.4993702173233032, 0.5010833740234375, 0.5006653666496277, 0.5000249147415161, 0.49937674403190613, 0.5010733604431152, 0.49933528900146484, 0.49888378381729126, 0.4986441135406494, 0.4985271990299225, 0.5015386343002319, 0.49842771887779236, 0.5016289949417114, 0.501672625541687, 0.5016801953315735], "advantages": [20.638458251953125, 19.839492797851562, 19.026885986328125, 18.20616340637207, 17.382604598999023, 16.550785064697266, 15.704916954040527, 14.85617733001709, 13.993186950683594, 13.121712684631348, 12.246697425842285, 11.363025665283203, 10.464713096618652, 9.557663917541504, 8.646533012390137, 7.721145153045654, 6.787222862243652, 5.847266674041748, 4.894478797912598, 3.932813882827759, 2.961942195892334, 1.9821118116378784, 0.9926413893699646, 31.74469566345215, 31.0580997467041, 30.35905647277832, 29.652942657470703, 28.940214157104492, 28.224853515625, 27.497615814208984, 26.767688751220703, 26.025667190551758, 25.276851654052734, 24.523752212524414, 23.763710021972656, 22.991252899169922, 22.215673446655273, 21.427579879760742, 20.63612937927246, 19.83712387084961, 19.029972076416016, 18.214109420776367, 17.385635375976562, 16.553272247314453, 15.708002090454102, 14.853675842285156, 13.990864753723145, 13.124733924865723, 12.249951362609863, 11.3658447265625, 10.472101211547852, 9.56607723236084, 8.654221534729004, 7.732516765594482, 6.799525737762451, 5.859103202819824, 4.908712387084961, 3.947740316390991, 2.978013515472412, 1.9981924295425415, 1.0081778764724731, 22.21763801574707, 21.429302215576172, 20.63358497619629, 19.830520629882812, 19.022239685058594, 18.202836990356445, 17.37805938720703, 16.545610427856445, 15.705268859863281, 14.856450080871582, 13.998549461364746, 13.131319046020508, 12.252137184143066, 11.367363929748535, 10.47305679321289, 9.567687034606934, 8.65524673461914, 7.7315802574157715, 6.798043727874756, 5.858274459838867, 4.9083251953125, 3.948310613632202, 2.977725028991699, 1.9970821142196655, 1.0061932802200317, 19.83690643310547, 19.029966354370117, 18.21426773071289, 17.38597297668457, 16.548778533935547, 15.70314884185791, 14.854546546936035, 13.991771697998047, 13.125883102416992, 12.245621681213379, 11.36209487915039, 10.463996887207031, 9.562470436096191, 8.646178245544434, 7.721130847930908, 6.787444591522217, 5.8449273109436035, 4.893316268920898, 3.9323740005493164, 2.961902618408203, 1.9817357063293457, 0.9917305707931519, 33.10247039794922, 32.429527282714844, 31.74419403076172, 31.057540893554688, 30.363374710083008, 29.65774154663086, 28.949460983276367, 28.233272552490234, 27.506921768188477, 26.772605895996094, 26.030366897583008, 25.280595779418945, 24.528879165649414, 23.769363403320312, 22.996898651123047, 22.221858978271484, 21.43385887145996, 20.637653350830078, 19.83368492126465, 19.02678871154785, 18.20644760131836, 17.38316535949707, 16.546144485473633, 15.70612907409668, 14.852109909057617, 13.989964485168457, 13.119726181030273, 12.241214752197266, 11.35590648651123, 10.459485054016113, 9.554424285888672, 8.641484260559082, 7.718023777008057, 6.786465167999268, 5.845848560333252, 4.89618444442749, 3.9338626861572266, 2.964705467224121, 1.9830141067504883, 0.9920801520347595, 30.35830307006836, 29.652074813842773, 28.94415855407715, 28.22364616394043, 27.501258850097656, 26.766178131103516, 26.029016494750977, 25.27907943725586, 24.526832580566406, 23.767168045043945, 22.999448776245117, 22.223325729370117, 21.438772201538086, 20.645854949951172, 19.84355354309082, 19.03266716003418, 18.21297264099121, 17.38875389099121, 16.552547454833984, 15.711528778076172, 14.858503341674805, 13.996281623840332, 13.125004768371582, 12.25055980682373, 11.366640090942383, 10.46941089630127, 9.567378044128418, 8.652154922485352, 7.731610298156738, 6.798051834106445, 5.854562282562256, 4.901265621185303, 3.943890333175659, 2.9713807106018066, 1.9943698644638062, 1.006574273109436, 18.209165573120117, 17.380184173583984, 16.548362731933594, 15.708123207092285, 14.858839988708496, 13.99651050567627, 13.13000202178955, 12.250229835510254, 11.36107349395752, 10.463041305541992, 9.556570053100586, 8.645134925842285, 7.720257759094238, 6.786786079406738, 5.844465255737305, 4.893013000488281, 3.9326839447021484, 2.9619405269622803, 1.982016921043396, 0.9924078583717346], "value_targets": [20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [2755081, 2755081, 2755081, 2755081, 2755081, 2755081, 2755081, 2755081, 2755081, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 578045844, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 625175134, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 1617312608, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 626142221, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 99979342, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851, 704409851], "obs": [[-0.038227278739213943, 0.03421524912118912, -0.023869682103395462, 0.042771004140377045], [-0.03754297271370888, 0.22967121005058289, -0.023014262318611145, -0.25734642148017883], [-0.032949548214673996, 0.4251140356063843, -0.028161190450191498, -0.5571986436843872], [-0.02444726787507534, 0.6206197738647461, -0.03930516541004181, -0.8586192727088928], [-0.01203487254679203, 0.8162544965744019, -0.05647755041718483, -1.1633974313735962], [0.004290217068046331, 1.0120644569396973, -0.07974550127983093, -1.4732396602630615], [0.02453150600194931, 1.2080656290054321, -0.1092102900147438, -1.7897273302078247], [0.048692818731069565, 1.4042302370071411, -0.14500483870506287, -2.1142654418945312], [0.07677742093801498, 1.6004726886749268, -0.18729014694690704, -2.4480221271514893], [-0.01498539187014103, -0.0029599731788039207, 0.01599946804344654, -0.027393843978643417], [-0.015044591389596462, 0.1919289231300354, 0.015451591461896896, -0.31498613953590393], [-0.011206013150513172, 0.38682740926742554, 0.009151868522167206, -0.6027563810348511], [-0.0034694650676101446, 0.5818201303482056, -0.002903258427977562, -0.8925426602363586], [0.008166938088834286, 0.3867377042770386, -0.02075411193072796, -0.6007737517356873], [0.01590169221162796, 0.5821437239646912, -0.0327695868909359, -0.8999209403991699], [0.027544567361474037, 0.7776941061019897, -0.05076800659298897, -1.2027214765548706], [0.04309844970703125, 0.5832639932632446, -0.07482243329286575, -0.9263715147972107], [0.054763730615377426, 0.38922786712646484, -0.0933498665690422, -0.6581089496612549], [0.06254828721284866, 0.585516631603241, -0.10651204735040665, -0.9786651730537415], [0.07425861805677414, 0.3919714093208313, -0.1260853409767151, -0.7212479710578918], [0.08209804445505142, 0.5885911583900452, -0.14051030576229095, -1.0508073568344116], [0.09386987239122391, 0.3955840468406677, -0.16152645647525787, -0.805324137210846], [0.10178155452013016, 0.5925080180168152, -0.17763294279575348, -1.144147515296936], [0.1136317104101181, 0.40009424090385437, -0.20051588118076324, -0.9120182991027832], [-0.03759820759296417, 0.022775495424866676, -0.023352809250354767, 0.0025434771087020636], [-0.03714269772171974, 0.218224436044693, -0.02330193854868412, -0.2974151074886322], [-0.03277820721268654, 0.41367068886756897, -0.029250241816043854, -0.5973550081253052], [-0.02450479380786419, 0.21896998584270477, -0.041197340935468674, -0.31402724981307983], [-0.02012539468705654, 0.024458374828100204, -0.04747788608074188, -0.03461599349975586], [-0.019636226817965508, -0.16995170712471008, -0.04817020520567894, 0.24271726608276367], [-0.023035261780023575, -0.3643536865711212, -0.043315861374139786, 0.5198253989219666], [-0.03032233566045761, -0.5588399171829224, -0.03291935473680496, 0.7985502481460571], [-0.04149913415312767, -0.363282173871994, -0.01694834791123867, 0.4956960380077362], [-0.048764776438474655, -0.5581610798835754, -0.0070344265550374985, 0.7829898595809937], [-0.05992799997329712, -0.7531856894493103, 0.008625369518995285, 1.0734513998031616], [-0.07499171048402786, -0.948420524597168, 0.030094396322965622, 1.3688286542892456], [-0.09396012127399445, -1.1439058780670166, 0.05747096985578537, 1.670770287513733], [-0.116838239133358, -0.949496865272522, 0.09088637679815292, 1.396525263786316], [-0.1358281821012497, -1.1456241607666016, 0.11881688237190247, 1.7161859273910522], [-0.15874065458774567, -1.3418917655944824, 0.1531406044960022, 2.0433616638183594], [-0.18557849526405334, -1.5382200479507446, 0.19400782883167267, 2.3792552947998047], [-0.027703123167157173, -0.007142084650695324, 0.005460320971906185, 0.04905525594949722], [-0.027845963835716248, -0.20234189927577972, 0.0064414264634251595, 0.3434559404850006], [-0.0318928025662899, -0.007312180940061808, 0.01331054512411356, 0.05281119793653488], [-0.03203904628753662, -0.2026224285364151, 0.01436676923185587, 0.3496638238430023], [-0.03609149530529976, -0.007707725279033184, 0.021360045298933983, 0.06154560297727585], [-0.03624564781785011, 0.1871015578508377, 0.022590957581996918, -0.22432228922843933], [-0.03250361606478691, 0.38189348578453064, 0.018104512244462967, -0.5097944140434265], [-0.02486574836075306, 0.18652120232582092, 0.007908623665571213, -0.2114616185426712], [-0.021135324612259865, 0.38152918219566345, 0.003679390763863921, -0.5016393661499023], [-0.01350474078208208, 0.1863555759191513, -0.006353395991027355, -0.20779915153980255], [-0.009777628816664219, 0.3815678060054779, -0.010509379208087921, -0.5024794340133667], [-0.0021462731529027224, 0.5768362879753113, -0.02055896818637848, -0.7984557151794434], [0.00939045287668705, 0.7722342014312744, -0.0365280844271183, -1.0975345373153687], [0.02483513578772545, 0.9678175449371338, -0.05847877264022827, -1.401450753211975], [0.04419148713350296, 0.7734689116477966, -0.08650778979063034, -1.127609133720398], [0.059660863131284714, 0.5795801281929016, -0.10905996710062027, -0.8632650971412659], [0.07125246524810791, 0.3860985040664673, -0.12632526457309723, -0.606766939163208], [0.07897444069385529, 0.1929481029510498, -0.13846060633659363, -0.35639098286628723], [0.08283340185880661, 3.8383463106583804e-05, -0.14558842778205872, -0.11037318408489227], [0.0828341692686081, -0.1927298605442047, -0.1477959007024765, 0.13306820392608643], [0.07897957414388657, -0.38545966148376465, -0.14513452351093292, 0.37571725249290466], [0.07127037644386292, -0.5782541632652283, -0.13762018084526062, 0.6193485856056213], [0.05970529466867447, -0.7712128758430481, -0.1252332180738449, 0.8657174110412598], [0.04428103566169739, -0.5746293663978577, -0.1079188659787178, 0.5364290475845337], [0.03278845176100731, -0.7680816054344177, -0.09719028323888779, 0.7932526469230652], [0.01742681860923767, -0.5717693567276001, -0.0813252329826355, 0.4716450273990631], [0.005991430953145027, -0.7656541466712952, -0.07189232856035233, 0.7376277446746826], [-0.009321652352809906, -0.5696168541908264, -0.05713977664709091, 0.4232132136821747], [-0.020713988691568375, -0.3737339377403259, -0.04867551103234291, 0.11307841539382935], [-0.028188668191432953, -0.17794953286647797, -0.04641394317150116, -0.19455531239509583], [-0.03174765780568123, -0.372377872467041, -0.05030504986643791, 0.08313234150409698], [-0.039195217192173004, -0.5667439699172974, -0.04864240065217018, 0.3595292270183563], [-0.050530094653367996, -0.7611419558525085, -0.041451819241046906, 0.6364859938621521], [-0.06575293093919754, -0.9556620121002197, -0.028722098097205162, 0.9158321619033813], [-0.08486617356538773, -0.7601636648178101, -0.010405454784631729, 0.6142624616622925], [-0.10006944835186005, -0.564897894859314, 0.00187979475595057, 0.31832048296928406], [-0.11136740446090698, -0.7600465416908264, 0.008246204815804958, 0.611595630645752], [-0.12656833231449127, -0.5650408267974854, 0.02047811634838581, 0.3215213418006897], [-0.13786914944648743, -0.37021639943122864, 0.026908542960882187, 0.03536610305309296], [-0.14527347683906555, -0.56571364402771, 0.0276158656924963, 0.3364160358905792], [-0.15658774971961975, -0.7612175345420837, 0.03434418514370918, 0.6376780271530151], [-0.17181210219860077, -0.5665909051895142, 0.04709774628281593, 0.3560054302215576], [-0.18314392864704132, -0.3721691071987152, 0.054217856377363205, 0.07853776961565018], [-0.19058731198310852, -0.5680246949195862, 0.05578861013054848, 0.38782167434692383], [-0.20194779336452484, -0.3737371861934662, 0.06354504823684692, 0.1132371798157692], [-0.2094225436449051, -0.5697094202041626, 0.06580978631973267, 0.4252718687057495], [-0.2208167314529419, -0.3755783438682556, 0.07431522756814957, 0.15403978526592255], [-0.22832830250263214, -0.5716813802719116, 0.07739602029323578, 0.4692109525203705], [-0.23976191878318787, -0.37773317098617554, 0.08678024262189865, 0.20189130306243896], [-0.24731658399105072, -0.5739821195602417, 0.09081806987524033, 0.5206384062767029], [-0.25879624485969543, -0.770257294178009, 0.10123083740472794, 0.840501606464386], [-0.274201363325119, -0.5766522884368896, 0.11804086714982986, 0.5812918543815613], [-0.2857344150543213, -0.38336482644081116, 0.12966670095920563, 0.3280017673969269], [-0.29340171813964844, -0.19030433893203735, 0.13622674345970154, 0.07885738462209702], [-0.2972078025341034, -0.3870895206928253, 0.13780388236045837, 0.41122737526893616], [-0.3049495816230774, -0.19416266679763794, 0.14602842926979065, 0.16496673226356506], [-0.3088328540325165, -0.3910403549671173, 0.14932776987552643, 0.4999200999736786], [-0.31665366888046265, -0.19830414652824402, 0.15932616591453552, 0.2577725350856781], [-0.32061973214149475, -0.005773007404059172, 0.16448162496089935, 0.019277557730674744], [-0.3207351863384247, 0.18665491044521332, 0.16486717760562897, -0.2173287719488144], [-0.3170020878314972, -0.010392938740551472, 0.16052059829235077, 0.12248675525188446], [-0.31720995903015137, -0.20740704238414764, 0.16297033429145813, 0.46119940280914307], [-0.3213581144809723, -0.014918265864253044, 0.17219431698322296, 0.22399349510669708], [-0.3216564655303955, 0.17737798392772675, 0.17667418718338013, -0.009809797629714012], [-0.3181089162826538, -0.019779687747359276, 0.17647799849510193, 0.33299559354782104], [-0.3185045123100281, -0.2169167697429657, 0.183137908577919, 0.6757239699363708], [-0.3228428363800049, -0.41404733061790466, 0.1966523826122284, 1.0200170278549194], [0.00201775343157351, -0.017038404941558838, 0.022872230038046837, -0.032315559685230255], [0.0016769854119047523, -0.21248075366020203, 0.022225920110940933, 0.26749515533447266], [-0.0025726298335939646, -0.017682945355772972, 0.027575822547078133, -0.018095528706908226], [-0.002926288638263941, 0.17703290283679962, 0.027213912457227707, -0.3019520044326782], [0.000614369404502213, -0.018466128036379814, 0.021174872294068336, -0.0008121278369799256], [0.0002450468600727618, -0.21388526260852814, 0.021158630028367043, 0.29847580194473267], [-0.004032658413052559, -0.019071202725172043, 0.027128145098686218, 0.012540300376713276], [-0.004414082504808903, -0.2145714908838272, 0.027378952130675316, 0.3136575222015381], [-0.008705511689186096, -0.41007256507873535, 0.03365210071206093, 0.6148476004600525], [-0.016906963661313057, -0.6056481599807739, 0.0459490530192852, 0.9179368019104004], [-0.029019925743341446, -0.41117650270462036, 0.0643077865242958, 0.6400414705276489], [-0.03724345564842224, -0.21700727939605713, 0.07710862159729004, 0.36828312277793884], [-0.041583601385354996, -0.4131353497505188, 0.08447428047657013, 0.6842485666275024], [-0.049846310168504715, -0.6093223094940186, 0.09815925359725952, 1.0022854804992676], [-0.062032755464315414, -0.41563913226127625, 0.11820496618747711, 0.7419717907905579], [-0.07034553587436676, -0.22233004868030548, 0.13304439187049866, 0.4887029230594635], [-0.07479213923215866, -0.41905340552330017, 0.14281845092773438, 0.8201799392700195], [-0.08317320793867111, -0.615810751914978, 0.1592220515012741, 1.1541571617126465], [-0.09548941999673843, -0.4230823516845703, 0.1823052018880844, 0.9153350591659546], [-0.10395106673240662, -0.2308315485715866, 0.2006119042634964, 0.6850390434265137], [-0.013644421473145485, -0.02747584693133831, 0.0031195832416415215, 0.017488138750195503], [-0.014193938113749027, -0.22264239192008972, 0.003469345858320594, 0.31115370988845825], [-0.018646785989403725, -0.41781359910964966, 0.0096924202516675, 0.604928731918335], [-0.027003059163689613, -0.22282852232456207, 0.021790994331240654, 0.315314382314682], [-0.03145962953567505, -0.41825398802757263, 0.028097281232476234, 0.6147890090942383], [-0.0398247092962265, -0.2235356718301773, 0.04039306193590164, 0.33108633756637573], [-0.04429542273283005, -0.4192086160182953, 0.047014787793159485, 0.6362286806106567], [-0.05267959460616112, -0.22477279603481293, 0.0597393624484539, 0.3587144911289215], [-0.05717505142092705, -0.03054872713983059, 0.0669136494398117, 0.08545100688934326], [-0.05778602510690689, -0.22656285762786865, 0.06862267106771469, 0.3984721601009369], [-0.06231728196144104, -0.4225878119468689, 0.07659211754798889, 0.7119767665863037], [-0.0707690417766571, -0.2286052703857422, 0.09083165228366852, 0.44435209035873413], [-0.07534114271402359, -0.03487798571586609, 0.09971869736909866, 0.18162688612937927], [-0.07603870332241058, 0.15868614614009857, 0.10335122793912888, -0.07800820469856262], [-0.07286497950553894, 0.3521863520145416, 0.10179106891155243, -0.3363785147666931], [-0.06582125276327133, 0.15577423572540283, 0.09506350010633469, -0.013410455547273159], [-0.06270577013492584, 0.3494133949279785, 0.09479528665542603, -0.2746511399745941], [-0.055717501789331436, 0.15307573974132538, 0.08930226415395737, 0.04636117443442345], [-0.052655987441539764, 0.3468112051486969, 0.09022948890924454, -0.21686403453350067], [-0.04571976140141487, 0.5405352115631104, 0.0858922079205513, -0.47977644205093384], [-0.03490905836224556, 0.3443123996257782, 0.07629667967557907, -0.16130603849887848], [-0.02802281081676483, 0.14818578958511353, 0.07307055592536926, 0.15443748235702515], [-0.02505909465253353, -0.04790220037102699, 0.07615930587053299, 0.4692482352256775], [-0.026017138734459877, -0.2440127581357956, 0.08554427325725555, 0.7849305272102356], [-0.030897393822669983, -0.05016384273767471, 0.10124288499355316, 0.5203397870063782], [-0.03190067037940025, 0.14339806139469147, 0.11164967715740204, 0.2611982822418213], [-0.029032710939645767, -0.05312591418623924, 0.11687364429235458, 0.5869056582450867], [-0.030095228925347328, -0.24967403709888458, 0.128611758351326, 0.9139992594718933], [-0.035088710486888885, -0.056504279375076294, 0.1468917429447174, 0.6643454432487488], [-0.0362187959253788, 0.13630200922489166, 0.16017864644527435, 0.4212816059589386], [-0.03349275514483452, 0.3288350999355316, 0.1686042845249176, 0.1830703467130661], [-0.026916053146123886, 0.5211937427520752, 0.1722656935453415, -0.05204097926616669], [-0.016492178663611412, 0.7134807705879211, 0.17122487723827362, -0.28580644726753235], [-0.0022225631400942802, 0.9057998657226562, 0.16550874710083008, -0.5199720859527588], [0.01589343324303627, 1.098252534866333, 0.15510930120944977, -0.7562684416770935], [0.03785848245024681, 0.9013715982437134, 0.13998393714427948, -0.4190730154514313], [0.0558859147131443, 0.7045724391937256, 0.1316024661064148, -0.08574084937572479], [0.06997736543416977, 0.897586464881897, 0.129887655377388, -0.3341788649559021], [0.08792909234762192, 0.7008782029151917, 0.1232040748000145, -0.0035222333390265703], [0.10194665938615799, 0.8940376043319702, 0.12313362956047058, -0.2549346685409546], [0.11982740461826324, 1.0872060060501099, 0.11803493648767471, -0.5063835382461548], [0.1415715217590332, 0.8906358480453491, 0.1079072654247284, -0.1789582073688507], [0.15938425064086914, 1.0840613842010498, 0.10432810336351395, -0.43574586510658264], [0.18106546998023987, 1.2775636911392212, 0.09561318159103394, -0.6938042640686035], [0.20661674439907074, 1.0812546014785767, 0.08173710107803345, -0.3726181387901306], [0.22824184596538544, 1.2751260995864868, 0.07428473979234695, -0.6384504437446594], [0.25374436378479004, 1.0790512561798096, 0.06151572987437248, -0.3233296275138855], [0.27532538771629333, 0.8831097483634949, 0.05504913628101349, -0.01189910527318716], [0.292987585067749, 1.077400803565979, 0.054811153560876846, -0.28671789169311523], [0.31453558802604675, 1.2716999053955078, 0.04907679557800293, -0.5616225600242615], [0.33996960520744324, 1.4661000967025757, 0.03784434497356415, -0.8384488821029663], [0.36929160356521606, 1.2704823017120361, 0.02107536606490612, -0.5341087579727173], [0.3947012424468994, 1.4653016328811646, 0.010393191128969193, -0.8200771808624268], [0.42400726675987244, 1.6602798700332642, -0.0060083516873419285, -1.1094731092453003], [0.4572128653526306, 1.4652373790740967, -0.028197813779115677, -0.8186811208724976], [0.48651760816574097, 1.660733699798584, -0.04457143694162369, -1.1200981140136719], [0.5197322964668274, 1.8564109802246094, -0.06697339564561844, -1.4264222383499146], [0.5568605065345764, 2.052293539047241, -0.0955018401145935, -1.7392628192901611], [0.5979064106941223, 1.8583805561065674, -0.13028709590435028, -1.4777536392211914], [0.6350740194320679, 1.6650680303573608, -0.15984217822551727, -1.2284384965896606], [0.6683753728866577, 1.8618444204330444, -0.1844109445810318, -1.566634178161621], [0.042271215468645096, -0.03714655712246895, -0.035471681505441666, -0.030315125361084938], [0.041528284549713135, -0.23174233734607697, -0.03607798367738724, 0.25096845626831055], [0.036893438547849655, -0.03612427040934563, -0.031058616936206818, -0.052872344851493835], [0.03617095202207565, -0.23078742623329163, -0.03211606293916702, 0.22985181212425232], [0.03155520558357239, -0.03522161394357681, -0.027519026771187782, -0.07278614491224289], [0.03085077367722988, -0.22993846237659454, -0.028974749147892, 0.21108895540237427], [0.026252003386616707, -0.4246343970298767, -0.024752970784902573, 0.49449291825294495], [0.01775931566953659, -0.6193986535072327, -0.014863112010061741, 0.7792732119560242], [0.005371341947466135, -0.8143131732940674, 0.0007223517168313265, 1.067242980003357], [-0.010914920829236507, -0.6192007660865784, 0.02206721156835556, 0.7747868895530701], [-0.02329893596470356, -0.42438921332359314, 0.03756295144557953, 0.4891279339790344], [-0.0317867211997509, -0.6200203895568848, 0.04734550788998604, 0.7934086322784424], [-0.04418712854385376, -0.8157591819763184, 0.06321368366479874, 1.100602149963379], [-0.0605023130774498, -1.0116534233093262, 0.08522572368383408, 1.4124290943145752], [-0.08073538541793823, -0.8176850080490112, 0.11347430944442749, 1.147558569908142], [-0.09708908200263977, -0.6242125630378723, 0.13642548024654388, 0.8925061821937561], [-0.10957333445549011, -0.8208949565887451, 0.15427561104297638, 1.2247734069824219], [-0.12599124014377594, -1.0176297426223755, 0.17877106368541718, 1.561547875404358]], "actions": [1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.03754297271370888, 0.22967121005058289, -0.023014262318611145, -0.25734642148017883], [-0.032949548214673996, 0.4251140356063843, -0.028161190450191498, -0.5571986436843872], [-0.02444726787507534, 0.6206197738647461, -0.03930516541004181, -0.8586192727088928], [-0.01203487254679203, 0.8162544965744019, -0.05647755041718483, -1.1633974313735962], [0.004290217068046331, 1.0120644569396973, -0.07974550127983093, -1.4732396602630615], [0.02453150600194931, 1.2080656290054321, -0.1092102900147438, -1.7897273302078247], [0.048692818731069565, 1.4042302370071411, -0.14500483870506287, -2.1142654418945312], [0.07677742093801498, 1.6004726886749268, -0.18729014694690704, -2.4480221271514893], [0.10878688097000122, 1.407375693321228, -0.23625057935714722, -2.2181835174560547], [-0.015044591389596462, 0.1919289231300354, 0.015451591461896896, -0.31498613953590393], [-0.011206013150513172, 0.38682740926742554, 0.009151868522167206, -0.6027563810348511], [-0.0034694650676101446, 0.5818201303482056, -0.002903258427977562, -0.8925426602363586], [0.008166938088834286, 0.3867377042770386, -0.02075411193072796, -0.6007737517356873], [0.01590169221162796, 0.5821437239646912, -0.0327695868909359, -0.8999209403991699], [0.027544567361474037, 0.7776941061019897, -0.05076800659298897, -1.2027214765548706], [0.04309844970703125, 0.5832639932632446, -0.07482243329286575, -0.9263715147972107], [0.054763730615377426, 0.38922786712646484, -0.0933498665690422, -0.6581089496612549], [0.06254828721284866, 0.585516631603241, -0.10651204735040665, -0.9786651730537415], [0.07425861805677414, 0.3919714093208313, -0.1260853409767151, -0.7212479710578918], [0.08209804445505142, 0.5885911583900452, -0.14051030576229095, -1.0508073568344116], [0.09386987239122391, 0.3955840468406677, -0.16152645647525787, -0.805324137210846], [0.10178155452013016, 0.5925080180168152, -0.17763294279575348, -1.144147515296936], [0.1136317104101181, 0.40009424090385437, -0.20051588118076324, -0.9120182991027832], [0.12163359671831131, 0.5972813963890076, -0.21875625848770142, -1.2604302167892456], [-0.03714269772171974, 0.218224436044693, -0.02330193854868412, -0.2974151074886322], [-0.03277820721268654, 0.41367068886756897, -0.029250241816043854, -0.5973550081253052], [-0.02450479380786419, 0.21896998584270477, -0.041197340935468674, -0.31402724981307983], [-0.02012539468705654, 0.024458374828100204, -0.04747788608074188, -0.03461599349975586], [-0.019636226817965508, -0.16995170712471008, -0.04817020520567894, 0.24271726608276367], [-0.023035261780023575, -0.3643536865711212, -0.043315861374139786, 0.5198253989219666], [-0.03032233566045761, -0.5588399171829224, -0.03291935473680496, 0.7985502481460571], [-0.04149913415312767, -0.363282173871994, -0.01694834791123867, 0.4956960380077362], [-0.048764776438474655, -0.5581610798835754, -0.0070344265550374985, 0.7829898595809937], [-0.05992799997329712, -0.7531856894493103, 0.008625369518995285, 1.0734513998031616], [-0.07499171048402786, -0.948420524597168, 0.030094396322965622, 1.3688286542892456], [-0.09396012127399445, -1.1439058780670166, 0.05747096985578537, 1.670770287513733], [-0.116838239133358, -0.949496865272522, 0.09088637679815292, 1.396525263786316], [-0.1358281821012497, -1.1456241607666016, 0.11881688237190247, 1.7161859273910522], [-0.15874065458774567, -1.3418917655944824, 0.1531406044960022, 2.0433616638183594], [-0.18557849526405334, -1.5382200479507446, 0.19400782883167267, 2.3792552947998047], [-0.21634289622306824, -1.3452712297439575, 0.24159292876720428, 2.151942729949951], [-0.027845963835716248, -0.20234189927577972, 0.0064414264634251595, 0.3434559404850006], [-0.0318928025662899, -0.007312180940061808, 0.01331054512411356, 0.05281119793653488], [-0.03203904628753662, -0.2026224285364151, 0.01436676923185587, 0.3496638238430023], [-0.03609149530529976, -0.007707725279033184, 0.021360045298933983, 0.06154560297727585], [-0.03624564781785011, 0.1871015578508377, 0.022590957581996918, -0.22432228922843933], [-0.03250361606478691, 0.38189348578453064, 0.018104512244462967, -0.5097944140434265], [-0.02486574836075306, 0.18652120232582092, 0.007908623665571213, -0.2114616185426712], [-0.021135324612259865, 0.38152918219566345, 0.003679390763863921, -0.5016393661499023], [-0.01350474078208208, 0.1863555759191513, -0.006353395991027355, -0.20779915153980255], [-0.009777628816664219, 0.3815678060054779, -0.010509379208087921, -0.5024794340133667], [-0.0021462731529027224, 0.5768362879753113, -0.02055896818637848, -0.7984557151794434], [0.00939045287668705, 0.7722342014312744, -0.0365280844271183, -1.0975345373153687], [0.02483513578772545, 0.9678175449371338, -0.05847877264022827, -1.401450753211975], [0.04419148713350296, 0.7734689116477966, -0.08650778979063034, -1.127609133720398], [0.059660863131284714, 0.5795801281929016, -0.10905996710062027, -0.8632650971412659], [0.07125246524810791, 0.3860985040664673, -0.12632526457309723, -0.606766939163208], [0.07897444069385529, 0.1929481029510498, -0.13846060633659363, -0.35639098286628723], [0.08283340185880661, 3.8383463106583804e-05, -0.14558842778205872, -0.11037318408489227], [0.0828341692686081, -0.1927298605442047, -0.1477959007024765, 0.13306820392608643], [0.07897957414388657, -0.38545966148376465, -0.14513452351093292, 0.37571725249290466], [0.07127037644386292, -0.5782541632652283, -0.13762018084526062, 0.6193485856056213], [0.05970529466867447, -0.7712128758430481, -0.1252332180738449, 0.8657174110412598], [0.04428103566169739, -0.5746293663978577, -0.1079188659787178, 0.5364290475845337], [0.03278845176100731, -0.7680816054344177, -0.09719028323888779, 0.7932526469230652], [0.01742681860923767, -0.5717693567276001, -0.0813252329826355, 0.4716450273990631], [0.005991430953145027, -0.7656541466712952, -0.07189232856035233, 0.7376277446746826], [-0.009321652352809906, -0.5696168541908264, -0.05713977664709091, 0.4232132136821747], [-0.020713988691568375, -0.3737339377403259, -0.04867551103234291, 0.11307841539382935], [-0.028188668191432953, -0.17794953286647797, -0.04641394317150116, -0.19455531239509583], [-0.03174765780568123, -0.372377872467041, -0.05030504986643791, 0.08313234150409698], [-0.039195217192173004, -0.5667439699172974, -0.04864240065217018, 0.3595292270183563], [-0.050530094653367996, -0.7611419558525085, -0.041451819241046906, 0.6364859938621521], [-0.06575293093919754, -0.9556620121002197, -0.028722098097205162, 0.9158321619033813], [-0.08486617356538773, -0.7601636648178101, -0.010405454784631729, 0.6142624616622925], [-0.10006944835186005, -0.564897894859314, 0.00187979475595057, 0.31832048296928406], [-0.11136740446090698, -0.7600465416908264, 0.008246204815804958, 0.611595630645752], [-0.12656833231449127, -0.5650408267974854, 0.02047811634838581, 0.3215213418006897], [-0.13786914944648743, -0.37021639943122864, 0.026908542960882187, 0.03536610305309296], [-0.14527347683906555, -0.56571364402771, 0.0276158656924963, 0.3364160358905792], [-0.15658774971961975, -0.7612175345420837, 0.03434418514370918, 0.6376780271530151], [-0.17181210219860077, -0.5665909051895142, 0.04709774628281593, 0.3560054302215576], [-0.18314392864704132, -0.3721691071987152, 0.054217856377363205, 0.07853776961565018], [-0.19058731198310852, -0.5680246949195862, 0.05578861013054848, 0.38782167434692383], [-0.20194779336452484, -0.3737371861934662, 0.06354504823684692, 0.1132371798157692], [-0.2094225436449051, -0.5697094202041626, 0.06580978631973267, 0.4252718687057495], [-0.2208167314529419, -0.3755783438682556, 0.07431522756814957, 0.15403978526592255], [-0.22832830250263214, -0.5716813802719116, 0.07739602029323578, 0.4692109525203705], [-0.23976191878318787, -0.37773317098617554, 0.08678024262189865, 0.20189130306243896], [-0.24731658399105072, -0.5739821195602417, 0.09081806987524033, 0.5206384062767029], [-0.25879624485969543, -0.770257294178009, 0.10123083740472794, 0.840501606464386], [-0.274201363325119, -0.5766522884368896, 0.11804086714982986, 0.5812918543815613], [-0.2857344150543213, -0.38336482644081116, 0.12966670095920563, 0.3280017673969269], [-0.29340171813964844, -0.19030433893203735, 0.13622674345970154, 0.07885738462209702], [-0.2972078025341034, -0.3870895206928253, 0.13780388236045837, 0.41122737526893616], [-0.3049495816230774, -0.19416266679763794, 0.14602842926979065, 0.16496673226356506], [-0.3088328540325165, -0.3910403549671173, 0.14932776987552643, 0.4999200999736786], [-0.31665366888046265, -0.19830414652824402, 0.15932616591453552, 0.2577725350856781], [-0.32061973214149475, -0.005773007404059172, 0.16448162496089935, 0.019277557730674744], [-0.3207351863384247, 0.18665491044521332, 0.16486717760562897, -0.2173287719488144], [-0.3170020878314972, -0.010392938740551472, 0.16052059829235077, 0.12248675525188446], [-0.31720995903015137, -0.20740704238414764, 0.16297033429145813, 0.46119940280914307], [-0.3213581144809723, -0.014918265864253044, 0.17219431698322296, 0.22399349510669708], [-0.3216564655303955, 0.17737798392772675, 0.17667418718338013, -0.009809797629714012], [-0.3181089162826538, -0.019779687747359276, 0.17647799849510193, 0.33299559354782104], [-0.3185045123100281, -0.2169167697429657, 0.183137908577919, 0.6757239699363708], [-0.3228428363800049, -0.41404733061790466, 0.1966523826122284, 1.0200170278549194], [-0.3311237692832947, -0.22201161086559296, 0.21705272793769836, 0.7949591875076294], [0.0016769854119047523, -0.21248075366020203, 0.022225920110940933, 0.26749515533447266], [-0.0025726298335939646, -0.017682945355772972, 0.027575822547078133, -0.018095528706908226], [-0.002926288638263941, 0.17703290283679962, 0.027213912457227707, -0.3019520044326782], [0.000614369404502213, -0.018466128036379814, 0.021174872294068336, -0.0008121278369799256], [0.0002450468600727618, -0.21388526260852814, 0.021158630028367043, 0.29847580194473267], [-0.004032658413052559, -0.019071202725172043, 0.027128145098686218, 0.012540300376713276], [-0.004414082504808903, -0.2145714908838272, 0.027378952130675316, 0.3136575222015381], [-0.008705511689186096, -0.41007256507873535, 0.03365210071206093, 0.6148476004600525], [-0.016906963661313057, -0.6056481599807739, 0.0459490530192852, 0.9179368019104004], [-0.029019925743341446, -0.41117650270462036, 0.0643077865242958, 0.6400414705276489], [-0.03724345564842224, -0.21700727939605713, 0.07710862159729004, 0.36828312277793884], [-0.041583601385354996, -0.4131353497505188, 0.08447428047657013, 0.6842485666275024], [-0.049846310168504715, -0.6093223094940186, 0.09815925359725952, 1.0022854804992676], [-0.062032755464315414, -0.41563913226127625, 0.11820496618747711, 0.7419717907905579], [-0.07034553587436676, -0.22233004868030548, 0.13304439187049866, 0.4887029230594635], [-0.07479213923215866, -0.41905340552330017, 0.14281845092773438, 0.8201799392700195], [-0.08317320793867111, -0.615810751914978, 0.1592220515012741, 1.1541571617126465], [-0.09548941999673843, -0.4230823516845703, 0.1823052018880844, 0.9153350591659546], [-0.10395106673240662, -0.2308315485715866, 0.2006119042634964, 0.6850390434265137], [-0.10856769979000092, -0.4280896484851837, 0.21431268751621246, 1.0335772037506104], [-0.014193938113749027, -0.22264239192008972, 0.003469345858320594, 0.31115370988845825], [-0.018646785989403725, -0.41781359910964966, 0.0096924202516675, 0.604928731918335], [-0.027003059163689613, -0.22282852232456207, 0.021790994331240654, 0.315314382314682], [-0.03145962953567505, -0.41825398802757263, 0.028097281232476234, 0.6147890090942383], [-0.0398247092962265, -0.2235356718301773, 0.04039306193590164, 0.33108633756637573], [-0.04429542273283005, -0.4192086160182953, 0.047014787793159485, 0.6362286806106567], [-0.05267959460616112, -0.22477279603481293, 0.0597393624484539, 0.3587144911289215], [-0.05717505142092705, -0.03054872713983059, 0.0669136494398117, 0.08545100688934326], [-0.05778602510690689, -0.22656285762786865, 0.06862267106771469, 0.3984721601009369], [-0.06231728196144104, -0.4225878119468689, 0.07659211754798889, 0.7119767665863037], [-0.0707690417766571, -0.2286052703857422, 0.09083165228366852, 0.44435209035873413], [-0.07534114271402359, -0.03487798571586609, 0.09971869736909866, 0.18162688612937927], [-0.07603870332241058, 0.15868614614009857, 0.10335122793912888, -0.07800820469856262], [-0.07286497950553894, 0.3521863520145416, 0.10179106891155243, -0.3363785147666931], [-0.06582125276327133, 0.15577423572540283, 0.09506350010633469, -0.013410455547273159], [-0.06270577013492584, 0.3494133949279785, 0.09479528665542603, -0.2746511399745941], [-0.055717501789331436, 0.15307573974132538, 0.08930226415395737, 0.04636117443442345], [-0.052655987441539764, 0.3468112051486969, 0.09022948890924454, -0.21686403453350067], [-0.04571976140141487, 0.5405352115631104, 0.0858922079205513, -0.47977644205093384], [-0.03490905836224556, 0.3443123996257782, 0.07629667967557907, -0.16130603849887848], [-0.02802281081676483, 0.14818578958511353, 0.07307055592536926, 0.15443748235702515], [-0.02505909465253353, -0.04790220037102699, 0.07615930587053299, 0.4692482352256775], [-0.026017138734459877, -0.2440127581357956, 0.08554427325725555, 0.7849305272102356], [-0.030897393822669983, -0.05016384273767471, 0.10124288499355316, 0.5203397870063782], [-0.03190067037940025, 0.14339806139469147, 0.11164967715740204, 0.2611982822418213], [-0.029032710939645767, -0.05312591418623924, 0.11687364429235458, 0.5869056582450867], [-0.030095228925347328, -0.24967403709888458, 0.128611758351326, 0.9139992594718933], [-0.035088710486888885, -0.056504279375076294, 0.1468917429447174, 0.6643454432487488], [-0.0362187959253788, 0.13630200922489166, 0.16017864644527435, 0.4212816059589386], [-0.03349275514483452, 0.3288350999355316, 0.1686042845249176, 0.1830703467130661], [-0.026916053146123886, 0.5211937427520752, 0.1722656935453415, -0.05204097926616669], [-0.016492178663611412, 0.7134807705879211, 0.17122487723827362, -0.28580644726753235], [-0.0022225631400942802, 0.9057998657226562, 0.16550874710083008, -0.5199720859527588], [0.01589343324303627, 1.098252534866333, 0.15510930120944977, -0.7562684416770935], [0.03785848245024681, 0.9013715982437134, 0.13998393714427948, -0.4190730154514313], [0.0558859147131443, 0.7045724391937256, 0.1316024661064148, -0.08574084937572479], [0.06997736543416977, 0.897586464881897, 0.129887655377388, -0.3341788649559021], [0.08792909234762192, 0.7008782029151917, 0.1232040748000145, -0.0035222333390265703], [0.10194665938615799, 0.8940376043319702, 0.12313362956047058, -0.2549346685409546], [0.11982740461826324, 1.0872060060501099, 0.11803493648767471, -0.5063835382461548], [0.1415715217590332, 0.8906358480453491, 0.1079072654247284, -0.1789582073688507], [0.15938425064086914, 1.0840613842010498, 0.10432810336351395, -0.43574586510658264], [0.18106546998023987, 1.2775636911392212, 0.09561318159103394, -0.6938042640686035], [0.20661674439907074, 1.0812546014785767, 0.08173710107803345, -0.3726181387901306], [0.22824184596538544, 1.2751260995864868, 0.07428473979234695, -0.6384504437446594], [0.25374436378479004, 1.0790512561798096, 0.06151572987437248, -0.3233296275138855], [0.27532538771629333, 0.8831097483634949, 0.05504913628101349, -0.01189910527318716], [0.292987585067749, 1.077400803565979, 0.054811153560876846, -0.28671789169311523], [0.31453558802604675, 1.2716999053955078, 0.04907679557800293, -0.5616225600242615], [0.33996960520744324, 1.4661000967025757, 0.03784434497356415, -0.8384488821029663], [0.36929160356521606, 1.2704823017120361, 0.02107536606490612, -0.5341087579727173], [0.3947012424468994, 1.4653016328811646, 0.010393191128969193, -0.8200771808624268], [0.42400726675987244, 1.6602798700332642, -0.0060083516873419285, -1.1094731092453003], [0.4572128653526306, 1.4652373790740967, -0.028197813779115677, -0.8186811208724976], [0.48651760816574097, 1.660733699798584, -0.04457143694162369, -1.1200981140136719], [0.5197322964668274, 1.8564109802246094, -0.06697339564561844, -1.4264222383499146], [0.5568605065345764, 2.052293539047241, -0.0955018401145935, -1.7392628192901611], [0.5979064106941223, 1.8583805561065674, -0.13028709590435028, -1.4777536392211914], [0.6350740194320679, 1.6650680303573608, -0.15984217822551727, -1.2284384965896606], [0.6683753728866577, 1.8618444204330444, -0.1844109445810318, -1.566634178161621], [0.7056122422218323, 1.6693421602249146, -0.21574363112449646, -1.3366868495941162], [0.041528284549713135, -0.23174233734607697, -0.03607798367738724, 0.25096845626831055], [0.036893438547849655, -0.03612427040934563, -0.031058616936206818, -0.052872344851493835], [0.03617095202207565, -0.23078742623329163, -0.03211606293916702, 0.22985181212425232], [0.03155520558357239, -0.03522161394357681, -0.027519026771187782, -0.07278614491224289], [0.03085077367722988, -0.22993846237659454, -0.028974749147892, 0.21108895540237427], [0.026252003386616707, -0.4246343970298767, -0.024752970784902573, 0.49449291825294495], [0.01775931566953659, -0.6193986535072327, -0.014863112010061741, 0.7792732119560242], [0.005371341947466135, -0.8143131732940674, 0.0007223517168313265, 1.067242980003357], [-0.010914920829236507, -0.6192007660865784, 0.02206721156835556, 0.7747868895530701], [-0.02329893596470356, -0.42438921332359314, 0.03756295144557953, 0.4891279339790344], [-0.0317867211997509, -0.6200203895568848, 0.04734550788998604, 0.7934086322784424], [-0.04418712854385376, -0.8157591819763184, 0.06321368366479874, 1.100602149963379], [-0.0605023130774498, -1.0116534233093262, 0.08522572368383408, 1.4124290943145752], [-0.08073538541793823, -0.8176850080490112, 0.11347430944442749, 1.147558569908142], [-0.09708908200263977, -0.6242125630378723, 0.13642548024654388, 0.8925061821937561], [-0.10957333445549011, -0.8208949565887451, 0.15427561104297638, 1.2247734069824219], [-0.12599124014377594, -1.0176297426223755, 0.17877106368541718, 1.561547875404358], [-0.14634382724761963, -0.8250399231910706, 0.21000203490257263, 1.329546332359314]], "action_prob": [0.4999801516532898, 0.49932199716567993, 0.49887412786483765, 0.49864256381988525, 0.4985332787036896, 0.49847251176834106, 0.49842506647109985, 0.4983794093132019, 0.5016655921936035, 0.5000140070915222, 0.49937090277671814, 0.49892789125442505, 0.5013095140457153, 0.4988618493080139, 0.4986289143562317, 0.5014815926551819, 0.5014591813087463, 0.49867406487464905, 0.5015282034873962, 0.4985791742801666, 0.5016003251075745, 0.49847927689552307, 0.5016753673553467, 0.4983772933483124, 0.49994853138923645, 0.49929726123809814, 0.5011382699012756, 0.5007641911506653, 0.5001639127731323, 0.4995121359825134, 0.49902600049972534, 0.5012492537498474, 0.4989806115627289, 0.49870023131370544, 0.4985659718513489, 0.4984979033470154, 0.5015487670898438, 0.4983974099159241, 0.4983605444431305, 0.498325377702713, 0.5017112493515015, 0.4998922049999237, 0.5007473230361938, 0.49986815452575684, 0.5007718801498413, 0.5001630783081055, 0.4995030164718628, 0.5009828805923462, 0.49947991967201233, 0.5010125041007996, 0.4994471073150635, 0.49895256757736206, 0.49868375062942505, 0.49855613708496094, 0.5015105605125427, 0.5015373229980469, 0.5015110373497009, 0.5013688802719116, 0.5010342001914978, 0.5004934072494507, 0.49987655878067017, 0.4993675649166107, 0.49903830885887146, 0.5011491775512695, 0.49899986386299133, 0.5012039542198181, 0.49896204471588135, 0.5012558698654175, 0.5010768175125122, 0.5006517171859741, 0.5000069737434387, 0.4993737041950226, 0.4989182651042938, 0.49866917729377747, 0.5014491677284241, 0.5013987421989441, 0.4988105893135071, 0.5014447569847107, 0.5012416839599609, 0.4992024898529053, 0.4987247586250305, 0.5015173554420471, 0.501336932182312, 0.49907395243644714, 0.5013805627822876, 0.49900779128074646, 0.5014276504516602, 0.4989342987537384, 0.501478374004364, 0.4988531172275543, 0.4984675347805023, 0.5016907453536987, 0.5016134977340698, 0.5013612508773804, 0.4991067051887512, 0.501443088054657, 0.4989791810512543, 0.5015251040458679, 0.5011538863182068, 0.5006083250045776, 0.49996671080589294, 0.4992719888687134, 0.5013459920883179, 0.5008737444877625, 0.49970343708992004, 0.49900126457214355, 0.4984785318374634, 0.5017843246459961, 0.499968558549881, 0.5006929636001587, 0.5000637769699097, 0.5005826950073242, 0.49992814660072327, 0.500724732875824, 0.4998944103717804, 0.4992440938949585, 0.4988144636154175, 0.5014029145240784, 0.5012654066085815, 0.4990708529949188, 0.4986719489097595, 0.5015164017677307, 0.501420795917511, 0.49884113669395447, 0.4985053241252899, 0.5016425251960754, 0.5015944838523865, 0.49857789278030396, 0.49991437792778015, 0.4992731213569641, 0.5011543035507202, 0.4992237985134125, 0.5012005567550659, 0.4991627037525177, 0.5012527108192444, 0.5009104013442993, 0.49966126680374146, 0.49903255701065063, 0.5013478398323059, 0.5010576248168945, 0.5005418062210083, 0.4999048411846161, 0.500645101070404, 0.49996307492256165, 0.5006116628646851, 0.5000210404396057, 0.49942609667778015, 0.5009829998016357, 0.5005591511726379, 0.499892920255661, 0.49922168254852295, 0.5012339949607849, 0.5008756518363953, 0.4996825158596039, 0.4990420341491699, 0.5013617277145386, 0.5010718107223511, 0.500591516494751, 0.49999338388442993, 0.49943873286247253, 0.499039888381958, 0.49879753589630127, 0.5013415217399597, 0.5012556910514832, 0.49902912974357605, 0.5012771487236023, 0.4990476071834564, 0.49871131777763367, 0.5014764666557312, 0.4986879825592041, 0.4984816312789917, 0.501623272895813, 0.4984276294708252, 0.5016821026802063, 0.5016205310821533, 0.4986078143119812, 0.49835458397865295, 0.49823513627052307, 0.5018129348754883, 0.4981738328933716, 0.49813181161880493, 0.5018783211708069, 0.4980676770210266, 0.4980703294277191, 0.4980802834033966, 0.501912534236908, 0.5019704103469849, 0.49796321988105774, 0.5019953846931458, 0.5000811815261841, 0.5005584359169006, 0.5000984072685242, 0.5005475878715515, 0.500113844871521, 0.49946269392967224, 0.4989929795265198, 0.498734712600708, 0.501392126083374, 0.5013434886932373, 0.4988473355770111, 0.4985983669757843, 0.49848783016204834, 0.5015671253204346, 0.5016034841537476, 0.49840325117111206, 0.49832555651664734, 0.5017101168632507], "advantages": [8.648519515991211, 7.72294282913208, 6.788635730743408, 5.845653533935547, 4.893752098083496, 3.9326441287994385, 2.9620838165283203, 1.9818716049194336, 0.9918429255485535, 13.993938446044922, 13.122499465942383, 12.242868423461914, 11.355063438415527, 10.461101531982422, 9.555256843566895, 8.640854835510254, 7.718809127807617, 6.787916660308838, 5.845004558563232, 4.895033359527588, 3.9331023693084717, 2.9636433124542236, 1.982347011566162, 0.9929925203323364, 15.705570220947266, 14.851314544677734, 13.98908805847168, 13.122345924377441, 12.247405052185059, 11.36369514465332, 10.47058391571045, 9.56778621673584, 8.652568817138672, 7.731499671936035, 6.800514221191406, 5.859684944152832, 4.909059524536133, 3.948280096054077, 2.9783432483673096, 1.9984102249145508, 1.0084619522094727, 49.001861572265625, 48.48945617675781, 47.9664306640625, 47.44358444213867, 46.91002655029297, 46.371009826660156, 45.82706069946289, 45.28225326538086, 44.72724914550781, 44.17131423950195, 43.60504913330078, 43.033809661865234, 42.457427978515625, 41.875667572021484, 41.28904342651367, 40.69683074951172, 40.099090576171875, 39.495853424072266, 38.886985778808594, 38.272098541259766, 37.65069580078125, 37.022499084472656, 36.38745880126953, 35.743255615234375, 35.09547805786133, 34.438114166259766, 33.777313232421875, 33.106563568115234, 32.428321838378906, 31.742839813232422, 31.056041717529297, 30.361953735351562, 29.660259246826172, 28.950923919677734, 28.231895446777344, 27.50498390197754, 26.774621963500977, 26.03302001953125, 25.283374786376953, 24.53124237060547, 23.770877838134766, 22.999025344848633, 22.218843460083008, 21.435771942138672, 20.639860153198242, 19.84081268310547, 19.028865814208984, 18.213512420654297, 17.385217666625977, 16.553213119506836, 15.712056159973145, 14.859273910522461, 13.997381210327148, 13.12636661529541, 12.251795768737793, 11.363261222839355, 10.470768928527832, 9.564393997192383, 8.6485595703125, 7.723521709442139, 6.7946882247924805, 5.8562774658203125, 4.903168678283691, 3.9402384757995605, 2.973237991333008, 1.9958440065383911, 1.007615327835083, 18.209089279174805, 17.385759353637695, 16.548545837402344, 15.702919006347656, 14.854290962219238, 13.997038841247559, 13.125618934631348, 12.250905990600586, 11.366693496704102, 10.47278881072998, 9.567177772521973, 8.65180778503418, 7.731203556060791, 6.8004913330078125, 5.858030796051025, 4.905531406402588, 3.9468743801116943, 2.977715492248535, 1.9969664812088013, 1.0059221982955933, 45.83167266845703, 45.287261962890625, 44.73672103881836, 44.17637634277344, 43.61464309692383, 43.04302978515625, 42.469852447509766, 41.88676452636719, 41.297237396240234, 40.707088470458984, 40.11021041870117, 39.503517150878906, 38.8901252746582, 38.270286560058594, 37.64443588256836, 37.017513275146484, 36.37890625, 35.739261627197266, 35.08766555786133, 34.42997741699219, 33.770179748535156, 33.10421371459961, 32.431278228759766, 31.75074005126953, 31.0596866607666, 30.361085891723633, 29.660297393798828, 28.951520919799805, 28.232540130615234, 27.505762100219727, 26.771259307861328, 26.029325485229492, 25.280214309692383, 24.523971557617188, 23.760494232177734, 22.9921817779541, 22.216773986816406, 21.42923927307129, 20.638132095336914, 19.834545135498047, 19.02326202392578, 18.207448959350586, 17.37960433959961, 16.54379653930664, 15.70252799987793, 14.849654197692871, 13.991321563720703, 13.124791145324707, 12.245301246643066, 11.35733413696289, 10.460773468017578, 9.557733535766602, 8.642905235290527, 7.7191643714904785, 6.788023948669434, 5.8454813957214355, 4.893698692321777, 3.93251633644104, 2.962491512298584, 1.9828112125396729, 0.9919887781143188, 16.54834747314453, 15.708078384399414, 14.853743553161621, 13.99638843536377, 13.12475872039795, 12.249963760375977, 11.365828514099121, 10.472071647644043, 9.568703651428223, 8.654216766357422, 7.729912757873535, 6.799540996551514, 5.859119892120361, 4.908743858337402, 3.9477710723876953, 2.9767868518829346, 1.997663974761963, 1.0081859827041626], "value_targets": [8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 472100448, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 961862410, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 473094516, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 758920220, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 1461294973, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819, 39834819], "obs": [[0.048017196357250214, -0.03546358644962311, 0.014227733947336674, -0.031366147100925446], [0.047307927161455154, -0.23078665137290955, 0.013600410893559456, 0.2657715976238251], [0.042692191898822784, -0.4261000454425812, 0.018915843218564987, 0.5627130270004272], [0.03417019173502922, -0.23124857246875763, 0.030170103535056114, 0.2760489881038666], [0.029545219615101814, -0.036569755524396896, 0.03569108247756958, -0.006967657711356878], [0.02881382592022419, 0.15802264213562012, 0.035551730543375015, -0.2881793975830078], [0.03197427839040756, -0.037587784230709076, 0.029788142070174217, 0.015500825829803944], [0.031222522258758545, 0.1570945829153061, 0.03009815886616707, -0.2676367461681366], [0.03436441347002983, 0.35177433490753174, 0.02474542334675789, -0.5506766438484192], [0.04139989987015724, 0.1563137322664261, 0.01373189128935337, -0.2503010332584381], [0.044526174664497375, -0.039001598954200745, 0.00872587040066719, 0.046681374311447144], [0.04374614357948303, -0.2342475801706314, 0.009659497998654842, 0.34210458397865295], [0.03906119242310524, -0.03926437720656395, 0.016501588746905327, 0.05248326063156128], [0.03827590495347977, -0.23461900651454926, 0.017551254481077194, 0.3503265678882599], [0.03358352556824684, -0.4299861192703247, 0.02455778606235981, 0.6484918594360352], [0.024983802810311317, -0.2352147251367569, 0.037527624517679214, 0.363642156124115], [0.02027950808405876, -0.04064567759633064, 0.044800467789173126, 0.08302460610866547], [0.019466593861579895, -0.23638024926185608, 0.04646096006035805, 0.3894988000392914], [0.014738989062607288, -0.43212980031967163, 0.05425093322992325, 0.6964608430862427], [0.006096393335610628, -0.2378004938364029, 0.068180151283741, 0.42133772373199463], [0.0013403831981122494, -0.04370743781328201, 0.07660690695047379, 0.15090399980545044], [0.00046623448724858463, 0.1502387374639511, 0.07962498813867569, -0.11666161566972733], [0.003471009200438857, 0.3441348671913147, 0.07729175686836243, -0.3831992745399475], [0.010353706777095795, 0.5380792021751404, 0.06962776929140091, -0.6505460739135742], [0.021115290001034737, 0.7321658134460449, 0.05661684647202492, -0.9205165505409241], [0.0357586070895195, 0.9264787435531616, 0.038206517696380615, -1.1948825120925903], [0.05428818240761757, 1.1210857629776, 0.014308866113424301, -1.4753499031066895], [0.07670989632606506, 0.9257919192314148, -0.015198132954537868, -1.1782325506210327], [0.0952257364988327, 1.1211079359054565, -0.038762785494327545, -1.4756407737731934], [0.11764789372682571, 1.3166813850402832, -0.06827560067176819, -1.7801740169525146], [0.14398151636123657, 1.512501835823059, -0.10387907922267914, -2.093277931213379], [0.17423155903816223, 1.708505392074585, -0.14574463665485382, -2.4161839485168457], [0.2084016650915146, 1.5149158239364624, -0.1940683126449585, -2.1715755462646484], [-0.008759675547480583, -0.003872330766171217, 0.03771994635462761, -0.02510867267847061], [-0.008837121538817883, -0.19951434433460236, 0.037217773497104645, 0.2792326509952545], [-0.012827408500015736, -0.004942541476339102, 0.04280242696404457, -0.0014834540197625756], [-0.012926260009407997, -0.2006513774394989, 0.04277275875210762, 0.3043909966945648], [-0.01693928800523281, -0.3963559567928314, 0.0488605760037899, 0.61025071144104], [-0.024866405874490738, -0.201949805021286, 0.061065591871738434, 0.33334881067276], [-0.02890540286898613, -0.39788535237312317, 0.0677325651049614, 0.6446464657783508], [-0.03686311095952988, -0.5938825607299805, 0.0806254968047142, 0.9578663110733032], [-0.04874075949192047, -0.7899906635284424, 0.09978282451629639, 1.27475106716156], [-0.0645405724644661, -0.9862337112426758, 0.12527784705162048, 1.596938967704773], [-0.08426524698734283, -1.182598352432251, 0.1572166234254837, 1.9259129762649536], [-0.10791721940040588, -1.3790191411972046, 0.1957348883152008, 2.26294207572937], [0.03172638639807701, -8.883396367309615e-05, -0.04820443317294121, 0.016638141125440598], [0.031724609434604645, -0.19448751211166382, -0.0478716716170311, 0.29373082518577576], [0.027834860607981682, 0.0012831023195758462, -0.04199705645442009, -0.013657578267157078], [0.027860522270202637, -0.19321218132972717, -0.04227020591497421, 0.26548460125923157], [0.023996278643608093, -0.38770613074302673, -0.03696051612496376, 0.5445411801338196], [0.01624215580523014, -0.5822897553443909, -0.02606969140470028, 0.8253533244132996], [0.004596360959112644, -0.38682112097740173, -0.009562624618411064, 0.5245864391326904], [-0.003140061628073454, -0.5818071961402893, 0.0009291042806580663, 0.8142408132553101], [-0.014776205644011497, -0.7769418954849243, 0.017213920131325722, 1.1072158813476562], [-0.030315043404698372, -0.972285807132721, 0.0393582358956337, 1.405248999595642], [-0.04976075887680054, -0.7776739597320557, 0.067463219165802, 1.1251256465911865], [-0.06531424075365067, -0.9736121296882629, 0.08996573090553284, 1.4381834268569946], [-0.08478648215532303, -1.16972017288208, 0.11872939765453339, 1.7575701475143433], [-0.10818088799715042, -1.365970492362976, 0.15388080477714539, 2.084697723388672], [-0.13550029695034027, -1.5622773170471191, 0.19557476043701172, 2.420741081237793], [-0.0011163880117237568, -0.0018233839655295014, -0.005074701737612486, -0.013971924781799316], [-0.0011528556933626533, 0.19337098300457, -0.0053541399538517, -0.30825164914131165], [0.002714563859626651, 0.38856881856918335, -0.01151917316019535, -0.6026183366775513], [0.010485939681529999, 0.19360984861850739, -0.023571539670228958, -0.3135858476161957], [0.014358136802911758, 0.38905951380729675, -0.029843255877494812, -0.6136083006858826], [0.022139327600598335, 0.5845855474472046, -0.04211542382836342, -0.9155393242835999], [0.03383103758096695, 0.39005765318870544, -0.06042620912194252, -0.6363845467567444], [0.041632190346717834, 0.1958281546831131, -0.07315389811992645, -0.3633265197277069], [0.045548755675554276, 0.0018180259503424168, -0.08042042702436447, -0.09457771480083466], [0.045585114508867264, -0.19206468760967255, -0.08231198042631149, 0.1716882884502411], [0.041743822395801544, 0.004132997710257769, -0.07887821644544601, -0.14578424394130707], [0.04182647913694382, 0.2002907395362854, -0.0817939043045044, -0.46227213740348816], [0.04583229497075081, 0.3964676558971405, -0.09103934466838837, -0.7795743346214294], [0.05376164987683296, 0.5927154421806335, -0.1066308319568634, -1.0994555950164795], [0.06561595946550369, 0.7890668511390686, -0.1286199390888214, -1.4235999584197998], [0.08139729499816895, 0.985522985458374, -0.15709194540977478, -1.7535600662231445], [0.10110775381326675, 1.182039737701416, -0.1921631395816803, -2.09070086479187], [0.013265336863696575, -0.0025884569622576237, -0.03135821223258972, -0.042323049157857895], [0.013213567435741425, 0.19296880066394806, -0.032204676419496536, -0.34473252296447754], [0.017072943970561028, 0.38853371143341064, -0.039099324494600296, -0.6473943591117859], [0.024843618273735046, 0.5841779708862305, -0.052047211676836014, -0.9521287083625793], [0.036527179181575775, 0.38979360461235046, -0.07108978927135468, -0.676241934299469], [0.04432304948568344, 0.19572770595550537, -0.08461462706327438, -0.40676116943359375], [0.04823760315775871, 0.0019011285621672869, -0.09274984896183014, -0.14190851151943207], [0.048275627195835114, -0.1917785257101059, -0.09558802098035812, 0.12013289332389832], [0.04444005712866783, 0.00457374332472682, -0.09318536520004272, -0.2011110633611679], [0.044531531631946564, -0.1891004890203476, -0.09720758348703384, 0.06078299507498741], [0.04074952006340027, 0.007271100301295519, -0.09599192440509796, -0.2609178423881531], [0.040894944220781326, -0.18635883927345276, -0.10121028125286102, 1.1650725355139002e-05], [0.03716776520013809, -0.3798946142196655, -0.10121005028486252, 0.25912466645240784], [0.029569873586297035, -0.5734370350837708, -0.09602755308151245, 0.518247663974762], [0.018101133406162262, -0.767085075378418, -0.0856626033782959, 0.7791928052902222], [0.0027594321873039007, -0.9609313607215881, -0.07007874548435211, 1.043742060661316], [-0.01645919494330883, -1.155056357383728, -0.04920390620827675, 1.3136284351348877], [-0.03956032171845436, -0.9593473076820374, -0.022931335493922234, 1.0059601068496704], [-0.058747269213199615, -0.7639268040657043, -0.002812132937833667, 0.7061651349067688], [-0.07402580231428146, -0.9590096473693848, 0.01131116971373558, 0.9979615211486816], [-0.0932059958577156, -0.7640407681465149, 0.03127039968967438, 0.7088522911071777], [-0.10848681628704071, -0.5693655610084534, 0.045447446405887604, 0.42617425322532654], [-0.11987412720918655, -0.37491580843925476, 0.053970932960510254, 0.1481577605009079], [-0.12737244367599487, -0.5707674622535706, 0.056934088468551636, 0.4573671817779541], [-0.13878779113292694, -0.3764946460723877, 0.06608142703771591, 0.1831597536802292], [-0.14631767570972443, -0.182377427816391, 0.06974462419748306, -0.08796676993370056], [-0.14996522665023804, 0.011679098010063171, 0.06798528879880905, -0.35785558819770813], [-0.14973165094852448, -0.18434017896652222, 0.060828179121017456, -0.044533610343933105], [-0.15341845154762268, 0.009859159588813782, 0.059937506914138794, -0.31742140650749207], [-0.1532212644815445, 0.20407846570014954, 0.05358907952904701, -0.5906161665916443], [-0.14913970232009888, 0.008248785510659218, 0.04177675396203995, -0.2815456688404083], [-0.1489747315645218, -0.18744340538978577, 0.03614583984017372, 0.024015285074710846], [-0.15272359549999237, -0.3830645680427551, 0.036626145243644714, 0.327879935503006], [-0.1603848785161972, -0.18848267197608948, 0.043183743953704834, 0.04696851968765259], [-0.1641545444726944, 0.00599429989233613, 0.04412311688065529, -0.2317829132080078], [-0.1640346497297287, 0.20045891404151917, 0.039487458765506744, -0.5102279186248779], [-0.1600254774093628, 0.004803576972335577, 0.02928289957344532, -0.20536741614341736], [-0.15992939472198486, 0.19949480891227722, 0.02517555095255375, -0.48867112398147583], [-0.1559395045042038, 0.3942526876926422, 0.015402127988636494, -0.7733145356178284], [-0.14805445075035095, 0.589159369468689, -6.416278483811766e-05, -1.0611118078231812], [-0.13627126812934875, 0.39403828978538513, -0.02128640003502369, -0.768449068069458], [-0.12839050590991974, 0.19921571016311646, -0.03665538132190704, -0.4825391471385956], [-0.12440618127584457, 0.004629781004041433, -0.04630616307258606, -0.2016305923461914], [-0.124313585460186, -0.18980036675930023, -0.05033877491950989, 0.07609286904335022], [-0.12810958921909332, 0.006005731876939535, -0.04881691932678223, -0.23203758895397186], [-0.1279894858598709, -0.18838591873645782, -0.05345766991376877, 0.04485603794455528], [-0.1317571997642517, 0.007460216525942087, -0.05256054922938347, -0.2642025649547577], [-0.1316079944372177, -0.186873659491539, -0.057844601571559906, 0.011449986137449741], [-0.1353454738855362, -0.38112038373947144, -0.057615600526332855, 0.2853359282016754], [-0.14296787977218628, -0.18522606790065765, -0.051908884197473526, -0.02494758926331997], [-0.14667239785194397, -0.37956666946411133, -0.05240783467888832, 0.2509162724018097], [-0.15426373481750488, -0.5739026069641113, -0.04738951101899147, 0.5266190767288208], [-0.16574178636074066, -0.3781469762325287, -0.03685712814331055, 0.21938802301883698], [-0.1733047217130661, -0.18251807987689972, -0.03246936947107315, -0.08468957245349884], [-0.17695508897304535, -0.3771599233150482, -0.034163158386945724, 0.19757498800754547], [-0.18449828028678894, -0.18156640231609344, -0.030211659148335457, -0.10568612068891525], [-0.18812960386276245, 0.01397518627345562, -0.0323253832757473, -0.40774551033973694], [-0.18785010278224945, -0.18067385256290436, -0.040480293333530426, -0.1254265010356903], [-0.19146358966827393, -0.37519320845603943, -0.04298882186412811, 0.15421554446220398], [-0.19896744191646576, -0.17948293685913086, -0.03990451246500015, -0.15171346068382263], [-0.20255710184574127, -0.37401145696640015, -0.042938780039548874, 0.12811820209026337], [-0.21003733575344086, -0.17830152809619904, -0.040376417338848114, -0.17779622972011566], [-0.21360336244106293, 0.017374278977513313, -0.043932341039180756, -0.48293814063072205], [-0.2132558822631836, -0.17710097134113312, -0.053591106086969376, -0.20441868901252747], [-0.21679790318012238, 0.018744779750704765, -0.05767947807908058, -0.5135138034820557], [-0.21642300486564636, 0.2146296501159668, -0.06794975697994232, -0.8238008618354797], [-0.21213041245937347, 0.4106120467185974, -0.08442576974630356, -1.137057900428772], [-0.20391817390918732, 0.21668966114521027, -0.10716693103313446, -0.8720020651817322], [-0.19958437979221344, 0.41309303045272827, -0.12460696697235107, -1.1963638067245483], [-0.19132252037525177, 0.21978463232517242, -0.14853425323963165, -0.9451891183853149], [-0.18692682683467865, 0.4165612757205963, -0.16743803024291992, -1.2806127071380615], [-0.17859560251235962, 0.6133732795715332, -0.19305028021335602, -1.620699167251587], [-0.020621823146939278, 0.04559939727187157, 0.04592999070882797, 0.023670557886362076], [-0.019709834828972816, 0.2400336116552353, 0.04640340059995651, -0.25417450070381165], [-0.014909162186086178, 0.04428086057305336, 0.04131991043686867, 0.052776236087083817], [-0.014023545198142529, 0.2387867271900177, 0.042375434190034866, -0.22658893465995789], [-0.009247810579836369, 0.04308559373021126, 0.03784365579485893, 0.0791538879275322], [-0.00838609877973795, 0.23764517903327942, 0.039426736533641815, -0.20135316252708435], [-0.003633194835856557, 0.04198218509554863, 0.0353996716439724, 0.10350171476602554], [-0.0027935511898249388, 0.23657940328121185, 0.03746970742940903, -0.17780593037605286], [0.0019380369922146201, 0.43114566802978516, 0.03391358628869057, -0.4584369361400604], [0.010560950264334679, 0.23556113243103027, 0.024744849652051926, -0.1552601456642151], [0.015272173099219799, 0.04009378328919411, 0.021639645099639893, 0.1451253592967987], [0.01607404835522175, 0.23489925265312195, 0.024542152881622314, -0.1406528800725937], [0.02077203430235386, 0.42966127395629883, 0.02172909490764141, -0.4254932403564453], [0.029365258291363716, 0.6244688034057617, 0.013219230808317661, -0.7112477421760559], [0.04185463488101959, 0.429166316986084, -0.0010057240724563599, -0.41443324089050293], [0.050437960773706436, 0.23405863344669342, -0.009294388815760612, -0.12206754833459854], [0.05511913448572159, 0.42931249737739563, -0.01173574011772871, -0.4176682233810425], [0.06370538473129272, 0.2343588024377823, -0.020089104771614075, -0.12870803475379944], [0.0683925598859787, 0.03953031077980995, -0.022663265466690063, 0.15756992995738983], [0.06918316334486008, 0.23496928811073303, -0.019511865451931953, -0.14217567443847656], [0.07388255000114441, 0.040132131427526474, -0.022355379536747932, 0.1442883014678955], [0.07468519359827042, 0.23556698858737946, -0.0194696132093668, -0.15536266565322876], [0.07939653098583221, 0.4309622049331665, -0.022576866671442986, -0.4541236460208893], [0.08801577985286713, 0.6263960003852844, -0.031659338623285294, -0.7538366913795471], [0.10054370015859604, 0.43172451853752136, -0.04673607274889946, -0.47128206491470337], [0.10917818546295166, 0.6274743676185608, -0.05616171285510063, -0.7783216238021851], [0.12172767519950867, 0.43316778540611267, -0.07172814756631851, -0.5038241744041443], [0.13039103150367737, 0.23912617564201355, -0.08180463314056396, -0.2345801591873169], [0.13517355918884277, 0.04526252672076225, -0.08649623394012451, 0.0312191154807806], [0.13607880473136902, -0.1485193818807602, -0.0858718529343605, 0.29540711641311646], [0.13310842216014862, 0.04771512746810913, -0.07996370643377304, -0.02307535707950592], [0.134062722325325, -0.14617443084716797, -0.0804252177476883, 0.24334536492824554], [0.13113923370838165, -0.3400610089302063, -0.07555831223726273, 0.5096156597137451], [0.12433801591396332, -0.14396044611930847, -0.0653659924864769, 0.19411104917526245], [0.12145880609750748, 0.05203269049525261, -0.061483774334192276, -0.11845473945140839], [0.12249945849180222, 0.24797920882701874, -0.06385286897420883, -0.42988401651382446], [0.12745903432369232, 0.053816862404346466, -0.07245054841041565, -0.15799398720264435], [0.12853537499904633, -0.1401970535516739, -0.07561042904853821, 0.11098158359527588], [0.1257314383983612, -0.33415868878364563, -0.07339079678058624, 0.378884494304657], [0.11904826760292053, -0.5281658172607422, -0.0658131092786789, 0.647554337978363], [0.10848494619131088, -0.7223120927810669, -0.0528620220720768, 0.9188081622123718], [0.0940387025475502, -0.5265169739723206, -0.03448585793375969, 0.6099915504455566], [0.08350836485624313, -0.33093035221099854, -0.022286027669906616, 0.30664920806884766], [0.0768897607922554, -0.5257277488708496, -0.016153043136000633, 0.592221200466156], [0.06637520343065262, -0.7206199169158936, -0.004308619070798159, 0.8797724843025208], [0.051962804049253464, -0.9156830310821533, 0.013286830857396126, 1.171097755432129], [0.03364914283156395, -1.1109752655029297, 0.03670878708362579, 1.4679163694381714], [0.011429638601839542, -0.9163212776184082, 0.06606711447238922, 1.1869221925735474], [-0.0068967873230576515, -1.1122348308563232, 0.08980555832386017, 1.499560832977295], [-0.029141483828425407, -1.3083256483078003, 0.11979677528142929, 1.8188791275024414], [-0.05530799552798271, -1.5045584440231323, 0.15617436170578003, 2.146254777908325], [-0.08539916574954987, -1.7008373737335205, 0.19909945130348206, 2.482819080352783]], "actions": [0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[0.047307927161455154, -0.23078665137290955, 0.013600410893559456, 0.2657715976238251], [0.042692191898822784, -0.4261000454425812, 0.018915843218564987, 0.5627130270004272], [0.03417019173502922, -0.23124857246875763, 0.030170103535056114, 0.2760489881038666], [0.029545219615101814, -0.036569755524396896, 0.03569108247756958, -0.006967657711356878], [0.02881382592022419, 0.15802264213562012, 0.035551730543375015, -0.2881793975830078], [0.03197427839040756, -0.037587784230709076, 0.029788142070174217, 0.015500825829803944], [0.031222522258758545, 0.1570945829153061, 0.03009815886616707, -0.2676367461681366], [0.03436441347002983, 0.35177433490753174, 0.02474542334675789, -0.5506766438484192], [0.04139989987015724, 0.1563137322664261, 0.01373189128935337, -0.2503010332584381], [0.044526174664497375, -0.039001598954200745, 0.00872587040066719, 0.046681374311447144], [0.04374614357948303, -0.2342475801706314, 0.009659497998654842, 0.34210458397865295], [0.03906119242310524, -0.03926437720656395, 0.016501588746905327, 0.05248326063156128], [0.03827590495347977, -0.23461900651454926, 0.017551254481077194, 0.3503265678882599], [0.03358352556824684, -0.4299861192703247, 0.02455778606235981, 0.6484918594360352], [0.024983802810311317, -0.2352147251367569, 0.037527624517679214, 0.363642156124115], [0.02027950808405876, -0.04064567759633064, 0.044800467789173126, 0.08302460610866547], [0.019466593861579895, -0.23638024926185608, 0.04646096006035805, 0.3894988000392914], [0.014738989062607288, -0.43212980031967163, 0.05425093322992325, 0.6964608430862427], [0.006096393335610628, -0.2378004938364029, 0.068180151283741, 0.42133772373199463], [0.0013403831981122494, -0.04370743781328201, 0.07660690695047379, 0.15090399980545044], [0.00046623448724858463, 0.1502387374639511, 0.07962498813867569, -0.11666161566972733], [0.003471009200438857, 0.3441348671913147, 0.07729175686836243, -0.3831992745399475], [0.010353706777095795, 0.5380792021751404, 0.06962776929140091, -0.6505460739135742], [0.021115290001034737, 0.7321658134460449, 0.05661684647202492, -0.9205165505409241], [0.0357586070895195, 0.9264787435531616, 0.038206517696380615, -1.1948825120925903], [0.05428818240761757, 1.1210857629776, 0.014308866113424301, -1.4753499031066895], [0.07670989632606506, 0.9257919192314148, -0.015198132954537868, -1.1782325506210327], [0.0952257364988327, 1.1211079359054565, -0.038762785494327545, -1.4756407737731934], [0.11764789372682571, 1.3166813850402832, -0.06827560067176819, -1.7801740169525146], [0.14398151636123657, 1.512501835823059, -0.10387907922267914, -2.093277931213379], [0.17423155903816223, 1.708505392074585, -0.14574463665485382, -2.4161839485168457], [0.2084016650915146, 1.5149158239364624, -0.1940683126449585, -2.1715755462646484], [0.2386999875307083, 1.3221451044082642, -0.23749981820583344, -1.944546103477478], [-0.008837121538817883, -0.19951434433460236, 0.037217773497104645, 0.2792326509952545], [-0.012827408500015736, -0.004942541476339102, 0.04280242696404457, -0.0014834540197625756], [-0.012926260009407997, -0.2006513774394989, 0.04277275875210762, 0.3043909966945648], [-0.01693928800523281, -0.3963559567928314, 0.0488605760037899, 0.61025071144104], [-0.024866405874490738, -0.201949805021286, 0.061065591871738434, 0.33334881067276], [-0.02890540286898613, -0.39788535237312317, 0.0677325651049614, 0.6446464657783508], [-0.03686311095952988, -0.5938825607299805, 0.0806254968047142, 0.9578663110733032], [-0.04874075949192047, -0.7899906635284424, 0.09978282451629639, 1.27475106716156], [-0.0645405724644661, -0.9862337112426758, 0.12527784705162048, 1.596938967704773], [-0.08426524698734283, -1.182598352432251, 0.1572166234254837, 1.9259129762649536], [-0.10791721940040588, -1.3790191411972046, 0.1957348883152008, 2.26294207572937], [-0.13549759984016418, -1.1861952543258667, 0.24099372327327728, 2.0364084243774414], [0.031724609434604645, -0.19448751211166382, -0.0478716716170311, 0.29373082518577576], [0.027834860607981682, 0.0012831023195758462, -0.04199705645442009, -0.013657578267157078], [0.027860522270202637, -0.19321218132972717, -0.04227020591497421, 0.26548460125923157], [0.023996278643608093, -0.38770613074302673, -0.03696051612496376, 0.5445411801338196], [0.01624215580523014, -0.5822897553443909, -0.02606969140470028, 0.8253533244132996], [0.004596360959112644, -0.38682112097740173, -0.009562624618411064, 0.5245864391326904], [-0.003140061628073454, -0.5818071961402893, 0.0009291042806580663, 0.8142408132553101], [-0.014776205644011497, -0.7769418954849243, 0.017213920131325722, 1.1072158813476562], [-0.030315043404698372, -0.972285807132721, 0.0393582358956337, 1.405248999595642], [-0.04976075887680054, -0.7776739597320557, 0.067463219165802, 1.1251256465911865], [-0.06531424075365067, -0.9736121296882629, 0.08996573090553284, 1.4381834268569946], [-0.08478648215532303, -1.16972017288208, 0.11872939765453339, 1.7575701475143433], [-0.10818088799715042, -1.365970492362976, 0.15388080477714539, 2.084697723388672], [-0.13550029695034027, -1.5622773170471191, 0.19557476043701172, 2.420741081237793], [-0.1667458415031433, -1.3693114519119263, 0.24398957192897797, 2.193943500518799], [-0.0011528556933626533, 0.19337098300457, -0.0053541399538517, -0.30825164914131165], [0.002714563859626651, 0.38856881856918335, -0.01151917316019535, -0.6026183366775513], [0.010485939681529999, 0.19360984861850739, -0.023571539670228958, -0.3135858476161957], [0.014358136802911758, 0.38905951380729675, -0.029843255877494812, -0.6136083006858826], [0.022139327600598335, 0.5845855474472046, -0.04211542382836342, -0.9155393242835999], [0.03383103758096695, 0.39005765318870544, -0.06042620912194252, -0.6363845467567444], [0.041632190346717834, 0.1958281546831131, -0.07315389811992645, -0.3633265197277069], [0.045548755675554276, 0.0018180259503424168, -0.08042042702436447, -0.09457771480083466], [0.045585114508867264, -0.19206468760967255, -0.08231198042631149, 0.1716882884502411], [0.041743822395801544, 0.004132997710257769, -0.07887821644544601, -0.14578424394130707], [0.04182647913694382, 0.2002907395362854, -0.0817939043045044, -0.46227213740348816], [0.04583229497075081, 0.3964676558971405, -0.09103934466838837, -0.7795743346214294], [0.05376164987683296, 0.5927154421806335, -0.1066308319568634, -1.0994555950164795], [0.06561595946550369, 0.7890668511390686, -0.1286199390888214, -1.4235999584197998], [0.08139729499816895, 0.985522985458374, -0.15709194540977478, -1.7535600662231445], [0.10110775381326675, 1.182039737701416, -0.1921631395816803, -2.09070086479187], [0.12474855035543442, 0.9893062710762024, -0.23397715389728546, -1.8630708456039429], [0.013213567435741425, 0.19296880066394806, -0.032204676419496536, -0.34473252296447754], [0.017072943970561028, 0.38853371143341064, -0.039099324494600296, -0.6473943591117859], [0.024843618273735046, 0.5841779708862305, -0.052047211676836014, -0.9521287083625793], [0.036527179181575775, 0.38979360461235046, -0.07108978927135468, -0.676241934299469], [0.04432304948568344, 0.19572770595550537, -0.08461462706327438, -0.40676116943359375], [0.04823760315775871, 0.0019011285621672869, -0.09274984896183014, -0.14190851151943207], [0.048275627195835114, -0.1917785257101059, -0.09558802098035812, 0.12013289332389832], [0.04444005712866783, 0.00457374332472682, -0.09318536520004272, -0.2011110633611679], [0.044531531631946564, -0.1891004890203476, -0.09720758348703384, 0.06078299507498741], [0.04074952006340027, 0.007271100301295519, -0.09599192440509796, -0.2609178423881531], [0.040894944220781326, -0.18635883927345276, -0.10121028125286102, 1.1650725355139002e-05], [0.03716776520013809, -0.3798946142196655, -0.10121005028486252, 0.25912466645240784], [0.029569873586297035, -0.5734370350837708, -0.09602755308151245, 0.518247663974762], [0.018101133406162262, -0.767085075378418, -0.0856626033782959, 0.7791928052902222], [0.0027594321873039007, -0.9609313607215881, -0.07007874548435211, 1.043742060661316], [-0.01645919494330883, -1.155056357383728, -0.04920390620827675, 1.3136284351348877], [-0.03956032171845436, -0.9593473076820374, -0.022931335493922234, 1.0059601068496704], [-0.058747269213199615, -0.7639268040657043, -0.002812132937833667, 0.7061651349067688], [-0.07402580231428146, -0.9590096473693848, 0.01131116971373558, 0.9979615211486816], [-0.0932059958577156, -0.7640407681465149, 0.03127039968967438, 0.7088522911071777], [-0.10848681628704071, -0.5693655610084534, 0.045447446405887604, 0.42617425322532654], [-0.11987412720918655, -0.37491580843925476, 0.053970932960510254, 0.1481577605009079], [-0.12737244367599487, -0.5707674622535706, 0.056934088468551636, 0.4573671817779541], [-0.13878779113292694, -0.3764946460723877, 0.06608142703771591, 0.1831597536802292], [-0.14631767570972443, -0.182377427816391, 0.06974462419748306, -0.08796676993370056], [-0.14996522665023804, 0.011679098010063171, 0.06798528879880905, -0.35785558819770813], [-0.14973165094852448, -0.18434017896652222, 0.060828179121017456, -0.044533610343933105], [-0.15341845154762268, 0.009859159588813782, 0.059937506914138794, -0.31742140650749207], [-0.1532212644815445, 0.20407846570014954, 0.05358907952904701, -0.5906161665916443], [-0.14913970232009888, 0.008248785510659218, 0.04177675396203995, -0.2815456688404083], [-0.1489747315645218, -0.18744340538978577, 0.03614583984017372, 0.024015285074710846], [-0.15272359549999237, -0.3830645680427551, 0.036626145243644714, 0.327879935503006], [-0.1603848785161972, -0.18848267197608948, 0.043183743953704834, 0.04696851968765259], [-0.1641545444726944, 0.00599429989233613, 0.04412311688065529, -0.2317829132080078], [-0.1640346497297287, 0.20045891404151917, 0.039487458765506744, -0.5102279186248779], [-0.1600254774093628, 0.004803576972335577, 0.02928289957344532, -0.20536741614341736], [-0.15992939472198486, 0.19949480891227722, 0.02517555095255375, -0.48867112398147583], [-0.1559395045042038, 0.3942526876926422, 0.015402127988636494, -0.7733145356178284], [-0.14805445075035095, 0.589159369468689, -6.416278483811766e-05, -1.0611118078231812], [-0.13627126812934875, 0.39403828978538513, -0.02128640003502369, -0.768449068069458], [-0.12839050590991974, 0.19921571016311646, -0.03665538132190704, -0.4825391471385956], [-0.12440618127584457, 0.004629781004041433, -0.04630616307258606, -0.2016305923461914], [-0.124313585460186, -0.18980036675930023, -0.05033877491950989, 0.07609286904335022], [-0.12810958921909332, 0.006005731876939535, -0.04881691932678223, -0.23203758895397186], [-0.1279894858598709, -0.18838591873645782, -0.05345766991376877, 0.04485603794455528], [-0.1317571997642517, 0.007460216525942087, -0.05256054922938347, -0.2642025649547577], [-0.1316079944372177, -0.186873659491539, -0.057844601571559906, 0.011449986137449741], [-0.1353454738855362, -0.38112038373947144, -0.057615600526332855, 0.2853359282016754], [-0.14296787977218628, -0.18522606790065765, -0.051908884197473526, -0.02494758926331997], [-0.14667239785194397, -0.37956666946411133, -0.05240783467888832, 0.2509162724018097], [-0.15426373481750488, -0.5739026069641113, -0.04738951101899147, 0.5266190767288208], [-0.16574178636074066, -0.3781469762325287, -0.03685712814331055, 0.21938802301883698], [-0.1733047217130661, -0.18251807987689972, -0.03246936947107315, -0.08468957245349884], [-0.17695508897304535, -0.3771599233150482, -0.034163158386945724, 0.19757498800754547], [-0.18449828028678894, -0.18156640231609344, -0.030211659148335457, -0.10568612068891525], [-0.18812960386276245, 0.01397518627345562, -0.0323253832757473, -0.40774551033973694], [-0.18785010278224945, -0.18067385256290436, -0.040480293333530426, -0.1254265010356903], [-0.19146358966827393, -0.37519320845603943, -0.04298882186412811, 0.15421554446220398], [-0.19896744191646576, -0.17948293685913086, -0.03990451246500015, -0.15171346068382263], [-0.20255710184574127, -0.37401145696640015, -0.042938780039548874, 0.12811820209026337], [-0.21003733575344086, -0.17830152809619904, -0.040376417338848114, -0.17779622972011566], [-0.21360336244106293, 0.017374278977513313, -0.043932341039180756, -0.48293814063072205], [-0.2132558822631836, -0.17710097134113312, -0.053591106086969376, -0.20441868901252747], [-0.21679790318012238, 0.018744779750704765, -0.05767947807908058, -0.5135138034820557], [-0.21642300486564636, 0.2146296501159668, -0.06794975697994232, -0.8238008618354797], [-0.21213041245937347, 0.4106120467185974, -0.08442576974630356, -1.137057900428772], [-0.20391817390918732, 0.21668966114521027, -0.10716693103313446, -0.8720020651817322], [-0.19958437979221344, 0.41309303045272827, -0.12460696697235107, -1.1963638067245483], [-0.19132252037525177, 0.21978463232517242, -0.14853425323963165, -0.9451891183853149], [-0.18692682683467865, 0.4165612757205963, -0.16743803024291992, -1.2806127071380615], [-0.17859560251235962, 0.6133732795715332, -0.19305028021335602, -1.620699167251587], [-0.16632813215255737, 0.4209781885147095, -0.22546426951885223, -1.3938724994659424], [-0.019709834828972816, 0.2400336116552353, 0.04640340059995651, -0.25417450070381165], [-0.014909162186086178, 0.04428086057305336, 0.04131991043686867, 0.052776236087083817], [-0.014023545198142529, 0.2387867271900177, 0.042375434190034866, -0.22658893465995789], [-0.009247810579836369, 0.04308559373021126, 0.03784365579485893, 0.0791538879275322], [-0.00838609877973795, 0.23764517903327942, 0.039426736533641815, -0.20135316252708435], [-0.003633194835856557, 0.04198218509554863, 0.0353996716439724, 0.10350171476602554], [-0.0027935511898249388, 0.23657940328121185, 0.03746970742940903, -0.17780593037605286], [0.0019380369922146201, 0.43114566802978516, 0.03391358628869057, -0.4584369361400604], [0.010560950264334679, 0.23556113243103027, 0.024744849652051926, -0.1552601456642151], [0.015272173099219799, 0.04009378328919411, 0.021639645099639893, 0.1451253592967987], [0.01607404835522175, 0.23489925265312195, 0.024542152881622314, -0.1406528800725937], [0.02077203430235386, 0.42966127395629883, 0.02172909490764141, -0.4254932403564453], [0.029365258291363716, 0.6244688034057617, 0.013219230808317661, -0.7112477421760559], [0.04185463488101959, 0.429166316986084, -0.0010057240724563599, -0.41443324089050293], [0.050437960773706436, 0.23405863344669342, -0.009294388815760612, -0.12206754833459854], [0.05511913448572159, 0.42931249737739563, -0.01173574011772871, -0.4176682233810425], [0.06370538473129272, 0.2343588024377823, -0.020089104771614075, -0.12870803475379944], [0.0683925598859787, 0.03953031077980995, -0.022663265466690063, 0.15756992995738983], [0.06918316334486008, 0.23496928811073303, -0.019511865451931953, -0.14217567443847656], [0.07388255000114441, 0.040132131427526474, -0.022355379536747932, 0.1442883014678955], [0.07468519359827042, 0.23556698858737946, -0.0194696132093668, -0.15536266565322876], [0.07939653098583221, 0.4309622049331665, -0.022576866671442986, -0.4541236460208893], [0.08801577985286713, 0.6263960003852844, -0.031659338623285294, -0.7538366913795471], [0.10054370015859604, 0.43172451853752136, -0.04673607274889946, -0.47128206491470337], [0.10917818546295166, 0.6274743676185608, -0.05616171285510063, -0.7783216238021851], [0.12172767519950867, 0.43316778540611267, -0.07172814756631851, -0.5038241744041443], [0.13039103150367737, 0.23912617564201355, -0.08180463314056396, -0.2345801591873169], [0.13517355918884277, 0.04526252672076225, -0.08649623394012451, 0.0312191154807806], [0.13607880473136902, -0.1485193818807602, -0.0858718529343605, 0.29540711641311646], [0.13310842216014862, 0.04771512746810913, -0.07996370643377304, -0.02307535707950592], [0.134062722325325, -0.14617443084716797, -0.0804252177476883, 0.24334536492824554], [0.13113923370838165, -0.3400610089302063, -0.07555831223726273, 0.5096156597137451], [0.12433801591396332, -0.14396044611930847, -0.0653659924864769, 0.19411104917526245], [0.12145880609750748, 0.05203269049525261, -0.061483774334192276, -0.11845473945140839], [0.12249945849180222, 0.24797920882701874, -0.06385286897420883, -0.42988401651382446], [0.12745903432369232, 0.053816862404346466, -0.07245054841041565, -0.15799398720264435], [0.12853537499904633, -0.1401970535516739, -0.07561042904853821, 0.11098158359527588], [0.1257314383983612, -0.33415868878364563, -0.07339079678058624, 0.378884494304657], [0.11904826760292053, -0.5281658172607422, -0.0658131092786789, 0.647554337978363], [0.10848494619131088, -0.7223120927810669, -0.0528620220720768, 0.9188081622123718], [0.0940387025475502, -0.5265169739723206, -0.03448585793375969, 0.6099915504455566], [0.08350836485624313, -0.33093035221099854, -0.022286027669906616, 0.30664920806884766], [0.0768897607922554, -0.5257277488708496, -0.016153043136000633, 0.592221200466156], [0.06637520343065262, -0.7206199169158936, -0.004308619070798159, 0.8797724843025208], [0.051962804049253464, -0.9156830310821533, 0.013286830857396126, 1.171097755432129], [0.03364914283156395, -1.1109752655029297, 0.03670878708362579, 1.4679163694381714], [0.011429638601839542, -0.9163212776184082, 0.06606711447238922, 1.1869221925735474], [-0.0068967873230576515, -1.1122348308563232, 0.08980555832386017, 1.499560832977295], [-0.029141483828425407, -1.3083256483078003, 0.11979677528142929, 1.8188791275024414], [-0.05530799552798271, -1.5045584440231323, 0.15617436170578003, 2.146254777908325], [-0.08539916574954987, -1.7008373737335205, 0.19909945130348206, 2.482819080352783], [-0.11941590905189514, -1.8969889879226685, 0.2487558275461197, 2.829383134841919]], "action_prob": [0.49999067187309265, 0.4993383586406708, 0.5011053681373596, 0.5007149577140808, 0.5001000165939331, 0.5005508661270142, 0.5001165866851807, 0.499459832906723, 0.5010227560997009, 0.5005602240562439, 0.4998936653137207, 0.5007344484329224, 0.49986594915390015, 0.49923813343048096, 0.5011649131774902, 0.5008230209350586, 0.499753475189209, 0.4991319179534912, 0.5012504458427429, 0.5009472370147705, 0.5004135966300964, 0.4997638463973999, 0.4992187023162842, 0.49887973070144653, 0.49870261549949646, 0.4986109435558319, 0.5014473795890808, 0.4985139071941376, 0.4984658360481262, 0.49842557311058044, 0.49838486313819885, 0.5016563534736633, 0.5017217397689819, 0.4999430477619171, 0.5007241368293762, 0.4998975992202759, 0.4992355704307556, 0.5012052655220032, 0.49916186928749084, 0.4987366199493408, 0.49852868914604187, 0.49843457341194153, 0.49838221073150635, 0.49834010004997253, 0.501701295375824, 0.5001004934310913, 0.5005354881286621, 0.5001260042190552, 0.4994814693927765, 0.49901729822158813, 0.5012413263320923, 0.49896565079689026, 0.49870437383651733, 0.49857795238494873, 0.5014897584915161, 0.49848437309265137, 0.4984268546104431, 0.4983852505683899, 0.4983453154563904, 0.5016950368881226, 0.49997591972351074, 0.49932441115379333, 0.5011202692985535, 0.4992746412754059, 0.49883317947387695, 0.5013934969902039, 0.5012456178665161, 0.5008938312530518, 0.5003198981285095, 0.5003230571746826, 0.4996190369129181, 0.4990009069442749, 0.49863386154174805, 0.49845990538597107, 0.4983774423599243, 0.4983264207839966, 0.5017172694206238, 0.49987685680389404, 0.49922695755958557, 0.49879980087280273, 0.5014164447784424, 0.5012827515602112, 0.5009552836418152, 0.500404953956604, 0.5002359747886658, 0.5004782676696777, 0.5001621842384338, 0.500554084777832, 0.49991950392723083, 0.49935200810432434, 0.4989761412143707, 0.4987695813179016, 0.49866026639938354, 0.501407265663147, 0.5014331936836243, 0.49859803915023804, 0.501501202583313, 0.5014767050743103, 0.5013239979743958, 0.4990483522415161, 0.5013704895973206, 0.5010216236114502, 0.5004468560218811, 0.5001968145370483, 0.5004885792732239, 0.4998384416103363, 0.5006900429725647, 0.5001569390296936, 0.4994719624519348, 0.5011049509048462, 0.5005794167518616, 0.4999222159385681, 0.5006399750709534, 0.49992311000823975, 0.4993487596511841, 0.49897870421409607, 0.501226544380188, 0.5010965466499329, 0.5007877349853516, 0.5002509951591492, 0.5004051923751831, 0.5002910494804382, 0.5003622770309448, 0.5003349184989929, 0.49968641996383667, 0.5008848309516907, 0.49971315264701843, 0.49912819266319275, 0.5012461543083191, 0.5008848905563354, 0.49972954392433167, 0.5008769631385803, 0.5002559423446655, 0.5004128813743591, 0.4997873902320862, 0.5008277297019958, 0.49981194734573364, 0.5008087158203125, 0.50016188621521, 0.5004905462265015, 0.5001044273376465, 0.49945706129074097, 0.4990064203739166, 0.5012562870979309, 0.49890831112861633, 0.5013388991355896, 0.49880170822143555, 0.4985734224319458, 0.5015607476234436, 0.5000620484352112, 0.5005718469619751, 0.5000874400138855, 0.5005543828010559, 0.5001114010810852, 0.5005367994308472, 0.5001346468925476, 0.4994814097881317, 0.5009998679161072, 0.50052809715271, 0.5001473426818848, 0.49948403239250183, 0.49898460507392883, 0.5012931823730469, 0.5010649561882019, 0.4994131326675415, 0.5010963678359985, 0.5006259679794312, 0.5000332593917847, 0.5006448030471802, 0.5000119209289551, 0.49933576583862305, 0.498842716217041, 0.5014151930809021, 0.49877434968948364, 0.5014722347259521, 0.5013028383255005, 0.5009133219718933, 0.5003160834312439, 0.5003097057342529, 0.5003743767738342, 0.4997379183769226, 0.5007544755935669, 0.5002409815788269, 0.4995455741882324, 0.5010590553283691, 0.5005311965942383, 0.499885231256485, 0.49933820962905884, 0.4989895224571228, 0.5012015700340271, 0.5010684132575989, 0.49926984310150146, 0.49889394640922546, 0.49869877099990845, 0.4985992908477783, 0.5014633536338806, 0.498503178358078, 0.4984516203403473, 0.49840790033340454, 0.4983645975589752, 0.49832236766815186], "advantages": [28.226797103881836, 27.50461196899414, 26.774511337280273, 26.032718658447266, 25.282896041870117, 24.52549171447754, 23.766029357910156, 22.993268966674805, 22.213214874267578, 21.429885864257812, 20.63912010192871, 19.840187072753906, 19.027828216552734, 18.212631225585938, 17.388498306274414, 16.552085876464844, 15.706623077392578, 14.857897758483887, 13.999839782714844, 13.12937068939209, 12.249510765075684, 11.360509872436523, 10.462811470031738, 9.556635856628418, 8.641887664794922, 7.718348979949951, 6.785796165466309, 5.844742298126221, 4.893216133117676, 3.932319402694702, 2.9618701934814453, 1.9817135334014893, 0.9915434718132019, 11.361373901367188, 10.468911170959473, 9.56187915802002, 8.651228904724121, 7.730713844299316, 6.796685695648193, 5.857405662536621, 4.907834053039551, 3.948063611984253, 2.9782025814056396, 1.9983046054840088, 1.0083720684051514, 13.994232177734375, 13.128104209899902, 12.247697830200195, 11.363974571228027, 10.470788955688477, 9.567902565002441, 8.652809143066406, 7.731640338897705, 6.800568580627441, 5.859672546386719, 4.908247947692871, 3.94824481010437, 2.978254556655884, 1.9982908964157104, 1.0083284378051758, 15.70553970336914, 14.851319313049316, 13.989097595214844, 13.12243938446045, 12.242731094360352, 11.354898452758789, 10.4608154296875, 9.55832290649414, 8.647256851196289, 7.727108955383301, 6.791981220245361, 5.847748279571533, 4.894810199737549, 3.933030128479004, 2.9620816707611084, 1.9816659688949585, 0.9915438890457153, 51.50041198730469, 51.00772476196289, 50.51074981689453, 50.009525299072266, 49.505802154541016, 48.997596740722656, 48.48481369018555, 47.967041015625, 47.4383430480957, 46.909996032714844, 46.37063980102539, 45.831478118896484, 45.28672790527344, 44.73596954345703, 44.179080963134766, 43.61610412597656, 43.04710388183594, 42.47110366821289, 41.88882827758789, 41.302940368652344, 40.70889663696289, 40.10829544067383, 39.501041412353516, 38.89240264892578, 38.272945404052734, 37.6468505859375, 37.014522552490234, 36.38120651245117, 35.736026763916016, 35.0848503112793, 34.4315185546875, 33.77211380004883, 33.10590744018555, 32.42762756347656, 31.74239158630371, 31.05068016052246, 30.35672378540039, 29.650938034057617, 28.93874168395996, 28.220001220703125, 27.495996475219727, 26.765304565429688, 26.02789306640625, 25.283390045166016, 24.52573585510254, 23.766035079956055, 22.993070602416992, 22.217853546142578, 21.434709548950195, 20.63823699951172, 19.839181900024414, 19.031579971313477, 18.2113037109375, 17.382287979125977, 16.550432205200195, 15.704642295837402, 14.850502967834473, 13.992928504943848, 13.126821517944336, 12.246426582336426, 11.362680435180664, 10.464472770690918, 9.557518005371094, 8.646320343017578, 7.721031188964844, 6.787205219268799, 5.844715595245361, 4.894494533538818, 3.9329543113708496, 2.9632861614227295, 1.982345700263977, 0.9919753074645996, 40.703617095947266, 40.102020263671875, 39.49991989135742, 38.88612365722656, 38.271751403808594, 37.64552307128906, 37.01862335205078, 36.37971878051758, 35.734806060791016, 35.08818817138672, 34.435428619384766, 33.770381927490234, 33.09901428222656, 32.42153549194336, 31.740774154663086, 31.05379867553711, 30.354875564575195, 29.65386962890625, 28.94609260559082, 28.225473403930664, 27.50326919555664, 26.76807975769043, 26.025888442993164, 25.276926040649414, 24.523836135864258, 23.759693145751953, 22.991178512573242, 22.215492248535156, 21.4323673248291, 20.641246795654297, 19.836637496948242, 19.029470443725586, 18.213665008544922, 17.38500213623047, 16.5474796295166, 15.701756477355957, 14.852697372436523, 13.995277404785156, 13.128868103027344, 12.253085136413574, 11.367856979370117, 10.471203804016113, 9.56477165222168, 8.653230667114258, 7.731805324554443, 6.800554275512695, 5.859546184539795, 4.908216953277588, 3.9481070041656494, 2.9780585765838623, 1.9980684518814087, 1.0080984830856323], "value_targets": [28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 1827651813, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 501702207, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1561588942, 1621042211, 1621042211, 1621042211, 1621042211, 1621042211, 1621042211, 1621042211, 1621042211, 1621042211, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 313712563, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 1989371953, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 518074159, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 977698926, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 570428624, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265, 973191265], "obs": [[-0.0407908596098423, 0.04736078903079033, 0.014863060787320137, 0.005399354267865419], [-0.039843641221523285, -0.14797113835811615, 0.014971047639846802, 0.30273446440696716], [-0.04280306398868561, 0.04693428799510002, 0.02102573588490486, 0.014810409396886826], [-0.04186438024044037, -0.1484827846288681, 0.021321944892406464, 0.3140523433685303], [-0.044834036380052567, 0.046329036355018616, 0.027602991089224815, 0.02816920354962349], [-0.04390745609998703, -0.1491776555776596, 0.028166376054286957, 0.32943177223205566], [-0.04689100757241249, -0.3446890115737915, 0.03475501015782356, 0.630862295627594], [-0.05378478765487671, -0.5402782559394836, 0.04737225919961929, 0.9342848658561707], [-0.06459034979343414, -0.7360061407089233, 0.0660579577088356, 1.2414696216583252], [-0.07931047677993774, -0.9319109916687012, 0.09088734537363052, 1.5540928840637207], [-0.09794869273900986, -0.7379883527755737, 0.12196920067071915, 1.2910935878753662], [-0.11270846426486969, -0.5446099042892456, 0.1477910727262497, 1.0389509201049805], [-0.12360066175460815, -0.741353452205658, 0.16857010126113892, 1.3741416931152344], [-0.138427734375, -0.5486912131309509, 0.1960529237985611, 1.138569951057434], [-0.016268353909254074, -0.0450003556907177, -0.005877231247723103, -0.023368779569864273], [-0.017168361693620682, -0.24003753066062927, -0.006344606634229422, 0.26745402812957764], [-0.021969111636281013, -0.43506836891174316, -0.0009955259738489985, 0.558129072189331], [-0.03067047894001007, -0.23993244767189026, 0.010167055763304234, 0.26513269543647766], [-0.03546912968158722, -0.04495707526803017, 0.015469709411263466, -0.024326197803020477], [-0.036368269473314285, -0.24029742181301117, 0.014983185566961765, 0.2731971740722656], [-0.04117421805858612, -0.04539242759346962, 0.020447129383683205, -0.014722607098519802], [-0.04208206757903099, 0.14943040907382965, 0.020152676850557327, -0.3008847236633301], [-0.03909345716238022, 0.3442594110965729, 0.014134982600808144, -0.5871444344520569], [-0.03220827132463455, 0.14894238114356995, 0.0023920941166579723, -0.29004257917404175], [-0.0292294230312109, -0.046213600784540176, -0.0034087577369064093, 0.0033938216511160135], [-0.03015369549393654, 0.14895707368850708, -0.0033408813178539276, -0.2903626561164856], [-0.027174552902579308, 0.34412649273872375, -0.009148133918642998, -0.5840973854064941], [-0.020292023196816444, 0.14913389086723328, -0.020830081775784492, -0.29431021213531494], [-0.017309345304965973, 0.34454652667045593, -0.026716286316514015, -0.5934891700744629], [-0.010418415069580078, 0.14980852603912354, -0.03858606889843941, -0.30934008955955505], [-0.007422244641929865, -0.04474300891160965, -0.04477287083864212, -0.029071496799588203], [-0.008317104540765285, 0.15099146962165833, -0.04535430297255516, -0.33553779125213623], [-0.005297275260090828, 0.3467285633087158, -0.052065059542655945, -0.6421710848808289], [0.0016372955869883299, 0.15236951410770416, -0.0649084821343422, -0.36632782220840454], [0.004684686195105314, 0.3483509123325348, -0.07223503291606903, -0.6787505745887756], [0.011651704087853432, 0.15430283546447754, -0.08581005036830902, -0.4096561670303345], [0.014737761579453945, -0.03950436785817146, -0.09400317072868347, -0.14521218836307526], [0.013947674073278904, -0.23316319286823273, -0.09690741449594498, 0.11639726907014847], [0.009284409694373608, -0.42677268385887146, -0.09457947313785553, 0.3770027160644531], [0.0007489563431590796, -0.23044361174106598, -0.08703941851854324, 0.05606038495898247], [-0.003859916003420949, -0.42421671748161316, -0.08591821044683456, 0.32006242871284485], [-0.012344250455498695, -0.22798293828964233, -0.07951696217060089, 0.0015686507103964686], [-0.016903908923268318, -0.42187976837158203, -0.07948558777570724, 0.2681415379047394], [-0.02534150518476963, -0.22571875154972076, -0.07412275671958923, -0.04851515591144562], [-0.02985587902367115, -0.419703871011734, -0.07509306073188782, 0.21989144384860992], [-0.03824995830655098, -0.2235933393239975, -0.07069522887468338, -0.09550198912620544], [-0.04272182285785675, -0.4176345765590668, -0.07260526716709137, 0.1740657389163971], [-0.05107451602816582, -0.6116463541984558, -0.06912395358085632, 0.4429894983768463], [-0.06330744177103043, -0.805725634098053, -0.060264162719249725, 0.7131068706512451], [-0.07942195236682892, -0.6098233461380005, -0.04600202664732933, 0.4020799994468689], [-0.09161841869354248, -0.8042636513710022, -0.03796042501926422, 0.6799120903015137], [-0.10770369321107864, -0.6086355447769165, -0.02436218410730362, 0.3755236566066742], [-0.11987640708684921, -0.41317617893218994, -0.01685171201825142, 0.07525982707738876], [-0.128139927983284, -0.21781675517559052, -0.015346514992415905, -0.2226918786764145], [-0.13249626755714417, -0.02247885800898075, -0.019800351932644844, -0.5201759338378906], [-0.13294583559036255, 0.17291615903377533, -0.030203871428966522, -0.8190318942070007], [-0.1294875144958496, 0.368438184261322, -0.04658450931310654, -1.121059775352478], [-0.1221187561750412, 0.17395713925361633, -0.06900570541620255, -0.843345582485199], [-0.11863961070775986, 0.3699495494365692, -0.08587262034416199, -1.1569061279296875], [-0.11124061793088913, 0.5660794377326965, -0.1090107411146164, -1.475232481956482], [-0.09991902858018875, 0.7623514533042908, -0.1385153830051422, -1.7998785972595215], [-0.0846720039844513, 0.9587242603302002, -0.17451296746730804, -2.1322100162506104], [-0.0454050675034523, 0.029701290652155876, -0.005388908088207245, 0.04887032136321068], [-0.04481104016304016, -0.16534297168254852, -0.004411501344293356, 0.339848130941391], [-0.048117902129888535, 0.02984146773815155, 0.002385461237281561, 0.045777346938848495], [-0.04752106964588165, -0.16531461477279663, 0.003301008138805628, 0.33921194076538086], [-0.05082736164331436, -0.3604833781719208, 0.010085247457027435, 0.6329339742660522], [-0.058037031441926956, -0.5557445287704468, 0.02274392731487751, 0.9287759065628052], [-0.06915192306041718, -0.3609369099140167, 0.04131944477558136, 0.6433261036872864], [-0.07637065649032593, -0.5566096305847168, 0.05418596789240837, 0.9487292170524597], [-0.0875028520822525, -0.7524176239967346, 0.0731605514883995, 1.2579329013824463], [-0.10255120694637299, -0.5583041906356812, 0.09831921011209488, 0.9890317320823669], [-0.11371728777885437, -0.7545950412750244, 0.11809984594583511, 1.3109053373336792], [-0.12880918383598328, -0.561150074005127, 0.14431795477867126, 1.0573997497558594], [-0.14003218710422516, -0.7578585743904114, 0.16546595096588135, 1.3916774988174438], [-0.1551893651485443, -0.5651379227638245, 0.19329950213432312, 1.1549701690673828], [-0.04489262029528618, -0.009710580110549927, 0.020327888429164886, 0.023386100307106972], [-0.045086830854415894, -0.2051180601119995, 0.020795609802007675, 0.32241275906562805], [-0.049189191311597824, -0.4005298912525177, 0.02724386565387249, 0.6215805411338806], [-0.05719979107379913, -0.5960214734077454, 0.039675477892160416, 0.9227178692817688], [-0.06912022083997726, -0.7916563749313354, 0.05812983214855194, 1.2276008129119873], [-0.08495334535837173, -0.9874763488769531, 0.08268184959888458, 1.5379151105880737], [-0.10470287501811981, -1.18349027633667, 0.1134401485323906, 1.8552123308181763], [-0.1283726841211319, -1.379661202430725, 0.1505444049835205, 2.1808574199676514], [-0.1559658944606781, -1.1862881183624268, 0.1941615492105484, 1.9381715059280396], [0.022797144949436188, 0.04794376716017723, 0.008106382563710213, 0.03411654755473137], [0.02375601977109909, 0.2429485321044922, 0.00878871325403452, -0.25599774718284607], [0.028614990413188934, 0.4379439055919647, 0.00366875808686018, -0.5458956360816956], [0.037373870611190796, 0.6330141425132751, -0.007249155081808567, -0.8374204039573669], [0.05003415048122406, 0.4379919171333313, -0.023997563868761063, -0.5470260381698608], [0.058793988078832626, 0.6334426403045654, -0.034938082098960876, -0.8471723198890686], [0.07146283984184265, 0.43881428241729736, -0.05188152939081192, -0.5656776428222656], [0.08023913204669952, 0.6346242427825928, -0.06319507956504822, -0.8742436766624451], [0.09293161332607269, 0.8305458426475525, -0.08067995309829712, -1.1861064434051514], [0.10954252630472183, 0.6365575194358826, -0.1044020876288414, -0.9197646379470825], [0.12227368354797363, 0.8329238295555115, -0.12279737740755081, -1.2433488368988037], [0.13893215358257294, 0.6395728588104248, -0.14766435325145721, -0.9915180206298828], [0.15172360837459564, 0.44670233130455017, -0.16749471426010132, -0.7486163973808289], [0.16065765917301178, 0.2542380690574646, -0.1824670433998108, -0.5129736661911011], [0.165742427110672, 0.4513975977897644, -0.1927265077829361, -0.8571515083312988], [0.007080171722918749, 0.004242399707436562, -0.008040770888328552, -0.03617843613028526], [0.007165019866079092, -0.19076332449913025, -0.008764339610934258, 0.25395673513412476], [0.0033497530966997147, 0.004482661373913288, -0.0036852045450359583, -0.04147768393158913], [0.0034394063986837864, 0.19965726137161255, -0.004514758009463549, -0.3353210389614105], [0.007432551588863134, 0.0045998552814126015, -0.01122117880731821, -0.04406524822115898], [0.007524548564106226, -0.19035941362380981, -0.01210248377174139, 0.24505627155303955], [0.0037173605524003506, -0.3853064179420471, -0.007201358675956726, 0.533897340297699], [-0.003988767974078655, -0.19008395075798035, 0.0034765885211527348, 0.23895403742790222], [-0.007790446747094393, -0.3852553963661194, 0.0082556689158082, 0.5327315330505371], [-0.01549555454403162, -0.5804924964904785, 0.018910299986600876, 0.8280043601989746], [-0.027105404064059258, -0.3856341242790222, 0.0354703851044178, 0.5413283705711365], [-0.03481808677315712, -0.1910281926393509, 0.04629695415496826, 0.2600291967391968], [-0.0386386513710022, -0.38677942752838135, 0.05149753764271736, 0.566947877407074], [-0.04637423902750015, -0.1924162656068802, 0.06283649802207947, 0.29092320799827576], [-0.05022256448864937, 0.001756044919602573, 0.06865496188402176, 0.018701329827308655], [-0.05018744245171547, -0.19427989423274994, 0.06902898848056793, 0.33223122358322144], [-0.054073043167591095, -0.0002049142640316859, 0.07567360997200012, 0.0620904415845871], [-0.0540771409869194, -0.19632568955421448, 0.07691542059183121, 0.3776565194129944], [-0.05800365284085274, -0.3924509584903717, 0.0844685509800911, 0.6935654878616333], [-0.06585267186164856, -0.5886367559432983, 0.09833985567092896, 1.0115991830825806], [-0.07762540876865387, -0.7849235534667969, 0.11857184022665024, 1.3334721326828003], [-0.09332387894392014, -0.981323778629303, 0.14524129033088684, 1.6607824563980103], [-0.11295035481452942, -0.7881622314453125, 0.17845693230628967, 1.4166418313980103], [-0.12871359288692474, -0.9849881529808044, 0.2067897766828537, 1.7593803405761719], [0.03961664438247681, 0.030456971377134323, 0.02276303805410862, 0.0033254690933972597], [0.040225785225629807, -0.16498391330242157, 0.02282954752445221, 0.30310261249542236], [0.03692610561847687, 0.029805360361933708, 0.02889159880578518, 0.01770613342523575], [0.03752221539616585, -0.16571876406669617, 0.02924572303891182, 0.3193628787994385], [0.03420783951878548, -0.3612447679042816, 0.03563297912478447, 0.6211234331130981], [0.026982944458723068, -0.5568457245826721, 0.04805544763803482, 0.9248125553131104], [0.015846028923988342, -0.36240464448928833, 0.06655170023441315, 0.6476104855537415], [0.008597936481237411, -0.5583875775337219, 0.07950390875339508, 0.9604859352111816], [-0.0025698160752654076, -0.7544829845428467, 0.09871362894773483, 1.2770494222640991], [-0.017659476026892662, -0.950715184211731, 0.12425461411476135, 1.5989394187927246], [-0.03667378053069115, -0.7572652101516724, 0.15623340010643005, 1.3474385738372803], [-0.0518190823495388, -0.9539674520492554, 0.18318217992782593, 1.6846442222595215], [-0.026335202157497406, 0.004156477749347687, -0.018988970667123795, -0.02679370902478695], [-0.02625207230448723, 0.19954553246498108, -0.019524844363331795, -0.32540684938430786], [-0.022261161357164383, 0.39493995904922485, -0.026032982394099236, -0.6241825819015503], [-0.014362362213432789, 0.2001909464597702, -0.038516633212566376, -0.33981087803840637], [-0.010358543135225773, 0.3958391845226288, -0.045312851667404175, -0.6443866491317749], [-0.0024417599197477102, 0.2013770341873169, -0.05820058286190033, -0.3663102686405182], [0.001585780642926693, 0.007128350902348757, -0.06552679091691971, -0.09253191202878952], [0.0017283476190641522, -0.18699617683887482, -0.06737742573022842, 0.17877887189388275], [-0.0020115759689360857, 0.00902202446013689, -0.0638018473982811, -0.13437525928020477], [-0.001831135479733348, -0.185130774974823, -0.06648935377597809, 0.1375163495540619], [-0.005533750634640455, -0.3792405128479004, -0.06373903155326843, 0.4085041284561157], [-0.013118560425937176, -0.18327546119689941, -0.05556894466280937, 0.09642687439918518], [-0.016784070059657097, -0.37755876779556274, -0.05364040657877922, 0.3710731267929077], [-0.024335244670510292, -0.5718792080879211, -0.04621894657611847, 0.6463719010353088], [-0.03577283024787903, -0.7663277387619019, -0.03329150751233101, 0.9241496324539185], [-0.05109938606619835, -0.5707722902297974, -0.014808515086770058, 0.6211931109428406], [-0.06251483410596848, -0.7656843662261963, -0.0023846530821174383, 0.9091755747795105], [-0.07782851904630661, -0.5705301761627197, 0.015798859298229218, 0.6157441139221191], [-0.08923912048339844, -0.7658692598342896, 0.02811374142765999, 0.9133608341217041], [-0.10455650836229324, -0.5711386799812317, 0.04638095572590828, 0.6296446919441223], [-0.11597927659749985, -0.7668761014938354, 0.058973852545022964, 0.9365662336349487], [-0.13131679594516754, -0.5725969076156616, 0.07770517468452454, 0.6629823446273804], [-0.1427687406539917, -0.3786371350288391, 0.09096482396125793, 0.39574292302131653], [-0.1503414809703827, -0.5749240517616272, 0.09887968003749847, 0.7156628370285034], [-0.16183996200561523, -0.7712655663490295, 0.11319293826818466, 1.0377596616744995], [-0.17726527154445648, -0.9676949977874756, 0.13394813239574432, 1.363726019859314], [-0.1966191828250885, -1.1642162799835205, 0.1612226516008377, 1.695130467414856], [-0.21990349888801575, -1.3607898950576782, 0.1951252669095993, 2.0333614349365234], [-0.014469180256128311, -0.013824628666043282, -0.018114551901817322, -0.009178923442959785], [-0.014745672233402729, 0.18155236542224884, -0.018298130482435226, -0.3075217306613922], [-0.011114625260233879, 0.37693020701408386, -0.024448566138744354, -0.6059187650680542], [-0.0035760209430009127, 0.572385311126709, -0.03656693920493126, -0.9062010049819946], [0.007871685549616814, 0.377777099609375, -0.05469096079468727, -0.6252320408821106], [0.01542722713202238, 0.1834595650434494, -0.0671956017613411, -0.35026270151138306], [0.01909641921520233, 0.3794696033000946, -0.07420085370540619, -0.6633548736572266], [0.0266858097165823, 0.1854540854692459, -0.08746795356273651, -0.394927442073822], [0.030394893139600754, 0.38170120120048523, -0.09536650031805038, -0.7138555645942688], [0.038028914481401443, 0.5780049562454224, -0.1096436157822609, -1.0349684953689575], [0.049589015543460846, 0.38449808955192566, -0.1303429901599884, -0.7786218523979187], [0.05727897956967354, 0.1913861781358719, -0.1459154188632965, -0.5296235084533691], [0.06110670045018196, 0.3882269263267517, -0.15650789439678192, -0.8644940257072449], [0.06887123733758926, 0.5850933194160461, -0.17379777133464813, -1.2020100355148315], [0.08057310432195663, 0.7819833755493164, -0.1978379786014557, -1.5437356233596802], [0.02451103739440441, 0.01933724246919155, -0.015418538823723793, -0.035470884293317795], [0.024897782132029533, 0.2146768718957901, -0.01612795703113079, -0.33297836780548096], [0.02919132076203823, 0.019788138568401337, -0.02278752438724041, -0.045424703508615494], [0.02958708256483078, 0.2152293175458908, -0.023696018382906914, -0.3452093005180359], [0.033891670405864716, 0.020452314987778664, -0.030600203201174736, -0.060091808438301086], [0.03430071473121643, 0.21599934995174408, -0.031802039593458176, -0.3622700870037079], [0.03862070292234421, 0.4115585386753082, -0.03904744237661362, -0.6648087501525879], [0.04685187339782715, 0.21700087189674377, -0.052343618124723434, -0.38467177748680115], [0.05119188874959946, 0.022659609094262123, -0.06003705412149429, -0.10894113034009933], [0.051645081490278244, -0.17155292630195618, -0.06221587583422661, 0.16421250998973846], [0.04821402579545975, -0.3657316267490387, -0.0589316263794899, 0.43663734197616577], [0.04089939221739769, -0.16982713341712952, -0.05019887909293175, 0.1259748786687851], [0.037502847611904144, 0.02597668021917343, -0.04767937958240509, -0.1821131408214569], [0.03802238404750824, 0.22174730896949768, -0.051321644335985184, -0.48944777250289917], [0.042457327246665955, 0.4175542891025543, -0.06111059710383415, -0.7978534698486328], [0.050808414816856384, 0.22332166135311127, -0.07706766575574875, -0.5250037312507629], [0.055274847894907, 0.029364027082920074, -0.08756774663925171, -0.25756630301475525], [0.05586212873458862, 0.22561992704868317, -0.09271907061338425, -0.5765342116355896], [0.06037452816963196, 0.4219108521938324, -0.1042497530579567, -0.8969262838363647], [0.06881274282932281, 0.6182798147201538, -0.1221882775425911, -1.2204744815826416], [0.08117833733558655, 0.814746081829071, -0.14659777283668518, -1.5488107204437256], [0.09747326374053955, 1.011291742324829, -0.17757397890090942, -1.883412480354309]], "actions": [0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.039843641221523285, -0.14797113835811615, 0.014971047639846802, 0.30273446440696716], [-0.04280306398868561, 0.04693428799510002, 0.02102573588490486, 0.014810409396886826], [-0.04186438024044037, -0.1484827846288681, 0.021321944892406464, 0.3140523433685303], [-0.044834036380052567, 0.046329036355018616, 0.027602991089224815, 0.02816920354962349], [-0.04390745609998703, -0.1491776555776596, 0.028166376054286957, 0.32943177223205566], [-0.04689100757241249, -0.3446890115737915, 0.03475501015782356, 0.630862295627594], [-0.05378478765487671, -0.5402782559394836, 0.04737225919961929, 0.9342848658561707], [-0.06459034979343414, -0.7360061407089233, 0.0660579577088356, 1.2414696216583252], [-0.07931047677993774, -0.9319109916687012, 0.09088734537363052, 1.5540928840637207], [-0.09794869273900986, -0.7379883527755737, 0.12196920067071915, 1.2910935878753662], [-0.11270846426486969, -0.5446099042892456, 0.1477910727262497, 1.0389509201049805], [-0.12360066175460815, -0.741353452205658, 0.16857010126113892, 1.3741416931152344], [-0.138427734375, -0.5486912131309509, 0.1960529237985611, 1.138569951057434], [-0.14940154552459717, -0.7457597851753235, 0.2188243269920349, 1.485780954360962], [-0.017168361693620682, -0.24003753066062927, -0.006344606634229422, 0.26745402812957764], [-0.021969111636281013, -0.43506836891174316, -0.0009955259738489985, 0.558129072189331], [-0.03067047894001007, -0.23993244767189026, 0.010167055763304234, 0.26513269543647766], [-0.03546912968158722, -0.04495707526803017, 0.015469709411263466, -0.024326197803020477], [-0.036368269473314285, -0.24029742181301117, 0.014983185566961765, 0.2731971740722656], [-0.04117421805858612, -0.04539242759346962, 0.020447129383683205, -0.014722607098519802], [-0.04208206757903099, 0.14943040907382965, 0.020152676850557327, -0.3008847236633301], [-0.03909345716238022, 0.3442594110965729, 0.014134982600808144, -0.5871444344520569], [-0.03220827132463455, 0.14894238114356995, 0.0023920941166579723, -0.29004257917404175], [-0.0292294230312109, -0.046213600784540176, -0.0034087577369064093, 0.0033938216511160135], [-0.03015369549393654, 0.14895707368850708, -0.0033408813178539276, -0.2903626561164856], [-0.027174552902579308, 0.34412649273872375, -0.009148133918642998, -0.5840973854064941], [-0.020292023196816444, 0.14913389086723328, -0.020830081775784492, -0.29431021213531494], [-0.017309345304965973, 0.34454652667045593, -0.026716286316514015, -0.5934891700744629], [-0.010418415069580078, 0.14980852603912354, -0.03858606889843941, -0.30934008955955505], [-0.007422244641929865, -0.04474300891160965, -0.04477287083864212, -0.029071496799588203], [-0.008317104540765285, 0.15099146962165833, -0.04535430297255516, -0.33553779125213623], [-0.005297275260090828, 0.3467285633087158, -0.052065059542655945, -0.6421710848808289], [0.0016372955869883299, 0.15236951410770416, -0.0649084821343422, -0.36632782220840454], [0.004684686195105314, 0.3483509123325348, -0.07223503291606903, -0.6787505745887756], [0.011651704087853432, 0.15430283546447754, -0.08581005036830902, -0.4096561670303345], [0.014737761579453945, -0.03950436785817146, -0.09400317072868347, -0.14521218836307526], [0.013947674073278904, -0.23316319286823273, -0.09690741449594498, 0.11639726907014847], [0.009284409694373608, -0.42677268385887146, -0.09457947313785553, 0.3770027160644531], [0.0007489563431590796, -0.23044361174106598, -0.08703941851854324, 0.05606038495898247], [-0.003859916003420949, -0.42421671748161316, -0.08591821044683456, 0.32006242871284485], [-0.012344250455498695, -0.22798293828964233, -0.07951696217060089, 0.0015686507103964686], [-0.016903908923268318, -0.42187976837158203, -0.07948558777570724, 0.2681415379047394], [-0.02534150518476963, -0.22571875154972076, -0.07412275671958923, -0.04851515591144562], [-0.02985587902367115, -0.419703871011734, -0.07509306073188782, 0.21989144384860992], [-0.03824995830655098, -0.2235933393239975, -0.07069522887468338, -0.09550198912620544], [-0.04272182285785675, -0.4176345765590668, -0.07260526716709137, 0.1740657389163971], [-0.05107451602816582, -0.6116463541984558, -0.06912395358085632, 0.4429894983768463], [-0.06330744177103043, -0.805725634098053, -0.060264162719249725, 0.7131068706512451], [-0.07942195236682892, -0.6098233461380005, -0.04600202664732933, 0.4020799994468689], [-0.09161841869354248, -0.8042636513710022, -0.03796042501926422, 0.6799120903015137], [-0.10770369321107864, -0.6086355447769165, -0.02436218410730362, 0.3755236566066742], [-0.11987640708684921, -0.41317617893218994, -0.01685171201825142, 0.07525982707738876], [-0.128139927983284, -0.21781675517559052, -0.015346514992415905, -0.2226918786764145], [-0.13249626755714417, -0.02247885800898075, -0.019800351932644844, -0.5201759338378906], [-0.13294583559036255, 0.17291615903377533, -0.030203871428966522, -0.8190318942070007], [-0.1294875144958496, 0.368438184261322, -0.04658450931310654, -1.121059775352478], [-0.1221187561750412, 0.17395713925361633, -0.06900570541620255, -0.843345582485199], [-0.11863961070775986, 0.3699495494365692, -0.08587262034416199, -1.1569061279296875], [-0.11124061793088913, 0.5660794377326965, -0.1090107411146164, -1.475232481956482], [-0.09991902858018875, 0.7623514533042908, -0.1385153830051422, -1.7998785972595215], [-0.0846720039844513, 0.9587242603302002, -0.17451296746730804, -2.1322100162506104], [-0.0654975175857544, 0.7657102346420288, -0.21715715527534485, -1.8981331586837769], [-0.04481104016304016, -0.16534297168254852, -0.004411501344293356, 0.339848130941391], [-0.048117902129888535, 0.02984146773815155, 0.002385461237281561, 0.045777346938848495], [-0.04752106964588165, -0.16531461477279663, 0.003301008138805628, 0.33921194076538086], [-0.05082736164331436, -0.3604833781719208, 0.010085247457027435, 0.6329339742660522], [-0.058037031441926956, -0.5557445287704468, 0.02274392731487751, 0.9287759065628052], [-0.06915192306041718, -0.3609369099140167, 0.04131944477558136, 0.6433261036872864], [-0.07637065649032593, -0.5566096305847168, 0.05418596789240837, 0.9487292170524597], [-0.0875028520822525, -0.7524176239967346, 0.0731605514883995, 1.2579329013824463], [-0.10255120694637299, -0.5583041906356812, 0.09831921011209488, 0.9890317320823669], [-0.11371728777885437, -0.7545950412750244, 0.11809984594583511, 1.3109053373336792], [-0.12880918383598328, -0.561150074005127, 0.14431795477867126, 1.0573997497558594], [-0.14003218710422516, -0.7578585743904114, 0.16546595096588135, 1.3916774988174438], [-0.1551893651485443, -0.5651379227638245, 0.19329950213432312, 1.1549701690673828], [-0.16649211943149567, -0.7621814608573914, 0.21639889478683472, 1.5015076398849487], [-0.045086830854415894, -0.2051180601119995, 0.020795609802007675, 0.32241275906562805], [-0.049189191311597824, -0.4005298912525177, 0.02724386565387249, 0.6215805411338806], [-0.05719979107379913, -0.5960214734077454, 0.039675477892160416, 0.9227178692817688], [-0.06912022083997726, -0.7916563749313354, 0.05812983214855194, 1.2276008129119873], [-0.08495334535837173, -0.9874763488769531, 0.08268184959888458, 1.5379151105880737], [-0.10470287501811981, -1.18349027633667, 0.1134401485323906, 1.8552123308181763], [-0.1283726841211319, -1.379661202430725, 0.1505444049835205, 2.1808574199676514], [-0.1559658944606781, -1.1862881183624268, 0.1941615492105484, 1.9381715059280396], [-0.17969165742397308, -1.3828824758529663, 0.23292498290538788, 2.284247636795044], [0.02375601977109909, 0.2429485321044922, 0.00878871325403452, -0.25599774718284607], [0.028614990413188934, 0.4379439055919647, 0.00366875808686018, -0.5458956360816956], [0.037373870611190796, 0.6330141425132751, -0.007249155081808567, -0.8374204039573669], [0.05003415048122406, 0.4379919171333313, -0.023997563868761063, -0.5470260381698608], [0.058793988078832626, 0.6334426403045654, -0.034938082098960876, -0.8471723198890686], [0.07146283984184265, 0.43881428241729736, -0.05188152939081192, -0.5656776428222656], [0.08023913204669952, 0.6346242427825928, -0.06319507956504822, -0.8742436766624451], [0.09293161332607269, 0.8305458426475525, -0.08067995309829712, -1.1861064434051514], [0.10954252630472183, 0.6365575194358826, -0.1044020876288414, -0.9197646379470825], [0.12227368354797363, 0.8329238295555115, -0.12279737740755081, -1.2433488368988037], [0.13893215358257294, 0.6395728588104248, -0.14766435325145721, -0.9915180206298828], [0.15172360837459564, 0.44670233130455017, -0.16749471426010132, -0.7486163973808289], [0.16065765917301178, 0.2542380690574646, -0.1824670433998108, -0.5129736661911011], [0.165742427110672, 0.4513975977897644, -0.1927265077829361, -0.8571515083312988], [0.17477037012577057, 0.25934991240501404, -0.20986954867839813, -0.6307249069213867], [0.007165019866079092, -0.19076332449913025, -0.008764339610934258, 0.25395673513412476], [0.0033497530966997147, 0.004482661373913288, -0.0036852045450359583, -0.04147768393158913], [0.0034394063986837864, 0.19965726137161255, -0.004514758009463549, -0.3353210389614105], [0.007432551588863134, 0.0045998552814126015, -0.01122117880731821, -0.04406524822115898], [0.007524548564106226, -0.19035941362380981, -0.01210248377174139, 0.24505627155303955], [0.0037173605524003506, -0.3853064179420471, -0.007201358675956726, 0.533897340297699], [-0.003988767974078655, -0.19008395075798035, 0.0034765885211527348, 0.23895403742790222], [-0.007790446747094393, -0.3852553963661194, 0.0082556689158082, 0.5327315330505371], [-0.01549555454403162, -0.5804924964904785, 0.018910299986600876, 0.8280043601989746], [-0.027105404064059258, -0.3856341242790222, 0.0354703851044178, 0.5413283705711365], [-0.03481808677315712, -0.1910281926393509, 0.04629695415496826, 0.2600291967391968], [-0.0386386513710022, -0.38677942752838135, 0.05149753764271736, 0.566947877407074], [-0.04637423902750015, -0.1924162656068802, 0.06283649802207947, 0.29092320799827576], [-0.05022256448864937, 0.001756044919602573, 0.06865496188402176, 0.018701329827308655], [-0.05018744245171547, -0.19427989423274994, 0.06902898848056793, 0.33223122358322144], [-0.054073043167591095, -0.0002049142640316859, 0.07567360997200012, 0.0620904415845871], [-0.0540771409869194, -0.19632568955421448, 0.07691542059183121, 0.3776565194129944], [-0.05800365284085274, -0.3924509584903717, 0.0844685509800911, 0.6935654878616333], [-0.06585267186164856, -0.5886367559432983, 0.09833985567092896, 1.0115991830825806], [-0.07762540876865387, -0.7849235534667969, 0.11857184022665024, 1.3334721326828003], [-0.09332387894392014, -0.981323778629303, 0.14524129033088684, 1.6607824563980103], [-0.11295035481452942, -0.7881622314453125, 0.17845693230628967, 1.4166418313980103], [-0.12871359288692474, -0.9849881529808044, 0.2067897766828537, 1.7593803405761719], [-0.14841336011886597, -1.1817649602890015, 0.24197737872600555, 2.1086208820343018], [0.040225785225629807, -0.16498391330242157, 0.02282954752445221, 0.30310261249542236], [0.03692610561847687, 0.029805360361933708, 0.02889159880578518, 0.01770613342523575], [0.03752221539616585, -0.16571876406669617, 0.02924572303891182, 0.3193628787994385], [0.03420783951878548, -0.3612447679042816, 0.03563297912478447, 0.6211234331130981], [0.026982944458723068, -0.5568457245826721, 0.04805544763803482, 0.9248125553131104], [0.015846028923988342, -0.36240464448928833, 0.06655170023441315, 0.6476104855537415], [0.008597936481237411, -0.5583875775337219, 0.07950390875339508, 0.9604859352111816], [-0.0025698160752654076, -0.7544829845428467, 0.09871362894773483, 1.2770494222640991], [-0.017659476026892662, -0.950715184211731, 0.12425461411476135, 1.5989394187927246], [-0.03667378053069115, -0.7572652101516724, 0.15623340010643005, 1.3474385738372803], [-0.0518190823495388, -0.9539674520492554, 0.18318217992782593, 1.6846442222595215], [-0.07089842855930328, -0.7613774538040161, 0.21687506139278412, 1.454147458076477], [-0.02625207230448723, 0.19954553246498108, -0.019524844363331795, -0.32540684938430786], [-0.022261161357164383, 0.39493995904922485, -0.026032982394099236, -0.6241825819015503], [-0.014362362213432789, 0.2001909464597702, -0.038516633212566376, -0.33981087803840637], [-0.010358543135225773, 0.3958391845226288, -0.045312851667404175, -0.6443866491317749], [-0.0024417599197477102, 0.2013770341873169, -0.05820058286190033, -0.3663102686405182], [0.001585780642926693, 0.007128350902348757, -0.06552679091691971, -0.09253191202878952], [0.0017283476190641522, -0.18699617683887482, -0.06737742573022842, 0.17877887189388275], [-0.0020115759689360857, 0.00902202446013689, -0.0638018473982811, -0.13437525928020477], [-0.001831135479733348, -0.185130774974823, -0.06648935377597809, 0.1375163495540619], [-0.005533750634640455, -0.3792405128479004, -0.06373903155326843, 0.4085041284561157], [-0.013118560425937176, -0.18327546119689941, -0.05556894466280937, 0.09642687439918518], [-0.016784070059657097, -0.37755876779556274, -0.05364040657877922, 0.3710731267929077], [-0.024335244670510292, -0.5718792080879211, -0.04621894657611847, 0.6463719010353088], [-0.03577283024787903, -0.7663277387619019, -0.03329150751233101, 0.9241496324539185], [-0.05109938606619835, -0.5707722902297974, -0.014808515086770058, 0.6211931109428406], [-0.06251483410596848, -0.7656843662261963, -0.0023846530821174383, 0.9091755747795105], [-0.07782851904630661, -0.5705301761627197, 0.015798859298229218, 0.6157441139221191], [-0.08923912048339844, -0.7658692598342896, 0.02811374142765999, 0.9133608341217041], [-0.10455650836229324, -0.5711386799812317, 0.04638095572590828, 0.6296446919441223], [-0.11597927659749985, -0.7668761014938354, 0.058973852545022964, 0.9365662336349487], [-0.13131679594516754, -0.5725969076156616, 0.07770517468452454, 0.6629823446273804], [-0.1427687406539917, -0.3786371350288391, 0.09096482396125793, 0.39574292302131653], [-0.1503414809703827, -0.5749240517616272, 0.09887968003749847, 0.7156628370285034], [-0.16183996200561523, -0.7712655663490295, 0.11319293826818466, 1.0377596616744995], [-0.17726527154445648, -0.9676949977874756, 0.13394813239574432, 1.363726019859314], [-0.1966191828250885, -1.1642162799835205, 0.1612226516008377, 1.695130467414856], [-0.21990349888801575, -1.3607898950576782, 0.1951252669095993, 2.0333614349365234], [-0.24711929261684418, -1.5573170185089111, 0.23579248785972595, 2.37956166267395], [-0.014745672233402729, 0.18155236542224884, -0.018298130482435226, -0.3075217306613922], [-0.011114625260233879, 0.37693020701408386, -0.024448566138744354, -0.6059187650680542], [-0.0035760209430009127, 0.572385311126709, -0.03656693920493126, -0.9062010049819946], [0.007871685549616814, 0.377777099609375, -0.05469096079468727, -0.6252320408821106], [0.01542722713202238, 0.1834595650434494, -0.0671956017613411, -0.35026270151138306], [0.01909641921520233, 0.3794696033000946, -0.07420085370540619, -0.6633548736572266], [0.0266858097165823, 0.1854540854692459, -0.08746795356273651, -0.394927442073822], [0.030394893139600754, 0.38170120120048523, -0.09536650031805038, -0.7138555645942688], [0.038028914481401443, 0.5780049562454224, -0.1096436157822609, -1.0349684953689575], [0.049589015543460846, 0.38449808955192566, -0.1303429901599884, -0.7786218523979187], [0.05727897956967354, 0.1913861781358719, -0.1459154188632965, -0.5296235084533691], [0.06110670045018196, 0.3882269263267517, -0.15650789439678192, -0.8644940257072449], [0.06887123733758926, 0.5850933194160461, -0.17379777133464813, -1.2020100355148315], [0.08057310432195663, 0.7819833755493164, -0.1978379786014557, -1.5437356233596802], [0.09621277451515198, 0.5897117257118225, -0.22871269285678864, -1.318739652633667], [0.024897782132029533, 0.2146768718957901, -0.01612795703113079, -0.33297836780548096], [0.02919132076203823, 0.019788138568401337, -0.02278752438724041, -0.045424703508615494], [0.02958708256483078, 0.2152293175458908, -0.023696018382906914, -0.3452093005180359], [0.033891670405864716, 0.020452314987778664, -0.030600203201174736, -0.060091808438301086], [0.03430071473121643, 0.21599934995174408, -0.031802039593458176, -0.3622700870037079], [0.03862070292234421, 0.4115585386753082, -0.03904744237661362, -0.6648087501525879], [0.04685187339782715, 0.21700087189674377, -0.052343618124723434, -0.38467177748680115], [0.05119188874959946, 0.022659609094262123, -0.06003705412149429, -0.10894113034009933], [0.051645081490278244, -0.17155292630195618, -0.06221587583422661, 0.16421250998973846], [0.04821402579545975, -0.3657316267490387, -0.0589316263794899, 0.43663734197616577], [0.04089939221739769, -0.16982713341712952, -0.05019887909293175, 0.1259748786687851], [0.037502847611904144, 0.02597668021917343, -0.04767937958240509, -0.1821131408214569], [0.03802238404750824, 0.22174730896949768, -0.051321644335985184, -0.48944777250289917], [0.042457327246665955, 0.4175542891025543, -0.06111059710383415, -0.7978534698486328], [0.050808414816856384, 0.22332166135311127, -0.07706766575574875, -0.5250037312507629], [0.055274847894907, 0.029364027082920074, -0.08756774663925171, -0.25756630301475525], [0.05586212873458862, 0.22561992704868317, -0.09271907061338425, -0.5765342116355896], [0.06037452816963196, 0.4219108521938324, -0.1042497530579567, -0.8969262838363647], [0.06881274282932281, 0.6182798147201538, -0.1221882775425911, -1.2204744815826416], [0.08117833733558655, 0.814746081829071, -0.14659777283668518, -1.5488107204437256], [0.09747326374053955, 1.011291742324829, -0.17757397890090942, -1.883412480354309], [0.11769909411668777, 0.8184921145439148, -0.21524223685264587, -1.6506935358047485]], "action_prob": [0.5000100135803223, 0.500657856464386, 0.49998340010643005, 0.5006839632987976, 0.49995067715644836, 0.4992848038673401, 0.4988258481025696, 0.4985869824886322, 0.49847471714019775, 0.5015859603881836, 0.5016244053840637, 0.498379647731781, 0.5017053484916687, 0.49828311800956726, 0.4999530613422394, 0.49930837750434875, 0.5011299848556519, 0.5007315278053284, 0.49989625811576843, 0.50075364112854, 0.5001312494277954, 0.4994763731956482, 0.500995397567749, 0.5005540251731873, 0.5000984072685242, 0.49943283200263977, 0.5010440945625305, 0.49938657879829407, 0.5010883808135986, 0.5006720423698425, 0.49995437264442444, 0.49928539991378784, 0.5011690258979797, 0.49920862913131714, 0.5012298822402954, 0.5008807182312012, 0.5003154873847961, 0.49967753887176514, 0.5008283853530884, 0.49972090125083923, 0.5008116960525513, 0.4997633993625641, 0.5007919073104858, 0.49980559945106506, 0.5007688403129578, 0.4998483657836914, 0.4992578327655792, 0.49886491894721985, 0.5013427734375, 0.49882373213768005, 0.5013925433158875, 0.5012201070785522, 0.5008058547973633, 0.5001656413078308, 0.49951109290122986, 0.49903517961502075, 0.5012499094009399, 0.4989491105079651, 0.49867406487464905, 0.4985167980194092, 0.49841663241386414, 0.5016590356826782, 0.49996182322502136, 0.500686526298523, 0.49994826316833496, 0.4992973506450653, 0.4988510310649872, 0.5013833045959473, 0.4987780749797821, 0.4985520541667938, 0.5015519261360168, 0.49846112728118896, 0.5016310214996338, 0.4983671307563782, 0.5017122030258179, 0.4982711374759674, 0.49987712502479553, 0.49922803044319153, 0.49879711866378784, 0.4985792636871338, 0.49847882986068726, 0.49842414259910583, 0.49838152527809143, 0.501660168170929, 0.49826866388320923, 0.4999610483646393, 0.499315083026886, 0.4988729655742645, 0.50135737657547, 0.4988080859184265, 0.5014165639877319, 0.49873462319374084, 0.498521625995636, 0.5015690922737122, 0.4984346628189087, 0.5016424059867859, 0.5016542077064514, 0.5015841722488403, 0.49863725900650024, 0.5016602873802185, 0.500075101852417, 0.5005845427513123, 0.49992942810058594, 0.5007125735282898, 0.5000924468040466, 0.49943211674690247, 0.5010431408882141, 0.49939945340156555, 0.4989211857318878, 0.5013351440429688, 0.5011467933654785, 0.4992688000202179, 0.5011981725692749, 0.5008050799369812, 0.4998015761375427, 0.500862181186676, 0.49972623586654663, 0.49907585978507996, 0.49866941571235657, 0.4984758496284485, 0.49838903546333313, 0.501660168170929, 0.49828797578811646, 0.4982461929321289, 0.5000330209732056, 0.500632107257843, 0.49999913573265076, 0.49933600425720215, 0.49888184666633606, 0.501356840133667, 0.4988001883029938, 0.4985748827457428, 0.4984682500362396, 0.5015923380851746, 0.4983668625354767, 0.5016850829124451, 0.4999419152736664, 0.49929317831993103, 0.5011399984359741, 0.49923276901245117, 0.5011923909187317, 0.5008400678634644, 0.500261664390564, 0.5003881454467773, 0.5003105998039246, 0.49965718388557434, 0.5008652806282043, 0.4996775984764099, 0.49913617968559265, 0.4988100528717041, 0.501353919506073, 0.4987470805644989, 0.5014162063598633, 0.4986792206764221, 0.5014784336090088, 0.49860599637031555, 0.5015408992767334, 0.5014726519584656, 0.4987614154815674, 0.49846774339675903, 0.49835261702537537, 0.49831050634384155, 0.49828651547431946, 0.498261958360672, 0.49998679757118225, 0.4993278384208679, 0.498876690864563, 0.5013596415519714, 0.5012004971504211, 0.4991665482521057, 0.5012610554695129, 0.4990767240524292, 0.4986724853515625, 0.5015209317207336, 0.5014238357543945, 0.498835027217865, 0.49849894642829895, 0.4983469247817993, 0.5017261505126953, 0.49987179040908813, 0.5007697343826294, 0.4998398423194885, 0.5007998943328857, 0.4998007118701935, 0.4991644620895386, 0.5012416839599609, 0.5009049773216248, 0.5003365874290466, 0.4996830224990845, 0.500834047794342, 0.5003024339675903, 0.49960386753082275, 0.49901333451271057, 0.5013343095779419, 0.5010706782341003, 0.49941888451576233, 0.49886074662208557, 0.49855291843414307, 0.4984089136123657, 0.49833613634109497, 0.5017135739326477], "advantages": [13.125404357910156, 12.250706672668457, 11.36159896850586, 10.469091415405273, 9.562016487121582, 8.65133285522461, 7.730805397033691, 6.800206661224365, 5.859601974487305, 4.909091472625732, 3.9482438564300537, 2.9774303436279297, 1.998110055923462, 1.0077422857284546, 38.270782470703125, 37.65000915527344, 37.02239227294922, 36.38400650024414, 35.7386589050293, 35.09236526489258, 34.433990478515625, 33.769004821777344, 33.09789276123047, 32.42435836791992, 31.744571685791016, 31.05234146118164, 30.35371971130371, 29.652414321899414, 28.93963050842285, 28.223974227905273, 27.501619338989258, 26.76646614074707, 26.024580001831055, 25.279312133789062, 24.522445678710938, 23.761877059936523, 22.994182586669922, 22.218915939331055, 21.435501098632812, 20.639095306396484, 19.83983039855957, 19.02724838256836, 18.2117862701416, 17.382720947265625, 16.550708770751953, 15.70483684539795, 14.855917930603027, 13.997980117797852, 13.130800247192383, 12.251453399658203, 11.366754531860352, 10.469561576843262, 9.562685012817383, 8.64635944366455, 7.721105098724365, 6.787254810333252, 5.844706058502197, 4.894623279571533, 3.9329798221588135, 2.9621500968933105, 1.9818251132965088, 0.9917629957199097, 13.125761985778809, 12.250967979431152, 11.361844062805176, 10.469256401062012, 9.56702709197998, 8.654949188232422, 7.730889797210693, 6.800281524658203, 5.859670162200928, 4.908054828643799, 3.948296070098877, 2.9774961471557617, 1.9981575012207031, 1.007799744606018, 8.648493766784668, 7.728548526763916, 6.798666000366211, 5.858639717102051, 4.908530235290527, 3.9484264850616455, 2.978374481201172, 1.9983742237091064, 1.0084971189498901, 13.994478225708008, 13.122976303100586, 12.243228912353516, 11.355305671691895, 10.46144962310791, 9.555488586425781, 8.643380165100098, 7.719051837921143, 6.786016464233398, 5.845231533050537, 4.893308162689209, 3.933274507522583, 2.9639058113098145, 1.9851990938186646, 0.9932188987731934, 21.431838989257812, 20.640995025634766, 19.836551666259766, 19.02409553527832, 18.208877563476562, 17.385478973388672, 16.55322265625, 15.707995414733887, 14.858841896057129, 14.000370979309082, 13.130142211914062, 12.25046443939209, 11.366430282592773, 10.469029426574707, 9.562077522277832, 8.651479721069336, 7.7262282371521, 6.797046184539795, 5.857715129852295, 4.908082962036133, 3.9482603073120117, 2.978358745574951, 1.9981402158737183, 1.0084782838821411, 11.36162281036377, 10.469096183776855, 9.562047958374023, 8.651341438293457, 7.730762958526611, 6.800109386444092, 5.857425689697266, 4.907827377319336, 3.948028564453125, 2.9781436920166016, 1.9978781938552856, 1.0082449913024902, 24.52773666381836, 23.76262664794922, 22.99045753479004, 22.21461296081543, 21.426807403564453, 20.63507652282715, 19.835920333862305, 19.028833389282227, 18.20790672302246, 17.38439178466797, 16.552217483520508, 15.70658016204834, 14.857549667358398, 13.9993314743042, 13.131839752197266, 12.252973556518555, 11.36793327331543, 10.471271514892578, 9.568290710449219, 8.653509140014648, 7.732186317443848, 6.798952102661133, 5.855734348297119, 4.906819820404053, 3.947556734085083, 2.9780404567718506, 1.99836003780365, 1.0085536241531372, 13.994028091430664, 13.12248420715332, 12.242781639099121, 11.354951858520508, 10.460887908935547, 9.558425903320312, 8.642733573913574, 7.72177791595459, 6.787607669830322, 5.844823837280273, 4.894741535186768, 3.935561418533325, 2.9634037017822266, 1.9822415113449097, 0.9917032122612, 19.83658790588379, 19.02409553527832, 18.20884895324707, 17.37990951538086, 16.548017501831055, 15.702301025390625, 14.848745346069336, 13.990571022033691, 13.124308586120605, 12.249452590942383, 11.365361213684082, 10.467408180236816, 9.560039520263672, 8.643903732299805, 7.71931791305542, 6.788796424865723, 5.849488735198975, 4.895953178405762, 3.9336626529693604, 2.9623782634735107, 1.9817637205123901, 0.9915335178375244], "value_targets": [13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1483372751, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931, 1732281931], "obs": [[0.0409204363822937, -0.0018227597465738654, 0.03385833650827408, 0.028363829478621483], [0.04088398069143295, 0.1927976906299591, 0.03442561626434326, -0.2534470856189728], [0.04473993554711342, -0.0027984711341559887, 0.02935667335987091, 0.04989245906472206], [0.04468396306037903, 0.19189050793647766, 0.030354522168636322, -0.23338554799556732], [0.048521775752305984, -0.003651717910543084, 0.02568681165575981, 0.06871552020311356], [0.04844874143600464, 0.19109272956848145, 0.02706112153828144, -0.2157536894083023], [0.052270594984292984, 0.3858175575733185, 0.022746047005057335, -0.49977901577949524], [0.05998694524168968, 0.1903824657201767, 0.012750467285513878, -0.20001541078090668], [0.06379459798336029, -0.004919512663036585, 0.008750159293413162, 0.0966622605919838], [0.06369620561599731, -0.2001657783985138, 0.01068340428173542, 0.3920929431915283], [0.05969288945198059, -0.005197052378207445, 0.0185252632945776, 0.10279742628335953], [0.059588950127363205, 0.18965457379817963, 0.020581211894750595, -0.18398375809192657], [0.06338203698396683, -0.00575571833178401, 0.016901537775993347, 0.1151200607419014], [0.06326692551374435, 0.18912002444267273, 0.01920393854379654, -0.17218299210071564], [0.06704932451248169, -0.006271436810493469, 0.015760278329253197, 0.12649577856063843], [0.06692389398813248, 0.18862122297286987, 0.018290193751454353, -0.16117358207702637], [0.07069632411003113, 0.3834766149520874, 0.01506672240793705, -0.4480307698249817], [0.07836585491895676, 0.5783822536468506, 0.00610610656440258, -0.7359265685081482], [0.08993349969387054, 0.7734193205833435, -0.008612425066530704, -1.0266815423965454], [0.1054018884897232, 0.5784130692481995, -0.02914605662226677, -0.7367150783538818], [0.11697014421224594, 0.3837055563926697, -0.04388035833835602, -0.45334553718566895], [0.12464425712823868, 0.5794196724891663, -0.0529472678899765, -0.759530782699585], [0.1362326592206955, 0.7752296328544617, -0.06813788414001465, -1.068393349647522], [0.151737242937088, 0.5810718536376953, -0.08950575441122055, -0.7978495955467224], [0.1633586883544922, 0.7773004174232483, -0.10546274483203888, -1.1172937154769897], [0.1789046972990036, 0.5837085247039795, -0.1278086155653, -0.8594678640365601], [0.1905788630247116, 0.39053741097450256, -0.1449979692697525, -0.6095480918884277], [0.19838960468769073, 0.1977081000804901, -0.15718893706798553, -0.3658196032047272], [0.20234377682209015, 0.39467379450798035, -0.16450533270835876, -0.70364910364151], [0.21023724973201752, 0.20216742157936096, -0.17857831716537476, -0.4669346809387207], [0.21428059041500092, 0.3993034362792969, -0.18791700899600983, -0.8101595640182495], [0.22226665914058685, 0.20718444883823395, -0.2041201889514923, -0.581977367401123], [-0.0383063405752182, -0.038008976727724075, -0.01880093663930893, 0.03184643015265465], [-0.03906651958823204, -0.23285633325576782, -0.018164008855819702, 0.3185386657714844], [-0.04372364655137062, -0.03748046234250069, -0.011793235316872597, 0.020183268934488297], [-0.044473256915807724, 0.15780861675739288, -0.01138957031071186, -0.2761971056461334], [-0.041317086666822433, -0.03714900463819504, -0.016913512721657753, 0.012871895916759968], [-0.042060066014528275, -0.23202435672283173, -0.016656074672937393, 0.30017077922821045], [-0.046700552105903625, -0.036669012159109116, -0.01065265852957964, 0.002281747991219163], [-0.04743393138051033, 0.15860408544540405, -0.010607023723423481, -0.2937431037425995], [-0.04426185041666031, -0.036365047097206116, -0.016481885686516762, -0.004424257203936577], [-0.04498915374279022, -0.23124679923057556, -0.01657037064433098, 0.2830131947994232], [-0.049614086747169495, -0.035892464220523834, -0.01091010682284832, -0.014849530532956123], [-0.05033193901181221, -0.2308562695980072, -0.011207097209990025, 0.27437126636505127], [-0.054949063807725906, -0.035576216876506805, -0.005719671957194805, -0.021825233474373817], [-0.055660586804151535, -0.23061567544937134, -0.006156176328659058, 0.2690475881099701], [-0.06027290225028992, -0.03540641814470291, -0.0007752245874144137, -0.02557065151631832], [-0.06098102778196335, 0.15972664952278137, -0.0012866376200690866, -0.31849807500839233], [-0.0577864944934845, 0.3548668920993805, -0.0076565989293158054, -0.6115864515304565], [-0.05068915709853172, 0.1598527878522873, -0.01988832838833332, -0.3213249146938324], [-0.04749210178852081, -0.034980375319719315, -0.02631482668220997, -0.034979745745658875], [-0.04819171130657196, 0.16050885617733002, -0.027014421299099922, -0.33584773540496826], [-0.04498153179883957, -0.034218430519104004, -0.0337313748896122, -0.05180465430021286], [-0.04566590115427971, 0.16137054562568665, -0.03476747125387192, -0.3549363613128662], [-0.04243848845362663, -0.03324025496840477, -0.04186619818210602, -0.07341615855693817], [-0.04310329630970955, -0.22773776948451996, -0.04333452135324478, 0.2057694047689438], [-0.047658052295446396, -0.4222141206264496, -0.03921913355588913, 0.48447367548942566], [-0.05610233172774315, -0.2265612632036209, -0.02952965907752514, 0.17969262599945068], [-0.06063355877995491, -0.031029460951685905, -0.025935806334018707, -0.12215767055749893], [-0.061254147440195084, -0.22577041387557983, -0.028378959745168686, 0.16223125159740448], [-0.06576955318450928, -0.4204748570919037, -0.025134334340691566, 0.44582802057266235], [-0.07417905330657959, -0.22500649094581604, -0.016217773780226707, 0.14532937109470367], [-0.07867918163537979, -0.41989248991012573, -0.01331118680536747, 0.4328520894050598], [-0.08707702904939651, -0.22458460927009583, -0.0046541448682546616, 0.13600286841392517], [-0.091568723320961, -0.029396312311291695, -0.0019340873695909977, -0.1581447273492813], [-0.09215664863586426, 0.16575327515602112, -0.005096981767565012, -0.45143717527389526], [-0.08884158730506897, -0.02929621934890747, -0.014125725254416466, -0.1603652387857437], [-0.08942750841379166, -0.2242131233215332, -0.017333030700683594, 0.12782812118530273], [-0.09391177445650101, -0.028847211971879005, -0.014776468276977539, -0.17027238011360168], [-0.0944887176156044, -0.22375458478927612, -0.01818191632628441, 0.11771263182163239], [-0.09896380454301834, -0.028376903384923935, -0.015827663242816925, -0.18065063655376434], [-0.09953134506940842, 0.16696791350841522, -0.019440675154328346, -0.4782842993736267], [-0.09619198739528656, -0.02787424810230732, -0.029006361961364746, -0.19179148972034454], [-0.09674946963787079, 0.16765038669109344, -0.03284219279885292, -0.49348175525665283], [-0.09339646250009537, -0.026993339881300926, -0.04271182790398598, -0.211327463388443], [-0.09393633157014847, -0.2214794009923935, -0.046938374638557434, 0.06758211553096771], [-0.098365917801857, -0.41589805483818054, -0.045586735010147095, 0.34509408473968506], [-0.1066838800907135, -0.22015827894210815, -0.03868485242128372, 0.038391582667827606], [-0.11108704656362534, -0.024503551423549652, -0.03791702166199684, -0.2662414312362671], [-0.1115771159529686, -0.219064399600029, -0.043241847306489944, 0.014245135709643364], [-0.11595840752124786, -0.023349842056632042, -0.042956944555044174, -0.2917614281177521], [-0.11642540246248245, -0.21783380210399628, -0.04879217594861984, -0.012930049560964108], [-0.12078207731246948, -0.02204730175435543, -0.04905077442526817, -0.3205994963645935], [-0.12122302502393723, -0.21643763780593872, -0.05546276643872261, -0.04377984628081322], [-0.12555177509784698, -0.4107222259044647, -0.0563383623957634, 0.23090121150016785], [-0.13376621901988983, -0.6049957871437073, -0.05172033980488777, 0.5052944421768188], [-0.14586614072322845, -0.7993521690368652, -0.04161445051431656, 0.7812402248382568], [-0.16185317933559418, -0.9938781261444092, -0.02598964422941208, 1.0605454444885254], [-0.1817307472229004, -0.7984218001365662, -0.004778735805302858, 0.7598198652267456], [-0.197699174284935, -0.6032343506813049, 0.01041766069829464, 0.4656370282173157], [-0.20976386964321136, -0.7985019087791443, 0.019730402156710625, 0.7615852952003479], [-0.2257339060306549, -0.6036572456359863, 0.03496210649609566, 0.47517549991607666], [-0.23780705034732819, -0.4090459942817688, 0.04446561634540558, 0.19371378421783447], [-0.24598796665668488, -0.21458739042282104, 0.04833989217877388, -0.08461721986532211], [-0.2502797245979309, -0.4103677272796631, 0.04664754867553711, 0.2229166477918625], [-0.2584870755672455, -0.21594248712062836, 0.05110588297247887, -0.054694581776857376], [-0.26280590891838074, -0.41175854206085205, 0.05001198872923851, 0.25366461277008057], [-0.2710410952568054, -0.21738505363464355, 0.055085282772779465, -0.022833678871393204], [-0.27538880705833435, -0.023094577714800835, 0.054628610610961914, -0.29764047265052795], [-0.27585068345069885, -0.21895098686218262, 0.04867579787969589, 0.011758710257709026], [-0.28022971749305725, -0.02455967664718628, 0.04891097545623779, -0.265177845954895], [-0.28072088956832886, -0.22034436464309692, 0.04360741749405861, 0.04252207279205322], [-0.28512778878211975, -0.025873983278870583, 0.04445786029100418, -0.23608967661857605], [-0.2856452763080597, -0.22160197794437408, 0.0397360660135746, 0.07027853280305862], [-0.2900772988796234, -0.027071572840213776, 0.04114163666963577, -0.20960740745067596], [-0.29061874747276306, 0.16743870079517365, 0.036949485540390015, -0.48903369903564453], [-0.2872699499130249, -0.028184527531266212, 0.027168814092874527, -0.1849384754896164], [-0.28783366084098816, -0.22368445992469788, 0.023470044136047363, 0.1161898598074913], [-0.2923073470592499, -0.4191347062587738, 0.02579384110867977, 0.41618403792381287], [-0.30069002509117126, -0.22438763082027435, 0.034117523580789566, 0.1317431479692459], [-0.3051777780056, -0.029770584776997566, 0.03675238415598869, -0.14998392760753632], [-0.30577319860458374, 0.1648063361644745, 0.03375270590186119, -0.43084946274757385], [-0.30247706174850464, -0.030776895582675934, 0.025135716423392296, -0.12772028148174286], [-0.3030925989151001, 0.16397611796855927, 0.02258131094276905, -0.41236841678619385], [-0.29981309175491333, -0.031458530575037, 0.014333942905068398, -0.11265283077955246], [-0.30044224858283997, -0.2267829030752182, 0.012080886401236057, 0.18451768159866333], [-0.3049779236316681, -0.031835880130529404, 0.01577123999595642, -0.10432983934879303], [-0.3056146204471588, -0.22718025743961334, 0.013684643432497978, 0.19328683614730835], [-0.31015825271606445, -0.032256707549095154, 0.017550379037857056, -0.09504794329404831], [-0.3108033835887909, 0.16260935366153717, 0.015649421140551567, -0.38214248418807983], [-0.30755117535591125, -0.03273126110434532, 0.008006570860743523, -0.08456669002771378], [-0.30820581316947937, 0.1622750163078308, 0.0063152373768389225, -0.37471282482147217], [-0.30496031045913696, 0.35730668902397156, -0.0011790188727900386, -0.6653978228569031], [-0.29781419038772583, 0.5524449944496155, -0.014486975967884064, -0.9584517478942871], [-0.28676527738571167, 0.7477587461471558, -0.03365601226687431, -1.2556506395339966], [-0.2718101143836975, 0.5530834794044495, -0.058769021183252335, -0.9736960530281067], [-0.2607484459877014, 0.3587971031665802, -0.0782429426908493, -0.7000378370285034], [-0.2535724937915802, 0.16484203934669495, -0.09224370121955872, -0.43297526240348816], [-0.2502756416797638, -0.02886107936501503, -0.10090320557355881, -0.17073705792427063], [-0.25085288286209106, -0.22240489721298218, -0.10431794822216034, 0.08848678320646286], [-0.25530096888542175, -0.025954362004995346, -0.10254821181297302, -0.23520098626613617], [-0.25582006573677063, 0.17047184705734253, -0.10725223273038864, -0.5583887696266174], [-0.2524106204509735, -0.022994063794612885, -0.11842000484466553, -0.3013291358947754], [-0.25287050008773804, -0.2162466198205948, -0.12444659322500229, -0.0482146255671978], [-0.25719544291496277, -0.40938475728034973, -0.12541088461875916, 0.20275917649269104], [-0.26538312435150146, -0.6025108695030212, -0.12135569751262665, 0.45339900255203247], [-0.2774333357810974, -0.40590062737464905, -0.1122877225279808, 0.12506155669689178], [-0.28555136919021606, -0.20936407148838043, -0.1097864881157875, -0.20082995295524597], [-0.28973865509033203, -0.40275856852531433, -0.11380308866500854, 0.05530289560556412], [-0.29779380559921265, -0.5960804224014282, -0.11269702762365341, 0.3100239336490631], [-0.3097154200077057, -0.7894313931465149, -0.10649655014276505, 0.5651477575302124], [-0.32550403475761414, -0.5929892063140869, -0.09519359469413757, 0.24090297520160675], [-0.3373638391494751, -0.7866315245628357, -0.09037553519010544, 0.5021067261695862], [-0.35309645533561707, -0.9803711175918579, -0.0803333967924118, 0.7649959325790405], [-0.37270388007164, -0.7842402458190918, -0.06503348052501678, 0.4481557607650757], [-0.3883886933326721, -0.9783849120140076, -0.05607036501169205, 0.7196507453918457], [-0.40795639157295227, -1.1726881265640259, -0.04167735204100609, 0.9941714406013489], [-0.43141016364097595, -0.9770341515541077, -0.021793924272060394, 0.6886957287788391], [-0.45095083117485046, -1.1718469858169556, -0.008020007982850075, 0.9744386672973633], [-0.4743877649307251, -0.9766182899475098, 0.011468765325844288, 0.6792473196983337], [-0.49392014741897583, -0.7816575169563293, 0.025053711608052254, 0.39019712805747986], [-0.5095533132553101, -0.586899995803833, 0.03285765275359154, 0.10551746189594269], [-0.5212913155555725, -0.39226391911506653, 0.03496800363063812, -0.17662061750888824], [-0.5291365385055542, -0.5878683924674988, 0.031435590237379074, 0.12688523530960083], [-0.5408939123153687, -0.3932105600833893, 0.033973295241594315, -0.15571673214435577], [-0.5487581491470337, -0.5888020396232605, 0.03085896000266075, 0.14748743176460266], [-0.5605341792106628, -0.3941352665424347, 0.03380870819091797, -0.1353025883436203], [-0.5684168934822083, -0.1995134949684143, 0.031102657318115234, -0.41713058948516846], [-0.5724071860313416, -0.0048458087258040905, 0.022760044783353806, -0.6998481750488281], [-0.5725041031837463, -0.20027577877044678, 0.008763082325458527, -0.40008828043937683], [-0.5765095949172974, -0.3955209255218506, 0.0007613165653310716, -0.10465546697378159], [-0.5844200253486633, -0.2004099041223526, -0.001331792795099318, -0.3970980942249298], [-0.5884281992912292, -0.3955129384994507, -0.009273755364120007, -0.10483536869287491], [-0.5963384509086609, -0.5905007719993591, -0.011370462365448475, 0.18490736186504364], [-0.608148455619812, -0.39521798491477966, -0.007672314997762442, -0.1113407164812088], [-0.6160528659820557, -0.19998693466186523, -0.009899129159748554, -0.4064342975616455], [-0.6200525760650635, -0.39496713876724243, -0.018027815967798233, -0.11688864976167679], [-0.6279519200325012, -0.19959157705307007, -0.02036558836698532, -0.415204256772995], [-0.6319437623023987, -0.3944190442562103, -0.028669673949480057, -0.12901070713996887], [-0.6398321390151978, -0.19889837503433228, -0.031249888241291046, -0.4305989146232605], [-0.6438100934028625, -0.3935641944408417, -0.03986186534166336, -0.14792872965335846], [-0.6516813635826111, -0.5880933403968811, -0.042820438742637634, 0.13191688060760498], [-0.6634432673454285, -0.7825765609741211, -0.04018210247159004, 0.41078898310661316], [-0.6790947914123535, -0.5869086980819702, -0.031966324895620346, 0.10571370273828506], [-0.6908329725265503, -0.7815582752227783, -0.02985204942524433, 0.388142466545105], [-0.7064641118049622, -0.586025595664978, -0.022089200094342232, 0.08619891852140427], [-0.7181846499443054, -0.7808240652084351, -0.020365221425890923, 0.37183162569999695], [-0.7338011264801025, -0.5854188203811646, -0.01292858924716711, 0.07279756665229797], [-0.7455095052719116, -0.3901139199733734, -0.011472637765109539, -0.22393618524074554], [-0.7533117532730103, -0.19482991099357605, -0.015951361507177353, -0.5202158093452454], [-0.7572083473205566, 0.0005129263736307621, -0.026355678215622902, -0.8178822994232178], [-0.7571980953216553, -0.19423852860927582, -0.04271332547068596, -0.5336042642593384], [-0.7610828876495361, -0.3887345492839813, -0.0533854104578495, -0.25468018651008606], [-0.7688575983047485, -0.5830552577972412, -0.05847901478409767, 0.02069769985973835], [-0.780518651008606, -0.3871455192565918, -0.058065060526132584, -0.28984758257865906], [-0.7882615923881531, -0.5813934803009033, -0.06386201083660126, -0.016028210520744324], [-0.7998894453048706, -0.38541656732559204, -0.0641825720667839, -0.3281570076942444], [-0.807597815990448, -0.18944239616394043, -0.07074571400880814, -0.640369713306427], [-0.8113866448402405, 0.006590821780264378, -0.08355311304330826, -0.954465925693512], [-0.8112547993659973, -0.18731378018856049, -0.10264242440462112, -0.6891596913337708], [-0.8150010704994202, -0.38087278604507446, -0.11642561852931976, -0.4304731786251068], [-0.8226185441017151, -0.18431125581264496, -0.1250350922346115, -0.7574713230133057], [-0.8263047933578491, 0.012291714549064636, -0.14018450677394867, -1.086738109588623], [-0.8260589241981506, -0.18073126673698425, -0.16191928088665009, -0.8411233425140381], [-0.8296735882759094, -0.3733164668083191, -0.17874173820018768, -0.6034206748008728], [-0.837139904499054, -0.5655478239059448, -0.1908101588487625, -0.3719382584095001], [-0.8484508395195007, -0.757519543170929, -0.19824892282485962, -0.14496520161628723], [-0.8636012673377991, -0.9493318796157837, -0.20114822685718536, 0.07921355962753296], [-0.8825879096984863, -1.1410874128341675, -0.19956395030021667, 0.30230793356895447], [-0.9054096341133118, -0.9437638521194458, -0.1935177892446518, -0.046086084097623825], [-0.9242849349975586, -1.1356604099273682, -0.19443951547145844, 0.1798458993434906], [-0.946998119354248, -0.9383646249771118, -0.19084259867668152, -0.16732662916183472], [-0.9657654166221619, -1.1303154230117798, -0.1941891312599182, 0.059604424983263016], [-0.988371729850769, -1.3221997022628784, -0.1929970383644104, 0.2852875888347626], [-1.0148156881332397, -1.5141206979751587, -0.18729129433631897, 0.5114346146583557], [-1.0450981855392456, -1.316922903060913, -0.17706260085105896, 0.16606837511062622], [-1.0714366436004639, -1.5091266632080078, -0.17374123632907867, 0.3980816602706909], [-1.1016191244125366, -1.7014130353927612, -0.16577959060668945, 0.6313455104827881], [-1.1356474161148071, -1.8938814401626587, -0.1531526893377304, 0.8675737977027893], [-1.1735249757766724, -2.08662486076355, -0.13580121099948883, 1.1084538698196411], [-1.2152575254440308, -1.8900052309036255, -0.11363213509321213, 0.7764367461204529], [-1.253057599067688, -2.0833961963653564, -0.09810339659452438, 1.0313165187835693], [-1.2947255373001099, -1.8871158361434937, -0.07747706770896912, 0.7095152735710144], [-1.332467794418335, -1.6910110712051392, -0.06328675895929337, 0.39348524808883667], [-1.3662880659103394, -1.4950509071350098, -0.05541705712676048, 0.08153942972421646], [-1.3961890935897827, -1.2991801500320435, -0.0537862703204155, -0.22809995710849762], [-1.4221726655960083, -1.1033324003219604, -0.058348268270492554, -0.5372521877288818], [-1.4442393779754639, -1.297587513923645, -0.06909330934286118, -0.2635100185871124], [-1.4701911211013794, -1.1015509366989136, -0.07436351478099823, -0.577160656452179], [-1.4922220706939697, -0.9054697155952454, -0.0859067291021347, -0.8923122882843018], [-1.5103315114974976, -1.0993279218673706, -0.1037529706954956, -0.6278228759765625], [-1.532318115234375, -1.292860507965088, -0.11630942672491074, -0.3695337474346161], [-1.5581753253936768, -1.4861544370651245, -0.1237001046538353, -0.11566976457834244], [-1.5878983736038208, -1.6793067455291748, -0.12601350247859955, 0.13556984066963196], [-1.6214845180511475, -1.8724197149276733, -0.12330210208892822, 0.38599228858947754], [-1.6589329242706299, -1.6757827997207642, -0.11558225750923157, 0.057117242366075516], [-1.6924484968185425, -1.8690741062164307, -0.11443991214036942, 0.3112141191959381], [-1.729830026626587, -1.6725234985351562, -0.10821563005447388, -0.015255188569426537], [-1.7632805109024048, -1.476029396057129, -0.10852073132991791, -0.34002554416656494], [-1.7928011417388916, -1.2795442342758179, -0.11532124131917953, -0.6648621559143066], [-1.8183919191360474, -1.4728891849517822, -0.12861847877502441, -0.41060030460357666], [-1.847849726676941, -1.6659754514694214, -0.13683049380779266, -0.16107283532619476]], "actions": [1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[0.04088398069143295, 0.1927976906299591, 0.03442561626434326, -0.2534470856189728], [0.04473993554711342, -0.0027984711341559887, 0.02935667335987091, 0.04989245906472206], [0.04468396306037903, 0.19189050793647766, 0.030354522168636322, -0.23338554799556732], [0.048521775752305984, -0.003651717910543084, 0.02568681165575981, 0.06871552020311356], [0.04844874143600464, 0.19109272956848145, 0.02706112153828144, -0.2157536894083023], [0.052270594984292984, 0.3858175575733185, 0.022746047005057335, -0.49977901577949524], [0.05998694524168968, 0.1903824657201767, 0.012750467285513878, -0.20001541078090668], [0.06379459798336029, -0.004919512663036585, 0.008750159293413162, 0.0966622605919838], [0.06369620561599731, -0.2001657783985138, 0.01068340428173542, 0.3920929431915283], [0.05969288945198059, -0.005197052378207445, 0.0185252632945776, 0.10279742628335953], [0.059588950127363205, 0.18965457379817963, 0.020581211894750595, -0.18398375809192657], [0.06338203698396683, -0.00575571833178401, 0.016901537775993347, 0.1151200607419014], [0.06326692551374435, 0.18912002444267273, 0.01920393854379654, -0.17218299210071564], [0.06704932451248169, -0.006271436810493469, 0.015760278329253197, 0.12649577856063843], [0.06692389398813248, 0.18862122297286987, 0.018290193751454353, -0.16117358207702637], [0.07069632411003113, 0.3834766149520874, 0.01506672240793705, -0.4480307698249817], [0.07836585491895676, 0.5783822536468506, 0.00610610656440258, -0.7359265685081482], [0.08993349969387054, 0.7734193205833435, -0.008612425066530704, -1.0266815423965454], [0.1054018884897232, 0.5784130692481995, -0.02914605662226677, -0.7367150783538818], [0.11697014421224594, 0.3837055563926697, -0.04388035833835602, -0.45334553718566895], [0.12464425712823868, 0.5794196724891663, -0.0529472678899765, -0.759530782699585], [0.1362326592206955, 0.7752296328544617, -0.06813788414001465, -1.068393349647522], [0.151737242937088, 0.5810718536376953, -0.08950575441122055, -0.7978495955467224], [0.1633586883544922, 0.7773004174232483, -0.10546274483203888, -1.1172937154769897], [0.1789046972990036, 0.5837085247039795, -0.1278086155653, -0.8594678640365601], [0.1905788630247116, 0.39053741097450256, -0.1449979692697525, -0.6095480918884277], [0.19838960468769073, 0.1977081000804901, -0.15718893706798553, -0.3658196032047272], [0.20234377682209015, 0.39467379450798035, -0.16450533270835876, -0.70364910364151], [0.21023724973201752, 0.20216742157936096, -0.17857831716537476, -0.4669346809387207], [0.21428059041500092, 0.3993034362792969, -0.18791700899600983, -0.8101595640182495], [0.22226665914058685, 0.20718444883823395, -0.2041201889514923, -0.581977367401123], [0.22641035914421082, 0.015418819151818752, -0.215759739279747, -0.35989606380462646], [-0.03906651958823204, -0.23285633325576782, -0.018164008855819702, 0.3185386657714844], [-0.04372364655137062, -0.03748046234250069, -0.011793235316872597, 0.020183268934488297], [-0.044473256915807724, 0.15780861675739288, -0.01138957031071186, -0.2761971056461334], [-0.041317086666822433, -0.03714900463819504, -0.016913512721657753, 0.012871895916759968], [-0.042060066014528275, -0.23202435672283173, -0.016656074672937393, 0.30017077922821045], [-0.046700552105903625, -0.036669012159109116, -0.01065265852957964, 0.002281747991219163], [-0.04743393138051033, 0.15860408544540405, -0.010607023723423481, -0.2937431037425995], [-0.04426185041666031, -0.036365047097206116, -0.016481885686516762, -0.004424257203936577], [-0.04498915374279022, -0.23124679923057556, -0.01657037064433098, 0.2830131947994232], [-0.049614086747169495, -0.035892464220523834, -0.01091010682284832, -0.014849530532956123], [-0.05033193901181221, -0.2308562695980072, -0.011207097209990025, 0.27437126636505127], [-0.054949063807725906, -0.035576216876506805, -0.005719671957194805, -0.021825233474373817], [-0.055660586804151535, -0.23061567544937134, -0.006156176328659058, 0.2690475881099701], [-0.06027290225028992, -0.03540641814470291, -0.0007752245874144137, -0.02557065151631832], [-0.06098102778196335, 0.15972664952278137, -0.0012866376200690866, -0.31849807500839233], [-0.0577864944934845, 0.3548668920993805, -0.0076565989293158054, -0.6115864515304565], [-0.05068915709853172, 0.1598527878522873, -0.01988832838833332, -0.3213249146938324], [-0.04749210178852081, -0.034980375319719315, -0.02631482668220997, -0.034979745745658875], [-0.04819171130657196, 0.16050885617733002, -0.027014421299099922, -0.33584773540496826], [-0.04498153179883957, -0.034218430519104004, -0.0337313748896122, -0.05180465430021286], [-0.04566590115427971, 0.16137054562568665, -0.03476747125387192, -0.3549363613128662], [-0.04243848845362663, -0.03324025496840477, -0.04186619818210602, -0.07341615855693817], [-0.04310329630970955, -0.22773776948451996, -0.04333452135324478, 0.2057694047689438], [-0.047658052295446396, -0.4222141206264496, -0.03921913355588913, 0.48447367548942566], [-0.05610233172774315, -0.2265612632036209, -0.02952965907752514, 0.17969262599945068], [-0.06063355877995491, -0.031029460951685905, -0.025935806334018707, -0.12215767055749893], [-0.061254147440195084, -0.22577041387557983, -0.028378959745168686, 0.16223125159740448], [-0.06576955318450928, -0.4204748570919037, -0.025134334340691566, 0.44582802057266235], [-0.07417905330657959, -0.22500649094581604, -0.016217773780226707, 0.14532937109470367], [-0.07867918163537979, -0.41989248991012573, -0.01331118680536747, 0.4328520894050598], [-0.08707702904939651, -0.22458460927009583, -0.0046541448682546616, 0.13600286841392517], [-0.091568723320961, -0.029396312311291695, -0.0019340873695909977, -0.1581447273492813], [-0.09215664863586426, 0.16575327515602112, -0.005096981767565012, -0.45143717527389526], [-0.08884158730506897, -0.02929621934890747, -0.014125725254416466, -0.1603652387857437], [-0.08942750841379166, -0.2242131233215332, -0.017333030700683594, 0.12782812118530273], [-0.09391177445650101, -0.028847211971879005, -0.014776468276977539, -0.17027238011360168], [-0.0944887176156044, -0.22375458478927612, -0.01818191632628441, 0.11771263182163239], [-0.09896380454301834, -0.028376903384923935, -0.015827663242816925, -0.18065063655376434], [-0.09953134506940842, 0.16696791350841522, -0.019440675154328346, -0.4782842993736267], [-0.09619198739528656, -0.02787424810230732, -0.029006361961364746, -0.19179148972034454], [-0.09674946963787079, 0.16765038669109344, -0.03284219279885292, -0.49348175525665283], [-0.09339646250009537, -0.026993339881300926, -0.04271182790398598, -0.211327463388443], [-0.09393633157014847, -0.2214794009923935, -0.046938374638557434, 0.06758211553096771], [-0.098365917801857, -0.41589805483818054, -0.045586735010147095, 0.34509408473968506], [-0.1066838800907135, -0.22015827894210815, -0.03868485242128372, 0.038391582667827606], [-0.11108704656362534, -0.024503551423549652, -0.03791702166199684, -0.2662414312362671], [-0.1115771159529686, -0.219064399600029, -0.043241847306489944, 0.014245135709643364], [-0.11595840752124786, -0.023349842056632042, -0.042956944555044174, -0.2917614281177521], [-0.11642540246248245, -0.21783380210399628, -0.04879217594861984, -0.012930049560964108], [-0.12078207731246948, -0.02204730175435543, -0.04905077442526817, -0.3205994963645935], [-0.12122302502393723, -0.21643763780593872, -0.05546276643872261, -0.04377984628081322], [-0.12555177509784698, -0.4107222259044647, -0.0563383623957634, 0.23090121150016785], [-0.13376621901988983, -0.6049957871437073, -0.05172033980488777, 0.5052944421768188], [-0.14586614072322845, -0.7993521690368652, -0.04161445051431656, 0.7812402248382568], [-0.16185317933559418, -0.9938781261444092, -0.02598964422941208, 1.0605454444885254], [-0.1817307472229004, -0.7984218001365662, -0.004778735805302858, 0.7598198652267456], [-0.197699174284935, -0.6032343506813049, 0.01041766069829464, 0.4656370282173157], [-0.20976386964321136, -0.7985019087791443, 0.019730402156710625, 0.7615852952003479], [-0.2257339060306549, -0.6036572456359863, 0.03496210649609566, 0.47517549991607666], [-0.23780705034732819, -0.4090459942817688, 0.04446561634540558, 0.19371378421783447], [-0.24598796665668488, -0.21458739042282104, 0.04833989217877388, -0.08461721986532211], [-0.2502797245979309, -0.4103677272796631, 0.04664754867553711, 0.2229166477918625], [-0.2584870755672455, -0.21594248712062836, 0.05110588297247887, -0.054694581776857376], [-0.26280590891838074, -0.41175854206085205, 0.05001198872923851, 0.25366461277008057], [-0.2710410952568054, -0.21738505363464355, 0.055085282772779465, -0.022833678871393204], [-0.27538880705833435, -0.023094577714800835, 0.054628610610961914, -0.29764047265052795], [-0.27585068345069885, -0.21895098686218262, 0.04867579787969589, 0.011758710257709026], [-0.28022971749305725, -0.02455967664718628, 0.04891097545623779, -0.265177845954895], [-0.28072088956832886, -0.22034436464309692, 0.04360741749405861, 0.04252207279205322], [-0.28512778878211975, -0.025873983278870583, 0.04445786029100418, -0.23608967661857605], [-0.2856452763080597, -0.22160197794437408, 0.0397360660135746, 0.07027853280305862], [-0.2900772988796234, -0.027071572840213776, 0.04114163666963577, -0.20960740745067596], [-0.29061874747276306, 0.16743870079517365, 0.036949485540390015, -0.48903369903564453], [-0.2872699499130249, -0.028184527531266212, 0.027168814092874527, -0.1849384754896164], [-0.28783366084098816, -0.22368445992469788, 0.023470044136047363, 0.1161898598074913], [-0.2923073470592499, -0.4191347062587738, 0.02579384110867977, 0.41618403792381287], [-0.30069002509117126, -0.22438763082027435, 0.034117523580789566, 0.1317431479692459], [-0.3051777780056, -0.029770584776997566, 0.03675238415598869, -0.14998392760753632], [-0.30577319860458374, 0.1648063361644745, 0.03375270590186119, -0.43084946274757385], [-0.30247706174850464, -0.030776895582675934, 0.025135716423392296, -0.12772028148174286], [-0.3030925989151001, 0.16397611796855927, 0.02258131094276905, -0.41236841678619385], [-0.29981309175491333, -0.031458530575037, 0.014333942905068398, -0.11265283077955246], [-0.30044224858283997, -0.2267829030752182, 0.012080886401236057, 0.18451768159866333], [-0.3049779236316681, -0.031835880130529404, 0.01577123999595642, -0.10432983934879303], [-0.3056146204471588, -0.22718025743961334, 0.013684643432497978, 0.19328683614730835], [-0.31015825271606445, -0.032256707549095154, 0.017550379037857056, -0.09504794329404831], [-0.3108033835887909, 0.16260935366153717, 0.015649421140551567, -0.38214248418807983], [-0.30755117535591125, -0.03273126110434532, 0.008006570860743523, -0.08456669002771378], [-0.30820581316947937, 0.1622750163078308, 0.0063152373768389225, -0.37471282482147217], [-0.30496031045913696, 0.35730668902397156, -0.0011790188727900386, -0.6653978228569031], [-0.29781419038772583, 0.5524449944496155, -0.014486975967884064, -0.9584517478942871], [-0.28676527738571167, 0.7477587461471558, -0.03365601226687431, -1.2556506395339966], [-0.2718101143836975, 0.5530834794044495, -0.058769021183252335, -0.9736960530281067], [-0.2607484459877014, 0.3587971031665802, -0.0782429426908493, -0.7000378370285034], [-0.2535724937915802, 0.16484203934669495, -0.09224370121955872, -0.43297526240348816], [-0.2502756416797638, -0.02886107936501503, -0.10090320557355881, -0.17073705792427063], [-0.25085288286209106, -0.22240489721298218, -0.10431794822216034, 0.08848678320646286], [-0.25530096888542175, -0.025954362004995346, -0.10254821181297302, -0.23520098626613617], [-0.25582006573677063, 0.17047184705734253, -0.10725223273038864, -0.5583887696266174], [-0.2524106204509735, -0.022994063794612885, -0.11842000484466553, -0.3013291358947754], [-0.25287050008773804, -0.2162466198205948, -0.12444659322500229, -0.0482146255671978], [-0.25719544291496277, -0.40938475728034973, -0.12541088461875916, 0.20275917649269104], [-0.26538312435150146, -0.6025108695030212, -0.12135569751262665, 0.45339900255203247], [-0.2774333357810974, -0.40590062737464905, -0.1122877225279808, 0.12506155669689178], [-0.28555136919021606, -0.20936407148838043, -0.1097864881157875, -0.20082995295524597], [-0.28973865509033203, -0.40275856852531433, -0.11380308866500854, 0.05530289560556412], [-0.29779380559921265, -0.5960804224014282, -0.11269702762365341, 0.3100239336490631], [-0.3097154200077057, -0.7894313931465149, -0.10649655014276505, 0.5651477575302124], [-0.32550403475761414, -0.5929892063140869, -0.09519359469413757, 0.24090297520160675], [-0.3373638391494751, -0.7866315245628357, -0.09037553519010544, 0.5021067261695862], [-0.35309645533561707, -0.9803711175918579, -0.0803333967924118, 0.7649959325790405], [-0.37270388007164, -0.7842402458190918, -0.06503348052501678, 0.4481557607650757], [-0.3883886933326721, -0.9783849120140076, -0.05607036501169205, 0.7196507453918457], [-0.40795639157295227, -1.1726881265640259, -0.04167735204100609, 0.9941714406013489], [-0.43141016364097595, -0.9770341515541077, -0.021793924272060394, 0.6886957287788391], [-0.45095083117485046, -1.1718469858169556, -0.008020007982850075, 0.9744386672973633], [-0.4743877649307251, -0.9766182899475098, 0.011468765325844288, 0.6792473196983337], [-0.49392014741897583, -0.7816575169563293, 0.025053711608052254, 0.39019712805747986], [-0.5095533132553101, -0.586899995803833, 0.03285765275359154, 0.10551746189594269], [-0.5212913155555725, -0.39226391911506653, 0.03496800363063812, -0.17662061750888824], [-0.5291365385055542, -0.5878683924674988, 0.031435590237379074, 0.12688523530960083], [-0.5408939123153687, -0.3932105600833893, 0.033973295241594315, -0.15571673214435577], [-0.5487581491470337, -0.5888020396232605, 0.03085896000266075, 0.14748743176460266], [-0.5605341792106628, -0.3941352665424347, 0.03380870819091797, -0.1353025883436203], [-0.5684168934822083, -0.1995134949684143, 0.031102657318115234, -0.41713058948516846], [-0.5724071860313416, -0.0048458087258040905, 0.022760044783353806, -0.6998481750488281], [-0.5725041031837463, -0.20027577877044678, 0.008763082325458527, -0.40008828043937683], [-0.5765095949172974, -0.3955209255218506, 0.0007613165653310716, -0.10465546697378159], [-0.5844200253486633, -0.2004099041223526, -0.001331792795099318, -0.3970980942249298], [-0.5884281992912292, -0.3955129384994507, -0.009273755364120007, -0.10483536869287491], [-0.5963384509086609, -0.5905007719993591, -0.011370462365448475, 0.18490736186504364], [-0.608148455619812, -0.39521798491477966, -0.007672314997762442, -0.1113407164812088], [-0.6160528659820557, -0.19998693466186523, -0.009899129159748554, -0.4064342975616455], [-0.6200525760650635, -0.39496713876724243, -0.018027815967798233, -0.11688864976167679], [-0.6279519200325012, -0.19959157705307007, -0.02036558836698532, -0.415204256772995], [-0.6319437623023987, -0.3944190442562103, -0.028669673949480057, -0.12901070713996887], [-0.6398321390151978, -0.19889837503433228, -0.031249888241291046, -0.4305989146232605], [-0.6438100934028625, -0.3935641944408417, -0.03986186534166336, -0.14792872965335846], [-0.6516813635826111, -0.5880933403968811, -0.042820438742637634, 0.13191688060760498], [-0.6634432673454285, -0.7825765609741211, -0.04018210247159004, 0.41078898310661316], [-0.6790947914123535, -0.5869086980819702, -0.031966324895620346, 0.10571370273828506], [-0.6908329725265503, -0.7815582752227783, -0.02985204942524433, 0.388142466545105], [-0.7064641118049622, -0.586025595664978, -0.022089200094342232, 0.08619891852140427], [-0.7181846499443054, -0.7808240652084351, -0.020365221425890923, 0.37183162569999695], [-0.7338011264801025, -0.5854188203811646, -0.01292858924716711, 0.07279756665229797], [-0.7455095052719116, -0.3901139199733734, -0.011472637765109539, -0.22393618524074554], [-0.7533117532730103, -0.19482991099357605, -0.015951361507177353, -0.5202158093452454], [-0.7572083473205566, 0.0005129263736307621, -0.026355678215622902, -0.8178822994232178], [-0.7571980953216553, -0.19423852860927582, -0.04271332547068596, -0.5336042642593384], [-0.7610828876495361, -0.3887345492839813, -0.0533854104578495, -0.25468018651008606], [-0.7688575983047485, -0.5830552577972412, -0.05847901478409767, 0.02069769985973835], [-0.780518651008606, -0.3871455192565918, -0.058065060526132584, -0.28984758257865906], [-0.7882615923881531, -0.5813934803009033, -0.06386201083660126, -0.016028210520744324], [-0.7998894453048706, -0.38541656732559204, -0.0641825720667839, -0.3281570076942444], [-0.807597815990448, -0.18944239616394043, -0.07074571400880814, -0.640369713306427], [-0.8113866448402405, 0.006590821780264378, -0.08355311304330826, -0.954465925693512], [-0.8112547993659973, -0.18731378018856049, -0.10264242440462112, -0.6891596913337708], [-0.8150010704994202, -0.38087278604507446, -0.11642561852931976, -0.4304731786251068], [-0.8226185441017151, -0.18431125581264496, -0.1250350922346115, -0.7574713230133057], [-0.8263047933578491, 0.012291714549064636, -0.14018450677394867, -1.086738109588623], [-0.8260589241981506, -0.18073126673698425, -0.16191928088665009, -0.8411233425140381], [-0.8296735882759094, -0.3733164668083191, -0.17874173820018768, -0.6034206748008728], [-0.837139904499054, -0.5655478239059448, -0.1908101588487625, -0.3719382584095001], [-0.8484508395195007, -0.757519543170929, -0.19824892282485962, -0.14496520161628723], [-0.8636012673377991, -0.9493318796157837, -0.20114822685718536, 0.07921355962753296], [-0.8825879096984863, -1.1410874128341675, -0.19956395030021667, 0.30230793356895447], [-0.9054096341133118, -0.9437638521194458, -0.1935177892446518, -0.046086084097623825], [-0.9242849349975586, -1.1356604099273682, -0.19443951547145844, 0.1798458993434906], [-0.946998119354248, -0.9383646249771118, -0.19084259867668152, -0.16732662916183472], [-0.9657654166221619, -1.1303154230117798, -0.1941891312599182, 0.059604424983263016], [-0.988371729850769, -1.3221997022628784, -0.1929970383644104, 0.2852875888347626], [-1.0148156881332397, -1.5141206979751587, -0.18729129433631897, 0.5114346146583557], [-1.0450981855392456, -1.316922903060913, -0.17706260085105896, 0.16606837511062622], [-1.0714366436004639, -1.5091266632080078, -0.17374123632907867, 0.3980816602706909], [-1.1016191244125366, -1.7014130353927612, -0.16577959060668945, 0.6313455104827881], [-1.1356474161148071, -1.8938814401626587, -0.1531526893377304, 0.8675737977027893], [-1.1735249757766724, -2.08662486076355, -0.13580121099948883, 1.1084538698196411], [-1.2152575254440308, -1.8900052309036255, -0.11363213509321213, 0.7764367461204529], [-1.253057599067688, -2.0833961963653564, -0.09810339659452438, 1.0313165187835693], [-1.2947255373001099, -1.8871158361434937, -0.07747706770896912, 0.7095152735710144], [-1.332467794418335, -1.6910110712051392, -0.06328675895929337, 0.39348524808883667], [-1.3662880659103394, -1.4950509071350098, -0.05541705712676048, 0.08153942972421646], [-1.3961890935897827, -1.2991801500320435, -0.0537862703204155, -0.22809995710849762], [-1.4221726655960083, -1.1033324003219604, -0.058348268270492554, -0.5372521877288818], [-1.4442393779754639, -1.297587513923645, -0.06909330934286118, -0.2635100185871124], [-1.4701911211013794, -1.1015509366989136, -0.07436351478099823, -0.577160656452179], [-1.4922220706939697, -0.9054697155952454, -0.0859067291021347, -0.8923122882843018], [-1.5103315114974976, -1.0993279218673706, -0.1037529706954956, -0.6278228759765625], [-1.532318115234375, -1.292860507965088, -0.11630942672491074, -0.3695337474346161], [-1.5581753253936768, -1.4861544370651245, -0.1237001046538353, -0.11566976457834244], [-1.5878983736038208, -1.6793067455291748, -0.12601350247859955, 0.13556984066963196], [-1.6214845180511475, -1.8724197149276733, -0.12330210208892822, 0.38599228858947754], [-1.6589329242706299, -1.6757827997207642, -0.11558225750923157, 0.057117242366075516], [-1.6924484968185425, -1.8690741062164307, -0.11443991214036942, 0.3112141191959381], [-1.729830026626587, -1.6725234985351562, -0.10821563005447388, -0.015255188569426537], [-1.7632805109024048, -1.476029396057129, -0.10852073132991791, -0.34002554416656494], [-1.7928011417388916, -1.2795442342758179, -0.11532124131917953, -0.6648621559143066], [-1.8183919191360474, -1.4728891849517822, -0.12861847877502441, -0.41060030460357666], [-1.847849726676941, -1.6659754514694214, -0.13683049380779266, -0.16107283532619476], [-1.881169319152832, -1.8589003086090088, -0.1400519460439682, 0.08550680428743362]], "action_prob": [0.5177308320999146, 0.6059285998344421, 0.5276751518249512, 0.6002064347267151, 0.5362385511398315, 0.4052051901817322, 0.6486473679542542, 0.5938112139701843, 0.45689311623573303, 0.6356320381164551, 0.5504201650619507, 0.5848744511604309, 0.5557374954223633, 0.5805760025978088, 0.5606170892715454, 0.42365679144859314, 0.3551313281059265, 0.3457290530204773, 0.6455402970314026, 0.6555899977684021, 0.3464338481426239, 0.3442193865776062, 0.6430991291999817, 0.34476572275161743, 0.6399617195129395, 0.6528055667877197, 0.6643920540809631, 0.33346298336982727, 0.6616783738136292, 0.3283398449420929, 0.6564430594444275, 0.6709957122802734, 0.4923938810825348, 0.6198424100875854, 0.5043643116950989, 0.618409276008606, 0.5021719932556152, 0.6152946949005127, 0.4949074983596802, 0.6229000091552734, 0.511547863483429, 0.6103963851928711, 0.5146256685256958, 0.6093990206718445, 0.5158643126487732, 0.6093705892562866, 0.4846543073654175, 0.373685747385025, 0.653768002986908, 0.6312455534934998, 0.46782007813453674, 0.6357793807983398, 0.4554419219493866, 0.640785813331604, 0.559269368648529, 0.42647451162338257, 0.6398541331291199, 0.5675047636032104, 0.5756706595420837, 0.4398319721221924, 0.6372051239013672, 0.44244325160980225, 0.6375174522399902, 0.558463990688324, 0.41922298073768616, 0.6479678750038147, 0.585835874080658, 0.5503063201904297, 0.5896809101104736, 0.545434296131134, 0.40628886222839355, 0.6516945362091064, 0.39791253209114075, 0.6541577577590942, 0.6129452586174011, 0.49268049001693726, 0.6148814558982849, 0.4956834614276886, 0.6269478797912598, 0.4809664487838745, 0.6339980363845825, 0.46441179513931274, 0.6409512758255005, 0.5539318919181824, 0.42530667781829834, 0.3611997663974762, 0.34797006845474243, 0.6476631164550781, 0.6539032459259033, 0.35609865188598633, 0.6551510691642761, 0.648737370967865, 0.5992806553840637, 0.520849347114563, 0.6110298037528992, 0.5013834834098816, 0.621987521648407, 0.5196601748466492, 0.5990896224975586, 0.536941647529602, 0.5879343152046204, 0.5520455837249756, 0.5765991806983948, 0.5653102993965149, 0.43489447236061096, 0.6368758678436279, 0.5583069920539856, 0.4181416928768158, 0.6506889462471008, 0.5929985046386719, 0.4651937186717987, 0.6261563301086426, 0.472526878118515, 0.6243382096290588, 0.5236034393310547, 0.6073064804077148, 0.5177822709083557, 0.611217737197876, 0.48873937129974365, 0.6178523302078247, 0.49065637588500977, 0.38198959827423096, 0.35158151388168335, 0.3549509644508362, 0.6330907344818115, 0.6445930004119873, 0.6533032059669495, 0.6472517848014832, 0.5955482721328735, 0.5198643803596497, 0.38190165162086487, 0.6572458744049072, 0.6384754180908203, 0.5613241195678711, 0.44448062777519226, 0.6276627779006958, 0.5234818458557129, 0.616958737373352, 0.5128519535064697, 0.40717729926109314, 0.6416295170783997, 0.4262494146823883, 0.36385002732276917, 0.6543287038803101, 0.36778056621551514, 0.34500086307525635, 0.6561247110366821, 0.3432336747646332, 0.6576043963432312, 0.659195065498352, 0.6405047178268433, 0.5716096758842468, 0.5492894053459167, 0.5819385051727295, 0.5369550585746765, 0.5915307402610779, 0.4757031202316284, 0.3791806101799011, 0.6512988805770874, 0.6204092502593994, 0.4822430908679962, 0.6204453706741333, 0.5195757746696472, 0.5983441472053528, 0.4803374111652374, 0.6213908195495605, 0.4758020341396332, 0.6242722868919373, 0.4680655598640442, 0.6285125613212585, 0.5428386330604553, 0.42544233798980713, 0.6423110365867615, 0.43073463439941406, 0.6409804821014404, 0.4336116909980774, 0.6405318975448608, 0.5658502578735352, 0.4448621869087219, 0.3656919598579407, 0.6535541415214539, 0.6397045850753784, 0.5770489573478699, 0.5330035090446472, 0.5887373089790344, 0.5166076421737671, 0.3993963897228241, 0.3480628430843353, 0.6555357575416565, 0.6575068831443787, 0.36548760533332825, 0.3388320207595825, 0.6539703011512756, 0.6638072729110718, 0.6623800992965698, 0.6376395225524902, 0.5792825818061829, 0.49806922674179077, 0.5749199390411377, 0.5422942638397217, 0.5369571447372437, 0.5811440944671631, 0.5046187043190002, 0.4342181980609894, 0.6143181920051575, 0.46566715836524963, 0.40624895691871643, 0.36899903416633606, 0.34845736622810364, 0.6616938710212708, 0.3519008159637451, 0.6613684296607971, 0.6459681391716003, 0.6103748083114624, 0.5454503893852234, 0.45938530564308167, 0.6153106689453125, 0.4500129520893097, 0.37852388620376587, 0.6587561964988708, 0.6308808326721191, 0.5797420144081116, 0.5134040713310242, 0.4487534165382385, 0.6010680794715881, 0.46368351578712463, 0.589996874332428, 0.5224655866622925, 0.4435650110244751, 0.620995283126831, 0.572413444519043, 0.5135853290557861], "advantages": [16.8153018951416, 16.08376693725586, 15.236452102661133, 14.484068870544434, 13.644913673400879, 12.871164321899414, 12.409887313842773, 11.362844467163086, 10.548711776733398, 9.980155944824219, 8.822973251342773, 7.9918622970581055, 7.141995906829834, 6.288285255432129, 5.43198299407959, 4.555024147033691, 3.9851555824279785, 3.700629234313965, 3.6662073135375977, 2.4138131141662598, 1.270835518836975, 1.208585262298584, 1.4131032228469849, 0.39334285259246826, 0.7542328238487244, -0.02605907805263996, -0.6824354529380798, -1.1758549213409424, -0.850268542766571, -1.1243308782577515, -0.7373318672180176, -0.7274096012115479, 76.39590454101562, 76.54303741455078, 76.13410949707031, 76.11520385742188, 75.9753189086914, 76.10285186767578, 75.70099639892578, 75.69377136230469, 75.53556823730469, 75.64729309082031, 75.2554931640625, 75.3444595336914, 74.94269561767578, 75.01179504394531, 74.59770202636719, 74.57467651367188, 74.92082977294922, 74.52130889892578, 74.35821533203125, 74.43809509277344, 74.2860107421875, 74.41649627685547, 74.27812957763672, 74.40652465820312, 74.77114868164062, 74.09799194335938, 73.83911895751953, 73.88331604003906, 74.17611694335938, 73.4902572631836, 73.7353744506836, 73.02095031738281, 72.70840454101562, 72.81431579589844, 72.50904083251953, 72.47879028320312, 72.2165298461914, 72.1785888671875, 71.92792510986328, 72.10999298095703, 71.83570098876953, 72.08980560302734, 71.86274719238281, 71.89083099365234, 72.16070556640625, 71.63977813720703, 71.56941223144531, 71.5447998046875, 71.5261001586914, 71.50858306884766, 71.55142974853516, 71.54796600341797, 71.7677001953125, 72.12239074707031, 72.47885131835938, 72.7291259765625, 71.55310821533203, 70.40770721435547, 70.59049987792969, 69.3442611694336, 68.28203582763672, 67.53401947021484, 67.36480712890625, 66.5807876586914, 66.4351577758789, 65.61344146728516, 65.14875030517578, 64.77725219726562, 64.30272674560547, 63.97257995605469, 63.485111236572266, 63.18836212158203, 62.685665130615234, 62.526588439941406, 62.02827453613281, 61.804359436035156, 61.845314025878906, 60.964019775390625, 60.41402816772461, 60.19400405883789, 59.735755920410156, 59.527259826660156, 59.100337982177734, 58.93549346923828, 58.38496398925781, 58.21684646606445, 57.64940643310547, 57.41193771362305, 57.00452423095703, 56.779964447021484, 56.87293243408203, 57.250911712646484, 57.861473083496094, 57.31090545654297, 56.848358154296875, 56.52627944946289, 56.402488708496094, 56.514060974121094, 56.460487365722656, 56.891883850097656, 56.85274887084961, 57.0250358581543, 57.387088775634766, 57.842491149902344, 57.36628341674805, 57.31421661376953, 57.5459098815918, 57.856929779052734, 58.128623962402344, 57.571266174316406, 57.720916748046875, 57.75039291381836, 56.994449615478516, 56.90576934814453, 56.67658233642578, 55.690711975097656, 55.37318801879883, 54.2305908203125, 53.07597732543945, 52.023597717285156, 51.1836051940918, 50.730857849121094, 49.866798400878906, 49.433197021484375, 48.541900634765625, 47.931644439697266, 47.61442184448242, 47.01749038696289, 46.56621170043945, 46.06650924682617, 45.647186279296875, 45.36742401123047, 44.592063903808594, 44.11302185058594, 43.70807647705078, 43.270816802978516, 42.89474868774414, 42.5067138671875, 42.160438537597656, 41.91938781738281, 41.73004913330078, 40.84308624267578, 40.59381103515625, 39.67547607421875, 39.37530517578125, 38.42173385620117, 37.69032287597656, 37.21800231933594, 36.99829864501953, 36.551883697509766, 36.179359436035156, 35.872711181640625, 35.36118698120117, 35.04701614379883, 34.57892990112305, 34.35118865966797, 34.324951171875, 34.16121292114258, 34.013587951660156, 34.00716018676758, 34.11477279663086, 34.259300231933594, 34.37340545654297, 34.41956329345703, 34.36500930786133, 34.181434631347656, 33.84870529174805, 33.66436767578125, 33.25724792480469, 33.0439338684082, 32.58868408203125, 32.00311279296875, 31.290464401245117, 30.927396774291992, 30.159408569335938, 29.284727096557617, 28.310998916625977, 27.24687957763672, 26.59670639038086, 25.466510772705078, 24.684572219848633, 23.878677368164062, 23.089889526367188, 22.333293914794922, 21.60093879699707, 20.667890548706055, 19.94930648803711, 19.241167068481445, 18.483835220336914, 17.624975204467773, 16.680532455444336, 15.667489051818848, 14.5980224609375, 13.773224830627441, 12.677483558654785, 11.824146270751953, 11.019350051879883, 10.2417631149292, 9.2701997756958, 8.228387832641602], "value_targets": [27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 86.60203552246094, 86.4666976928711, 86.33000183105469, 86.1919174194336, 86.05244445800781, 85.91156005859375, 85.76924896240234, 85.62550354003906, 85.48030853271484, 85.33364868164062, 85.18550109863281, 85.03585815429688, 84.88470458984375, 84.73202514648438, 84.57780456542969, 84.42202758789062, 84.2646713256836, 84.10572814941406, 83.94518280029297, 83.78301239013672, 83.61920166015625, 83.45374298095703, 83.28660583496094, 83.11778259277344, 82.94725799560547, 82.77500915527344, 82.60102081298828, 82.4252700805664, 82.24774932861328, 82.06842803955078, 81.8873062133789, 81.704345703125, 81.51954650878906, 81.33287048339844, 81.14431762695312, 80.953857421875, 80.76146697998047, 80.567138671875, 80.370849609375, 80.17257690429688, 79.97229766845703, 79.7699966430664, 79.5656509399414, 79.35924530029297, 79.1507568359375, 78.94015502929688, 78.72743225097656, 78.51255798339844, 78.2955093383789, 78.0762710571289, 77.85482025146484, 77.63113403320312, 77.40518188476562, 77.17695617675781, 76.94641876220703, 76.71355438232422, 76.47834014892578, 76.2407455444336, 76.0007553100586, 75.75833892822266, 75.51347351074219, 75.26612854003906, 75.01629638671875, 74.76393127441406, 74.50902557373047, 74.25154113769531, 73.991455078125, 73.72874450683594, 73.46337127685547, 73.19532775878906, 72.92457580566406, 72.65108489990234, 72.37483215332031, 72.09579467773438, 71.81392669677734, 71.52922058105469, 71.24163818359375, 70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 367682493, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 1897553340, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 310836068, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783, 1031060783], "obs": [[-0.0018584993667900562, 0.013001116923987865, -0.04821237549185753, 0.03883606567978859], [-0.0015984770143404603, 0.20878009498119354, -0.04743565246462822, -0.2686600983142853], [0.002577124862000346, 0.40454578399658203, -0.05280885472893715, -0.5759191513061523], [0.010668040253221989, 0.21020230650901794, -0.06432723999023438, -0.30032894015312195], [0.014872086234390736, 0.4061793386936188, -0.0703338161110878, -0.6125856637954712], [0.02299567312002182, 0.21210716664791107, -0.08258552849292755, -0.342858225107193], [0.027237815782427788, 0.01825129985809326, -0.08944269269704819, -0.07731804996728897], [0.027602842077612877, -0.1754821538925171, -0.09098906069993973, 0.18585941195487976], [0.024093199521303177, -0.3691924214363098, -0.08727186918258667, 0.44850894808769226], [0.016709351912140846, -0.5629785060882568, -0.07830169051885605, 0.7124564051628113], [0.005449781194329262, -0.36686471104621887, -0.06405255943536758, 0.3961898982524872], [-0.0018875130917876959, -0.17089521884918213, -0.056128762662410736, 0.08401988446712494], [-0.005305417347699404, 0.02498452551662922, -0.05444836616516113, -0.22583019733428955], [-0.004805726930499077, -0.16931870579719543, -0.05896496772766113, 0.04919280484318733], [-0.008192100562155247, -0.36354774236679077, -0.05798111483454704, 0.32270437479019165], [-0.015463056042790413, -0.5577982068061829, -0.051527027040719986, 0.5965535044670105], [-0.026619018986821175, -0.3619944453239441, -0.03959595412015915, 0.28809547424316406], [-0.03385891020298004, -0.16633087396621704, -0.03383404389023781, -0.01680801250040531], [-0.03718552738428116, 0.02925954759120941, -0.034170206636190414, -0.3199710547924042], [-0.03660033643245697, -0.1653595268726349, -0.04056962579488754, -0.0382569395005703], [-0.03990752622485161, -0.35987693071365356, -0.041334766894578934, 0.24135488271713257], [-0.04710506275296211, -0.5543848276138306, -0.03650766611099243, 0.520718514919281], [-0.05819275975227356, -0.3587684631347656, -0.026093296706676483, 0.21675866842269897], [-0.06536813080310822, -0.16328340768814087, -0.021758124232292175, -0.08403967320919037], [-0.0686337947845459, -0.35808682441711426, -0.023438917472958565, 0.201699897646904], [-0.07579553127288818, -0.1626376211643219, -0.01940491981804371, -0.09828377515077591], [-0.0790482833981514, 0.0327569916844368, -0.021370595321059227, -0.3970251977443695], [-0.07839314639568329, -0.1620553433895111, -0.029311098158359528, -0.11115589737892151], [-0.08163425326347351, -0.35674530267715454, -0.03153421729803085, 0.17213734984397888], [-0.08876916021108627, -0.16118653118610382, -0.028091469779610634, -0.13032448291778564], [-0.09199289232492447, -0.3558950424194336, -0.030697960406541824, 0.15336525440216064], [-0.09911078959703445, -0.16034729778766632, -0.027630655094981194, -0.1488419473171234], [-0.10231773555278778, -0.35506290197372437, -0.030607493594288826, 0.13499760627746582], [-0.10941899567842484, -0.5497334003448486, -0.027907541021704674, 0.41786935925483704], [-0.12041366100311279, -0.7444489598274231, -0.019550153985619545, 0.7016252279281616], [-0.13530264794826508, -0.5490615367889404, -0.005517648998647928, 0.40285277366638184], [-0.14628387987613678, -0.74410480260849, 0.002539406530559063, 0.6937910318374634], [-0.1611659675836563, -0.9392619132995605, 0.016415227204561234, 0.987272322177887], [-0.17995120584964752, -0.74436354637146, 0.0361606739461422, 0.6997900009155273], [-0.1948384791612625, -0.5497611165046692, 0.050156474113464355, 0.4187060594558716], [-0.20583370327949524, -0.3553844392299652, 0.058530595153570175, 0.14224755764007568], [-0.21294139325618744, -0.16114746034145355, 0.06137554720044136, -0.13141080737113953], [-0.21616433560848236, 0.033044058829545975, 0.05874732881784439, -0.40411654114723206], [-0.21550345420837402, -0.162859708070755, 0.0506649985909462, -0.09350604563951492], [-0.2187606543302536, -0.35866984724998474, 0.04879487678408623, 0.2147214114665985], [-0.22593404352664948, -0.16427822411060333, 0.05308930575847626, -0.062178969383239746], [-0.22921961545944214, 0.030043942853808403, 0.0518457256257534, -0.3376506268978119], [-0.22861874103546143, -0.16577596962451935, 0.04509271681308746, -0.029079606756567955], [-0.23193424940109253, 0.028671281412243843, 0.04451112449169159, -0.30720123648643494], [-0.23136082291603088, -0.16705572605133057, 0.038367096334695816, -0.0008195670670829713], [-0.2347019463777542, 0.027495577931404114, 0.038350705057382584, -0.281154602766037], [-0.23415203392505646, -0.1681518405675888, 0.03272761404514313, 0.0233730748295784], [-0.23751506209373474, 0.026485854759812355, 0.033195074647665024, -0.25880691409111023], [-0.23698535561561584, -0.16909387707710266, 0.02801893837749958, 0.04415862262248993], [-0.24036723375320435, -0.36460617184638977, 0.02890210971236229, 0.34554845094680786], [-0.2476593554019928, -0.16990701854228973, 0.03581307828426361, 0.062117721885442734], [-0.251057505607605, 0.024683639407157898, 0.03705543279647827, -0.21905431151390076], [-0.2505638301372528, -0.1709478795528412, 0.03267434611916542, 0.08508332073688507], [-0.2539827823638916, 0.02369084395468235, 0.03437601402401924, -0.19711437821388245], [-0.25350895524024963, 0.21830466389656067, 0.03043372556567192, -0.4787580668926239], [-0.2491428703069687, 0.02276656962931156, 0.020858565345406532, -0.17664062976837158], [-0.2486875355243683, -0.17264758050441742, 0.0173257514834404, 0.12254881113767624], [-0.25214049220085144, 0.022221915423870087, 0.019776728004217148, -0.16461804509162903], [-0.25169605016708374, -0.17317748069763184, 0.016484366729855537, 0.13423770666122437], [-0.2551595866680145, 0.021704524755477905, 0.019169121980667114, -0.15319938957691193], [-0.25472551584243774, -0.17368657886981964, 0.016105134040117264, 0.1454687863588333], [-0.2581992447376251, -0.36903542280197144, 0.0190145093947649, 0.44318875670433044], [-0.2655799388885498, -0.5644211769104004, 0.027878284454345703, 0.7418043613433838], [-0.27686837315559387, -0.36969494819641113, 0.04271437227725983, 0.45802366733551025], [-0.2842622697353363, -0.17520205676555634, 0.05187484622001648, 0.17910462617874146], [-0.28776630759239197, 0.019140657037496567, 0.05545693635940552, -0.0967729389667511], [-0.287383496761322, 0.21342574059963226, 0.05352148041129112, -0.3714565634727478], [-0.2831149995326996, 0.017585882917046547, 0.04609234631061554, -0.06238961219787598], [-0.28276327252388, 0.2120177149772644, 0.04484455659985542, -0.34018126130104065], [-0.27852290868759155, 0.406473845243454, 0.03804093226790428, -0.6183923482894897], [-0.270393431186676, 0.21084176003932953, 0.02567308396100998, -0.31397515535354614], [-0.26617661118507385, 0.015363674610853195, 0.01939358003437519, -0.013307605870068073], [-0.2658693194389343, 0.2102022022008896, 0.01912742853164673, -0.2998090982437134], [-0.2616652846336365, 0.014812912791967392, 0.013131246902048588, -0.0011556398821994662], [-0.2613690197467804, -0.18049487471580505, 0.013108134269714355, 0.2956412732601166], [-0.26497891545295715, 0.014437776058912277, 0.019020959734916687, 0.007121084723621607], [-0.2646901607513428, 0.20928184688091278, 0.019163381308317184, -0.2795003354549408], [-0.2605045437812805, 0.40412527322769165, 0.013573373667895794, -0.5660781264305115], [-0.252422034740448, 0.599054217338562, 0.002251812256872654, -0.8544541001319885], [-0.24044093489646912, 0.403901606798172, -0.01483726967126131, -0.5610639452934265], [-0.23236291110515594, 0.20899100601673126, -0.02605854906141758, -0.27309221029281616], [-0.2281830906867981, 0.4044749140739441, -0.03152039274573326, -0.5738788843154907], [-0.22009359300136566, 0.20980872213840485, -0.042997971177101135, -0.2912901043891907], [-0.21589741110801697, 0.40551653504371643, -0.048823773860931396, -0.5972180366516113], [-0.20778708159923553, 0.21111059188842773, -0.06076813116669655, -0.3203050494194031], [-0.2035648673772812, 0.4070429503917694, -0.06717423349618912, -0.6315159201622009], [-0.19542402029037476, 0.21291935443878174, -0.07980455458164215, -0.3607216477394104], [-0.19116562604904175, 0.019017115235328674, -0.08701898902654648, -0.09423163533210754], [-0.19078528881072998, 0.21527153253555298, -0.08890362083911896, -0.41305071115493774], [-0.186479851603508, 0.02151486836373806, -0.09716463088989258, -0.14966675639152527], [-0.18604955077171326, -0.17209115624427795, -0.1001579686999321, 0.11085100471973419], [-0.1894913762807846, 0.024312743917107582, -0.09794094413518906, -0.21167561411857605], [-0.18900512158870697, 0.22068868577480316, -0.10217446088790894, -0.533576488494873], [-0.1845913529396057, 0.41708794236183167, -0.11284598708152771, -0.856626033782959], [-0.17624959349632263, 0.22366951406002045, -0.1299785077571869, -0.6014500260353088], [-0.1717762053012848, 0.030582325533032417, -0.142007514834404, -0.35236856341362], [-0.17116455733776093, -0.16226479411125183, -0.1490548849105835, -0.1076197475194931], [-0.17440985143184662, 0.034643881022930145, -0.15120728313922882, -0.44336777925491333], [-0.1737169772386551, 0.23154567182064056, -0.1600746363401413, -0.7796362042427063], [-0.1690860539674759, 0.038943927735090256, -0.17566736042499542, -0.5412883162498474], [-0.16830718517303467, -0.153330460190773, -0.1864931285381317, -0.30869632959365845], [-0.17137378454208374, -0.34537357091903687, -0.19266705214977264, -0.08013828843832016], [-0.1782812625169754, -0.148086816072464, -0.1942698210477829, -0.4268871545791626], [-0.18124300241470337, -0.34000322222709656, -0.20280756056308746, -0.20118454098701477], [-0.18804305791854858, -0.5317344665527344, -0.20683124661445618, 0.021300548687577248], [-0.19867774844169617, -0.7233827710151672, -0.20640523731708527, 0.24227015674114227], [-0.2131454050540924, -0.9150506258010864, -0.20155984163284302, 0.4634162187576294], [-0.23144641518592834, -0.7177362442016602, -0.1922915130853653, 0.11457832157611847], [-0.2458011507987976, -0.9096574783325195, -0.18999993801116943, 0.3409682512283325], [-0.2639943063259125, -0.7124119400978088, -0.18318058550357819, -0.005100148729979992], [-0.2782425284385681, -0.515200138092041, -0.18328258395195007, -0.34952306747436523], [-0.28854653239250183, -0.7073068022727966, -0.19027304649353027, -0.11977343261241913], [-0.3026926815509796, -0.5100404024124146, -0.19266851246356964, -0.46593618392944336], [-0.31289348006248474, -0.7019926905632019, -0.20198723673820496, -0.23963013291358948], [-0.3269333243370056, -0.8937425017356873, -0.2067798376083374, -0.016834061592817307], [-0.3448081910610199, -1.0853917598724365, -0.2071165144443512, 0.20415474474430084], [-0.36651602387428284, -0.8880027532577515, -0.2030334323644638, -0.14605861902236938], [-0.38427606225013733, -1.0797260999679565, -0.20595459640026093, 0.07633663713932037], [-0.40587058663368225, -0.8823384642601013, -0.20442786812782288, -0.2736109793186188], [0.01962619088590145, 0.010136101394891739, 0.04045342281460762, 0.04268602281808853], [0.019828911870718002, -0.18554188311100006, 0.04130714014172554, 0.3478529453277588], [0.01611807569861412, 0.00896893534809351, 0.04826420173048973, 0.06847642362117767], [0.01629745401442051, 0.20336689054965973, 0.049633730202913284, -0.20859678089618683], [0.02036479115486145, 0.007571661379188299, 0.04546179249882698, 0.09932070970535278], [0.020516224205493927, 0.20201358199119568, 0.047448206692934036, -0.17867964506149292], [0.024556497111916542, 0.006245869677513838, 0.04387461394071579, 0.12858594954013824], [0.024681413546204567, 0.20071274042129517, 0.046446334570646286, -0.14993862807750702], [0.028695669025182724, 0.004957529716193676, 0.04344756156206131, 0.15702782571315765], [0.028794819489121437, -0.19075867533683777, 0.046588119119405746, 0.46309465169906616], [0.024979645386338234, -0.3865070044994354, 0.055850010365247726, 0.7700905203819275], [0.01724950596690178, -0.19219635426998138, 0.07125181704759598, 0.4954903721809387], [0.013405578210949898, 0.0018522836035117507, 0.08116162568330765, 0.22608627378940582], [0.013442624360322952, 0.1957261711359024, 0.08568335324525833, -0.03993193432688713], [0.017357148230075836, -0.0005133108352310956, 0.08488471806049347, 0.2785075008869171], [0.017346881330013275, 0.19330158829689026, 0.09045486152172089, 0.013758056797087193], [0.02121291309595108, -0.002993339905515313, 0.09073002636432648, 0.3335541784763336], [0.021153045818209648, -0.19928161799907684, 0.09740111231803894, 0.6534135937690735], [0.017167413607239723, -0.005641214083880186, 0.11046937853097916, 0.3929203450679779], [0.017054589465260506, -0.20214323699474335, 0.1183277890086174, 0.7182887196540833], [0.013011724688112736, -0.39868655800819397, 0.1326935589313507, 1.0457494258880615], [0.005037993658334017, -0.5952962636947632, 0.1536085456609726, 1.3769689798355103], [-0.00686793215572834, -0.4023902118206024, 0.18114793300628662, 1.1360005140304565], [-0.014915736392140388, -0.21003973484039307, 0.20386794209480286, 0.9051624536514282], [0.0285808015614748, -0.028731025755405426, 0.02119120955467224, 0.04043162241578102], [0.028006181120872498, -0.22415034472942352, 0.021999841555953026, 0.3397245407104492], [0.023523174226284027, -0.02934822253882885, 0.02879433147609234, 0.05405949428677559], [0.02293621003627777, 0.16534927487373352, 0.02987552247941494, -0.2294013351202011], [0.026243194937705994, -0.030186578631401062, 0.02528749592602253, 0.07255366444587708], [0.02563946321606636, -0.2256617546081543, 0.026738569140434265, 0.3731064200401306], [0.02112622931599617, -0.030929649248719215, 0.034200698137283325, 0.08897287398576736], [0.020507635548710823, 0.16368581354618073, 0.03598015382885933, -0.19272655248641968], [0.02378135174512863, 0.35827508568763733, 0.032125622034072876, -0.4738456606864929], [0.030946852639317513, 0.16271451115608215, 0.022648710757493973, -0.17121286690235138], [0.03420114517211914, -0.03272416070103645, 0.01922445371747017, 0.12852810323238373], [0.03354666009545326, 0.16211719810962677, 0.021795015782117844, -0.1580282747745514], [0.036789003759622574, -0.03330991044640541, 0.018634449690580368, 0.14144998788833618], [0.03612280637025833, 0.16154026985168457, 0.02146345004439354, -0.14529633522033691], [0.039353612810373306, 0.3563483655452728, 0.01855752244591713, -0.43113142251968384], [0.04648057743906975, 0.5512027144432068, 0.009934894740581512, -0.7179069519042969], [0.05750463157892227, 0.3559446930885315, -0.00442324485629797, -0.4221135973930359], [0.06462352722883224, 0.16088567674160004, -0.012865517288446426, -0.1308283805847168], [0.06784123927354813, -0.034049633890390396, -0.015482084825634956, 0.15776804089546204], [0.06716024875640869, -0.2289465367794037, -0.012326723895967007, 0.4455268085002899], [0.06258131563663483, -0.03365238755941391, -0.003416187595576048, 0.14898386597633362], [0.06190826743841171, -0.22872525453567505, -0.0004365102213341743, 0.4405871033668518], [0.05733376368880272, -0.033597126603126526, 0.008375232107937336, 0.1477666050195694], [0.05666182190179825, 0.16140389442443848, 0.011330563575029373, -0.14226238429546356], [0.05988990142941475, -0.03387847915291786, 0.008485316298902035, 0.15397348999977112], [0.0592123307287693, -0.2291208952665329, 0.011564786545932293, 0.4493212401866913], [0.05462991073727608, -0.424404501914978, 0.020551210269331932, 0.7456269860267639], [0.04614182189106941, -0.22957207262516022, 0.03546375036239624, 0.45948171615600586], [0.04155037924647331, -0.034968893975019455, 0.04465338587760925, 0.1781846582889557], [0.04085100442171097, -0.23070046305656433, 0.04821707680821419, 0.4846130907535553], [0.036236993968486786, -0.42646852135658264, 0.05790933966636658, 0.7920942306518555], [0.027707623317837715, -0.62233567237854, 0.07375122606754303, 1.102418303489685], [0.015260908752679825, -0.4282573461532593, 0.09579958766698837, 0.833755373954773], [0.006695762276649475, -0.23456571996212006, 0.1124747022986412, 0.5726721286773682], [0.0020044478587806225, -0.43107011914253235, 0.12392814457416534, 0.8985641598701477], [-0.006616954226046801, -0.23782600462436676, 0.14189942181110382, 0.6472627520561218], [-0.011373474262654781, -0.04493637755513191, 0.15484468638896942, 0.4024149179458618], [-0.012272202409803867, 0.1476893126964569, 0.16289298236370087, 0.162276029586792], [-0.009318416006863117, 0.34015005826950073, 0.16613849997520447, -0.07491441816091537], [-0.0025154149625450373, 0.14308428764343262, 0.16464020311832428, 0.2652343511581421], [0.00034627088462002575, 0.33552050590515137, 0.1699448972940445, 0.028669238090515137], [0.007056680973619223, 0.5278494358062744, 0.17051827907562256, -0.20594452321529388], [0.017613669857382774, 0.7201748490333557, 0.16639938950538635, -0.44035887718200684], [0.032017167657613754, 0.5231371521949768, 0.15759220719337463, -0.1001887246966362], [0.04247990995645523, 0.3261488676071167, 0.15558843314647675, 0.2377726435661316], [0.049002885818481445, 0.1291860193014145, 0.16034388542175293, 0.5752067565917969], [0.051586609333753586, -0.06777738034725189, 0.17184802889823914, 0.913801372051239], [0.05023105815052986, 0.1246558204293251, 0.190124049782753, 0.6796783208847046], [0.05272417515516281, 0.31669968366622925, 0.20371761918067932, 0.4523635804653168], [-0.011494453065097332, 0.010360819287598133, -0.0031320429407060146, -0.031702857464551926], [-0.011287236586213112, 0.20552754402160645, -0.0037661001551896334, -0.3253723382949829], [-0.007176685146987438, 0.40070292353630066, -0.010273546911776066, -0.6192405223846436], [0.0008373729651793838, 0.5959668159484863, -0.02265835739672184, -0.9151413440704346], [0.012756709940731525, 0.7913877964019775, -0.04096118360757828, -1.2148585319519043], [0.028584465384483337, 0.987013578414917, -0.06525835394859314, -1.5200902223587036], [0.04832473769783974, 0.7927383184432983, -0.09566015750169754, -1.2484699487686157], [0.06417950242757797, 0.5989639759063721, -0.12062955647706985, -0.9872186779975891], [0.0761587843298912, 0.7954765558242798, -0.14037393033504486, -1.3152246475219727], [0.09206831455230713, 0.6023819446563721, -0.16667842864990234, -1.0695661306381226], [0.10411595553159714, 0.40980905294418335, -0.18806974589824677, -0.8334869146347046], [0.11231213063001633, 0.606934130191803, -0.20473948121070862, -1.1789277791976929]], "actions": [1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.0015984770143404603, 0.20878009498119354, -0.04743565246462822, -0.2686600983142853], [0.002577124862000346, 0.40454578399658203, -0.05280885472893715, -0.5759191513061523], [0.010668040253221989, 0.21020230650901794, -0.06432723999023438, -0.30032894015312195], [0.014872086234390736, 0.4061793386936188, -0.0703338161110878, -0.6125856637954712], [0.02299567312002182, 0.21210716664791107, -0.08258552849292755, -0.342858225107193], [0.027237815782427788, 0.01825129985809326, -0.08944269269704819, -0.07731804996728897], [0.027602842077612877, -0.1754821538925171, -0.09098906069993973, 0.18585941195487976], [0.024093199521303177, -0.3691924214363098, -0.08727186918258667, 0.44850894808769226], [0.016709351912140846, -0.5629785060882568, -0.07830169051885605, 0.7124564051628113], [0.005449781194329262, -0.36686471104621887, -0.06405255943536758, 0.3961898982524872], [-0.0018875130917876959, -0.17089521884918213, -0.056128762662410736, 0.08401988446712494], [-0.005305417347699404, 0.02498452551662922, -0.05444836616516113, -0.22583019733428955], [-0.004805726930499077, -0.16931870579719543, -0.05896496772766113, 0.04919280484318733], [-0.008192100562155247, -0.36354774236679077, -0.05798111483454704, 0.32270437479019165], [-0.015463056042790413, -0.5577982068061829, -0.051527027040719986, 0.5965535044670105], [-0.026619018986821175, -0.3619944453239441, -0.03959595412015915, 0.28809547424316406], [-0.03385891020298004, -0.16633087396621704, -0.03383404389023781, -0.01680801250040531], [-0.03718552738428116, 0.02925954759120941, -0.034170206636190414, -0.3199710547924042], [-0.03660033643245697, -0.1653595268726349, -0.04056962579488754, -0.0382569395005703], [-0.03990752622485161, -0.35987693071365356, -0.041334766894578934, 0.24135488271713257], [-0.04710506275296211, -0.5543848276138306, -0.03650766611099243, 0.520718514919281], [-0.05819275975227356, -0.3587684631347656, -0.026093296706676483, 0.21675866842269897], [-0.06536813080310822, -0.16328340768814087, -0.021758124232292175, -0.08403967320919037], [-0.0686337947845459, -0.35808682441711426, -0.023438917472958565, 0.201699897646904], [-0.07579553127288818, -0.1626376211643219, -0.01940491981804371, -0.09828377515077591], [-0.0790482833981514, 0.0327569916844368, -0.021370595321059227, -0.3970251977443695], [-0.07839314639568329, -0.1620553433895111, -0.029311098158359528, -0.11115589737892151], [-0.08163425326347351, -0.35674530267715454, -0.03153421729803085, 0.17213734984397888], [-0.08876916021108627, -0.16118653118610382, -0.028091469779610634, -0.13032448291778564], [-0.09199289232492447, -0.3558950424194336, -0.030697960406541824, 0.15336525440216064], [-0.09911078959703445, -0.16034729778766632, -0.027630655094981194, -0.1488419473171234], [-0.10231773555278778, -0.35506290197372437, -0.030607493594288826, 0.13499760627746582], [-0.10941899567842484, -0.5497334003448486, -0.027907541021704674, 0.41786935925483704], [-0.12041366100311279, -0.7444489598274231, -0.019550153985619545, 0.7016252279281616], [-0.13530264794826508, -0.5490615367889404, -0.005517648998647928, 0.40285277366638184], [-0.14628387987613678, -0.74410480260849, 0.002539406530559063, 0.6937910318374634], [-0.1611659675836563, -0.9392619132995605, 0.016415227204561234, 0.987272322177887], [-0.17995120584964752, -0.74436354637146, 0.0361606739461422, 0.6997900009155273], [-0.1948384791612625, -0.5497611165046692, 0.050156474113464355, 0.4187060594558716], [-0.20583370327949524, -0.3553844392299652, 0.058530595153570175, 0.14224755764007568], [-0.21294139325618744, -0.16114746034145355, 0.06137554720044136, -0.13141080737113953], [-0.21616433560848236, 0.033044058829545975, 0.05874732881784439, -0.40411654114723206], [-0.21550345420837402, -0.162859708070755, 0.0506649985909462, -0.09350604563951492], [-0.2187606543302536, -0.35866984724998474, 0.04879487678408623, 0.2147214114665985], [-0.22593404352664948, -0.16427822411060333, 0.05308930575847626, -0.062178969383239746], [-0.22921961545944214, 0.030043942853808403, 0.0518457256257534, -0.3376506268978119], [-0.22861874103546143, -0.16577596962451935, 0.04509271681308746, -0.029079606756567955], [-0.23193424940109253, 0.028671281412243843, 0.04451112449169159, -0.30720123648643494], [-0.23136082291603088, -0.16705572605133057, 0.038367096334695816, -0.0008195670670829713], [-0.2347019463777542, 0.027495577931404114, 0.038350705057382584, -0.281154602766037], [-0.23415203392505646, -0.1681518405675888, 0.03272761404514313, 0.0233730748295784], [-0.23751506209373474, 0.026485854759812355, 0.033195074647665024, -0.25880691409111023], [-0.23698535561561584, -0.16909387707710266, 0.02801893837749958, 0.04415862262248993], [-0.24036723375320435, -0.36460617184638977, 0.02890210971236229, 0.34554845094680786], [-0.2476593554019928, -0.16990701854228973, 0.03581307828426361, 0.062117721885442734], [-0.251057505607605, 0.024683639407157898, 0.03705543279647827, -0.21905431151390076], [-0.2505638301372528, -0.1709478795528412, 0.03267434611916542, 0.08508332073688507], [-0.2539827823638916, 0.02369084395468235, 0.03437601402401924, -0.19711437821388245], [-0.25350895524024963, 0.21830466389656067, 0.03043372556567192, -0.4787580668926239], [-0.2491428703069687, 0.02276656962931156, 0.020858565345406532, -0.17664062976837158], [-0.2486875355243683, -0.17264758050441742, 0.0173257514834404, 0.12254881113767624], [-0.25214049220085144, 0.022221915423870087, 0.019776728004217148, -0.16461804509162903], [-0.25169605016708374, -0.17317748069763184, 0.016484366729855537, 0.13423770666122437], [-0.2551595866680145, 0.021704524755477905, 0.019169121980667114, -0.15319938957691193], [-0.25472551584243774, -0.17368657886981964, 0.016105134040117264, 0.1454687863588333], [-0.2581992447376251, -0.36903542280197144, 0.0190145093947649, 0.44318875670433044], [-0.2655799388885498, -0.5644211769104004, 0.027878284454345703, 0.7418043613433838], [-0.27686837315559387, -0.36969494819641113, 0.04271437227725983, 0.45802366733551025], [-0.2842622697353363, -0.17520205676555634, 0.05187484622001648, 0.17910462617874146], [-0.28776630759239197, 0.019140657037496567, 0.05545693635940552, -0.0967729389667511], [-0.287383496761322, 0.21342574059963226, 0.05352148041129112, -0.3714565634727478], [-0.2831149995326996, 0.017585882917046547, 0.04609234631061554, -0.06238961219787598], [-0.28276327252388, 0.2120177149772644, 0.04484455659985542, -0.34018126130104065], [-0.27852290868759155, 0.406473845243454, 0.03804093226790428, -0.6183923482894897], [-0.270393431186676, 0.21084176003932953, 0.02567308396100998, -0.31397515535354614], [-0.26617661118507385, 0.015363674610853195, 0.01939358003437519, -0.013307605870068073], [-0.2658693194389343, 0.2102022022008896, 0.01912742853164673, -0.2998090982437134], [-0.2616652846336365, 0.014812912791967392, 0.013131246902048588, -0.0011556398821994662], [-0.2613690197467804, -0.18049487471580505, 0.013108134269714355, 0.2956412732601166], [-0.26497891545295715, 0.014437776058912277, 0.019020959734916687, 0.007121084723621607], [-0.2646901607513428, 0.20928184688091278, 0.019163381308317184, -0.2795003354549408], [-0.2605045437812805, 0.40412527322769165, 0.013573373667895794, -0.5660781264305115], [-0.252422034740448, 0.599054217338562, 0.002251812256872654, -0.8544541001319885], [-0.24044093489646912, 0.403901606798172, -0.01483726967126131, -0.5610639452934265], [-0.23236291110515594, 0.20899100601673126, -0.02605854906141758, -0.27309221029281616], [-0.2281830906867981, 0.4044749140739441, -0.03152039274573326, -0.5738788843154907], [-0.22009359300136566, 0.20980872213840485, -0.042997971177101135, -0.2912901043891907], [-0.21589741110801697, 0.40551653504371643, -0.048823773860931396, -0.5972180366516113], [-0.20778708159923553, 0.21111059188842773, -0.06076813116669655, -0.3203050494194031], [-0.2035648673772812, 0.4070429503917694, -0.06717423349618912, -0.6315159201622009], [-0.19542402029037476, 0.21291935443878174, -0.07980455458164215, -0.3607216477394104], [-0.19116562604904175, 0.019017115235328674, -0.08701898902654648, -0.09423163533210754], [-0.19078528881072998, 0.21527153253555298, -0.08890362083911896, -0.41305071115493774], [-0.186479851603508, 0.02151486836373806, -0.09716463088989258, -0.14966675639152527], [-0.18604955077171326, -0.17209115624427795, -0.1001579686999321, 0.11085100471973419], [-0.1894913762807846, 0.024312743917107582, -0.09794094413518906, -0.21167561411857605], [-0.18900512158870697, 0.22068868577480316, -0.10217446088790894, -0.533576488494873], [-0.1845913529396057, 0.41708794236183167, -0.11284598708152771, -0.856626033782959], [-0.17624959349632263, 0.22366951406002045, -0.1299785077571869, -0.6014500260353088], [-0.1717762053012848, 0.030582325533032417, -0.142007514834404, -0.35236856341362], [-0.17116455733776093, -0.16226479411125183, -0.1490548849105835, -0.1076197475194931], [-0.17440985143184662, 0.034643881022930145, -0.15120728313922882, -0.44336777925491333], [-0.1737169772386551, 0.23154567182064056, -0.1600746363401413, -0.7796362042427063], [-0.1690860539674759, 0.038943927735090256, -0.17566736042499542, -0.5412883162498474], [-0.16830718517303467, -0.153330460190773, -0.1864931285381317, -0.30869632959365845], [-0.17137378454208374, -0.34537357091903687, -0.19266705214977264, -0.08013828843832016], [-0.1782812625169754, -0.148086816072464, -0.1942698210477829, -0.4268871545791626], [-0.18124300241470337, -0.34000322222709656, -0.20280756056308746, -0.20118454098701477], [-0.18804305791854858, -0.5317344665527344, -0.20683124661445618, 0.021300548687577248], [-0.19867774844169617, -0.7233827710151672, -0.20640523731708527, 0.24227015674114227], [-0.2131454050540924, -0.9150506258010864, -0.20155984163284302, 0.4634162187576294], [-0.23144641518592834, -0.7177362442016602, -0.1922915130853653, 0.11457832157611847], [-0.2458011507987976, -0.9096574783325195, -0.18999993801116943, 0.3409682512283325], [-0.2639943063259125, -0.7124119400978088, -0.18318058550357819, -0.005100148729979992], [-0.2782425284385681, -0.515200138092041, -0.18328258395195007, -0.34952306747436523], [-0.28854653239250183, -0.7073068022727966, -0.19027304649353027, -0.11977343261241913], [-0.3026926815509796, -0.5100404024124146, -0.19266851246356964, -0.46593618392944336], [-0.31289348006248474, -0.7019926905632019, -0.20198723673820496, -0.23963013291358948], [-0.3269333243370056, -0.8937425017356873, -0.2067798376083374, -0.016834061592817307], [-0.3448081910610199, -1.0853917598724365, -0.2071165144443512, 0.20415474474430084], [-0.36651602387428284, -0.8880027532577515, -0.2030334323644638, -0.14605861902236938], [-0.38427606225013733, -1.0797260999679565, -0.20595459640026093, 0.07633663713932037], [-0.40587058663368225, -0.8823384642601013, -0.20442786812782288, -0.2736109793186188], [-0.4235173761844635, -0.6849756836891174, -0.20990008115768433, -0.6231747269630432], [0.019828911870718002, -0.18554188311100006, 0.04130714014172554, 0.3478529453277588], [0.01611807569861412, 0.00896893534809351, 0.04826420173048973, 0.06847642362117767], [0.01629745401442051, 0.20336689054965973, 0.049633730202913284, -0.20859678089618683], [0.02036479115486145, 0.007571661379188299, 0.04546179249882698, 0.09932070970535278], [0.020516224205493927, 0.20201358199119568, 0.047448206692934036, -0.17867964506149292], [0.024556497111916542, 0.006245869677513838, 0.04387461394071579, 0.12858594954013824], [0.024681413546204567, 0.20071274042129517, 0.046446334570646286, -0.14993862807750702], [0.028695669025182724, 0.004957529716193676, 0.04344756156206131, 0.15702782571315765], [0.028794819489121437, -0.19075867533683777, 0.046588119119405746, 0.46309465169906616], [0.024979645386338234, -0.3865070044994354, 0.055850010365247726, 0.7700905203819275], [0.01724950596690178, -0.19219635426998138, 0.07125181704759598, 0.4954903721809387], [0.013405578210949898, 0.0018522836035117507, 0.08116162568330765, 0.22608627378940582], [0.013442624360322952, 0.1957261711359024, 0.08568335324525833, -0.03993193432688713], [0.017357148230075836, -0.0005133108352310956, 0.08488471806049347, 0.2785075008869171], [0.017346881330013275, 0.19330158829689026, 0.09045486152172089, 0.013758056797087193], [0.02121291309595108, -0.002993339905515313, 0.09073002636432648, 0.3335541784763336], [0.021153045818209648, -0.19928161799907684, 0.09740111231803894, 0.6534135937690735], [0.017167413607239723, -0.005641214083880186, 0.11046937853097916, 0.3929203450679779], [0.017054589465260506, -0.20214323699474335, 0.1183277890086174, 0.7182887196540833], [0.013011724688112736, -0.39868655800819397, 0.1326935589313507, 1.0457494258880615], [0.005037993658334017, -0.5952962636947632, 0.1536085456609726, 1.3769689798355103], [-0.00686793215572834, -0.4023902118206024, 0.18114793300628662, 1.1360005140304565], [-0.014915736392140388, -0.21003973484039307, 0.20386794209480286, 0.9051624536514282], [-0.019116532057523727, -0.01817481964826584, 0.22197118401527405, 0.6828479766845703], [0.028006181120872498, -0.22415034472942352, 0.021999841555953026, 0.3397245407104492], [0.023523174226284027, -0.02934822253882885, 0.02879433147609234, 0.05405949428677559], [0.02293621003627777, 0.16534927487373352, 0.02987552247941494, -0.2294013351202011], [0.026243194937705994, -0.030186578631401062, 0.02528749592602253, 0.07255366444587708], [0.02563946321606636, -0.2256617546081543, 0.026738569140434265, 0.3731064200401306], [0.02112622931599617, -0.030929649248719215, 0.034200698137283325, 0.08897287398576736], [0.020507635548710823, 0.16368581354618073, 0.03598015382885933, -0.19272655248641968], [0.02378135174512863, 0.35827508568763733, 0.032125622034072876, -0.4738456606864929], [0.030946852639317513, 0.16271451115608215, 0.022648710757493973, -0.17121286690235138], [0.03420114517211914, -0.03272416070103645, 0.01922445371747017, 0.12852810323238373], [0.03354666009545326, 0.16211719810962677, 0.021795015782117844, -0.1580282747745514], [0.036789003759622574, -0.03330991044640541, 0.018634449690580368, 0.14144998788833618], [0.03612280637025833, 0.16154026985168457, 0.02146345004439354, -0.14529633522033691], [0.039353612810373306, 0.3563483655452728, 0.01855752244591713, -0.43113142251968384], [0.04648057743906975, 0.5512027144432068, 0.009934894740581512, -0.7179069519042969], [0.05750463157892227, 0.3559446930885315, -0.00442324485629797, -0.4221135973930359], [0.06462352722883224, 0.16088567674160004, -0.012865517288446426, -0.1308283805847168], [0.06784123927354813, -0.034049633890390396, -0.015482084825634956, 0.15776804089546204], [0.06716024875640869, -0.2289465367794037, -0.012326723895967007, 0.4455268085002899], [0.06258131563663483, -0.03365238755941391, -0.003416187595576048, 0.14898386597633362], [0.06190826743841171, -0.22872525453567505, -0.0004365102213341743, 0.4405871033668518], [0.05733376368880272, -0.033597126603126526, 0.008375232107937336, 0.1477666050195694], [0.05666182190179825, 0.16140389442443848, 0.011330563575029373, -0.14226238429546356], [0.05988990142941475, -0.03387847915291786, 0.008485316298902035, 0.15397348999977112], [0.0592123307287693, -0.2291208952665329, 0.011564786545932293, 0.4493212401866913], [0.05462991073727608, -0.424404501914978, 0.020551210269331932, 0.7456269860267639], [0.04614182189106941, -0.22957207262516022, 0.03546375036239624, 0.45948171615600586], [0.04155037924647331, -0.034968893975019455, 0.04465338587760925, 0.1781846582889557], [0.04085100442171097, -0.23070046305656433, 0.04821707680821419, 0.4846130907535553], [0.036236993968486786, -0.42646852135658264, 0.05790933966636658, 0.7920942306518555], [0.027707623317837715, -0.62233567237854, 0.07375122606754303, 1.102418303489685], [0.015260908752679825, -0.4282573461532593, 0.09579958766698837, 0.833755373954773], [0.006695762276649475, -0.23456571996212006, 0.1124747022986412, 0.5726721286773682], [0.0020044478587806225, -0.43107011914253235, 0.12392814457416534, 0.8985641598701477], [-0.006616954226046801, -0.23782600462436676, 0.14189942181110382, 0.6472627520561218], [-0.011373474262654781, -0.04493637755513191, 0.15484468638896942, 0.4024149179458618], [-0.012272202409803867, 0.1476893126964569, 0.16289298236370087, 0.162276029586792], [-0.009318416006863117, 0.34015005826950073, 0.16613849997520447, -0.07491441816091537], [-0.0025154149625450373, 0.14308428764343262, 0.16464020311832428, 0.2652343511581421], [0.00034627088462002575, 0.33552050590515137, 0.1699448972940445, 0.028669238090515137], [0.007056680973619223, 0.5278494358062744, 0.17051827907562256, -0.20594452321529388], [0.017613669857382774, 0.7201748490333557, 0.16639938950538635, -0.44035887718200684], [0.032017167657613754, 0.5231371521949768, 0.15759220719337463, -0.1001887246966362], [0.04247990995645523, 0.3261488676071167, 0.15558843314647675, 0.2377726435661316], [0.049002885818481445, 0.1291860193014145, 0.16034388542175293, 0.5752067565917969], [0.051586609333753586, -0.06777738034725189, 0.17184802889823914, 0.913801372051239], [0.05023105815052986, 0.1246558204293251, 0.190124049782753, 0.6796783208847046], [0.05272417515516281, 0.31669968366622925, 0.20371761918067932, 0.4523635804653168], [0.05905817076563835, 0.11936765164136887, 0.2127648890018463, 0.8017203211784363], [-0.011287236586213112, 0.20552754402160645, -0.0037661001551896334, -0.3253723382949829], [-0.007176685146987438, 0.40070292353630066, -0.010273546911776066, -0.6192405223846436], [0.0008373729651793838, 0.5959668159484863, -0.02265835739672184, -0.9151413440704346], [0.012756709940731525, 0.7913877964019775, -0.04096118360757828, -1.2148585319519043], [0.028584465384483337, 0.987013578414917, -0.06525835394859314, -1.5200902223587036], [0.04832473769783974, 0.7927383184432983, -0.09566015750169754, -1.2484699487686157], [0.06417950242757797, 0.5989639759063721, -0.12062955647706985, -0.9872186779975891], [0.0761587843298912, 0.7954765558242798, -0.14037393033504486, -1.3152246475219727], [0.09206831455230713, 0.6023819446563721, -0.16667842864990234, -1.0695661306381226], [0.10411595553159714, 0.40980905294418335, -0.18806974589824677, -0.8334869146347046], [0.11231213063001633, 0.606934130191803, -0.20473948121070862, -1.1789277791976929], [0.12445081770420074, 0.4149719774723053, -0.22831803560256958, -0.9567723274230957]], "action_prob": [0.5002281069755554, 0.3757462799549103, 0.656010627746582, 0.3640094995498657, 0.6576133370399475, 0.6472514867782593, 0.5814530849456787, 0.4562465250492096, 0.37465140223503113, 0.6471850872039795, 0.6192896962165833, 0.5048933029174805, 0.6251847147941589, 0.5156940221786499, 0.39904704689979553, 0.6444008946418762, 0.5954406261444092, 0.460654616355896, 0.6416015028953552, 0.5530345439910889, 0.4217703938484192, 0.6400404572486877, 0.5742996335029602, 0.5662726759910583, 0.5696461200714111, 0.4288467764854431, 0.6496936082839966, 0.5801631212234497, 0.5547298192977905, 0.5871953368186951, 0.5469850897789001, 0.5938063263893127, 0.4610746204853058, 0.37133607268333435, 0.6516311764717102, 0.36916008591651917, 0.3469003736972809, 0.649616003036499, 0.6552542448043823, 0.64424729347229, 0.583619236946106, 0.4585525691509247, 0.6301906108856201, 0.5244782567024231, 0.6098766326904297, 0.49543526768684387, 0.613892138004303, 0.5115198493003845, 0.6059083342552185, 0.5252520442008972, 0.5982089042663574, 0.5368890762329102, 0.5909147262573242, 0.4532613158226013, 0.6405285596847534, 0.5600965619087219, 0.5714625716209412, 0.5707225799560547, 0.4382241666316986, 0.6361805200576782, 0.5569897890090942, 0.582994818687439, 0.5509675145149231, 0.5881652235984802, 0.5449367165565491, 0.4069112539291382, 0.3468663692474365, 0.6568717360496521, 0.6572035551071167, 0.6176112294197083, 0.5036683082580566, 0.6060689091682434, 0.5188369750976562, 0.40127086639404297, 0.6429276466369629, 0.5958595871925354, 0.5339517593383789, 0.5930008292198181, 0.46227607131004333, 0.6391919255256653, 0.5448004007339478, 0.4144742488861084, 0.3585345149040222, 0.6479291319847107, 0.6444877982139587, 0.40137407183647156, 0.6472750902175903, 0.3900865912437439, 0.6501611471176147, 0.3771383762359619, 0.6526119112968445, 0.6359414458274841, 0.43985825777053833, 0.6456641554832458, 0.5895959734916687, 0.5296134352684021, 0.38715875148773193, 0.3435004651546478, 0.6499144434928894, 0.6595808863639832, 0.6533762812614441, 0.3974989950656891, 0.3374825119972229, 0.6560871601104736, 0.6670969724655151, 0.6611931920051575, 0.3856998682022095, 0.6717017292976379, 0.6509827971458435, 0.5835831761360168, 0.48473668098449707, 0.5931963920593262, 0.5395475625991821, 0.5554931163787842, 0.41225889325141907, 0.6711191534996033, 0.37183094024658203, 0.6802102327346802, 0.6575329303741455, 0.5975621342658997, 0.48882395029067993, 0.6340986490249634, 0.4390694499015808, 0.34070611000061035, 0.46734920144081116, 0.6357464790344238, 0.5500560998916626, 0.5807037949562073, 0.5644313097000122, 0.5683937072753906, 0.5774888396263123, 0.5552527904510498, 0.41048750281333923, 0.34854474663734436, 0.6521111130714417, 0.6561735272407532, 0.6252639889717102, 0.4784442186355591, 0.6388840675354004, 0.44757235050201416, 0.3503064811229706, 0.6591807007789612, 0.34061846137046814, 0.3420429825782776, 0.36148715019226074, 0.6185347437858582, 0.6327099800109863, 0.6496976017951965, 0.4810437858104706, 0.628071129322052, 0.5302377939224243, 0.5986358523368835, 0.46121835708618164, 0.635817289352417, 0.5515031218528748, 0.4182555079460144, 0.6446731090545654, 0.5775406360626221, 0.5647422671318054, 0.572062075138092, 0.5704732537269592, 0.43357062339782715, 0.35837140679359436, 0.6538089513778687, 0.6442266702651978, 0.57425457239151, 0.43692222237586975, 0.6394822001457214, 0.43650227785110474, 0.6406037211418152, 0.5674971342086792, 0.5708653330802917, 0.4298318028450012, 0.35664668679237366, 0.6512136459350586, 0.6477658152580261, 0.40597230195999146, 0.348602294921875, 0.3490029275417328, 0.6364803910255432, 0.6499803066253662, 0.3402079939842224, 0.6469824910163879, 0.6602568030357361, 0.6638116240501404, 0.6349578499794006, 0.45279625058174133, 0.6571599841117859, 0.5979532599449158, 0.49043604731559753, 0.5975401401519775, 0.4610905051231384, 0.34458842873573303, 0.3271649181842804, 0.6526799201965332, 0.6712837219238281, 0.3193589448928833, 0.47770318388938904, 0.3703869879245758, 0.3454503118991852, 0.3520021438598633, 0.365538626909256, 0.6207409501075745, 0.6315907835960388, 0.3556399643421173, 0.6267839074134827, 0.6391270756721497, 0.34658825397491455, 0.6318305134773254], "advantages": [60.72389221191406, 60.66328048706055, 60.99504089355469, 60.598114013671875, 61.051025390625, 60.71316909790039, 60.5842170715332, 60.7015380859375, 61.042335510253906, 61.511417388916016, 60.54703140258789, 59.94383239746094, 59.80701446533203, 59.72380447387695, 59.88307189941406, 60.196651458740234, 59.246788024902344, 58.671844482421875, 58.55543518066406, 58.330509185791016, 58.3529167175293, 58.54679870605469, 57.60700225830078, 57.04682540893555, 56.95479965209961, 56.394615173339844, 56.27852249145508, 55.940738677978516, 55.84644317626953, 55.3497314453125, 55.231201171875, 54.74821090698242, 54.6088981628418, 54.65179443359375, 54.75383758544922, 53.533843994140625, 53.56486892700195, 53.56072998046875, 52.04449462890625, 50.589813232421875, 49.35211944580078, 48.4455680847168, 47.909271240234375, 47.229610443115234, 46.852577209472656, 45.91050338745117, 45.332603454589844, 44.72040939331055, 44.13453674316406, 43.56056213378906, 42.96404266357422, 42.419761657714844, 41.81092071533203, 41.289268493652344, 41.04732894897461, 40.03212356567383, 39.360198974609375, 38.84665298461914, 38.15516662597656, 37.79296875, 37.06317901611328, 36.59542465209961, 35.89445495605469, 35.42726516723633, 34.707916259765625, 34.2393798828125, 34.02328109741211, 33.99623107910156, 32.569759368896484, 31.416717529296875, 30.55734634399414, 29.974000930786133, 29.233243942260742, 28.63656234741211, 28.291940689086914, 27.397480010986328, 26.711599349975586, 26.116724014282227, 25.43666648864746, 24.982627868652344, 24.0703182220459, 23.43453598022461, 23.05953025817871, 22.934560775756836, 21.94058609008789, 21.099855422973633, 20.841651916503906, 20.01386070251465, 19.831546783447266, 19.02243995666504, 18.94411849975586, 18.16777992248535, 17.585559844970703, 17.344776153564453, 16.773778915405273, 16.436988830566406, 15.941475868225098, 15.92793083190918, 16.30059051513672, 15.775496482849121, 15.421213150024414, 15.271303176879883, 15.365471839904785, 15.821749687194824, 15.808418273925781, 15.938702583312988, 16.164302825927734, 16.30706214904785, 16.560752868652344, 16.75804901123047, 16.79305648803711, 16.58841896057129, 16.340988159179688, 15.987200736999512, 15.708213806152344, 15.404845237731934, 15.10168170928955, 14.719586372375488, 14.382893562316895, 13.857146263122559, 13.140963554382324, 12.691981315612793, 11.93160629272461, 11.38129711151123, 10.350178718566895, 9.692676544189453, 8.52286434173584, 7.651627540588379, 6.743772029876709, 5.841731071472168, 4.942955017089844, 4.00895881652832, 3.1150107383728027, 2.447056770324707, 1.9748774766921997, 0.39810141921043396, -0.9176886677742004, -2.0013623237609863, -2.9144132137298584, -4.032312393188477, -4.9383134841918945, -5.6704277992248535, -7.041413307189941, -7.7955098152160645, -8.412930488586426, -8.929671287536621, -10.702926635742188, -12.246440887451172, 28.483442306518555, 28.050106048583984, 27.051427841186523, 26.39740753173828, 25.687114715576172, 25.240577697753906, 24.189550399780273, 23.466089248657227, 23.051008224487305, 22.11627960205078, 21.423154830932617, 20.6787166595459, 19.98235511779785, 19.215211868286133, 18.75811767578125, 18.589101791381836, 17.51765251159668, 16.632566452026367, 15.974979400634766, 15.552529335021973, 14.433459281921387, 13.967504501342773, 12.814848899841309, 11.995081901550293, 11.236915588378906, 10.71856689453125, 10.399914741516113, 8.846254348754883, 7.585697174072266, 6.985454082489014, 6.5823163986206055, 6.301540374755859, 4.438974380493164, 2.8218579292297363, 2.322993278503418, 0.7169943451881409, -0.6469044089317322, -1.8167709112167358, -2.8455872535705566, -3.8108346462249756, -4.862460136413574, -5.825263023376465, -6.719231128692627, -7.8245439529418945, -8.832175254821777, -9.75698471069336, -10.603126525878906, -11.814775466918945, -12.936944007873535, 1.0639883279800415, 0.33925291895866394, -0.03392111510038376, -0.10779488831758499, 0.03385394066572189, 0.2862401604652405, -0.5855574011802673, -1.3702924251556396, -0.9170553088188171, -1.3283065557479858, -1.5711567401885986, -1.0936250686645508], "value_targets": [71.24163818359375, 70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 1455381298, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 647576592, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842, 1135918842], "obs": [[-0.0022034686990082264, 0.04372185468673706, 0.04442373663187027, 0.019768986850976944], [-0.001329031540080905, -0.15200810134410858, 0.04481911659240723, 0.32613053917884827], [-0.004369193688035011, 0.042448028922080994, 0.05134172737598419, 0.04791167750954628], [-0.00352023309096694, 0.23679761588573456, 0.05229995772242546, -0.228140726685524], [0.001215719268657267, 0.04096879065036774, 0.04773714393377304, 0.0805700495839119], [0.0020350951235741377, 0.2353750765323639, 0.04934854432940483, -0.1966777890920639], [0.006742596626281738, 0.03958325833082199, 0.045414991676807404, 0.11115498840808868], [0.007534261792898178, 0.2340260148048401, 0.04763808846473694, -0.16686099767684937], [0.01221478171646595, 0.03825566917657852, 0.0443008691072464, 0.14046166837215424], [0.012979894876480103, -0.15747185051441193, 0.04711010307073593, 0.4467850923538208], [0.009830458089709282, 0.036953095346689224, 0.05604580417275429, 0.16931650042533875], [0.01056952029466629, 0.23122991621494293, 0.05943213403224945, -0.10517232120037079], [0.015194118022918701, 0.035308837890625, 0.057328689843416214, 0.20565317571163177], [0.015900295227766037, 0.22956611216068268, 0.061441753059625626, -0.06840862333774567], [0.020491616800427437, 0.03361955285072327, 0.06007358059287071, 0.24300912022590637], [0.02116400934755802, -0.1623067408800125, 0.06493376195430756, 0.5540194511413574], [0.017917873337864876, 0.03184619918465614, 0.07601415365934372, 0.2824808955192566], [0.018554797396063805, 0.22580625116825104, 0.08166376501321793, 0.014707585796713829], [0.0230709221214056, 0.02961386740207672, 0.08195792138576508, 0.3319978713989258], [0.023663200438022614, -0.16657321155071259, 0.08859787881374359, 0.6493593454360962], [0.020331736654043198, 0.027210144326090813, 0.10158506780862808, 0.385838121175766], [0.02087593823671341, 0.22075431048870087, 0.10930182784795761, 0.1268332302570343], [0.025291025638580322, 0.02425006963312626, 0.11183848977088928, 0.4519014060497284], [0.025776026770472527, 0.2176274210214615, 0.12087652087211609, 0.19645956158638], [0.03012857399880886, 0.021002497524023056, 0.12480571120977402, 0.5246961116790771], [0.03054862469434738, 0.2141675055027008, 0.13529963791370392, 0.27379998564720154], [0.034831974655389786, 0.01740056835114956, 0.1407756358385086, 0.6059098243713379], [0.0351799875497818, 0.21030253171920776, 0.1528938263654709, 0.360670804977417], [0.03938603773713112, 0.40295812487602234, 0.16010724008083344, 0.11983439326286316], [0.04744520038366318, 0.5954671502113342, 0.1625039279460907, -0.11836525797843933], [0.059354543685913086, 0.7879329919815063, 0.1601366251707077, -0.3556942641735077], [0.0751131996512413, 0.5909396409988403, 0.15302273631095886, -0.01710572838783264], [0.0869319960474968, 0.7835736870765686, 0.1526806354522705, -0.2578670382499695], [0.1026034727692604, 0.9762236475944519, 0.14752328395843506, -0.4987664222717285], [0.1221279427409172, 1.1689914464950562, 0.13754795491695404, -0.7415626049041748], [0.14550776779651642, 0.9722657799720764, 0.12271670997142792, -0.40894952416419983], [0.1649530827999115, 0.7756370902061462, 0.11453771591186523, -0.0802362710237503], [0.18046583235263824, 0.5790753960609436, 0.11293299496173859, 0.24627487361431122], [0.1920473426580429, 0.7724184393882751, 0.11785849183797836, -0.008760517463088036], [0.20749570429325104, 0.9656702280044556, 0.1176832765340805, -0.26205700635910034], [0.22680911421775818, 1.1589329242706299, 0.11244213581085205, -0.5154268145561218], [0.24998776614665985, 1.3523067235946655, 0.1021336019039154, -0.770667552947998], [0.27703389525413513, 1.1559386253356934, 0.08672025054693222, -0.4476752281188965], [0.3001526892185211, 1.3497337102890015, 0.07776674628257751, -0.7118116021156311], [0.32714736461639404, 1.1536259651184082, 0.06353051215410233, -0.3956986665725708], [0.35021987557411194, 0.9576628804206848, 0.05561654269695282, -0.08368155360221863], [0.3693731129169464, 0.7617895603179932, 0.05394291132688522, 0.22601689398288727], [0.3846089243888855, 0.9561007618904114, 0.05846324935555458, -0.04917440935969353], [0.40373092889785767, 1.150337815284729, 0.05747976154088974, -0.32285377383232117], [0.4267376959323883, 0.9544464945793152, 0.05102268606424332, -0.012612294405698776], [0.44582661986351013, 1.1488009691238403, 0.050770439207553864, -0.28877049684524536], [0.46880263090133667, 1.3431636095046997, 0.0449950285255909, -0.5650185942649841], [0.49566590785980225, 1.1474401950836182, 0.03369465842843056, -0.25850656628608704], [0.5186147093772888, 0.9518537521362305, 0.028524525463581085, 0.044610824435949326], [0.537651777267456, 1.1465553045272827, 0.02941674180328846, -0.2389376312494278], [0.5605828762054443, 1.3412449359893799, 0.024637989699840546, -0.5221984386444092], [0.5874077677726746, 1.5360115766525269, 0.014194021001458168, -0.807016909122467], [0.6181280016899109, 1.340698003768921, -0.0019463177304714918, -0.5099031329154968], [0.6449419856071472, 1.1456035375595093, -0.012144381180405617, -0.2178342193365097], [0.6678540706634521, 0.950657308101654, -0.016501065343618393, 0.07099325209856033], [0.6868671774864197, 0.7557757496833801, -0.015081199817359447, 0.35842466354370117], [0.7019827365875244, 0.560871422290802, -0.007912706583738327, 0.646314263343811], [0.7132001519203186, 0.7561027407646179, 0.005013578105717897, 0.35115012526512146], [0.7283222079277039, 0.9511529803276062, 0.012036580592393875, 0.060052357614040375], [0.7473452687263489, 0.7558605670928955, 0.013237628154456615, 0.3565084636211395], [0.7624624967575073, 0.9507918357849121, 0.02036779746413231, 0.06802893429994583], [0.7814782857894897, 0.7553839087486267, 0.021728375926613808, 0.36706778407096863], [0.7965859770774841, 0.5599600076675415, 0.02906973287463188, 0.6665220260620117], [0.8077852129936218, 0.36444607377052307, 0.04240017384290695, 0.9682143330574036], [0.81507408618927, 0.5589738488197327, 0.06176446005702019, 0.6891468167304993], [0.8262535929679871, 0.3630515933036804, 0.07554739713668823, 1.0006170272827148], [0.8335146307945251, 0.5570870637893677, 0.0955597385764122, 0.7325838208198547], [0.8446563482284546, 0.7507678270339966, 0.11021140962839127, 0.47144001722335815], [0.8596717119216919, 0.944174587726593, 0.11964021623134613, 0.21542657911777496], [0.8785552382469177, 0.7475634813308716, 0.12394874542951584, 0.5433254241943359], [0.8935064673423767, 0.9407455325126648, 0.1348152458667755, 0.29212313890457153], [0.9123213887214661, 1.1337134838104248, 0.1406577229499817, 0.044813357293605804], [0.9349956512451172, 1.3265676498413086, 0.14155398309230804, -0.20039376616477966], [0.9615269899368286, 1.5194112062454224, 0.137546107172966, -0.445287823677063], [0.991915225982666, 1.7123464345932007, 0.12864035367965698, -0.6916462182998657], [1.0261621475219727, 1.5156965255737305, 0.11480742692947388, -0.36139267683029175], [1.05647611618042, 1.7090153694152832, 0.10757957398891449, -0.6157826781272888], [1.0906563997268677, 1.9024828672409058, 0.09526392072439194, -0.8727388381958008], [1.1287060976028442, 2.096189260482788, 0.07780914008617401, -1.1340157985687256], [1.170629858970642, 1.9001401662826538, 0.055128827691078186, -0.8179789781570435], [1.2086327075958252, 2.094465970993042, 0.03876924887299538, -1.0928250551223755], [1.2505220174789429, 1.8988550901412964, 0.01691274531185627, -0.7882341146469116], [1.288499116897583, 2.093740701675415, 0.0011480634566396475, -1.0755486488342285], [1.3303738832473755, 1.8986036777496338, -0.020362909883260727, -0.7825056314468384], [1.3683459758758545, 1.7037674188613892, -0.03601302206516266, -0.4962981343269348], [1.4024213552474976, 1.8993781805038452, -0.04593898355960846, -0.8001096248626709], [1.4404088258743286, 2.0950992107391357, -0.061941176652908325, -1.1068826913833618], [1.4823108911514282, 1.9008437395095825, -0.0840788334608078, -0.8342573642730713], [1.5203276872634888, 1.7069649696350098, -0.10076397657394409, -0.5691565871238708], [1.5544670820236206, 1.903344988822937, -0.11214710772037506, -0.8918070793151855], [1.5925339460372925, 1.709908366203308, -0.12998324632644653, -0.6363770365715027], [1.6267321109771729, 1.5168159008026123, -0.14271079003810883, -0.3872891068458557], [1.6570683717727661, 1.3239774703979492, -0.15045657753944397, -0.1427868753671646], [1.6835479736328125, 1.1312947273254395, -0.1533123105764389, 0.09890465438365936], [1.7061738967895508, 0.938664436340332, -0.15133421123027802, 0.3395634591579437], [1.7249470949172974, 0.7459833025932312, -0.14454294741153717, 0.5809592008590698], [1.739866852760315, 0.5531508922576904, -0.13292376697063446, 0.8248437643051147], [1.750929832458496, 0.7498160600662231, -0.11642688512802124, 0.49348366260528564], [1.7659261226654053, 0.5565120577812195, -0.1065572127699852, 0.7473244667053223], [1.777056336402893, 0.7529301047325134, -0.09161072969436646, 0.4230998456478119], [1.7921149730682373, 0.9492223858833313, -0.08314872533082962, 0.10300023853778839], [1.8110994100570679, 0.7553843855857849, -0.08108872175216675, 0.36833512783050537], [1.826207160949707, 0.5615026354789734, -0.07372201979160309, 0.6343882083892822], [1.8374371528625488, 0.3674822449684143, -0.06103425845503807, 0.9029736518859863], [1.8447868824005127, 0.5633754730224609, -0.04297478497028351, 0.5917479395866394], [1.8560543060302734, 0.7590718865394592, -0.031139826402068138, 0.2858436703681946], [1.871235728263855, 0.5644075870513916, -0.025422953069210052, 0.5685449838638306], [1.8825238943099976, 0.7598767280578613, -0.014052052982151508, 0.2679624557495117], [1.8977214097976685, 0.5649580955505371, -0.008692803792655468, 0.5561803579330444], [1.9090206623077393, 0.7602009773254395, 0.0024308033753186464, 0.26077139377593994], [1.924224615097046, 0.9552881717681885, 0.007646231446415186, -0.031143825501203537], [1.9433304071426392, 1.1502996683120728, 0.00702335499227047, -0.32140451669692993], [1.9663363695144653, 0.9550783634185791, 0.0005952647770754993, -0.026514990255236626], [1.9854379892349243, 0.7599478960037231, 6.496493006125093e-05, 0.2663556933403015], [2.0006368160247803, 0.5648249983787537, 0.005392078775912523, 0.5590590834617615], [2.0119333267211914, 0.7598708868026733, 0.016573261469602585, 0.26807984709739685], [2.0271308422088623, 0.5645163655281067, 0.021934857591986656, 0.5659436583518982], [2.038421154022217, 0.7593238353729248, 0.033253733068704605, 0.28025108575820923], [2.053607702255249, 0.9539560079574585, 0.03885875269770622, -0.0017610073555260897], [2.0726866722106934, 1.1484997272491455, 0.038823533803224564, -0.2819347083568573], [2.0956568717956543, 1.343047022819519, 0.03318483754992485, -0.562124490737915], [2.1225175857543945, 1.1474754810333252, 0.021942349150776863, -0.2591741681098938], [2.1454672813415527, 0.9520472884178162, 0.016758864745497704, 0.04034813120961189], [2.164508104324341, 0.7566890716552734, 0.017565827816724777, 0.3382711708545685], [2.1796419620513916, 0.5613216161727905, 0.02433125115931034, 0.6364412307739258], [2.190868377685547, 0.7560959458351135, 0.037060074508190155, 0.3515188992023468], [2.2059903144836426, 0.5604671239852905, 0.044090453535318375, 0.6556538343429565], [2.2171995639801025, 0.36475998163223267, 0.05720353126525879, 0.9618876576423645], [2.2244949340820312, 0.5590684413909912, 0.07644128799438477, 0.6877103447914124], [2.2356762886047363, 0.7530508637428284, 0.09019549190998077, 0.4200383126735687], [2.250737190246582, 0.556774377822876, 0.09859625995159149, 0.7397377490997314], [2.2618727684020996, 0.7504067420959473, 0.11339101195335388, 0.4796402156352997], [2.2768807411193848, 0.9437606930732727, 0.12298382073640823, 0.22473743557929993], [2.2957561016082764, 0.7471152544021606, 0.12747856974601746, 0.5535438060760498], [2.3106982707977295, 0.940238356590271, 0.13854944705963135, 0.3035871088504791], [2.329503059387207, 1.1331418752670288, 0.14462117850780487, 0.05760801210999489], [2.352165937423706, 1.3259259462356567, 0.14577335119247437, -0.18617881834506989], [2.3786845207214355, 1.1290518045425415, 0.14204977452754974, 0.1487061083316803], [-0.0033146331552416086, 0.011205780319869518, 0.020949525758624077, 0.018929600715637207], [-0.003090517595410347, 0.20602113008499146, 0.021328117698431015, -0.26707059144973755], [0.0010299049317836761, 0.010601377114653587, 0.01598670706152916, 0.03226236253976822], [0.001241932506673038, 0.20549046993255615, 0.016631953418254852, -0.2553340196609497], [0.005351741798222065, 0.01013504434376955, 0.011525273323059082, 0.04254814609885216], [0.005554442759603262, -0.18515026569366455, 0.01237623579800129, 0.33884501457214355], [0.0018514374969527125, 0.009793414734303951, 0.019153136759996414, 0.05009040981531143], [0.0020473056938499212, -0.18559786677360535, 0.02015494368970394, 0.34875425696372986], [-0.0016646514413878322, -0.3810005784034729, 0.02713003009557724, 0.6477239727973938], [-0.009284663014113903, -0.1862669140100479, 0.04008450731635094, 0.36370617151260376], [-0.013010001741349697, 0.008263098075985909, 0.04735863208770752, 0.08392725139856339], [-0.012844739481806755, 0.20267531275749207, 0.04903717711567879, -0.19344587624073029], [-0.008791233412921429, 0.006887437310069799, 0.045168258249759674, 0.11429406702518463], [-0.008653484284877777, -0.18885163962841034, 0.047454141080379486, 0.42087817192077637], [-0.012430517002940178, 0.005566961131989956, 0.05587170273065567, 0.14352485537528992], [-0.012319178320467472, 0.199846088886261, 0.05874220281839371, -0.13102136552333832], [-0.008322256617248058, 0.3940795361995697, 0.05612177401781082, -0.40460872650146484], [-0.0004406656080391258, 0.5883625149726868, 0.04802960157394409, -0.6790832281112671], [0.011326584964990616, 0.3926074504852295, 0.03444793447852135, -0.37167397141456604], [0.019178733229637146, 0.1970134675502777, 0.02701445482671261, -0.06833136826753616], [0.0231190025806427, 0.3917379081249237, 0.025647828355431557, -0.35237017273902893], [0.03095376119017601, 0.19626079499721527, 0.018600424751639366, -0.051711320877075195], [0.03487897664308548, 0.0008771469001658261, 0.017566198483109474, 0.24678167700767517], [0.03489651903510094, 0.1957438737154007, 0.022501831874251366, -0.0403091199696064], [0.038811396807432175, 0.00030659293406642973, 0.02169564925134182, 0.2593875527381897], [0.03881752863526344, 0.1951122134923935, 0.026883400976657867, -0.026374073699116707], [0.042719773948192596, -0.00038474873872473836, 0.026355918496847153, 0.2746681571006775], [0.042712077498435974, 0.1943514347076416, 0.03184928372502327, -0.009586920030415058], [0.04659910872578621, -0.0012124553322792053, 0.031657543033361435, 0.29297226667404175], [0.04657485708594322, 0.193444162607193, 0.037516988813877106, 0.010439393110573292], [0.05044374242424965, 0.3880085349082947, 0.0377257764339447, -0.27017441391944885], [0.058203913271427155, 0.19236911833286285, 0.03232228755950928, 0.034164682030677795], [0.06205129623413086, -0.00320107932202518, 0.03300558403134346, 0.3368678390979767], [0.06198727339506149, 0.1914360076189041, 0.03974293917417526, 0.05477309972047806], [0.0658159926533699, -0.004232592880725861, 0.04083840176463127, 0.35972559452056885], [0.06573133915662766, 0.19028575718402863, 0.048032913357019424, 0.08019449561834335], [0.06953705847263336, -0.005490671377629042, 0.049636803567409515, 0.3876366913318634], [0.0694272443652153, -0.20128077268600464, 0.05738953500986099, 0.695547342300415], [0.06540162861347198, -0.0069997659884393215, 0.07130048424005508, 0.4214688837528229], [0.06526163220405579, -0.20305564999580383, 0.07972986251115799, 0.7357500791549683], [0.061200518161058426, -0.39918312430381775, 0.09444486349821091, 1.0524224042892456], [0.053216855973005295, -0.2054317742586136, 0.11549331247806549, 0.7908161878585815], [0.049108222126960754, -0.012069055810570717, 0.1313096433877945, 0.5365839600563049], [0.048866841942071915, -0.2087690830230713, 0.14204131066799164, 0.867588222026825], [0.044691458344459534, -0.01583588309586048, 0.1593930721282959, 0.6227227449417114], [0.0443747416138649, -0.21278215944766998, 0.17184753715991974, 0.9610607624053955], [0.040119096636772156, -0.02033420465886593, 0.19106875360012054, 0.726915717124939], [0.039712414145469666, 0.17170487344264984, 0.205607071518898, 0.49993225932121277], [-0.02935086376965046, 0.0488850474357605, -0.038113657385110855, 0.04754052311182022], [-0.02837316319346428, -0.14567023515701294, -0.03716284781694412, 0.3279588222503662], [-0.0312865674495697, 0.049960531294345856, -0.030603671446442604, 0.023791905492544174], [-0.030287357047200203, 0.24550770223140717, -0.030127832666039467, -0.27838757634162903], [-0.02537720277905464, 0.05082820728421211, -0.03569558262825012, 0.004642899613827467], [-0.024360639974474907, 0.24644342064857483, -0.03560272604227066, -0.2990852892398834], [-0.019431771710515022, 0.44205430150032043, -0.04158443212509155, -0.6027806401252747], [-0.010590685531497002, 0.24753789603710175, -0.05364004522562027, -0.3234805762767792], [-0.0056399269960820675, 0.05321914702653885, -0.06010965630412102, -0.04818429797887802], [-0.004575544036924839, -0.140991672873497, -0.061073340475559235, 0.22494420409202576], [-0.00739537738263607, 0.054947562515735626, -0.05657445639371872, -0.08636108785867691], [-0.006296426057815552, 0.2508329153060913, -0.05830167979001999, -0.39634302258491516], [-0.0012797681847587228, 0.056584522128105164, -0.06622853875160217, -0.12259648740291595], [-0.00014807774277869612, -0.1375291496515274, -0.06868047267198563, 0.14847873151302338], [-0.002898660721257329, -0.3316038250923157, -0.0657108947634697, 0.41872820258140564], [-0.009530737064778805, -0.1356152445077896, -0.05733633041381836, 0.1060747355222702], [-0.012243041768670082, 0.0602794885635376, -0.055214837193489075, -0.20413215458393097], [-0.011037452146410942, 0.25614580512046814, -0.059297479689121246, -0.5137088298797607], [-0.0059145363047719, 0.061906926333904266, -0.06957165896892548, -0.24028582870960236], [-0.004676397889852524, 0.25795018672943115, -0.07437737286090851, -0.5540769100189209], [0.00048260579933412373, 0.06394711136817932, -0.0854589119553566, -0.28572362661361694], [0.0017615481046959758, -0.12985867261886597, -0.09117338061332703, -0.021170208230614662], [-0.0008356254547834396, 0.06644449383020401, -0.09159678965806961, -0.3411698341369629], [0.0004932644660584629, 0.26274219155311584, -0.09842018038034439, -0.6612738370895386], [0.0057481080293655396, 0.4590858817100525, -0.1116456612944603, -0.983253002166748], [0.014929826371371746, 0.6555122137069702, -0.13131071627140045, -1.3088138103485107], [0.028040070086717606, 0.8520304560661316, -0.15748699009418488, -1.6395479440689087], [0.04508068040013313, 1.0486087799072266, -0.19027794897556305, -1.9768762588500977]], "actions": [0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.001329031540080905, -0.15200810134410858, 0.04481911659240723, 0.32613053917884827], [-0.004369193688035011, 0.042448028922080994, 0.05134172737598419, 0.04791167750954628], [-0.00352023309096694, 0.23679761588573456, 0.05229995772242546, -0.228140726685524], [0.001215719268657267, 0.04096879065036774, 0.04773714393377304, 0.0805700495839119], [0.0020350951235741377, 0.2353750765323639, 0.04934854432940483, -0.1966777890920639], [0.006742596626281738, 0.03958325833082199, 0.045414991676807404, 0.11115498840808868], [0.007534261792898178, 0.2340260148048401, 0.04763808846473694, -0.16686099767684937], [0.01221478171646595, 0.03825566917657852, 0.0443008691072464, 0.14046166837215424], [0.012979894876480103, -0.15747185051441193, 0.04711010307073593, 0.4467850923538208], [0.009830458089709282, 0.036953095346689224, 0.05604580417275429, 0.16931650042533875], [0.01056952029466629, 0.23122991621494293, 0.05943213403224945, -0.10517232120037079], [0.015194118022918701, 0.035308837890625, 0.057328689843416214, 0.20565317571163177], [0.015900295227766037, 0.22956611216068268, 0.061441753059625626, -0.06840862333774567], [0.020491616800427437, 0.03361955285072327, 0.06007358059287071, 0.24300912022590637], [0.02116400934755802, -0.1623067408800125, 0.06493376195430756, 0.5540194511413574], [0.017917873337864876, 0.03184619918465614, 0.07601415365934372, 0.2824808955192566], [0.018554797396063805, 0.22580625116825104, 0.08166376501321793, 0.014707585796713829], [0.0230709221214056, 0.02961386740207672, 0.08195792138576508, 0.3319978713989258], [0.023663200438022614, -0.16657321155071259, 0.08859787881374359, 0.6493593454360962], [0.020331736654043198, 0.027210144326090813, 0.10158506780862808, 0.385838121175766], [0.02087593823671341, 0.22075431048870087, 0.10930182784795761, 0.1268332302570343], [0.025291025638580322, 0.02425006963312626, 0.11183848977088928, 0.4519014060497284], [0.025776026770472527, 0.2176274210214615, 0.12087652087211609, 0.19645956158638], [0.03012857399880886, 0.021002497524023056, 0.12480571120977402, 0.5246961116790771], [0.03054862469434738, 0.2141675055027008, 0.13529963791370392, 0.27379998564720154], [0.034831974655389786, 0.01740056835114956, 0.1407756358385086, 0.6059098243713379], [0.0351799875497818, 0.21030253171920776, 0.1528938263654709, 0.360670804977417], [0.03938603773713112, 0.40295812487602234, 0.16010724008083344, 0.11983439326286316], [0.04744520038366318, 0.5954671502113342, 0.1625039279460907, -0.11836525797843933], [0.059354543685913086, 0.7879329919815063, 0.1601366251707077, -0.3556942641735077], [0.0751131996512413, 0.5909396409988403, 0.15302273631095886, -0.01710572838783264], [0.0869319960474968, 0.7835736870765686, 0.1526806354522705, -0.2578670382499695], [0.1026034727692604, 0.9762236475944519, 0.14752328395843506, -0.4987664222717285], [0.1221279427409172, 1.1689914464950562, 0.13754795491695404, -0.7415626049041748], [0.14550776779651642, 0.9722657799720764, 0.12271670997142792, -0.40894952416419983], [0.1649530827999115, 0.7756370902061462, 0.11453771591186523, -0.0802362710237503], [0.18046583235263824, 0.5790753960609436, 0.11293299496173859, 0.24627487361431122], [0.1920473426580429, 0.7724184393882751, 0.11785849183797836, -0.008760517463088036], [0.20749570429325104, 0.9656702280044556, 0.1176832765340805, -0.26205700635910034], [0.22680911421775818, 1.1589329242706299, 0.11244213581085205, -0.5154268145561218], [0.24998776614665985, 1.3523067235946655, 0.1021336019039154, -0.770667552947998], [0.27703389525413513, 1.1559386253356934, 0.08672025054693222, -0.4476752281188965], [0.3001526892185211, 1.3497337102890015, 0.07776674628257751, -0.7118116021156311], [0.32714736461639404, 1.1536259651184082, 0.06353051215410233, -0.3956986665725708], [0.35021987557411194, 0.9576628804206848, 0.05561654269695282, -0.08368155360221863], [0.3693731129169464, 0.7617895603179932, 0.05394291132688522, 0.22601689398288727], [0.3846089243888855, 0.9561007618904114, 0.05846324935555458, -0.04917440935969353], [0.40373092889785767, 1.150337815284729, 0.05747976154088974, -0.32285377383232117], [0.4267376959323883, 0.9544464945793152, 0.05102268606424332, -0.012612294405698776], [0.44582661986351013, 1.1488009691238403, 0.050770439207553864, -0.28877049684524536], [0.46880263090133667, 1.3431636095046997, 0.0449950285255909, -0.5650185942649841], [0.49566590785980225, 1.1474401950836182, 0.03369465842843056, -0.25850656628608704], [0.5186147093772888, 0.9518537521362305, 0.028524525463581085, 0.044610824435949326], [0.537651777267456, 1.1465553045272827, 0.02941674180328846, -0.2389376312494278], [0.5605828762054443, 1.3412449359893799, 0.024637989699840546, -0.5221984386444092], [0.5874077677726746, 1.5360115766525269, 0.014194021001458168, -0.807016909122467], [0.6181280016899109, 1.340698003768921, -0.0019463177304714918, -0.5099031329154968], [0.6449419856071472, 1.1456035375595093, -0.012144381180405617, -0.2178342193365097], [0.6678540706634521, 0.950657308101654, -0.016501065343618393, 0.07099325209856033], [0.6868671774864197, 0.7557757496833801, -0.015081199817359447, 0.35842466354370117], [0.7019827365875244, 0.560871422290802, -0.007912706583738327, 0.646314263343811], [0.7132001519203186, 0.7561027407646179, 0.005013578105717897, 0.35115012526512146], [0.7283222079277039, 0.9511529803276062, 0.012036580592393875, 0.060052357614040375], [0.7473452687263489, 0.7558605670928955, 0.013237628154456615, 0.3565084636211395], [0.7624624967575073, 0.9507918357849121, 0.02036779746413231, 0.06802893429994583], [0.7814782857894897, 0.7553839087486267, 0.021728375926613808, 0.36706778407096863], [0.7965859770774841, 0.5599600076675415, 0.02906973287463188, 0.6665220260620117], [0.8077852129936218, 0.36444607377052307, 0.04240017384290695, 0.9682143330574036], [0.81507408618927, 0.5589738488197327, 0.06176446005702019, 0.6891468167304993], [0.8262535929679871, 0.3630515933036804, 0.07554739713668823, 1.0006170272827148], [0.8335146307945251, 0.5570870637893677, 0.0955597385764122, 0.7325838208198547], [0.8446563482284546, 0.7507678270339966, 0.11021140962839127, 0.47144001722335815], [0.8596717119216919, 0.944174587726593, 0.11964021623134613, 0.21542657911777496], [0.8785552382469177, 0.7475634813308716, 0.12394874542951584, 0.5433254241943359], [0.8935064673423767, 0.9407455325126648, 0.1348152458667755, 0.29212313890457153], [0.9123213887214661, 1.1337134838104248, 0.1406577229499817, 0.044813357293605804], [0.9349956512451172, 1.3265676498413086, 0.14155398309230804, -0.20039376616477966], [0.9615269899368286, 1.5194112062454224, 0.137546107172966, -0.445287823677063], [0.991915225982666, 1.7123464345932007, 0.12864035367965698, -0.6916462182998657], [1.0261621475219727, 1.5156965255737305, 0.11480742692947388, -0.36139267683029175], [1.05647611618042, 1.7090153694152832, 0.10757957398891449, -0.6157826781272888], [1.0906563997268677, 1.9024828672409058, 0.09526392072439194, -0.8727388381958008], [1.1287060976028442, 2.096189260482788, 0.07780914008617401, -1.1340157985687256], [1.170629858970642, 1.9001401662826538, 0.055128827691078186, -0.8179789781570435], [1.2086327075958252, 2.094465970993042, 0.03876924887299538, -1.0928250551223755], [1.2505220174789429, 1.8988550901412964, 0.01691274531185627, -0.7882341146469116], [1.288499116897583, 2.093740701675415, 0.0011480634566396475, -1.0755486488342285], [1.3303738832473755, 1.8986036777496338, -0.020362909883260727, -0.7825056314468384], [1.3683459758758545, 1.7037674188613892, -0.03601302206516266, -0.4962981343269348], [1.4024213552474976, 1.8993781805038452, -0.04593898355960846, -0.8001096248626709], [1.4404088258743286, 2.0950992107391357, -0.061941176652908325, -1.1068826913833618], [1.4823108911514282, 1.9008437395095825, -0.0840788334608078, -0.8342573642730713], [1.5203276872634888, 1.7069649696350098, -0.10076397657394409, -0.5691565871238708], [1.5544670820236206, 1.903344988822937, -0.11214710772037506, -0.8918070793151855], [1.5925339460372925, 1.709908366203308, -0.12998324632644653, -0.6363770365715027], [1.6267321109771729, 1.5168159008026123, -0.14271079003810883, -0.3872891068458557], [1.6570683717727661, 1.3239774703979492, -0.15045657753944397, -0.1427868753671646], [1.6835479736328125, 1.1312947273254395, -0.1533123105764389, 0.09890465438365936], [1.7061738967895508, 0.938664436340332, -0.15133421123027802, 0.3395634591579437], [1.7249470949172974, 0.7459833025932312, -0.14454294741153717, 0.5809592008590698], [1.739866852760315, 0.5531508922576904, -0.13292376697063446, 0.8248437643051147], [1.750929832458496, 0.7498160600662231, -0.11642688512802124, 0.49348366260528564], [1.7659261226654053, 0.5565120577812195, -0.1065572127699852, 0.7473244667053223], [1.777056336402893, 0.7529301047325134, -0.09161072969436646, 0.4230998456478119], [1.7921149730682373, 0.9492223858833313, -0.08314872533082962, 0.10300023853778839], [1.8110994100570679, 0.7553843855857849, -0.08108872175216675, 0.36833512783050537], [1.826207160949707, 0.5615026354789734, -0.07372201979160309, 0.6343882083892822], [1.8374371528625488, 0.3674822449684143, -0.06103425845503807, 0.9029736518859863], [1.8447868824005127, 0.5633754730224609, -0.04297478497028351, 0.5917479395866394], [1.8560543060302734, 0.7590718865394592, -0.031139826402068138, 0.2858436703681946], [1.871235728263855, 0.5644075870513916, -0.025422953069210052, 0.5685449838638306], [1.8825238943099976, 0.7598767280578613, -0.014052052982151508, 0.2679624557495117], [1.8977214097976685, 0.5649580955505371, -0.008692803792655468, 0.5561803579330444], [1.9090206623077393, 0.7602009773254395, 0.0024308033753186464, 0.26077139377593994], [1.924224615097046, 0.9552881717681885, 0.007646231446415186, -0.031143825501203537], [1.9433304071426392, 1.1502996683120728, 0.00702335499227047, -0.32140451669692993], [1.9663363695144653, 0.9550783634185791, 0.0005952647770754993, -0.026514990255236626], [1.9854379892349243, 0.7599478960037231, 6.496493006125093e-05, 0.2663556933403015], [2.0006368160247803, 0.5648249983787537, 0.005392078775912523, 0.5590590834617615], [2.0119333267211914, 0.7598708868026733, 0.016573261469602585, 0.26807984709739685], [2.0271308422088623, 0.5645163655281067, 0.021934857591986656, 0.5659436583518982], [2.038421154022217, 0.7593238353729248, 0.033253733068704605, 0.28025108575820923], [2.053607702255249, 0.9539560079574585, 0.03885875269770622, -0.0017610073555260897], [2.0726866722106934, 1.1484997272491455, 0.038823533803224564, -0.2819347083568573], [2.0956568717956543, 1.343047022819519, 0.03318483754992485, -0.562124490737915], [2.1225175857543945, 1.1474754810333252, 0.021942349150776863, -0.2591741681098938], [2.1454672813415527, 0.9520472884178162, 0.016758864745497704, 0.04034813120961189], [2.164508104324341, 0.7566890716552734, 0.017565827816724777, 0.3382711708545685], [2.1796419620513916, 0.5613216161727905, 0.02433125115931034, 0.6364412307739258], [2.190868377685547, 0.7560959458351135, 0.037060074508190155, 0.3515188992023468], [2.2059903144836426, 0.5604671239852905, 0.044090453535318375, 0.6556538343429565], [2.2171995639801025, 0.36475998163223267, 0.05720353126525879, 0.9618876576423645], [2.2244949340820312, 0.5590684413909912, 0.07644128799438477, 0.6877103447914124], [2.2356762886047363, 0.7530508637428284, 0.09019549190998077, 0.4200383126735687], [2.250737190246582, 0.556774377822876, 0.09859625995159149, 0.7397377490997314], [2.2618727684020996, 0.7504067420959473, 0.11339101195335388, 0.4796402156352997], [2.2768807411193848, 0.9437606930732727, 0.12298382073640823, 0.22473743557929993], [2.2957561016082764, 0.7471152544021606, 0.12747856974601746, 0.5535438060760498], [2.3106982707977295, 0.940238356590271, 0.13854944705963135, 0.3035871088504791], [2.329503059387207, 1.1331418752670288, 0.14462117850780487, 0.05760801210999489], [2.352165937423706, 1.3259259462356567, 0.14577335119247437, -0.18617881834506989], [2.3786845207214355, 1.1290518045425415, 0.14204977452754974, 0.1487061083316803], [2.4012656211853027, 1.321884036064148, 0.1450238972902298, -0.09600666910409927], [-0.003090517595410347, 0.20602113008499146, 0.021328117698431015, -0.26707059144973755], [0.0010299049317836761, 0.010601377114653587, 0.01598670706152916, 0.03226236253976822], [0.001241932506673038, 0.20549046993255615, 0.016631953418254852, -0.2553340196609497], [0.005351741798222065, 0.01013504434376955, 0.011525273323059082, 0.04254814609885216], [0.005554442759603262, -0.18515026569366455, 0.01237623579800129, 0.33884501457214355], [0.0018514374969527125, 0.009793414734303951, 0.019153136759996414, 0.05009040981531143], [0.0020473056938499212, -0.18559786677360535, 0.02015494368970394, 0.34875425696372986], [-0.0016646514413878322, -0.3810005784034729, 0.02713003009557724, 0.6477239727973938], [-0.009284663014113903, -0.1862669140100479, 0.04008450731635094, 0.36370617151260376], [-0.013010001741349697, 0.008263098075985909, 0.04735863208770752, 0.08392725139856339], [-0.012844739481806755, 0.20267531275749207, 0.04903717711567879, -0.19344587624073029], [-0.008791233412921429, 0.006887437310069799, 0.045168258249759674, 0.11429406702518463], [-0.008653484284877777, -0.18885163962841034, 0.047454141080379486, 0.42087817192077637], [-0.012430517002940178, 0.005566961131989956, 0.05587170273065567, 0.14352485537528992], [-0.012319178320467472, 0.199846088886261, 0.05874220281839371, -0.13102136552333832], [-0.008322256617248058, 0.3940795361995697, 0.05612177401781082, -0.40460872650146484], [-0.0004406656080391258, 0.5883625149726868, 0.04802960157394409, -0.6790832281112671], [0.011326584964990616, 0.3926074504852295, 0.03444793447852135, -0.37167397141456604], [0.019178733229637146, 0.1970134675502777, 0.02701445482671261, -0.06833136826753616], [0.0231190025806427, 0.3917379081249237, 0.025647828355431557, -0.35237017273902893], [0.03095376119017601, 0.19626079499721527, 0.018600424751639366, -0.051711320877075195], [0.03487897664308548, 0.0008771469001658261, 0.017566198483109474, 0.24678167700767517], [0.03489651903510094, 0.1957438737154007, 0.022501831874251366, -0.0403091199696064], [0.038811396807432175, 0.00030659293406642973, 0.02169564925134182, 0.2593875527381897], [0.03881752863526344, 0.1951122134923935, 0.026883400976657867, -0.026374073699116707], [0.042719773948192596, -0.00038474873872473836, 0.026355918496847153, 0.2746681571006775], [0.042712077498435974, 0.1943514347076416, 0.03184928372502327, -0.009586920030415058], [0.04659910872578621, -0.0012124553322792053, 0.031657543033361435, 0.29297226667404175], [0.04657485708594322, 0.193444162607193, 0.037516988813877106, 0.010439393110573292], [0.05044374242424965, 0.3880085349082947, 0.0377257764339447, -0.27017441391944885], [0.058203913271427155, 0.19236911833286285, 0.03232228755950928, 0.034164682030677795], [0.06205129623413086, -0.00320107932202518, 0.03300558403134346, 0.3368678390979767], [0.06198727339506149, 0.1914360076189041, 0.03974293917417526, 0.05477309972047806], [0.0658159926533699, -0.004232592880725861, 0.04083840176463127, 0.35972559452056885], [0.06573133915662766, 0.19028575718402863, 0.048032913357019424, 0.08019449561834335], [0.06953705847263336, -0.005490671377629042, 0.049636803567409515, 0.3876366913318634], [0.0694272443652153, -0.20128077268600464, 0.05738953500986099, 0.695547342300415], [0.06540162861347198, -0.0069997659884393215, 0.07130048424005508, 0.4214688837528229], [0.06526163220405579, -0.20305564999580383, 0.07972986251115799, 0.7357500791549683], [0.061200518161058426, -0.39918312430381775, 0.09444486349821091, 1.0524224042892456], [0.053216855973005295, -0.2054317742586136, 0.11549331247806549, 0.7908161878585815], [0.049108222126960754, -0.012069055810570717, 0.1313096433877945, 0.5365839600563049], [0.048866841942071915, -0.2087690830230713, 0.14204131066799164, 0.867588222026825], [0.044691458344459534, -0.01583588309586048, 0.1593930721282959, 0.6227227449417114], [0.0443747416138649, -0.21278215944766998, 0.17184753715991974, 0.9610607624053955], [0.040119096636772156, -0.02033420465886593, 0.19106875360012054, 0.726915717124939], [0.039712414145469666, 0.17170487344264984, 0.205607071518898, 0.49993225932121277], [0.04314650967717171, 0.3634255826473236, 0.2156057059764862, 0.2784319519996643], [-0.02837316319346428, -0.14567023515701294, -0.03716284781694412, 0.3279588222503662], [-0.0312865674495697, 0.049960531294345856, -0.030603671446442604, 0.023791905492544174], [-0.030287357047200203, 0.24550770223140717, -0.030127832666039467, -0.27838757634162903], [-0.02537720277905464, 0.05082820728421211, -0.03569558262825012, 0.004642899613827467], [-0.024360639974474907, 0.24644342064857483, -0.03560272604227066, -0.2990852892398834], [-0.019431771710515022, 0.44205430150032043, -0.04158443212509155, -0.6027806401252747], [-0.010590685531497002, 0.24753789603710175, -0.05364004522562027, -0.3234805762767792], [-0.0056399269960820675, 0.05321914702653885, -0.06010965630412102, -0.04818429797887802], [-0.004575544036924839, -0.140991672873497, -0.061073340475559235, 0.22494420409202576], [-0.00739537738263607, 0.054947562515735626, -0.05657445639371872, -0.08636108785867691], [-0.006296426057815552, 0.2508329153060913, -0.05830167979001999, -0.39634302258491516], [-0.0012797681847587228, 0.056584522128105164, -0.06622853875160217, -0.12259648740291595], [-0.00014807774277869612, -0.1375291496515274, -0.06868047267198563, 0.14847873151302338], [-0.002898660721257329, -0.3316038250923157, -0.0657108947634697, 0.41872820258140564], [-0.009530737064778805, -0.1356152445077896, -0.05733633041381836, 0.1060747355222702], [-0.012243041768670082, 0.0602794885635376, -0.055214837193489075, -0.20413215458393097], [-0.011037452146410942, 0.25614580512046814, -0.059297479689121246, -0.5137088298797607], [-0.0059145363047719, 0.061906926333904266, -0.06957165896892548, -0.24028582870960236], [-0.004676397889852524, 0.25795018672943115, -0.07437737286090851, -0.5540769100189209], [0.00048260579933412373, 0.06394711136817932, -0.0854589119553566, -0.28572362661361694], [0.0017615481046959758, -0.12985867261886597, -0.09117338061332703, -0.021170208230614662], [-0.0008356254547834396, 0.06644449383020401, -0.09159678965806961, -0.3411698341369629], [0.0004932644660584629, 0.26274219155311584, -0.09842018038034439, -0.6612738370895386], [0.0057481080293655396, 0.4590858817100525, -0.1116456612944603, -0.983253002166748], [0.014929826371371746, 0.6555122137069702, -0.13131071627140045, -1.3088138103485107], [0.028040070086717606, 0.8520304560661316, -0.15748699009418488, -1.6395479440689087], [0.04508068040013313, 1.0486087799072266, -0.19027794897556305, -1.9768762588500977], [0.06605285406112671, 0.855933427810669, -0.22981548309326172, -1.748684287071228]], "action_prob": [0.4723632037639618, 0.6351969838142395, 0.5460831522941589, 0.5832164883613586, 0.5612407326698303, 0.5709869265556335, 0.5748412013053894, 0.5580494403839111, 0.4127912223339081, 0.6520339846611023, 0.6027085185050964, 0.521735668182373, 0.6154993772506714, 0.5010378956794739, 0.37298789620399475, 0.6587495803833008, 0.6399539113044739, 0.44751864671707153, 0.35029515624046326, 0.659753143787384, 0.6590400338172913, 0.3879968822002411, 0.6645906567573547, 0.3635292053222656, 0.6674755811691284, 0.3445037007331848, 0.667815089225769, 0.6685023307800293, 0.6291855573654175, 0.5340645909309387, 0.5682979226112366, 0.5775604844093323, 0.46898579597473145, 0.39152219891548157, 0.6429081559181213, 0.591163694858551, 0.46568137407302856, 0.6477007269859314, 0.565762996673584, 0.4572979509830475, 0.38413435220718384, 0.6476184725761414, 0.3929481506347656, 0.6458510756492615, 0.6007054448127747, 0.49644142389297485, 0.6190630793571472, 0.5163291692733765, 0.5851329565048218, 0.5258129239082336, 0.42151132225990295, 0.6366031169891357, 0.5759875774383545, 0.533943235874176, 0.42652997374534607, 0.3642174303531647, 0.6592666506767273, 0.6392163038253784, 0.584062397480011, 0.4845924973487854, 0.38734760880470276, 0.6583918929100037, 0.6120096445083618, 0.4880313575267792, 0.6117571592330933, 0.48611196875572205, 0.38706183433532715, 0.341325044631958, 0.6634369492530823, 0.3379417359828949, 0.6639531254768372, 0.6660692691802979, 0.6439681649208069, 0.41555407643318176, 0.6538194417953491, 0.6072337031364441, 0.529593825340271, 0.44820863008499146, 0.38960617780685425, 0.6435197591781616, 0.4023102819919586, 0.3623509407043457, 0.3422364592552185, 0.6662643551826477, 0.3421262502670288, 0.667574405670166, 0.340496689081192, 0.6693598031997681, 0.6626163721084595, 0.3557242155075073, 0.3339027464389801, 0.67343670129776, 0.6706463098526001, 0.3393453061580658, 0.6746542453765869, 0.6687813997268677, 0.6541685461997986, 0.6256585717201233, 0.57830810546875, 0.5143845677375793, 0.4486374258995056, 0.602365255355835, 0.4706666171550751, 0.5888004899024963, 0.5106500387191772, 0.5792945623397827, 0.5070555210113525, 0.43700385093688965, 0.6123780012130737, 0.5559247136116028, 0.5260270833969116, 0.550796627998352, 0.5298709869384766, 0.548393964767456, 0.4695501923561096, 0.3959745764732361, 0.6515814065933228, 0.6054122447967529, 0.5338832139968872, 0.5436763763427734, 0.5317106246948242, 0.5463668704032898, 0.47356706857681274, 0.4039778709411621, 0.355827659368515, 0.6704288721084595, 0.6433002352714539, 0.5923920273780823, 0.5199998617172241, 0.5530160069465637, 0.5142295956611633, 0.4412986934185028, 0.6105658411979675, 0.5692937970161438, 0.4886610209941864, 0.5811513066291809, 0.5291419625282288, 0.5317866802215576, 0.5472249984741211, 0.49016353487968445, 0.43354588747024536, 0.6120694875717163, 0.4535965025424957, 0.5151715874671936, 0.6085749268531799, 0.5202736258506775, 0.6062118411064148, 0.47619765996932983, 0.6300301551818848, 0.4685876667499542, 0.36629244685173035, 0.6536722779273987, 0.6403294205665588, 0.5617313981056213, 0.5706326961517334, 0.42461931705474854, 0.6491867303848267, 0.5922091603279114, 0.4639412760734558, 0.37334245443344116, 0.6505885124206543, 0.6245748996734619, 0.4823974370956421, 0.6224923133850098, 0.5130597949028015, 0.615327000617981, 0.5056641101837158, 0.6197729706764221, 0.49660417437553406, 0.6247851848602295, 0.4856965243816376, 0.6302732825279236, 0.5272124409675598, 0.5975145697593689, 0.4631737172603607, 0.6390262246131897, 0.44987958669662476, 0.6441152691841125, 0.4344097375869751, 0.3507157266139984, 0.6563475131988525, 0.3441726863384247, 0.34406718611717224, 0.6382798552513123, 0.6545614004135132, 0.3337666094303131, 0.651075541973114, 0.33323153853416443, 0.6459333300590515, 0.6640292406082153, 0.676774263381958, 0.4832248389720917, 0.6230059862136841, 0.5063025951385498, 0.6185481548309326, 0.49244174361228943, 0.3742775321006775, 0.6547563672065735, 0.6355392932891846, 0.5491436123847961, 0.5794298648834229, 0.43256399035453796, 0.6483248472213745, 0.5882549285888672, 0.4607120752334595, 0.6265320777893066, 0.5215944647789001, 0.3844974637031555, 0.6575271487236023, 0.3699864447116852, 0.6597497463226318, 0.6438102126121521, 0.43620678782463074, 0.3463273346424103, 0.33987167477607727, 0.35638538002967834, 0.3752128779888153, 0.3916023075580597, 0.595160961151123], "advantages": [64.84490203857422, 64.71284484863281, 64.14674377441406, 63.865203857421875, 63.51496124267578, 63.214962005615234, 62.88627624511719, 62.56707000732422, 62.25556945800781, 62.16477966308594, 61.54140853881836, 61.164730072021484, 60.87002944946289, 60.47111511230469, 60.19000244140625, 60.10108184814453, 59.43913650512695, 58.987030029296875, 58.721004486083984, 58.62296676635742, 57.947792053222656, 57.45457458496094, 57.20442581176758, 56.6989860534668, 56.45758056640625, 55.94404602050781, 55.70805740356445, 55.19084548950195, 54.774635314941406, 54.42910385131836, 54.139556884765625, 53.70503616333008, 53.39686584472656, 53.13609313964844, 52.92827606201172, 52.41539001464844, 51.97401809692383, 51.58984375, 51.24139404296875, 50.932838439941406, 50.66815948486328, 50.45836639404297, 49.94350814819336, 49.731727600097656, 49.223941802978516, 48.76679229736328, 48.35213851928711, 48.00836181640625, 47.71449661254883, 47.25185012817383, 46.950740814208984, 46.71387481689453, 46.20087432861328, 45.731300354003906, 45.426025390625, 45.19355392456055, 45.05412673950195, 44.486297607421875, 43.96163558959961, 43.477256774902344, 43.031673431396484, 42.62512969970703, 42.17341232299805, 41.79716873168945, 41.319862365722656, 40.93339920043945, 40.44351577758789, 39.996315002441406, 39.59089279174805, 39.0028190612793, 38.57741165161133, 37.97120666503906, 37.42877197265625, 36.93925094604492, 36.40180206298828, 35.88822937011719, 35.41721725463867, 34.987266540527344, 34.60107421875, 34.264862060546875, 33.58443069458008, 33.24182891845703, 32.958526611328125, 32.74341583251953, 32.038787841796875, 31.85050392150879, 31.17923355102539, 31.02617073059082, 30.39495849609375, 29.790023803710938, 29.633928298950195, 29.562223434448242, 29.033935546875, 28.533327102661133, 28.487018585205078, 28.060007095336914, 27.645177841186523, 27.227628707885742, 26.806650161743164, 26.393571853637695, 26.000730514526367, 25.6281681060791, 25.130084991455078, 24.70235824584961, 24.18958282470703, 23.817686080932617, 23.297523498535156, 22.790098190307617, 22.28687858581543, 21.54834747314453, 20.94267463684082, 20.309919357299805, 19.662033081054688, 18.98196029663086, 18.28911781311035, 17.690929412841797, 17.152719497680664, 16.451162338256836, 15.719514846801758, 14.97555923461914, 14.194173812866211, 13.401199340820312, 12.570222854614258, 11.822554588317871, 11.128707885742188, 10.471596717834473, 9.72433853149414, 8.927382469177246, 8.09390640258789, 7.240878582000732, 6.305838108062744, 5.395290374755859, 4.464844703674316, 3.3060200214385986, 2.2409489154815674, 1.1867326498031616, 0.062367986887693405, -0.9830955862998962, -2.1201775074005127, -3.2094810009002686, -4.241089344024658, -5.235578536987305, -6.379737377166748, 27.39055633544922, 26.81203842163086, 26.097572326660156, 25.508033752441406, 24.79776954650879, 24.339340209960938, 23.372467041015625, 22.890867233276367, 22.633014678955078, 21.283353805541992, 20.233224868774414, 19.47222900390625, 18.705425262451172, 18.175020217895508, 17.071298599243164, 16.23222541809082, 15.6312837600708, 15.251936912536621, 14.146563529968262, 13.224324226379395, 12.619599342346191, 11.70429801940918, 10.986968994140625, 10.093547821044922, 9.360922813415527, 8.439271926879883, 7.691827297210693, 6.740492820739746, 5.978725910186768, 4.996460914611816, 4.234776496887207, 3.2765777111053467, 2.4990172386169434, 1.464330792427063, 0.670138418674469, -0.3967107832431793, -1.2065738439559937, -1.8517956733703613, -3.187420606613159, -3.8666279315948486, -4.409441947937012, -5.979111194610596, -7.335955619812012, -8.08370304107666, -9.438187599182129, -10.214499473571777, -11.559478759765625, -12.767827033996582, 13.329021453857422, 12.83576488494873, 11.8917818069458, 11.297660827636719, 10.522195816040039, 9.953763008117676, 9.742029190063477, 8.775078773498535, 8.007563591003418, 7.47698974609375, 6.6447296142578125, 6.241382598876953, 5.432535648345947, 4.8652753829956055, 4.534222602844238, 3.360339641571045, 2.6336629390716553, 2.357266902923584, 1.4826537370681763, 1.3107703924179077, 0.4970335364341736, -0.09460966289043427, -0.511314332485199, -0.49263548851013184, -0.23266570270061493, 0.057067468762397766, 0.23568974435329437, 0.2485407590866089], "value_targets": [76.2407455444336, 76.0007553100586, 75.75833892822266, 75.51347351074219, 75.26612854003906, 75.01629638671875, 74.76393127441406, 74.50902557373047, 74.25154113769531, 73.991455078125, 73.72874450683594, 73.46337127685547, 73.19532775878906, 72.92457580566406, 72.65108489990234, 72.37483215332031, 72.09579467773438, 71.81392669677734, 71.52922058105469, 71.24163818359375, 70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1820874006, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1461350891, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 1594200983, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630, 557438630], "obs": [[-0.013421892188489437, -0.02336839959025383, 0.02906772308051586, -0.01997542195022106], [-0.013889260590076447, -0.21889489889144897, 0.02866821549832821, 0.2817351222038269], [-0.018267158418893814, -0.41441377997398376, 0.03430291637778282, 0.5833202600479126], [-0.026555433869361877, -0.21978877484798431, 0.04596932232379913, 0.30163756012916565], [-0.030951209366321564, -0.02535112388432026, 0.05200207605957985, 0.023799419403076172], [-0.031458232551813126, -0.22117877006530762, 0.052478063851594925, 0.3324255347251892], [-0.035881806164979935, -0.026841524988412857, 0.05912657454609871, 0.056742433458566666], [-0.03641863912343979, 0.16738499701023102, 0.06026142090559006, -0.21671515703201294], [-0.03307093679904938, 0.361596018075943, 0.05592712014913559, -0.4897967576980591], [-0.02583901770412922, 0.1657315343618393, 0.046131182461977005, -0.1800253838300705], [-0.022524386644363403, 0.3601640462875366, 0.04253067448735237, -0.4578061103820801], [-0.015321106649935246, 0.1644674390554428, 0.03337455540895462, -0.15202642977237701], [-0.012031757272779942, 0.3590960204601288, 0.030334025621414185, -0.43399640917778015], [-0.00484983716160059, 0.1635580211877823, 0.021654097363352776, -0.13190752267837524], [-0.0015786768635734916, -0.03186731040477753, 0.019015947356820107, 0.16752757132053375], [-0.0022160231601446867, -0.22725622355937958, 0.022366497665643692, 0.4661482870578766], [-0.006761147640645504, -0.42268693447113037, 0.031689465045928955, 0.7657962441444397], [-0.015214886516332626, -0.22801533341407776, 0.047005388885736465, 0.48325058817863464], [-0.01977519318461418, -0.03358721733093262, 0.056670401245355606, 0.20574505627155304], [-0.020446937531232834, -0.2294718474149704, 0.06078530102968216, 0.5157524943351746], [-0.025036374107003212, -0.03525617718696594, 0.07110035419464111, 0.2428268939256668], [-0.025741497054696083, 0.158781960606575, 0.07595688849687576, -0.026609040796756744], [-0.02256585843861103, 0.35273709893226624, 0.07542470842599869, -0.29439303278923035], [-0.015511116944253445, 0.1566253900527954, 0.06953684985637665, 0.02109202928841114], [-0.01237860880792141, 0.3506847620010376, 0.06995868682861328, -0.24886620044708252], [-0.005364913959056139, 0.15463709831237793, 0.0649813637137413, 0.06503705680370331], [-0.002272171899676323, 0.3487701117992401, 0.06628210842609406, -0.20645679533481598], [0.00470323022454977, 0.5428847074508667, 0.06215297058224678, -0.47751665115356445], [0.01556092407554388, 0.34694281220436096, 0.05260263755917549, -0.16591010987758636], [0.022499781101942062, 0.5412738919258118, 0.0492844358086586, -0.44154542684555054], [0.033325258642435074, 0.34549039602279663, 0.04045352712273598, -0.1337430477142334], [0.040235064923763275, 0.5400102138519287, 0.037778664380311966, -0.4133940041065216], [0.05103527009487152, 0.3443737030029297, 0.02951078489422798, -0.10904433578252792], [0.05792274326086044, 0.5390605926513672, 0.02732989937067032, -0.39227262139320374], [0.06870395690202713, 0.34356170892715454, 0.019484445452690125, -0.09109976887702942], [0.07557518780231476, 0.5383990406990051, 0.017662450671195984, -0.377572238445282], [0.08634316921234131, 0.73326575756073, 0.01011100597679615, -0.6646342277526855], [0.10100848972797394, 0.9282456040382385, -0.0031816777773201466, -0.9541164636611938], [0.11957339942455292, 1.1234102249145508, -0.022264007478952408, -1.2477972507476807], [0.14204160869121552, 1.3188104629516602, -0.047219954431056976, -1.5473700761795044], [0.1684178113937378, 1.12428617477417, -0.07816735655069351, -1.2697863578796387], [0.19090352952480316, 0.9302443861961365, -0.1035630851984024, -1.002570390701294], [0.20950841903686523, 1.1265860795974731, -0.12361449003219604, -1.3258980512619019], [0.232040137052536, 0.9332225918769836, -0.1501324474811554, -1.074316143989563], [0.2507045865058899, 0.7403687834739685, -0.1716187745332718, -0.8322628736495972], [0.26551195979118347, 0.5479552745819092, -0.18826402723789215, -0.5980911254882812], [0.2764710783958435, 0.35589689016342163, -0.2002258598804474, -0.37011709809303284], [0.2835890054702759, 0.16409888863563538, -0.20762819051742554, -0.14664170145988464], [-0.03706119582056999, 0.012537594884634018, 0.003326627891510725, 0.0271906778216362], [-0.03681044280529022, 0.20761168003082275, 0.003870441345497966, -0.2644408047199249], [-0.03265821188688278, 0.012434701435267925, -0.0014183747116476297, 0.029460377991199493], [-0.03240951523184776, 0.2075769603252411, -0.0008291671401821077, -0.2636697292327881], [-0.028257977217435837, 0.012466858141124249, -0.0061025614850223064, 0.028751559555530548], [-0.028008639812469482, -0.1825670450925827, -0.0055275303311645985, 0.3195028305053711], [-0.03165998309850693, 0.012633186765015125, 0.0008625261834822595, 0.02508186548948288], [-0.03140731900930405, 0.20774275064468384, 0.0013641634723171592, -0.26732879877090454], [-0.02725246176123619, 0.012601364403963089, -0.003982412628829479, 0.02578408271074295], [-0.027000434696674347, -0.18246324360370636, -0.0034667309373617172, 0.31720784306526184], [-0.03064969927072525, -0.3775356411933899, 0.0028774263337254524, 0.6087954640388489], [-0.038200411945581436, -0.18245404958724976, 0.015053335577249527, 0.3170202374458313], [-0.041849493980407715, -0.37778714299201965, 0.02139374054968357, 0.6144121885299683], [-0.049405235797166824, -0.1829705536365509, 0.03368198499083519, 0.328543484210968], [-0.05306464806199074, 0.011656110174953938, 0.04025285318493843, 0.046669699251651764], [-0.05283152684569359, 0.2061784416437149, 0.041186247020959854, -0.233046293258667], [-0.048707958310842514, 0.40068843960762024, 0.03652532398700714, -0.5124585032463074], [-0.040694188326597214, 0.5952773690223694, 0.026276152580976486, -0.7934112548828125], [-0.028788641095161438, 0.790028989315033, 0.010407927446067333, -1.0777134895324707], [-0.012988060712814331, 0.9850119352340698, -0.011146342381834984, -1.367112159729004], [0.0067121777683496475, 0.7900312542915344, -0.038488585501909256, -1.0779362916946411], [0.022512802854180336, 0.9856398701667786, -0.06004730984568596, -1.3824447393417358], [0.04222559928894043, 1.1814574003219604, -0.08769620209932327, -1.6932849884033203], [0.0658547505736351, 0.9874505996704102, -0.12156190723180771, -1.429142713546753], [0.0856037586927414, 0.7940213680267334, -0.1501447558403015, -1.1767913103103638], [0.10148418694734573, 0.601134181022644, -0.17368058860301971, -0.9346925616264343], [0.11350686848163605, 0.40872642397880554, -0.19237443804740906, -0.701228678226471], [0.12168139964342117, 0.6059206128120422, -0.20639900863170624, -1.0477733612060547], [-0.015088296495378017, -0.008189859800040722, 0.04350156709551811, -0.04852038249373436], [-0.015252092853188515, -0.20390771329402924, 0.04253115877509117, 0.25756409764289856], [-0.01933024823665619, -0.3996102511882782, 0.047682441771030426, 0.5633528232574463], [-0.027322452515363693, -0.20518866181373596, 0.05894949659705162, 0.2860652208328247], [-0.03142622485756874, -0.010954804718494415, 0.06467080116271973, 0.012541643343865871], [-0.03164532035589218, 0.18318293988704681, 0.06492163240909576, -0.2590562701225281], [-0.02798166312277317, 0.37732088565826416, 0.05974050983786583, -0.5305761694908142], [-0.02043524570763111, 0.1814117133617401, 0.04912898689508438, -0.21968334913253784], [-0.016807010397315025, 0.37579822540283203, 0.044735319912433624, -0.49647319316864014], [-0.009291047230362892, 0.18007494509220123, 0.03480585664510727, -0.19003421068191528], [-0.00568954786285758, -0.015527207404375076, 0.031005172058939934, 0.11342218518257141], [-0.006000091787427664, -0.21107938885688782, 0.033273614943027496, 0.4157235324382782], [-0.01022167969495058, -0.016444433480501175, 0.041588086634874344, 0.13371333479881287], [-0.01055056881159544, -0.2121366560459137, 0.0442623533308506, 0.43922123312950134], [-0.014793301932513714, -0.017668193206191063, 0.053046777844429016, 0.1608131229877472], [-0.015146665275096893, 0.17665578424930573, 0.056263040751218796, -0.11467437446117401], [-0.011613549664616585, -0.01922531984746456, 0.05396955460309982, 0.19521495699882507], [-0.011998056434094906, 0.17508476972579956, 0.05787385255098343, -0.0799664556980133], [-0.0084963608533144, -0.02081701159477234, 0.056274522095918655, 0.23039965331554413], [-0.008912701159715652, 0.173457533121109, 0.06088251620531082, -0.04401487484574318], [-0.005443550646305084, 0.36765599250793457, 0.060002218931913376, -0.31688445806503296], [0.001909569138661027, 0.17173302173614502, 0.05366452783346176, -0.005898802075535059], [0.0053442297503352165, 0.36604592204093933, 0.05354655161499977, -0.281178742647171], [0.01266514789313078, 0.17020267248153687, 0.047922976315021515, 0.02790023759007454], [0.01606920175254345, -0.025572607293725014, 0.04848098382353783, 0.3353099524974823], [0.015557749196887016, 0.16882705688476562, 0.05518718063831329, 0.0583009198307991], [0.01893429085612297, 0.3631160855293274, 0.05635320022702217, -0.21647213399410248], [0.026196612045168877, 0.16723568737506866, 0.0520237572491169, 0.09344110637903214], [0.029541324824094772, 0.3615748882293701, 0.053892578929662704, -0.18238520622253418], [0.036772824823856354, 0.16572485864162445, 0.05024487525224686, 0.1268000602722168], [0.040087319910526276, 0.3600923418998718, 0.0527808777987957, -0.14961746335029602], [0.0472891665995121, 0.16425588726997375, 0.04978852719068527, 0.1592385321855545], [0.05057428404688835, 0.3586309850215912, 0.05297330021858215, -0.11733102053403854], [0.05774690583348274, 0.5529555082321167, 0.05062667652964592, -0.39284202456474304], [0.06880601495504379, 0.3571530282497406, 0.042769838124513626, -0.08463675528764725], [0.07594907283782959, 0.5516366362571716, 0.04107710346579552, -0.3635248839855194], [0.08698180317878723, 0.7461514472961426, 0.03380660340189934, -0.6429776549339294], [0.10190483182668686, 0.5505749583244324, 0.020947052165865898, -0.33984339237213135], [0.11291633546352386, 0.3551613390445709, 0.014150183647871017, -0.04062926396727562], [0.12001956254243851, 0.15983936190605164, 0.01333759818226099, 0.25648438930511475], [0.12321634590625763, -0.035470444709062576, 0.018467284739017487, 0.553344190120697], [0.12250693887472153, -0.23084679245948792, 0.029534168541431427, 0.851787805557251], [0.11789000779390335, -0.4263586699962616, 0.04656992480158806, 1.1536095142364502], [0.10936283320188522, -0.23187404870986938, 0.06964211910963058, 0.8758854866027832], [0.10472535341978073, -0.037764329463243484, 0.08715982735157013, 0.6058849096298218], [0.10397006571292877, 0.15603765845298767, 0.09927752614021301, 0.3418779969215393], [0.10709081590175629, -0.04034626856446266, 0.10611508041620255, 0.6641430854797363], [0.10628388822078705, 0.1531519740819931, 0.11939794570207596, 0.40666764974594116], [0.10934693366289139, 0.34639641642570496, 0.12753130495548248, 0.15388433635234833], [0.11627485603094101, 0.14970099925994873, 0.13060899078845978, 0.4839240312576294], [0.11926887929439545, 0.34276118874549866, 0.14028745889663696, 0.2350902110338211], [0.12612409889698029, 0.535629153251648, 0.1449892669916153, -0.010260186158120632], [0.1368366926908493, 0.7284063100814819, 0.14478406310081482, -0.2539142072200775], [0.15140481293201447, 0.5315457582473755, 0.13970577716827393, 0.08070496469736099], [0.16203573346138, 0.7244173288345337, 0.1413198858499527, -0.1648436337709427], [0.1765240728855133, 0.9172632098197937, 0.1380230039358139, -0.4098188579082489], [0.19486933946609497, 0.7204819321632385, 0.1298266351222992, -0.07700402289628983], [0.20927897095680237, 0.523760974407196, 0.12828655540943146, 0.2536560595035553], [0.2197542041540146, 0.7168400287628174, 0.13335967063903809, 0.004030297044664621], [0.23409099876880646, 0.5200825929641724, 0.1334402710199356, 0.3356374502182007], [0.24449265003204346, 0.7130781412124634, 0.14015302062034607, 0.08783286064863205], [0.2587542235851288, 0.9059419631958008, 0.14190968871116638, -0.15755601227283478], [0.27687305212020874, 1.0987770557403564, 0.1387585699558258, -0.4023195207118988], [0.29884859919548035, 0.9019879102706909, 0.13071216642856598, -0.06930866837501526], [0.31688836216926575, 1.0950171947479248, 0.1293260008096695, -0.31806254386901855], [0.3387886881828308, 1.2880828380584717, 0.12296474725008011, -0.5673266053199768], [0.3645503520965576, 1.0914700031280518, 0.11161822080612183, -0.23857365548610687], [0.38637974858283997, 0.8949452042579651, 0.10684674233198166, 0.08712687343358994], [0.4042786657810211, 0.6984668374061584, 0.1085892841219902, 0.411516934633255], [0.4182479977607727, 0.8918952941894531, 0.11681962013244629, 0.15494568645954132], [0.43608590960502625, 1.0851677656173706, 0.11991853266954422, -0.09872010350227356], [0.45778924226760864, 1.2783851623535156, 0.1179441288113594, -0.35129314661026], [0.48335695266723633, 1.4716495275497437, 0.11091826856136322, -0.6045805811882019], [0.5127899646759033, 1.6650599241256714, 0.09882665425539017, -0.8603700995445251], [0.5460911393165588, 1.858707070350647, 0.0816192552447319, -1.1204158067703247], [0.5832653045654297, 2.052669048309326, 0.059210941195487976, -1.3864209651947021], [0.6243186593055725, 1.8568611145019531, 0.0314825214445591, -1.075825810432434], [0.6614558696746826, 2.051553249359131, 0.009966002777218819, -1.3584650754928589], [0.7024869322776794, 2.246548891067505, -0.017203299328684807, -1.648013949394226], [0.7474179267883301, 2.4418675899505615, -0.05016357824206352, -1.9460062980651855], [0.7962552905082703, 2.637486696243286, -0.0890837013721466, -2.253807544708252], [0.8490050435066223, 2.4433071613311768, -0.1341598480939865, -1.9898490905761719], [0.8978711366653442, 2.2498228549957275, -0.17395684123039246, -1.7415554523468018], [0.942867636680603, 2.057055950164795, -0.2087879478931427, -1.5076549053192139], [0.0009936954593285918, 0.007597262971103191, -0.021887078881263733, -0.02805415354669094], [0.0011456407373771071, -0.18720409274101257, -0.022448161616921425, 0.25764361023902893], [-0.0025984409730881453, 0.008231038227677345, -0.017295289784669876, -0.04203443601727486], [-0.0024338201619684696, -0.18663868308067322, -0.018135977908968925, 0.2451418787240982], [-0.006166594102978706, 0.008737538941204548, -0.013233140110969543, -0.053205955773591995], [-0.0059918430633842945, 0.20404671132564545, -0.014297259971499443, -0.3500345051288605], [-0.0019109089625999331, 0.3993690609931946, -0.02129795029759407, -0.6471912860870361], [0.006076471880078316, 0.20455020666122437, -0.034241776913404465, -0.36129045486450195], [0.010167475789785385, 0.009931283071637154, -0.041467584669589996, -0.07959830015897751], [0.010366101749241352, 0.20562238991260529, -0.04305955022573471, -0.3850705921649933], [0.014478549361228943, 0.011137358844280243, -0.050760962069034576, -0.10626905411481857], [0.01470129657536745, 0.20694860816001892, -0.052886344492435455, -0.4145249128341675], [0.01884026825428009, 0.012614578008651733, -0.0611768402159214, -0.13897277414798737], [0.019092559814453125, 0.20855696499347687, -0.06395629793405533, -0.4503113031387329], [0.023263700306415558, 0.4045224189758301, -0.07296252250671387, -0.7624488472938538], [0.0313541479408741, 0.21047726273536682, -0.08821149915456772, -0.493587464094162], [0.035563692450523376, 0.016702942550182343, -0.0980832502245903, -0.22995667159557343], [0.03589775413274765, -0.176890566945076, -0.10268238186836243, 0.030247632414102554], [0.03235994279384613, 0.01954256370663643, -0.1020774319767952, -0.2929856777191162], [0.03275079280138016, -0.17398709058761597, -0.10793714225292206, -0.03416096791625023], [0.029271051287651062, -0.3674089312553406, -0.10862036049365997, 0.2226114124059677], [0.021922871470451355, -0.5608242750167847, -0.1041681319475174, 0.47915294766426086], [0.010706386528909206, -0.7543332576751709, -0.09458507597446442, 0.7372730374336243], [-0.004380278754979372, -0.9480304718017578, -0.07983961701393127, 0.998753547668457], [-0.02334088832139969, -0.7519372701644897, -0.05986454337835312, 0.6821027994155884], [-0.03837963193655014, -0.5560372471809387, -0.046222489327192307, 0.37118953466415405], [-0.04950037971138954, -0.36029016971588135, -0.03879869729280472, 0.06429789215326309], [-0.05670618265867233, -0.5548349618911743, -0.03751273825764656, 0.34449154138565063], [-0.06780288368463516, -0.35920003056526184, -0.03062290884554386, 0.04021940380334854], [-0.07498688250780106, -0.16365262866020203, -0.029818519949913025, -0.26196590065956116], [-0.07825993746519089, 0.03188199922442436, -0.03505783900618553, -0.5639027953147888], [-0.07762229442596436, -0.16273096203804016, -0.046335894614458084, -0.2824676036834717], [-0.0808769166469574, -0.3571624159812927, -0.0519852451980114, -0.004751332104206085], [-0.08802016079425812, -0.5515017509460449, -0.05208027362823486, 0.271087110042572], [-0.09905019402503967, -0.3556768298149109, -0.046658530831336975, -0.037556715309619904], [-0.10616373270750046, -0.5500997304916382, -0.04740966483950615, 0.24004758894443512], [-0.11716572940349579, -0.35433369874954224, -0.04260871186852455, -0.06720470637083054], [-0.12425240129232407, -0.5488196611404419, -0.043952807784080505, 0.21173632144927979], [-0.13522879779338837, -0.3530977666378021, -0.039718080312013626, -0.0944809839129448], [-0.14229075610637665, -0.5476285815238953, -0.041607700288295746, 0.18541109561920166], [-0.1532433182001114, -0.7421312928199768, -0.037899479269981384, 0.46468350291252136], [-0.1680859476327896, -0.5464948415756226, -0.028605807572603226, 0.16029980778694153], [-0.1790158450603485, -0.35097530484199524, -0.025399811565876007, -0.1412685066461563], [-0.18603534996509552, -0.15549896657466888, -0.028225181624293327, -0.44185519218444824], [-0.18914532661437988, 0.04001079127192497, -0.03706228733062744, -0.7433001399040222], [-0.18834511935710907, -0.15458054840564728, -0.051928289234638214, -0.46250736713409424], [-0.19143672287464142, 0.041235361248254776, -0.061178434640169144, -0.771095335483551], [-0.19061201810836792, -0.15299372375011444, -0.0766003429889679, -0.49827203154563904], [-0.19367189705371857, -0.3469568192958832, -0.0865657851099968, -0.2306790053844452], [-0.20061102509498596, -0.5407419800758362, -0.09117936342954636, 0.03349174186587334], [-0.21142587065696716, -0.3444388210773468, -0.09050952643156052, -0.2865094840526581], [-0.21831464767456055, -0.5381612181663513, -0.09623971581459045, -0.02368873916566372], [-0.22907787561416626, -0.3418003022670746, -0.09671349078416824, -0.34511798620224], [-0.23591387271881104, -0.14544515311717987, -0.10361585021018982, -0.6666637659072876], [-0.2388227880001068, 0.05095360055565834, -0.11694912612438202, -0.9900904893875122], [-0.23780371248722076, -0.1424253284931183, -0.1367509365081787, -0.736308217048645], [-0.24065221846103668, 0.05429386347532272, -0.15147709846496582, -1.068711757659912], [-0.23956634104251862, -0.13853563368320465, -0.1728513389825821, -0.8271437287330627], [-0.24233704805374146, -0.3309260904788971, -0.18939420580863953, -0.5934240221977234], [-0.24895557761192322, -0.5229629874229431, -0.2012626975774765, -0.3658691644668579], [-0.25941482186317444, -0.32563507556915283, -0.20858007669448853, -0.7146590352058411]], "actions": [0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.013889260590076447, -0.21889489889144897, 0.02866821549832821, 0.2817351222038269], [-0.018267158418893814, -0.41441377997398376, 0.03430291637778282, 0.5833202600479126], [-0.026555433869361877, -0.21978877484798431, 0.04596932232379913, 0.30163756012916565], [-0.030951209366321564, -0.02535112388432026, 0.05200207605957985, 0.023799419403076172], [-0.031458232551813126, -0.22117877006530762, 0.052478063851594925, 0.3324255347251892], [-0.035881806164979935, -0.026841524988412857, 0.05912657454609871, 0.056742433458566666], [-0.03641863912343979, 0.16738499701023102, 0.06026142090559006, -0.21671515703201294], [-0.03307093679904938, 0.361596018075943, 0.05592712014913559, -0.4897967576980591], [-0.02583901770412922, 0.1657315343618393, 0.046131182461977005, -0.1800253838300705], [-0.022524386644363403, 0.3601640462875366, 0.04253067448735237, -0.4578061103820801], [-0.015321106649935246, 0.1644674390554428, 0.03337455540895462, -0.15202642977237701], [-0.012031757272779942, 0.3590960204601288, 0.030334025621414185, -0.43399640917778015], [-0.00484983716160059, 0.1635580211877823, 0.021654097363352776, -0.13190752267837524], [-0.0015786768635734916, -0.03186731040477753, 0.019015947356820107, 0.16752757132053375], [-0.0022160231601446867, -0.22725622355937958, 0.022366497665643692, 0.4661482870578766], [-0.006761147640645504, -0.42268693447113037, 0.031689465045928955, 0.7657962441444397], [-0.015214886516332626, -0.22801533341407776, 0.047005388885736465, 0.48325058817863464], [-0.01977519318461418, -0.03358721733093262, 0.056670401245355606, 0.20574505627155304], [-0.020446937531232834, -0.2294718474149704, 0.06078530102968216, 0.5157524943351746], [-0.025036374107003212, -0.03525617718696594, 0.07110035419464111, 0.2428268939256668], [-0.025741497054696083, 0.158781960606575, 0.07595688849687576, -0.026609040796756744], [-0.02256585843861103, 0.35273709893226624, 0.07542470842599869, -0.29439303278923035], [-0.015511116944253445, 0.1566253900527954, 0.06953684985637665, 0.02109202928841114], [-0.01237860880792141, 0.3506847620010376, 0.06995868682861328, -0.24886620044708252], [-0.005364913959056139, 0.15463709831237793, 0.0649813637137413, 0.06503705680370331], [-0.002272171899676323, 0.3487701117992401, 0.06628210842609406, -0.20645679533481598], [0.00470323022454977, 0.5428847074508667, 0.06215297058224678, -0.47751665115356445], [0.01556092407554388, 0.34694281220436096, 0.05260263755917549, -0.16591010987758636], [0.022499781101942062, 0.5412738919258118, 0.0492844358086586, -0.44154542684555054], [0.033325258642435074, 0.34549039602279663, 0.04045352712273598, -0.1337430477142334], [0.040235064923763275, 0.5400102138519287, 0.037778664380311966, -0.4133940041065216], [0.05103527009487152, 0.3443737030029297, 0.02951078489422798, -0.10904433578252792], [0.05792274326086044, 0.5390605926513672, 0.02732989937067032, -0.39227262139320374], [0.06870395690202713, 0.34356170892715454, 0.019484445452690125, -0.09109976887702942], [0.07557518780231476, 0.5383990406990051, 0.017662450671195984, -0.377572238445282], [0.08634316921234131, 0.73326575756073, 0.01011100597679615, -0.6646342277526855], [0.10100848972797394, 0.9282456040382385, -0.0031816777773201466, -0.9541164636611938], [0.11957339942455292, 1.1234102249145508, -0.022264007478952408, -1.2477972507476807], [0.14204160869121552, 1.3188104629516602, -0.047219954431056976, -1.5473700761795044], [0.1684178113937378, 1.12428617477417, -0.07816735655069351, -1.2697863578796387], [0.19090352952480316, 0.9302443861961365, -0.1035630851984024, -1.002570390701294], [0.20950841903686523, 1.1265860795974731, -0.12361449003219604, -1.3258980512619019], [0.232040137052536, 0.9332225918769836, -0.1501324474811554, -1.074316143989563], [0.2507045865058899, 0.7403687834739685, -0.1716187745332718, -0.8322628736495972], [0.26551195979118347, 0.5479552745819092, -0.18826402723789215, -0.5980911254882812], [0.2764710783958435, 0.35589689016342163, -0.2002258598804474, -0.37011709809303284], [0.2835890054702759, 0.16409888863563538, -0.20762819051742554, -0.14664170145988464], [0.2868709862232208, -0.027538679540157318, -0.21056103706359863, 0.07403579354286194], [-0.03681044280529022, 0.20761168003082275, 0.003870441345497966, -0.2644408047199249], [-0.03265821188688278, 0.012434701435267925, -0.0014183747116476297, 0.029460377991199493], [-0.03240951523184776, 0.2075769603252411, -0.0008291671401821077, -0.2636697292327881], [-0.028257977217435837, 0.012466858141124249, -0.0061025614850223064, 0.028751559555530548], [-0.028008639812469482, -0.1825670450925827, -0.0055275303311645985, 0.3195028305053711], [-0.03165998309850693, 0.012633186765015125, 0.0008625261834822595, 0.02508186548948288], [-0.03140731900930405, 0.20774275064468384, 0.0013641634723171592, -0.26732879877090454], [-0.02725246176123619, 0.012601364403963089, -0.003982412628829479, 0.02578408271074295], [-0.027000434696674347, -0.18246324360370636, -0.0034667309373617172, 0.31720784306526184], [-0.03064969927072525, -0.3775356411933899, 0.0028774263337254524, 0.6087954640388489], [-0.038200411945581436, -0.18245404958724976, 0.015053335577249527, 0.3170202374458313], [-0.041849493980407715, -0.37778714299201965, 0.02139374054968357, 0.6144121885299683], [-0.049405235797166824, -0.1829705536365509, 0.03368198499083519, 0.328543484210968], [-0.05306464806199074, 0.011656110174953938, 0.04025285318493843, 0.046669699251651764], [-0.05283152684569359, 0.2061784416437149, 0.041186247020959854, -0.233046293258667], [-0.048707958310842514, 0.40068843960762024, 0.03652532398700714, -0.5124585032463074], [-0.040694188326597214, 0.5952773690223694, 0.026276152580976486, -0.7934112548828125], [-0.028788641095161438, 0.790028989315033, 0.010407927446067333, -1.0777134895324707], [-0.012988060712814331, 0.9850119352340698, -0.011146342381834984, -1.367112159729004], [0.0067121777683496475, 0.7900312542915344, -0.038488585501909256, -1.0779362916946411], [0.022512802854180336, 0.9856398701667786, -0.06004730984568596, -1.3824447393417358], [0.04222559928894043, 1.1814574003219604, -0.08769620209932327, -1.6932849884033203], [0.0658547505736351, 0.9874505996704102, -0.12156190723180771, -1.429142713546753], [0.0856037586927414, 0.7940213680267334, -0.1501447558403015, -1.1767913103103638], [0.10148418694734573, 0.601134181022644, -0.17368058860301971, -0.9346925616264343], [0.11350686848163605, 0.40872642397880554, -0.19237443804740906, -0.701228678226471], [0.12168139964342117, 0.6059206128120422, -0.20639900863170624, -1.0477733612060547], [0.13379980623722076, 0.414045512676239, -0.2273544818162918, -0.8263208866119385], [-0.015252092853188515, -0.20390771329402924, 0.04253115877509117, 0.25756409764289856], [-0.01933024823665619, -0.3996102511882782, 0.047682441771030426, 0.5633528232574463], [-0.027322452515363693, -0.20518866181373596, 0.05894949659705162, 0.2860652208328247], [-0.03142622485756874, -0.010954804718494415, 0.06467080116271973, 0.012541643343865871], [-0.03164532035589218, 0.18318293988704681, 0.06492163240909576, -0.2590562701225281], [-0.02798166312277317, 0.37732088565826416, 0.05974050983786583, -0.5305761694908142], [-0.02043524570763111, 0.1814117133617401, 0.04912898689508438, -0.21968334913253784], [-0.016807010397315025, 0.37579822540283203, 0.044735319912433624, -0.49647319316864014], [-0.009291047230362892, 0.18007494509220123, 0.03480585664510727, -0.19003421068191528], [-0.00568954786285758, -0.015527207404375076, 0.031005172058939934, 0.11342218518257141], [-0.006000091787427664, -0.21107938885688782, 0.033273614943027496, 0.4157235324382782], [-0.01022167969495058, -0.016444433480501175, 0.041588086634874344, 0.13371333479881287], [-0.01055056881159544, -0.2121366560459137, 0.0442623533308506, 0.43922123312950134], [-0.014793301932513714, -0.017668193206191063, 0.053046777844429016, 0.1608131229877472], [-0.015146665275096893, 0.17665578424930573, 0.056263040751218796, -0.11467437446117401], [-0.011613549664616585, -0.01922531984746456, 0.05396955460309982, 0.19521495699882507], [-0.011998056434094906, 0.17508476972579956, 0.05787385255098343, -0.0799664556980133], [-0.0084963608533144, -0.02081701159477234, 0.056274522095918655, 0.23039965331554413], [-0.008912701159715652, 0.173457533121109, 0.06088251620531082, -0.04401487484574318], [-0.005443550646305084, 0.36765599250793457, 0.060002218931913376, -0.31688445806503296], [0.001909569138661027, 0.17173302173614502, 0.05366452783346176, -0.005898802075535059], [0.0053442297503352165, 0.36604592204093933, 0.05354655161499977, -0.281178742647171], [0.01266514789313078, 0.17020267248153687, 0.047922976315021515, 0.02790023759007454], [0.01606920175254345, -0.025572607293725014, 0.04848098382353783, 0.3353099524974823], [0.015557749196887016, 0.16882705688476562, 0.05518718063831329, 0.0583009198307991], [0.01893429085612297, 0.3631160855293274, 0.05635320022702217, -0.21647213399410248], [0.026196612045168877, 0.16723568737506866, 0.0520237572491169, 0.09344110637903214], [0.029541324824094772, 0.3615748882293701, 0.053892578929662704, -0.18238520622253418], [0.036772824823856354, 0.16572485864162445, 0.05024487525224686, 0.1268000602722168], [0.040087319910526276, 0.3600923418998718, 0.0527808777987957, -0.14961746335029602], [0.0472891665995121, 0.16425588726997375, 0.04978852719068527, 0.1592385321855545], [0.05057428404688835, 0.3586309850215912, 0.05297330021858215, -0.11733102053403854], [0.05774690583348274, 0.5529555082321167, 0.05062667652964592, -0.39284202456474304], [0.06880601495504379, 0.3571530282497406, 0.042769838124513626, -0.08463675528764725], [0.07594907283782959, 0.5516366362571716, 0.04107710346579552, -0.3635248839855194], [0.08698180317878723, 0.7461514472961426, 0.03380660340189934, -0.6429776549339294], [0.10190483182668686, 0.5505749583244324, 0.020947052165865898, -0.33984339237213135], [0.11291633546352386, 0.3551613390445709, 0.014150183647871017, -0.04062926396727562], [0.12001956254243851, 0.15983936190605164, 0.01333759818226099, 0.25648438930511475], [0.12321634590625763, -0.035470444709062576, 0.018467284739017487, 0.553344190120697], [0.12250693887472153, -0.23084679245948792, 0.029534168541431427, 0.851787805557251], [0.11789000779390335, -0.4263586699962616, 0.04656992480158806, 1.1536095142364502], [0.10936283320188522, -0.23187404870986938, 0.06964211910963058, 0.8758854866027832], [0.10472535341978073, -0.037764329463243484, 0.08715982735157013, 0.6058849096298218], [0.10397006571292877, 0.15603765845298767, 0.09927752614021301, 0.3418779969215393], [0.10709081590175629, -0.04034626856446266, 0.10611508041620255, 0.6641430854797363], [0.10628388822078705, 0.1531519740819931, 0.11939794570207596, 0.40666764974594116], [0.10934693366289139, 0.34639641642570496, 0.12753130495548248, 0.15388433635234833], [0.11627485603094101, 0.14970099925994873, 0.13060899078845978, 0.4839240312576294], [0.11926887929439545, 0.34276118874549866, 0.14028745889663696, 0.2350902110338211], [0.12612409889698029, 0.535629153251648, 0.1449892669916153, -0.010260186158120632], [0.1368366926908493, 0.7284063100814819, 0.14478406310081482, -0.2539142072200775], [0.15140481293201447, 0.5315457582473755, 0.13970577716827393, 0.08070496469736099], [0.16203573346138, 0.7244173288345337, 0.1413198858499527, -0.1648436337709427], [0.1765240728855133, 0.9172632098197937, 0.1380230039358139, -0.4098188579082489], [0.19486933946609497, 0.7204819321632385, 0.1298266351222992, -0.07700402289628983], [0.20927897095680237, 0.523760974407196, 0.12828655540943146, 0.2536560595035553], [0.2197542041540146, 0.7168400287628174, 0.13335967063903809, 0.004030297044664621], [0.23409099876880646, 0.5200825929641724, 0.1334402710199356, 0.3356374502182007], [0.24449265003204346, 0.7130781412124634, 0.14015302062034607, 0.08783286064863205], [0.2587542235851288, 0.9059419631958008, 0.14190968871116638, -0.15755601227283478], [0.27687305212020874, 1.0987770557403564, 0.1387585699558258, -0.4023195207118988], [0.29884859919548035, 0.9019879102706909, 0.13071216642856598, -0.06930866837501526], [0.31688836216926575, 1.0950171947479248, 0.1293260008096695, -0.31806254386901855], [0.3387886881828308, 1.2880828380584717, 0.12296474725008011, -0.5673266053199768], [0.3645503520965576, 1.0914700031280518, 0.11161822080612183, -0.23857365548610687], [0.38637974858283997, 0.8949452042579651, 0.10684674233198166, 0.08712687343358994], [0.4042786657810211, 0.6984668374061584, 0.1085892841219902, 0.411516934633255], [0.4182479977607727, 0.8918952941894531, 0.11681962013244629, 0.15494568645954132], [0.43608590960502625, 1.0851677656173706, 0.11991853266954422, -0.09872010350227356], [0.45778924226760864, 1.2783851623535156, 0.1179441288113594, -0.35129314661026], [0.48335695266723633, 1.4716495275497437, 0.11091826856136322, -0.6045805811882019], [0.5127899646759033, 1.6650599241256714, 0.09882665425539017, -0.8603700995445251], [0.5460911393165588, 1.858707070350647, 0.0816192552447319, -1.1204158067703247], [0.5832653045654297, 2.052669048309326, 0.059210941195487976, -1.3864209651947021], [0.6243186593055725, 1.8568611145019531, 0.0314825214445591, -1.075825810432434], [0.6614558696746826, 2.051553249359131, 0.009966002777218819, -1.3584650754928589], [0.7024869322776794, 2.246548891067505, -0.017203299328684807, -1.648013949394226], [0.7474179267883301, 2.4418675899505615, -0.05016357824206352, -1.9460062980651855], [0.7962552905082703, 2.637486696243286, -0.0890837013721466, -2.253807544708252], [0.8490050435066223, 2.4433071613311768, -0.1341598480939865, -1.9898490905761719], [0.8978711366653442, 2.2498228549957275, -0.17395684123039246, -1.7415554523468018], [0.942867636680603, 2.057055950164795, -0.2087879478931427, -1.5076549053192139], [0.9840087294578552, 2.25400710105896, -0.2389410436153412, -1.8576046228408813], [0.0011456407373771071, -0.18720409274101257, -0.022448161616921425, 0.25764361023902893], [-0.0025984409730881453, 0.008231038227677345, -0.017295289784669876, -0.04203443601727486], [-0.0024338201619684696, -0.18663868308067322, -0.018135977908968925, 0.2451418787240982], [-0.006166594102978706, 0.008737538941204548, -0.013233140110969543, -0.053205955773591995], [-0.0059918430633842945, 0.20404671132564545, -0.014297259971499443, -0.3500345051288605], [-0.0019109089625999331, 0.3993690609931946, -0.02129795029759407, -0.6471912860870361], [0.006076471880078316, 0.20455020666122437, -0.034241776913404465, -0.36129045486450195], [0.010167475789785385, 0.009931283071637154, -0.041467584669589996, -0.07959830015897751], [0.010366101749241352, 0.20562238991260529, -0.04305955022573471, -0.3850705921649933], [0.014478549361228943, 0.011137358844280243, -0.050760962069034576, -0.10626905411481857], [0.01470129657536745, 0.20694860816001892, -0.052886344492435455, -0.4145249128341675], [0.01884026825428009, 0.012614578008651733, -0.0611768402159214, -0.13897277414798737], [0.019092559814453125, 0.20855696499347687, -0.06395629793405533, -0.4503113031387329], [0.023263700306415558, 0.4045224189758301, -0.07296252250671387, -0.7624488472938538], [0.0313541479408741, 0.21047726273536682, -0.08821149915456772, -0.493587464094162], [0.035563692450523376, 0.016702942550182343, -0.0980832502245903, -0.22995667159557343], [0.03589775413274765, -0.176890566945076, -0.10268238186836243, 0.030247632414102554], [0.03235994279384613, 0.01954256370663643, -0.1020774319767952, -0.2929856777191162], [0.03275079280138016, -0.17398709058761597, -0.10793714225292206, -0.03416096791625023], [0.029271051287651062, -0.3674089312553406, -0.10862036049365997, 0.2226114124059677], [0.021922871470451355, -0.5608242750167847, -0.1041681319475174, 0.47915294766426086], [0.010706386528909206, -0.7543332576751709, -0.09458507597446442, 0.7372730374336243], [-0.004380278754979372, -0.9480304718017578, -0.07983961701393127, 0.998753547668457], [-0.02334088832139969, -0.7519372701644897, -0.05986454337835312, 0.6821027994155884], [-0.03837963193655014, -0.5560372471809387, -0.046222489327192307, 0.37118953466415405], [-0.04950037971138954, -0.36029016971588135, -0.03879869729280472, 0.06429789215326309], [-0.05670618265867233, -0.5548349618911743, -0.03751273825764656, 0.34449154138565063], [-0.06780288368463516, -0.35920003056526184, -0.03062290884554386, 0.04021940380334854], [-0.07498688250780106, -0.16365262866020203, -0.029818519949913025, -0.26196590065956116], [-0.07825993746519089, 0.03188199922442436, -0.03505783900618553, -0.5639027953147888], [-0.07762229442596436, -0.16273096203804016, -0.046335894614458084, -0.2824676036834717], [-0.0808769166469574, -0.3571624159812927, -0.0519852451980114, -0.004751332104206085], [-0.08802016079425812, -0.5515017509460449, -0.05208027362823486, 0.271087110042572], [-0.09905019402503967, -0.3556768298149109, -0.046658530831336975, -0.037556715309619904], [-0.10616373270750046, -0.5500997304916382, -0.04740966483950615, 0.24004758894443512], [-0.11716572940349579, -0.35433369874954224, -0.04260871186852455, -0.06720470637083054], [-0.12425240129232407, -0.5488196611404419, -0.043952807784080505, 0.21173632144927979], [-0.13522879779338837, -0.3530977666378021, -0.039718080312013626, -0.0944809839129448], [-0.14229075610637665, -0.5476285815238953, -0.041607700288295746, 0.18541109561920166], [-0.1532433182001114, -0.7421312928199768, -0.037899479269981384, 0.46468350291252136], [-0.1680859476327896, -0.5464948415756226, -0.028605807572603226, 0.16029980778694153], [-0.1790158450603485, -0.35097530484199524, -0.025399811565876007, -0.1412685066461563], [-0.18603534996509552, -0.15549896657466888, -0.028225181624293327, -0.44185519218444824], [-0.18914532661437988, 0.04001079127192497, -0.03706228733062744, -0.7433001399040222], [-0.18834511935710907, -0.15458054840564728, -0.051928289234638214, -0.46250736713409424], [-0.19143672287464142, 0.041235361248254776, -0.061178434640169144, -0.771095335483551], [-0.19061201810836792, -0.15299372375011444, -0.0766003429889679, -0.49827203154563904], [-0.19367189705371857, -0.3469568192958832, -0.0865657851099968, -0.2306790053844452], [-0.20061102509498596, -0.5407419800758362, -0.09117936342954636, 0.03349174186587334], [-0.21142587065696716, -0.3444388210773468, -0.09050952643156052, -0.2865094840526581], [-0.21831464767456055, -0.5381612181663513, -0.09623971581459045, -0.02368873916566372], [-0.22907787561416626, -0.3418003022670746, -0.09671349078416824, -0.34511798620224], [-0.23591387271881104, -0.14544515311717987, -0.10361585021018982, -0.6666637659072876], [-0.2388227880001068, 0.05095360055565834, -0.11694912612438202, -0.9900904893875122], [-0.23780371248722076, -0.1424253284931183, -0.1367509365081787, -0.736308217048645], [-0.24065221846103668, 0.05429386347532272, -0.15147709846496582, -1.068711757659912], [-0.23956634104251862, -0.13853563368320465, -0.1728513389825821, -0.8271437287330627], [-0.24233704805374146, -0.3309260904788971, -0.18939420580863953, -0.5934240221977234], [-0.24895557761192322, -0.5229629874229431, -0.2012626975774765, -0.3658691644668579], [-0.25941482186317444, -0.32563507556915283, -0.20858007669448853, -0.7146590352058411], [-0.2659275233745575, -0.12833000719547272, -0.222873255610466, -1.0650808811187744]], "action_prob": [0.5063609480857849, 0.3818599283695221, 0.6526939272880554, 0.6278515458106995, 0.46997591853141785, 0.6360689997673035, 0.5513591766357422, 0.42212367057800293, 0.6409440636634827, 0.4331026077270508, 0.6388604640960693, 0.4411200284957886, 0.6374918818473816, 0.5541270971298218, 0.41267526149749756, 0.35058680176734924, 0.6519783735275269, 0.6535575985908508, 0.38600510358810425, 0.6565408706665039, 0.628821074962616, 0.52765291929245, 0.5918620824813843, 0.5502196550369263, 0.5764225721359253, 0.570029079914093, 0.44031888246536255, 0.6333813667297363, 0.45339807868003845, 0.6300325989723206, 0.4634620249271393, 0.6274592280387878, 0.4703291058540344, 0.625910222530365, 0.4740047752857208, 0.37446996569633484, 0.34707391262054443, 0.3484542965888977, 0.35783880949020386, 0.6311765909194946, 0.6403519511222839, 0.3497332036495209, 0.6365395188331604, 0.6463549733161926, 0.6568177938461304, 0.6658793091773987, 0.6676056385040283, 0.6472459435462952, 0.5182900428771973, 0.6085308194160461, 0.5171417593955994, 0.6098224520683289, 0.485690712928772, 0.6248102188110352, 0.5153582096099854, 0.6105807423591614, 0.48673123121261597, 0.3754425346851349, 0.6527715921401978, 0.3711114227771759, 0.65413898229599, 0.6354808211326599, 0.5452060699462891, 0.41461998224258423, 0.356448233127594, 0.34909409284591675, 0.3573046624660492, 0.6310365796089172, 0.35764080286026, 0.3708937168121338, 0.6165248155593872, 0.625083863735199, 0.6354995369911194, 0.6476777195930481, 0.339484840631485, 0.6405418515205383, 0.5155989527702332, 0.3849019706249237, 0.6531423926353455, 0.6273853778839111, 0.5298799276351929, 0.4066975712776184, 0.6447480916976929, 0.4167865812778473, 0.6432923674583435, 0.5759496688842773, 0.43206292390823364, 0.6458664536476135, 0.4185175597667694, 0.6499626636505127, 0.5970112681388855, 0.5298576951026917, 0.6099034547805786, 0.5102869868278503, 0.6216084361076355, 0.5109587907791138, 0.6041757464408875, 0.528354823589325, 0.5945714712142944, 0.4565376341342926, 0.6431039571762085, 0.561734676361084, 0.5688498616218567, 0.576673150062561, 0.5549179315567017, 0.5900166034698486, 0.5401468276977539, 0.6021005511283875, 0.47564879059791565, 0.6211658120155334, 0.4873230457305908, 0.3829750418663025, 0.6505891680717468, 0.6167297959327698, 0.5049490928649902, 0.3806118965148926, 0.34304776787757874, 0.3499479591846466, 0.6329740881919861, 0.6494153141975403, 0.662268877029419, 0.3455275595188141, 0.6623227000236511, 0.6639185547828674, 0.37623515725135803, 0.6689969897270203, 0.6475051641464233, 0.5689892172813416, 0.5418465733528137, 0.604149341583252, 0.49734818935394287, 0.5942908525466919, 0.4663656949996948, 0.6483849883079529, 0.4298340678215027, 0.6622262597084045, 0.6036136150360107, 0.5024672150611877, 0.5867772102355957, 0.5356977581977844, 0.43701693415641785, 0.623763382434845, 0.5408047437667847, 0.41448941826820374, 0.663095235824585, 0.6084469556808472, 0.5141101479530334, 0.4245453178882599, 0.371150404214859, 0.34705087542533875, 0.338711678981781, 0.6619061827659607, 0.3368293344974518, 0.33654162287712097, 0.34053531289100647, 0.3465937077999115, 0.6463339328765869, 0.6515306830406189, 0.65678870677948, 0.3379564881324768, 0.5293735265731812, 0.5990439653396606, 0.5349780321121216, 0.5959574580192566, 0.4608439803123474, 0.36286649107933044, 0.6554701924324036, 0.6429018974304199, 0.4346165060997009, 0.6478535532951355, 0.41812652349472046, 0.6526630520820618, 0.40033218264579773, 0.34303441643714905, 0.6549407243728638, 0.6614157557487488, 0.6389120817184448, 0.450863242149353, 0.6519824266433716, 0.5835159420967102, 0.4611318111419678, 0.38024577498435974, 0.35459813475608826, 0.6473135948181152, 0.6459556221961975, 0.6085754036903381, 0.5108354091644287, 0.6041291952133179, 0.48132339119911194, 0.3647897243499756, 0.6627327799797058, 0.6428666710853577, 0.5491099953651428, 0.5773723125457764, 0.5618240833282471, 0.5676777958869934, 0.5727627873420715, 0.5581372976303101, 0.5823429822921753, 0.45136016607284546, 0.6296370625495911, 0.5438072085380554, 0.4068174958229065, 0.3417210876941681, 0.6597369313240051, 0.3376992344856262, 0.659480631351471, 0.6664366126060486, 0.6366915106773376, 0.4601975083351135, 0.6488825082778931, 0.43239766359329224, 0.3412373960018158, 0.33100879192352295, 0.6504312753677368, 0.33155906200408936, 0.6463871598243713, 0.6658332943916321, 0.6795682907104492, 0.32379451394081116, 0.3219713568687439], "advantages": [28.048036575317383, 27.55583381652832, 27.31139373779297, 25.950210571289062, 24.912281036376953, 24.385784149169922, 23.311107635498047, 22.5430908203125, 22.055299758911133, 21.07729721069336, 20.586135864257812, 19.640344619750977, 19.147253036499023, 18.22370147705078, 17.529638290405273, 17.068321228027344, 16.804534912109375, 15.33533000946045, 14.144116401672363, 13.613990783691406, 12.394309043884277, 11.421401023864746, 10.6618070602417, 9.728776931762695, 8.939579963684082, 8.026018142700195, 7.206468105316162, 6.564455986022949, 5.51401948928833, 4.855637550354004, 3.8195912837982178, 3.1466281414031982, 2.117262363433838, 1.432149052619934, 0.4034739136695862, -0.2907947599887848, -0.7897732853889465, -1.0816311836242676, -1.1655539274215698, -1.0669852495193481, -2.2022342681884766, -3.289818286895752, -2.9723758697509766, -3.8448984622955322, -4.621053695678711, -5.27489709854126, -5.772811412811279, -6.077804088592529, 13.55277156829834, 12.869795799255371, 12.057090759277344, 11.37041187286377, 10.551521301269531, 9.978594779968262, 8.916670799255371, 8.196599960327148, 7.338379383087158, 6.727002143859863, 6.339681625366211, 4.871066093444824, 4.430931568145752, 2.922201156616211, 1.7170220613479614, 0.8068156838417053, 0.16963832080364227, -0.21424248814582825, -0.368463397026062, -0.33360111713409424, -1.5963412523269653, -1.3874458074569702, -1.0848034620285034, -1.8762567043304443, -2.5620973110198975, -3.117401599884033, -3.5133397579193115, -2.9096267223358154, 46.71133804321289, 46.353206634521484, 46.254615783691406, 45.09080505371094, 44.246917724609375, 43.714683532714844, 43.465728759765625, 42.66190719604492, 42.418670654296875, 41.657047271728516, 41.135093688964844, 40.85968017578125, 39.971092224121094, 39.67961502075195, 38.762027740478516, 38.120296478271484, 37.59489059448242, 36.92536544799805, 36.410282135009766, 35.712772369384766, 35.24113464355469, 34.549625396728516, 34.05733108520508, 33.38469314575195, 32.90352249145508, 32.14677810668945, 31.5942325592041, 30.93747329711914, 30.360742568969727, 29.71299934387207, 29.11168098449707, 28.469579696655273, 27.843244552612305, 27.38426399230957, 26.606067657470703, 26.133033752441406, 25.829694747924805, 24.93905258178711, 24.17987060546875, 23.559619903564453, 23.083147048950195, 22.74886703491211, 22.539365768432617, 21.202030181884766, 20.081600189208984, 19.14341163635254, 18.57965087890625, 17.628368377685547, 16.802467346191406, 16.11887550354004, 15.2731351852417, 14.507826805114746, 13.804015159606934, 12.976797103881836, 12.24531078338623, 11.563404083251953, 10.68970775604248, 9.880620956420898, 9.100123405456543, 8.290914535522461, 7.485498428344727, 6.714167594909668, 5.976471424102783, 5.0735883712768555, 4.310595989227295, 3.584794044494629, 2.636045217514038, 1.7306077480316162, 0.858249306678772, -0.003858497366309166, -0.8404263854026794, -1.6485360860824585, -2.419935464859009, -3.142042636871338, -3.7991998195648193, -4.374523162841797, -5.5004119873046875, -6.0299763679504395, -6.446266174316406, -6.74352502822876, -6.926023483276367, -7.881327152252197, -8.76781940460205, -9.579880714416504, 35.7668571472168, 35.45204544067383, 34.73023223876953, 34.385196685791016, 33.65235137939453, 33.316864013671875, 33.35161590576172, 32.54888916015625, 31.96193504333496, 31.75516128540039, 31.17825698852539, 31.04103660583496, 30.48287010192871, 30.43207359313965, 30.772785186767578, 30.18657112121582, 29.781259536743164, 29.600238800048828, 29.457120895385742, 29.288156509399414, 29.305940628051758, 29.40730857849121, 29.45095443725586, 29.328929901123047, 28.014890670776367, 26.771711349487305, 25.766613006591797, 25.445280075073242, 24.416528701782227, 23.755809783935547, 23.47420310974121, 22.869056701660156, 22.40880584716797, 22.052711486816406, 21.168441772460938, 20.753347396850586, 19.87044906616211, 19.404264450073242, 18.523849487304688, 18.013545989990234, 17.510353088378906, 16.333234786987305, 15.396865844726562, 14.774940490722656, 14.425771713256836, 13.801664352416992, 13.533952713012695, 13.065308570861816, 12.633467674255371, 12.2061128616333, 11.670463562011719, 11.231183052062988, 10.731736183166504, 10.370962142944336, 10.03287410736084, 9.968436241149902, 9.5765962600708, 9.675533294677734, 9.669419288635254, 9.50968074798584, 9.033143997192383], "value_targets": [38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 1164497969, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 388934695, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 241375232, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436, 268659436], "obs": [[-0.009633035399019718, 0.027575576677918434, -0.02855135127902031, 0.03614537790417671], [-0.00908152386546135, 0.22309507429599762, -0.02782844379544258, -0.2654072940349579], [-0.004619622603058815, 0.028381140902638435, -0.03313659131526947, 0.018370015546679497], [-0.004051999654620886, 0.22396224737167358, -0.03276918828487396, -0.2845809757709503], [0.0004272452206350863, 0.02932262234389782, -0.038460809737443924, -0.0024106898345053196], [0.0010136977070942521, -0.1652272492647171, -0.03850902244448662, 0.277893602848053], [-0.0022908472456038, 0.03042231872677803, -0.032951150089502335, -0.026682017371058464], [-0.0016824008198454976, 0.22600093483924866, -0.03348479047417641, -0.3295765817165375], [0.002837618114426732, 0.4215831756591797, -0.040076322853565216, -0.6326281428337097], [0.0112692816182971, 0.227042555809021, -0.05272888392210007, -0.35283082723617554], [0.015810132026672363, 0.4228731095790863, -0.05978550389409065, -0.6616635322570801], [0.024267595261335373, 0.22863174974918365, -0.07301877439022064, -0.3883885145187378], [0.028840230777859688, 0.03461809828877449, -0.08078654110431671, -0.11959194391965866], [0.029532592743635178, -0.15925903618335724, -0.08317837864160538, 0.14654985070228577], [0.026347411796450615, -0.35309740900993347, -0.08024738729000092, 0.4118759334087372], [0.01928546279668808, -0.15693503618240356, -0.0720098689198494, 0.09501183778047562], [0.016146762296557426, -0.35095497965812683, -0.07010962814092636, 0.36413490772247314], [0.00912766344845295, -0.15491029620170593, -0.06282693147659302, 0.050194963812828064], [0.0060294573195278645, -0.3490777313709259, -0.061823032796382904, 0.32241252064704895], [-0.0009520973544567823, -0.5432673096656799, -0.05537478253245354, 0.5949760675430298], [-0.011817444115877151, -0.34741586446762085, -0.043475259095430374, 0.28537726402282715], [-0.018765760585665703, -0.5418916940689087, -0.037767715752124786, 0.5640376806259155], [-0.029603594914078712, -0.3462607264518738, -0.026486961171030998, 0.25969940423965454], [-0.0365288071334362, -0.5409947633743286, -0.021292973309755325, 0.5439117550849915], [-0.04734870418906212, -0.345580130815506, -0.01041473913937807, 0.24459660053253174], [-0.05426030606031418, -0.5405517816543579, -0.005522807128727436, 0.5339763760566711], [-0.06507134437561035, -0.3453526198863983, 0.00515672005712986, 0.2395583540201187], [-0.07197839766740799, -0.15030470490455627, 0.009947887621819973, -0.05149354785680771], [-0.07498449087142944, 0.04467320814728737, 0.008918016217648983, -0.3410212993621826], [-0.07409102469682693, -0.1505744904279709, 0.0020975901279598475, -0.045539550483226776], [-0.07710251212120056, -0.34572646021842957, 0.0011867991415783763, 0.2478044480085373], [-0.08401704579591751, -0.5408653616905212, 0.006142888218164444, 0.5408614873886108], [-0.0948343500494957, -0.3458302617073059, 0.01696011796593666, 0.2501204013824463], [-0.10175095498561859, -0.15095455944538116, 0.021962525323033333, -0.0371650792658329], [-0.10477004945278168, 0.04384566843509674, 0.021219223737716675, -0.3228384852409363], [-0.10389313101768494, 0.23865912854671478, 0.014762453734874725, -0.6087549328804016], [-0.09911995381116867, 0.04333395138382912, 0.002587355440482497, -0.3114590644836426], [-0.0982532724738121, -0.15182477235794067, -0.0036418261006474495, -0.017961299046874046], [-0.101289764046669, 0.04334922507405281, -0.004001052118837833, -0.3117910325527191], [-0.10042278468608856, 0.23852795362472534, -0.010236873291432858, -0.6057330965995789], [-0.09565222263336182, 0.043550629168748856, -0.02235153503715992, -0.31629201769828796], [-0.09478121250867844, 0.23898370563983917, -0.028677374124526978, -0.615939199924469], [-0.09000153839588165, 0.04427390173077583, -0.040996160358190536, -0.3324245810508728], [-0.08911605924367905, -0.15024127066135406, -0.04764465242624283, -0.05294647440314293], [-0.09212088584899902, -0.3446488380432129, -0.04870358109474182, 0.22433170676231384], [-0.09901385754346848, -0.539042055606842, -0.04421694576740265, 0.5012626647949219], [-0.10979469865560532, -0.3433256447315216, -0.03419169411063194, 0.19497936964035034], [-0.11666121333837509, -0.5379422307014465, -0.030292106792330742, 0.47668322920799255], [-0.12742005288600922, -0.7326236963272095, -0.02075844071805477, 0.759666919708252], [-0.14207252860069275, -0.5372219681739807, -0.005565103143453598, 0.46052491664886475], [-0.15281696617603302, -0.34202176332473755, 0.0036453951615840197, 0.16609306633472443], [-0.15965740382671356, -0.5371957421302795, 0.006967256776988506, 0.45992377400398254], [-0.17040131986141205, -0.3421729505062103, 0.016165731474757195, 0.16944506764411926], [-0.17724478244781494, -0.5375224947929382, 0.019554633647203445, 0.4671836495399475], [-0.18799522519111633, -0.34268221259117126, 0.02889830619096756, 0.1807277798652649], [-0.19484888017177582, -0.14798544347286224, 0.032512862235307693, -0.10270050913095474], [-0.19780857861042023, -0.3435578942298889, 0.030458852648735046, 0.20006021857261658], [-0.20467974245548248, -0.5391019582748413, 0.03446005657315254, 0.5021937489509583], [-0.21546177566051483, -0.3444822430610657, 0.04450393095612526, 0.2205667644739151], [-0.22235143184661865, -0.15002374351024628, 0.04891526699066162, -0.0577523298561573], [-0.22535189986228943, 0.04436396807432175, 0.047760218381881714, -0.3346097767353058], [-0.22446462512016296, -0.1514040231704712, 0.041068024933338165, -0.02725646086037159], [-0.22749270498752594, 0.04310564696788788, 0.040522895753383636, -0.3067043721675873], [-0.2266305834054947, 0.23762743175029755, 0.03438880667090416, -0.5863370299339294], [-0.2218780368566513, 0.04204113408923149, 0.022662067785859108, -0.2830227315425873], [-0.22103720903396606, 0.2368326485157013, 0.01700161211192608, -0.5684728622436523], [-0.21630056202411652, 0.4317120611667633, 0.005632155109196901, -0.8557515144348145], [-0.2076663225889206, 0.23651380836963654, -0.011482874862849712, -0.5613029599189758], [-0.202936053276062, 0.04155487194657326, -0.022708933800458908, -0.2722597122192383], [-0.20210495591163635, -0.1532358080148697, -0.028154129162430763, 0.01317510660737753], [-0.2051696628332138, -0.34794291853904724, -0.027890626341104507, 0.2968437969684601], [-0.21212852001190186, -0.15243469178676605, -0.021953750401735306, -0.004503241740167141], [-0.21517722308635712, -0.3472350239753723, -0.02204381488263607, 0.2811729609966278], [-0.222121924161911, -0.15180569887161255, -0.016420355066657066, -0.01838018372654915], [-0.22515803575515747, 0.0435478501021862, -0.01678795926272869, -0.31619834899902344], [-0.22428707778453827, -0.15133100748062134, -0.023111926391720772, -0.028856704011559486], [-0.22731369733810425, -0.34611400961875916, -0.023689061403274536, 0.2564454972743988], [-0.2342359721660614, -0.5408898591995239, -0.018560150638222694, 0.5415633916854858], [-0.24505376815795898, -0.3455120623111725, -0.007728883530944586, 0.24309073388576508], [-0.2519640028476715, -0.15028056502342224, -0.0028670686297118664, -0.05202002450823784], [-0.25496962666511536, -0.34536129236221313, -0.003907469101250172, 0.23975694179534912], [-0.2618768513202667, -0.15018372237682343, 0.0008876697393134236, -0.054155945777893066], [-0.26488053798675537, -0.34531840682029724, -0.00019544913084246218, 0.23880691826343536], [-0.2717868983745575, -0.5404375791549683, 0.004580689128488302, 0.5314281582832336], [-0.2825956344604492, -0.34538033604621887, 0.015209252946078777, 0.24019214510917664], [-0.2895032465457916, -0.15047891438007355, 0.020013095811009407, -0.04765482619404793], [-0.29251283407211304, -0.34588202834129333, 0.01905999891459942, 0.25127461552619934], [-0.2994304597377777, -0.541270911693573, 0.02408549189567566, 0.5499079823493958], [-0.31025588512420654, -0.3464953899383545, 0.035083651542663574, 0.26490992307662964], [-0.31718578934669495, -0.1518913060426712, 0.04038184881210327, -0.016504114493727684], [-0.3202236294746399, 0.04262895509600639, 0.040051765739917755, -0.29617759585380554], [-0.3193710446357727, -0.15304040908813477, 0.03412821516394615, 0.008863129653036594], [-0.32243186235427856, 0.041575901210308075, 0.03430547937750816, -0.2728596031665802], [-0.3216003477573395, 0.236191987991333, 0.02884828671813011, -0.5545281171798706], [-0.31687650084495544, 0.04067709669470787, 0.017757723107933998, -0.25289759039878845], [-0.31606295704841614, 0.23554104566574097, 0.012699771672487259, -0.5399269461631775], [-0.3113521337509155, 0.4304821789264679, 0.001901233452372253, -0.8285814523696899], [-0.30274248123168945, 0.6255781054496765, -0.01467039529234171, -1.1206657886505127], [-0.290230929851532, 0.8208893537521362, -0.037083711475133896, -1.4179141521453857], [-0.2738131284713745, 0.6262456178665161, -0.06544199585914612, -1.1370493173599243], [-0.26128822565078735, 0.4320378005504608, -0.0881829783320427, -0.8655874133110046], [-0.2526474595069885, 0.23821960389614105, -0.10549473017454147, -0.6018819808959961], [-0.24788308143615723, 0.04471917077898979, -0.11753236502408981, -0.3442029058933258], [-0.2469886988401413, -0.14855177700519562, -0.12441642582416534, -0.09077156335115433], [-0.24995972216129303, -0.34169113636016846, -0.1262318640947342, 0.16021396219730377], [-0.2567935585975647, -0.5348011255264282, -0.12302757799625397, 0.4105604588985443], [-0.26748958230018616, -0.7279837131500244, -0.11481636762619019, 0.6620652079582214], [-0.2820492386817932, -0.5314672589302063, -0.10157506167888641, 0.335549533367157], [-0.2926785945892334, -0.33505749702453613, -0.09486407041549683, 0.012641659006476402], [-0.29937973618507385, -0.5286999940872192, -0.09461124241352081, 0.2739512026309967], [-0.3099537491798401, -0.33236438035964966, -0.08913221955299377, -0.04700933396816254], [-0.316601037979126, -0.1360848993062973, -0.090072400867939, -0.36643001437187195], [-0.31932273507118225, -0.3298191428184509, -0.09740100055932999, -0.1034521758556366], [-0.32591912150382996, -0.13344603776931763, -0.09947004914283752, -0.42520633339881897], [-0.3285880386829376, 0.06293384730815887, -0.10797417163848877, -0.7475160956382751], [-0.3273293673992157, 0.25936663150787354, -0.12292449921369553, -1.0721321105957031], [-0.3221420347690582, 0.06606503576040268, -0.14436714351177216, -0.8204164505004883], [-0.32082071900367737, -0.1268174946308136, -0.16077546775341034, -0.5763991475105286], [-0.32335707545280457, -0.3193640410900116, -0.1723034530878067, -0.338368684053421], [-0.3297443389892578, -0.12226273864507675, -0.1790708303451538, -0.6800497174263], [-0.3321896195411682, -0.3145051896572113, -0.19267182052135468, -0.44866296648979187], [-0.3384796977043152, -0.5064544677734375, -0.20164507627487183, -0.2223624587059021], [-0.3486087918281555, -0.3091072738170624, -0.20609232783317566, -0.5712681412696838], [-0.008780197240412235, 0.02821466699242592, 0.033755961805582047, -0.03580862656235695], [-0.00821590330451727, -0.16737468540668488, 0.03303978964686394, 0.2673306167125702], [-0.011563397012650967, 0.027260536327958107, 0.038386400789022446, -0.014750929549336433], [-0.011018186807632446, 0.22181154787540436, 0.03809138387441635, -0.29507964849472046], [-0.006581955589354038, 0.026167839765548706, 0.03218979015946388, 0.009369206614792347], [-0.00605859886854887, 0.22081370651721954, 0.032377175986766815, -0.27298617362976074], [-0.0016423244960606098, 0.025245098397135735, 0.02691745199263096, 0.029730219393968582], [-0.0011374225141480565, 0.21997089684009552, 0.02751205489039421, -0.25433990359306335], [0.0032619955018162727, 0.024467147886753082, 0.02242525853216648, 0.04689227417111397], [0.0037513384595513344, 0.21926048398017883, 0.023363104090094566, -0.23863178491592407], [0.008136548101902008, 0.023812690749764442, 0.018590467050671577, 0.06132802367210388], [0.008612802252173424, -0.1715708076953888, 0.01981702819466591, 0.35981789231300354], [0.0051813856698572636, -0.3669687807559967, 0.02701338566839695, 0.6586831212043762], [-0.0021579896565526724, -0.5624560713768005, 0.0401870496571064, 0.9597480893135071], [-0.013407111167907715, -0.7580945491790771, 0.059382010251283646, 1.2647806406021118], [-0.028569001704454422, -0.5637796521186829, 0.08467762172222137, 0.991270124912262], [-0.03984459489583969, -0.36988672614097595, 0.10450302809476852, 0.726338267326355], [-0.04724232852458954, -0.5662864446640015, 0.11902979016304016, 1.0499986410140991], [-0.05856806039810181, -0.7627689242362976, 0.14002977311611176, 1.377549171447754], [-0.07382343709468842, -0.9593343734741211, 0.1675807535648346, 1.7105457782745361], [-0.09301012754440308, -0.7664874792098999, 0.2017916589975357, 1.4743661880493164], [0.02498960867524147, -0.015323923900723457, 0.04494071006774902, 0.003153017722070217], [0.024683130905032158, 0.17912566661834717, 0.04500377178192139, -0.27501875162124634], [0.02826564386487007, -0.016608530655503273, 0.039503395557403564, 0.03151191398501396], [0.027933472767472267, 0.17792531847953796, 0.040133632719516754, -0.24845021963119507], [0.03149197995662689, 0.3724518120288849, 0.03516462817788124, -0.52820885181427], [0.03894101455807686, 0.1768532246351242, 0.024600451812148094, -0.2246561050415039], [0.042478080838918686, 0.37161508202552795, 0.02010732889175415, -0.509478747844696], [0.04991038143634796, 0.17621572315692902, 0.00991775467991829, -0.21052776277065277], [0.053434696048498154, -0.019046617671847343, 0.005707199685275555, 0.08526711910963058], [0.05305376276373863, -0.21424990892410278, 0.007412542123347521, 0.3797451853752136], [0.04876876622438431, -0.019234003499150276, 0.015007445588707924, 0.08940864354372025], [0.048384085297584534, 0.17566965520381927, 0.01679561845958233, -0.19850189983844757], [0.051897477358579636, 0.37054741382598877, 0.01282558124512434, -0.4858396053314209], [0.05930842459201813, 0.17524683475494385, 0.003108788514509797, -0.18914224207401276], [0.06281336396932602, -0.01991945132613182, -0.0006740562967024744, 0.10451975464820862], [0.062414973974227905, -0.21503174304962158, 0.0014163388404995203, 0.39698994159698486], [0.05811433866620064, -0.019929908215999603, 0.009356137365102768, 0.10475390404462814], [0.05771574005484581, -0.21518468856811523, 0.011451215483248234, 0.4003739058971405], [0.053412046283483505, -0.02022702246904373, 0.019458694383502007, 0.11132317781448364], [0.05300750583410263, -0.21562232077121735, 0.021685156971216202, 0.4100811183452606], [0.04869506135582924, -0.02081441506743431, 0.029886780306696892, 0.12431291490793228], [0.048278771340847015, 0.1738668978214264, 0.032373037189245224, -0.15879324078559875], [0.0517561100423336, -0.021703213453292847, 0.029197173193097115, 0.14392423629760742], [0.05132204666733742, -0.2172308713197708, 0.032075658440589905, 0.44567346572875977], [0.04697743058204651, -0.02257705293595791, 0.04098912701010704, 0.16327154636383057], [0.04652588814496994, -0.21826107800006866, 0.04425456002354622, 0.46859848499298096], [0.04216066747903824, -0.023791350424289703, 0.05362652614712715, 0.19018608331680298], [0.041684839874506, 0.17052403092384338, 0.05743024870753288, -0.08510934561491013], [0.04509532079100609, -0.025372110307216644, 0.055728062987327576, 0.22512564063072205], [0.0445878766477108, -0.22124440968036652, 0.06023057550191879, 0.5348535180091858], [0.040162988007068634, -0.02701886184513569, 0.07092764973640442, 0.2617405951023102], [0.03962261229753494, -0.22307781875133514, 0.07616245746612549, 0.5759248733520508], [0.035161055624485016, -0.41918015480041504, 0.08768095821142197, 0.891595721244812], [0.02677745185792446, -0.22535006701946259, 0.10551287233829498, 0.6277126669883728], [0.022270450368523598, -0.03184668347239494, 0.11806712299585342, 0.3700350821018219], [0.021633516997098923, -0.2284308820962906, 0.12546782195568085, 0.6974896192550659], [0.0170648992061615, -0.42504870891571045, 0.1394176185131073, 1.0268888473510742], [0.008563925512135029, -0.6217234134674072, 0.15995539724826813, 1.3598946332931519], [-0.0038705430924892426, -0.42892706394195557, 0.18715327978134155, 1.1212183237075806], [0.04365787282586098, -0.038822680711746216, 0.021257195621728897, 0.02996775694191456], [0.042881421744823456, 0.15598808228969574, 0.021856550127267838, -0.2559332251548767], [0.04600118100643158, -0.03943900018930435, 0.016737885773181915, 0.043562695384025574], [0.04521240293979645, 0.15543898940086365, 0.017609139904379845, -0.24379262328147888], [0.048321180045604706, 0.35030505061149597, 0.012733287177979946, -0.5308696031570435], [0.05532728135585785, 0.5452455878257751, 0.0021158955059945583, -0.819513201713562], [0.06623219698667526, 0.350094735622406, -0.01427436899393797, -0.5261655449867249], [0.07323408871889114, 0.5454146265983582, -0.024797679856419563, -0.823311984539032], [0.08414237946271896, 0.35064053535461426, -0.041263919323682785, -0.5385304689407349], [0.09115519374608994, 0.15612223744392395, -0.05203452706336975, -0.2591295540332794], [0.09427763521671295, -0.03821974992752075, -0.05721712112426758, 0.016697624698281288], [0.09351324290037155, -0.23247644305229187, -0.05688316747546196, 0.29079318046569824], [0.08886371552944183, -0.036591485142707825, -0.051067303866147995, -0.019273661077022552], [0.08813188225030899, -0.23094528913497925, -0.05145277827978134, 0.25686973333358765], [0.08351297676563263, -0.035127945244312286, -0.04631538316607475, -0.051588013768196106], [0.0828104168176651, 0.16062647104263306, -0.04734714329242706, -0.3585166037082672], [0.08602295070886612, -0.033791542053222656, -0.0545174740254879, -0.08113126456737518], [0.08534711599349976, -0.2280913144350052, -0.056140098720788956, 0.19386519491672516], [0.08078528940677643, -0.422367125749588, -0.052262794226408005, 0.468323290348053], [0.07233794778585434, -0.616713285446167, -0.0428963303565979, 0.7440862059593201], [0.06000368297100067, -0.42102640867233276, -0.02801460586488247, 0.43821823596954346], [0.05158315598964691, -0.2255193591117859, -0.019250240176916122, 0.13683752715587616], [0.047072768211364746, -0.030127044767141342, -0.016513491049408913, -0.16185584664344788], [0.04647022485733032, 0.16522736847400665, -0.019750608131289482, -0.4597022533416748], [0.04977477341890335, -0.029609913006424904, -0.028944652527570724, -0.17330963909626007], [0.049182575196027756, 0.16591408848762512, -0.032410845160484314, -0.4749813377857208], [0.05250085890293121, -0.02873554825782776, -0.04191047325730324, -0.19268734753131866], [0.0519261471927166, -0.2232336848974228, -0.045764219015836716, 0.0864855945110321], [0.04746147245168686, -0.4176707863807678, -0.044034507125616074, 0.3643859028816223], [0.03910805657505989, -0.6121401786804199, -0.0367467887699604, 0.6428652405738831], [0.02686525322496891, -0.41652581095695496, -0.023889483883976936, 0.33884066343307495], [0.018534738570451736, -0.6112998127937317, -0.017112670466303825, 0.6238954663276672], [0.0063087414018809795, -0.4159431755542755, -0.004634760785847902, 0.3258725702762604], [-0.0020101224072277546, -0.22075554728507996, 0.0018826901214197278, 0.03173163905739784], [-0.00642523355782032, -0.4159044623374939, 0.002517322776839137, 0.32500797510147095], [-0.014743322506546974, -0.6110621690750122, 0.00901748239994049, 0.6184837222099304], [-0.026964565739035606, -0.8063088655471802, 0.02138715609908104, 0.9139930009841919], [-0.04309074208140373, -0.6114826798439026, 0.03966701775789261, 0.6281078457832336], [-0.05532039701938629, -0.41693612933158875, 0.052229173481464386, 0.34817662835121155], [-0.06365911662578583, -0.22259443998336792, 0.059192705899477005, 0.07241000235080719], [-0.06811100989580154, -0.41851285099983215, 0.06064090505242348, 0.3831654191017151], [-0.07648126780986786, -0.22430194914340973, 0.06830421090126038, 0.11020205169916153], [-0.08096730709075928, -0.030221879482269287, 0.07050825655460358, -0.16017338633537292], [-0.08157174289226532, -0.22627870738506317, 0.06730479001998901, 0.15389341115951538], [-0.08609731495380402, -0.03218178078532219, 0.07038265466690063, -0.11682012677192688], [-0.08674094825983047, 0.16186483204364777, 0.06804625689983368, -0.386493980884552], [-0.08350365608930588, -0.0341537781059742, 0.06031637266278267, -0.07315635681152344], [-0.08418673276901245, 0.16005392372608185, 0.05885324627161026, -0.3462159037590027], [-0.0809856504201889, -0.03585365042090416, 0.05192892998456955, -0.035570450127124786], [-0.08170272409915924, -0.23168033361434937, 0.051217518746852875, 0.27303385734558105], [-0.08633632957935333, -0.0373251810669899, 0.05667819827795029, -0.0030652107670903206], [-0.08708283305168152, -0.23321224749088287, 0.0566168911755085, 0.3069480359554291], [-0.09174708276987076, -0.03894084319472313, 0.06275585293769836, 0.032644327729940414], [-0.0925258994102478, 0.1552276462316513, 0.0634087398648262, -0.23959696292877197], [-0.089421346783638, -0.04074012115597725, 0.05861680209636688, 0.07239362597465515], [-0.09023614972829819, -0.23665130138397217, 0.06006467342376709, 0.382979154586792], [-0.09496917575597763, -0.042431317269802094, 0.06772425770759583, 0.10982294380664825], [-0.09581779688596725, -0.23845508694648743, 0.06992071866989136, 0.4230802655220032], [-0.100586898624897, -0.044389739632606506, 0.07838232070207596, 0.15323346853256226], [-0.10147469490766525, -0.24054141342639923, 0.08144699037075043, 0.46957844495773315], [-0.10628551989793777, -0.046658776700496674, 0.09083855897188187, 0.20363749563694], [-0.10721869766712189, 0.14705459773540497, 0.09491130709648132, -0.05906473845243454], [-0.104277603328228, 0.3406966030597687, 0.09373001009225845, -0.32035842537879944], [-0.09746367484331131, 0.5343674421310425, 0.08732284605503082, -0.5820732116699219], [-0.08677632361650467, 0.33813753724098206, 0.07568138092756271, -0.26320958137512207], [-0.08001357316970825, 0.14202149212360382, 0.07041718810796738, 0.05235152319073677], [-0.0771731436252594, -0.05403580144047737, 0.07146421819925308, 0.36639419198036194], [-0.0782538577914238, 0.14000169932842255, 0.07879210263490677, 0.09707345813512802], [-0.07545382529497147, 0.33391115069389343, 0.08073357492685318, -0.16974739730358124], [-0.06877560168504715, 0.5277903079986572, 0.07733862847089767, -0.4359089732170105], [-0.058219797909259796, 0.3316636085510254, 0.06862044334411621, -0.11988339573144913], [-0.05158652737736702, 0.5257387161254883, 0.06622277945280075, -0.39015236496925354], [-0.041071753948926926, 0.7198613286018372, 0.05841973051428795, -0.6612427830696106], [-0.026674525812268257, 0.9141238331794739, 0.045194875448942184, -0.9349737763404846], [-0.008392048999667168, 0.7184223532676697, 0.026495398953557014, -0.6284385323524475], [0.005976397544145584, 0.5229408144950867, 0.013926628977060318, -0.3275304436683655], [0.01643521524965763, 0.3276234269142151, 0.0073760198429226875, -0.030488435178995132], [0.02298768237233162, 0.5226387977600098, 0.0067662508226931095, -0.32083505392074585], [0.03344045951962471, 0.7176637649536133, 0.00034954986767843366, -0.6113765239715576], [0.047793734818696976, 0.5225369334220886, -0.011877980083227158, -0.31858351826667786], [0.05824447423219681, 0.3275861442089081, -0.018249649554491043, -0.029670001938939095], [0.06479619443416595, 0.5229649543762207, -0.01884305104613304, -0.3280545771121979], [0.07525549829006195, 0.3281162977218628, -0.02540414221584797, -0.041372936218976974], [0.08181782066822052, 0.5235931277275085, -0.02623159997165203, -0.3419616222381592], [0.09228968620300293, 0.3288540244102478, -0.03307083249092102, -0.0576646514236927], [0.09886676073074341, 0.13422147929668427, -0.03422412648797035, 0.2244034856557846], [0.10155119746923447, 0.32981544733047485, -0.029736056923866272, -0.0788755714893341], [0.1081475019454956, 0.1351321041584015, -0.031313568353652954, 0.20427921414375305], [0.11085014790296555, -0.059528373181819916, -0.027227982878684998, 0.48692211508750916], [0.1096595749258995, 0.1359669715166092, -0.017489541321992874, 0.1857837438583374], [0.11237891763448715, -0.05890043079853058, -0.01377386599779129, 0.4728984832763672], [0.11120090633630753, 0.1364133208990097, -0.004315896891057491, 0.1759062558412552], [0.11392917484045029, 0.3315967619419098, -0.0007977716159075499, -0.11813505738973618], [0.12056110799312592, 0.1364862620830536, -0.0031604727264493704, 0.1742960661649704], [0.12329083681106567, 0.33165329694747925, 0.0003254485782235861, -0.11938221007585526], [0.12992389500141144, 0.1365266889333725, -0.00206219544634223, 0.17340338230133057], [0.13265442848205566, 0.3316780924797058, 0.0014058720553293824, -0.11992938816547394], [0.13928799331188202, 0.13653601706027985, -0.0009927158243954182, 0.17319674789905548], [0.14201872050762177, -0.058571707457304, 0.0024712190497666597, 0.46556633710861206], [0.14084728062152863, 0.13651524484157562, 0.01178254559636116, 0.17366334795951843], [0.14357759058475494, 0.33146658539772034, 0.015255812555551529, -0.11527939885854721], [0.15020692348480225, 0.526366651058197, 0.012950224801898003, -0.40311044454574585], [0.16073425114154816, 0.7213025689125061, 0.004888015799224377, -0.6916825175285339], [0.17516030371189117, 0.5261131525039673, -0.008945634588599205, -0.3974648118019104], [0.18568256497383118, 0.33111923933029175, -0.016894930973649025, -0.1076156497001648], [0.19230495393276215, 0.13624341785907745, -0.019047243520617485, 0.17968948185443878], [0.1950298249721527, 0.33163267374038696, -0.015453455038368702, -0.1189407929778099], [0.20166248083114624, 0.13673551380634308, -0.01783226989209652, 0.16882692277431488], [0.20439718663692474, 0.33210811018943787, -0.014455731958150864, -0.12942779064178467], [0.21103934943675995, 0.5274341106414795, -0.01704428717494011, -0.4266360402107239], [0.22158803045749664, 0.33255767822265625, -0.025577008724212646, -0.13937461376190186], [0.22823917865753174, 0.5280364751815796, -0.028364501893520355, -0.44001567363739014], [0.23879991471767426, 0.33332717418670654, -0.03716481477022171, -0.15640728175640106], [0.2454664558172226, 0.13875649869441986, -0.04029295966029167, 0.12432324886322021], [0.24824158847332, -0.055765729397535324, -0.037806496024131775, 0.4040268361568451], [0.2471262663602829, 0.13987143337726593, -0.02972595952451229, 0.09966833144426346], [0.2499237060546875, -0.05481215938925743, -0.027732592076063156, 0.382826566696167], [0.24882745742797852, -0.24952960014343262, -0.02007606066763401, 0.6666380763053894], [0.24383686482906342, -0.4443666636943817, -0.006743299309164286, 0.9529328346252441], [0.23494952917099, -0.6393972635269165, 0.012315357103943825, 1.2434895038604736], [0.22216159105300903, -0.8346750736236572, 0.037185147404670715, 1.5400046110153198], [0.205468088388443, -0.6400195360183716, 0.06798523664474487, 1.259153127670288], [0.19266769289970398, -0.835942268371582, 0.09316830337047577, 1.5723305940628052], [0.1759488433599472, -0.6420471668243408, 0.12461491674184799, 1.3101012706756592], [0.16310790181159973, -0.4487043619155884, 0.1508169323205948, 1.058877944946289], [0.15413381159305573, -0.2558668851852417, 0.17199449241161346, 0.8170773983001709], [0.14901648461818695, -0.06346412003040314, 0.18833604454994202, 0.583048939704895], [0.147747203707695, 0.12858973443508148, 0.19999702274799347, 0.35510629415512085], [0.15031899511814117, -0.06873030215501785, 0.20709915459156036, 0.7035945653915405]], "actions": [1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.00908152386546135, 0.22309507429599762, -0.02782844379544258, -0.2654072940349579], [-0.004619622603058815, 0.028381140902638435, -0.03313659131526947, 0.018370015546679497], [-0.004051999654620886, 0.22396224737167358, -0.03276918828487396, -0.2845809757709503], [0.0004272452206350863, 0.02932262234389782, -0.038460809737443924, -0.0024106898345053196], [0.0010136977070942521, -0.1652272492647171, -0.03850902244448662, 0.277893602848053], [-0.0022908472456038, 0.03042231872677803, -0.032951150089502335, -0.026682017371058464], [-0.0016824008198454976, 0.22600093483924866, -0.03348479047417641, -0.3295765817165375], [0.002837618114426732, 0.4215831756591797, -0.040076322853565216, -0.6326281428337097], [0.0112692816182971, 0.227042555809021, -0.05272888392210007, -0.35283082723617554], [0.015810132026672363, 0.4228731095790863, -0.05978550389409065, -0.6616635322570801], [0.024267595261335373, 0.22863174974918365, -0.07301877439022064, -0.3883885145187378], [0.028840230777859688, 0.03461809828877449, -0.08078654110431671, -0.11959194391965866], [0.029532592743635178, -0.15925903618335724, -0.08317837864160538, 0.14654985070228577], [0.026347411796450615, -0.35309740900993347, -0.08024738729000092, 0.4118759334087372], [0.01928546279668808, -0.15693503618240356, -0.0720098689198494, 0.09501183778047562], [0.016146762296557426, -0.35095497965812683, -0.07010962814092636, 0.36413490772247314], [0.00912766344845295, -0.15491029620170593, -0.06282693147659302, 0.050194963812828064], [0.0060294573195278645, -0.3490777313709259, -0.061823032796382904, 0.32241252064704895], [-0.0009520973544567823, -0.5432673096656799, -0.05537478253245354, 0.5949760675430298], [-0.011817444115877151, -0.34741586446762085, -0.043475259095430374, 0.28537726402282715], [-0.018765760585665703, -0.5418916940689087, -0.037767715752124786, 0.5640376806259155], [-0.029603594914078712, -0.3462607264518738, -0.026486961171030998, 0.25969940423965454], [-0.0365288071334362, -0.5409947633743286, -0.021292973309755325, 0.5439117550849915], [-0.04734870418906212, -0.345580130815506, -0.01041473913937807, 0.24459660053253174], [-0.05426030606031418, -0.5405517816543579, -0.005522807128727436, 0.5339763760566711], [-0.06507134437561035, -0.3453526198863983, 0.00515672005712986, 0.2395583540201187], [-0.07197839766740799, -0.15030470490455627, 0.009947887621819973, -0.05149354785680771], [-0.07498449087142944, 0.04467320814728737, 0.008918016217648983, -0.3410212993621826], [-0.07409102469682693, -0.1505744904279709, 0.0020975901279598475, -0.045539550483226776], [-0.07710251212120056, -0.34572646021842957, 0.0011867991415783763, 0.2478044480085373], [-0.08401704579591751, -0.5408653616905212, 0.006142888218164444, 0.5408614873886108], [-0.0948343500494957, -0.3458302617073059, 0.01696011796593666, 0.2501204013824463], [-0.10175095498561859, -0.15095455944538116, 0.021962525323033333, -0.0371650792658329], [-0.10477004945278168, 0.04384566843509674, 0.021219223737716675, -0.3228384852409363], [-0.10389313101768494, 0.23865912854671478, 0.014762453734874725, -0.6087549328804016], [-0.09911995381116867, 0.04333395138382912, 0.002587355440482497, -0.3114590644836426], [-0.0982532724738121, -0.15182477235794067, -0.0036418261006474495, -0.017961299046874046], [-0.101289764046669, 0.04334922507405281, -0.004001052118837833, -0.3117910325527191], [-0.10042278468608856, 0.23852795362472534, -0.010236873291432858, -0.6057330965995789], [-0.09565222263336182, 0.043550629168748856, -0.02235153503715992, -0.31629201769828796], [-0.09478121250867844, 0.23898370563983917, -0.028677374124526978, -0.615939199924469], [-0.09000153839588165, 0.04427390173077583, -0.040996160358190536, -0.3324245810508728], [-0.08911605924367905, -0.15024127066135406, -0.04764465242624283, -0.05294647440314293], [-0.09212088584899902, -0.3446488380432129, -0.04870358109474182, 0.22433170676231384], [-0.09901385754346848, -0.539042055606842, -0.04421694576740265, 0.5012626647949219], [-0.10979469865560532, -0.3433256447315216, -0.03419169411063194, 0.19497936964035034], [-0.11666121333837509, -0.5379422307014465, -0.030292106792330742, 0.47668322920799255], [-0.12742005288600922, -0.7326236963272095, -0.02075844071805477, 0.759666919708252], [-0.14207252860069275, -0.5372219681739807, -0.005565103143453598, 0.46052491664886475], [-0.15281696617603302, -0.34202176332473755, 0.0036453951615840197, 0.16609306633472443], [-0.15965740382671356, -0.5371957421302795, 0.006967256776988506, 0.45992377400398254], [-0.17040131986141205, -0.3421729505062103, 0.016165731474757195, 0.16944506764411926], [-0.17724478244781494, -0.5375224947929382, 0.019554633647203445, 0.4671836495399475], [-0.18799522519111633, -0.34268221259117126, 0.02889830619096756, 0.1807277798652649], [-0.19484888017177582, -0.14798544347286224, 0.032512862235307693, -0.10270050913095474], [-0.19780857861042023, -0.3435578942298889, 0.030458852648735046, 0.20006021857261658], [-0.20467974245548248, -0.5391019582748413, 0.03446005657315254, 0.5021937489509583], [-0.21546177566051483, -0.3444822430610657, 0.04450393095612526, 0.2205667644739151], [-0.22235143184661865, -0.15002374351024628, 0.04891526699066162, -0.0577523298561573], [-0.22535189986228943, 0.04436396807432175, 0.047760218381881714, -0.3346097767353058], [-0.22446462512016296, -0.1514040231704712, 0.041068024933338165, -0.02725646086037159], [-0.22749270498752594, 0.04310564696788788, 0.040522895753383636, -0.3067043721675873], [-0.2266305834054947, 0.23762743175029755, 0.03438880667090416, -0.5863370299339294], [-0.2218780368566513, 0.04204113408923149, 0.022662067785859108, -0.2830227315425873], [-0.22103720903396606, 0.2368326485157013, 0.01700161211192608, -0.5684728622436523], [-0.21630056202411652, 0.4317120611667633, 0.005632155109196901, -0.8557515144348145], [-0.2076663225889206, 0.23651380836963654, -0.011482874862849712, -0.5613029599189758], [-0.202936053276062, 0.04155487194657326, -0.022708933800458908, -0.2722597122192383], [-0.20210495591163635, -0.1532358080148697, -0.028154129162430763, 0.01317510660737753], [-0.2051696628332138, -0.34794291853904724, -0.027890626341104507, 0.2968437969684601], [-0.21212852001190186, -0.15243469178676605, -0.021953750401735306, -0.004503241740167141], [-0.21517722308635712, -0.3472350239753723, -0.02204381488263607, 0.2811729609966278], [-0.222121924161911, -0.15180569887161255, -0.016420355066657066, -0.01838018372654915], [-0.22515803575515747, 0.0435478501021862, -0.01678795926272869, -0.31619834899902344], [-0.22428707778453827, -0.15133100748062134, -0.023111926391720772, -0.028856704011559486], [-0.22731369733810425, -0.34611400961875916, -0.023689061403274536, 0.2564454972743988], [-0.2342359721660614, -0.5408898591995239, -0.018560150638222694, 0.5415633916854858], [-0.24505376815795898, -0.3455120623111725, -0.007728883530944586, 0.24309073388576508], [-0.2519640028476715, -0.15028056502342224, -0.0028670686297118664, -0.05202002450823784], [-0.25496962666511536, -0.34536129236221313, -0.003907469101250172, 0.23975694179534912], [-0.2618768513202667, -0.15018372237682343, 0.0008876697393134236, -0.054155945777893066], [-0.26488053798675537, -0.34531840682029724, -0.00019544913084246218, 0.23880691826343536], [-0.2717868983745575, -0.5404375791549683, 0.004580689128488302, 0.5314281582832336], [-0.2825956344604492, -0.34538033604621887, 0.015209252946078777, 0.24019214510917664], [-0.2895032465457916, -0.15047891438007355, 0.020013095811009407, -0.04765482619404793], [-0.29251283407211304, -0.34588202834129333, 0.01905999891459942, 0.25127461552619934], [-0.2994304597377777, -0.541270911693573, 0.02408549189567566, 0.5499079823493958], [-0.31025588512420654, -0.3464953899383545, 0.035083651542663574, 0.26490992307662964], [-0.31718578934669495, -0.1518913060426712, 0.04038184881210327, -0.016504114493727684], [-0.3202236294746399, 0.04262895509600639, 0.040051765739917755, -0.29617759585380554], [-0.3193710446357727, -0.15304040908813477, 0.03412821516394615, 0.008863129653036594], [-0.32243186235427856, 0.041575901210308075, 0.03430547937750816, -0.2728596031665802], [-0.3216003477573395, 0.236191987991333, 0.02884828671813011, -0.5545281171798706], [-0.31687650084495544, 0.04067709669470787, 0.017757723107933998, -0.25289759039878845], [-0.31606295704841614, 0.23554104566574097, 0.012699771672487259, -0.5399269461631775], [-0.3113521337509155, 0.4304821789264679, 0.001901233452372253, -0.8285814523696899], [-0.30274248123168945, 0.6255781054496765, -0.01467039529234171, -1.1206657886505127], [-0.290230929851532, 0.8208893537521362, -0.037083711475133896, -1.4179141521453857], [-0.2738131284713745, 0.6262456178665161, -0.06544199585914612, -1.1370493173599243], [-0.26128822565078735, 0.4320378005504608, -0.0881829783320427, -0.8655874133110046], [-0.2526474595069885, 0.23821960389614105, -0.10549473017454147, -0.6018819808959961], [-0.24788308143615723, 0.04471917077898979, -0.11753236502408981, -0.3442029058933258], [-0.2469886988401413, -0.14855177700519562, -0.12441642582416534, -0.09077156335115433], [-0.24995972216129303, -0.34169113636016846, -0.1262318640947342, 0.16021396219730377], [-0.2567935585975647, -0.5348011255264282, -0.12302757799625397, 0.4105604588985443], [-0.26748958230018616, -0.7279837131500244, -0.11481636762619019, 0.6620652079582214], [-0.2820492386817932, -0.5314672589302063, -0.10157506167888641, 0.335549533367157], [-0.2926785945892334, -0.33505749702453613, -0.09486407041549683, 0.012641659006476402], [-0.29937973618507385, -0.5286999940872192, -0.09461124241352081, 0.2739512026309967], [-0.3099537491798401, -0.33236438035964966, -0.08913221955299377, -0.04700933396816254], [-0.316601037979126, -0.1360848993062973, -0.090072400867939, -0.36643001437187195], [-0.31932273507118225, -0.3298191428184509, -0.09740100055932999, -0.1034521758556366], [-0.32591912150382996, -0.13344603776931763, -0.09947004914283752, -0.42520633339881897], [-0.3285880386829376, 0.06293384730815887, -0.10797417163848877, -0.7475160956382751], [-0.3273293673992157, 0.25936663150787354, -0.12292449921369553, -1.0721321105957031], [-0.3221420347690582, 0.06606503576040268, -0.14436714351177216, -0.8204164505004883], [-0.32082071900367737, -0.1268174946308136, -0.16077546775341034, -0.5763991475105286], [-0.32335707545280457, -0.3193640410900116, -0.1723034530878067, -0.338368684053421], [-0.3297443389892578, -0.12226273864507675, -0.1790708303451538, -0.6800497174263], [-0.3321896195411682, -0.3145051896572113, -0.19267182052135468, -0.44866296648979187], [-0.3384796977043152, -0.5064544677734375, -0.20164507627487183, -0.2223624587059021], [-0.3486087918281555, -0.3091072738170624, -0.20609232783317566, -0.5712681412696838], [-0.35479095578193665, -0.11178242415189743, -0.21751768887043, -0.9211548566818237], [-0.00821590330451727, -0.16737468540668488, 0.03303978964686394, 0.2673306167125702], [-0.011563397012650967, 0.027260536327958107, 0.038386400789022446, -0.014750929549336433], [-0.011018186807632446, 0.22181154787540436, 0.03809138387441635, -0.29507964849472046], [-0.006581955589354038, 0.026167839765548706, 0.03218979015946388, 0.009369206614792347], [-0.00605859886854887, 0.22081370651721954, 0.032377175986766815, -0.27298617362976074], [-0.0016423244960606098, 0.025245098397135735, 0.02691745199263096, 0.029730219393968582], [-0.0011374225141480565, 0.21997089684009552, 0.02751205489039421, -0.25433990359306335], [0.0032619955018162727, 0.024467147886753082, 0.02242525853216648, 0.04689227417111397], [0.0037513384595513344, 0.21926048398017883, 0.023363104090094566, -0.23863178491592407], [0.008136548101902008, 0.023812690749764442, 0.018590467050671577, 0.06132802367210388], [0.008612802252173424, -0.1715708076953888, 0.01981702819466591, 0.35981789231300354], [0.0051813856698572636, -0.3669687807559967, 0.02701338566839695, 0.6586831212043762], [-0.0021579896565526724, -0.5624560713768005, 0.0401870496571064, 0.9597480893135071], [-0.013407111167907715, -0.7580945491790771, 0.059382010251283646, 1.2647806406021118], [-0.028569001704454422, -0.5637796521186829, 0.08467762172222137, 0.991270124912262], [-0.03984459489583969, -0.36988672614097595, 0.10450302809476852, 0.726338267326355], [-0.04724232852458954, -0.5662864446640015, 0.11902979016304016, 1.0499986410140991], [-0.05856806039810181, -0.7627689242362976, 0.14002977311611176, 1.377549171447754], [-0.07382343709468842, -0.9593343734741211, 0.1675807535648346, 1.7105457782745361], [-0.09301012754440308, -0.7664874792098999, 0.2017916589975357, 1.4743661880493164], [-0.10833987593650818, -0.5743213891983032, 0.23127898573875427, 1.2508907318115234], [0.024683130905032158, 0.17912566661834717, 0.04500377178192139, -0.27501875162124634], [0.02826564386487007, -0.016608530655503273, 0.039503395557403564, 0.03151191398501396], [0.027933472767472267, 0.17792531847953796, 0.040133632719516754, -0.24845021963119507], [0.03149197995662689, 0.3724518120288849, 0.03516462817788124, -0.52820885181427], [0.03894101455807686, 0.1768532246351242, 0.024600451812148094, -0.2246561050415039], [0.042478080838918686, 0.37161508202552795, 0.02010732889175415, -0.509478747844696], [0.04991038143634796, 0.17621572315692902, 0.00991775467991829, -0.21052776277065277], [0.053434696048498154, -0.019046617671847343, 0.005707199685275555, 0.08526711910963058], [0.05305376276373863, -0.21424990892410278, 0.007412542123347521, 0.3797451853752136], [0.04876876622438431, -0.019234003499150276, 0.015007445588707924, 0.08940864354372025], [0.048384085297584534, 0.17566965520381927, 0.01679561845958233, -0.19850189983844757], [0.051897477358579636, 0.37054741382598877, 0.01282558124512434, -0.4858396053314209], [0.05930842459201813, 0.17524683475494385, 0.003108788514509797, -0.18914224207401276], [0.06281336396932602, -0.01991945132613182, -0.0006740562967024744, 0.10451975464820862], [0.062414973974227905, -0.21503174304962158, 0.0014163388404995203, 0.39698994159698486], [0.05811433866620064, -0.019929908215999603, 0.009356137365102768, 0.10475390404462814], [0.05771574005484581, -0.21518468856811523, 0.011451215483248234, 0.4003739058971405], [0.053412046283483505, -0.02022702246904373, 0.019458694383502007, 0.11132317781448364], [0.05300750583410263, -0.21562232077121735, 0.021685156971216202, 0.4100811183452606], [0.04869506135582924, -0.02081441506743431, 0.029886780306696892, 0.12431291490793228], [0.048278771340847015, 0.1738668978214264, 0.032373037189245224, -0.15879324078559875], [0.0517561100423336, -0.021703213453292847, 0.029197173193097115, 0.14392423629760742], [0.05132204666733742, -0.2172308713197708, 0.032075658440589905, 0.44567346572875977], [0.04697743058204651, -0.02257705293595791, 0.04098912701010704, 0.16327154636383057], [0.04652588814496994, -0.21826107800006866, 0.04425456002354622, 0.46859848499298096], [0.04216066747903824, -0.023791350424289703, 0.05362652614712715, 0.19018608331680298], [0.041684839874506, 0.17052403092384338, 0.05743024870753288, -0.08510934561491013], [0.04509532079100609, -0.025372110307216644, 0.055728062987327576, 0.22512564063072205], [0.0445878766477108, -0.22124440968036652, 0.06023057550191879, 0.5348535180091858], [0.040162988007068634, -0.02701886184513569, 0.07092764973640442, 0.2617405951023102], [0.03962261229753494, -0.22307781875133514, 0.07616245746612549, 0.5759248733520508], [0.035161055624485016, -0.41918015480041504, 0.08768095821142197, 0.891595721244812], [0.02677745185792446, -0.22535006701946259, 0.10551287233829498, 0.6277126669883728], [0.022270450368523598, -0.03184668347239494, 0.11806712299585342, 0.3700350821018219], [0.021633516997098923, -0.2284308820962906, 0.12546782195568085, 0.6974896192550659], [0.0170648992061615, -0.42504870891571045, 0.1394176185131073, 1.0268888473510742], [0.008563925512135029, -0.6217234134674072, 0.15995539724826813, 1.3598946332931519], [-0.0038705430924892426, -0.42892706394195557, 0.18715327978134155, 1.1212183237075806], [-0.012449083849787712, -0.6259435415267944, 0.20957764983177185, 1.4662851095199585], [0.042881421744823456, 0.15598808228969574, 0.021856550127267838, -0.2559332251548767], [0.04600118100643158, -0.03943900018930435, 0.016737885773181915, 0.043562695384025574], [0.04521240293979645, 0.15543898940086365, 0.017609139904379845, -0.24379262328147888], [0.048321180045604706, 0.35030505061149597, 0.012733287177979946, -0.5308696031570435], [0.05532728135585785, 0.5452455878257751, 0.0021158955059945583, -0.819513201713562], [0.06623219698667526, 0.350094735622406, -0.01427436899393797, -0.5261655449867249], [0.07323408871889114, 0.5454146265983582, -0.024797679856419563, -0.823311984539032], [0.08414237946271896, 0.35064053535461426, -0.041263919323682785, -0.5385304689407349], [0.09115519374608994, 0.15612223744392395, -0.05203452706336975, -0.2591295540332794], [0.09427763521671295, -0.03821974992752075, -0.05721712112426758, 0.016697624698281288], [0.09351324290037155, -0.23247644305229187, -0.05688316747546196, 0.29079318046569824], [0.08886371552944183, -0.036591485142707825, -0.051067303866147995, -0.019273661077022552], [0.08813188225030899, -0.23094528913497925, -0.05145277827978134, 0.25686973333358765], [0.08351297676563263, -0.035127945244312286, -0.04631538316607475, -0.051588013768196106], [0.0828104168176651, 0.16062647104263306, -0.04734714329242706, -0.3585166037082672], [0.08602295070886612, -0.033791542053222656, -0.0545174740254879, -0.08113126456737518], [0.08534711599349976, -0.2280913144350052, -0.056140098720788956, 0.19386519491672516], [0.08078528940677643, -0.422367125749588, -0.052262794226408005, 0.468323290348053], [0.07233794778585434, -0.616713285446167, -0.0428963303565979, 0.7440862059593201], [0.06000368297100067, -0.42102640867233276, -0.02801460586488247, 0.43821823596954346], [0.05158315598964691, -0.2255193591117859, -0.019250240176916122, 0.13683752715587616], [0.047072768211364746, -0.030127044767141342, -0.016513491049408913, -0.16185584664344788], [0.04647022485733032, 0.16522736847400665, -0.019750608131289482, -0.4597022533416748], [0.04977477341890335, -0.029609913006424904, -0.028944652527570724, -0.17330963909626007], [0.049182575196027756, 0.16591408848762512, -0.032410845160484314, -0.4749813377857208], [0.05250085890293121, -0.02873554825782776, -0.04191047325730324, -0.19268734753131866], [0.0519261471927166, -0.2232336848974228, -0.045764219015836716, 0.0864855945110321], [0.04746147245168686, -0.4176707863807678, -0.044034507125616074, 0.3643859028816223], [0.03910805657505989, -0.6121401786804199, -0.0367467887699604, 0.6428652405738831], [0.02686525322496891, -0.41652581095695496, -0.023889483883976936, 0.33884066343307495], [0.018534738570451736, -0.6112998127937317, -0.017112670466303825, 0.6238954663276672], [0.0063087414018809795, -0.4159431755542755, -0.004634760785847902, 0.3258725702762604], [-0.0020101224072277546, -0.22075554728507996, 0.0018826901214197278, 0.03173163905739784], [-0.00642523355782032, -0.4159044623374939, 0.002517322776839137, 0.32500797510147095], [-0.014743322506546974, -0.6110621690750122, 0.00901748239994049, 0.6184837222099304], [-0.026964565739035606, -0.8063088655471802, 0.02138715609908104, 0.9139930009841919], [-0.04309074208140373, -0.6114826798439026, 0.03966701775789261, 0.6281078457832336], [-0.05532039701938629, -0.41693612933158875, 0.052229173481464386, 0.34817662835121155], [-0.06365911662578583, -0.22259443998336792, 0.059192705899477005, 0.07241000235080719], [-0.06811100989580154, -0.41851285099983215, 0.06064090505242348, 0.3831654191017151], [-0.07648126780986786, -0.22430194914340973, 0.06830421090126038, 0.11020205169916153], [-0.08096730709075928, -0.030221879482269287, 0.07050825655460358, -0.16017338633537292], [-0.08157174289226532, -0.22627870738506317, 0.06730479001998901, 0.15389341115951538], [-0.08609731495380402, -0.03218178078532219, 0.07038265466690063, -0.11682012677192688], [-0.08674094825983047, 0.16186483204364777, 0.06804625689983368, -0.386493980884552], [-0.08350365608930588, -0.0341537781059742, 0.06031637266278267, -0.07315635681152344], [-0.08418673276901245, 0.16005392372608185, 0.05885324627161026, -0.3462159037590027], [-0.0809856504201889, -0.03585365042090416, 0.05192892998456955, -0.035570450127124786], [-0.08170272409915924, -0.23168033361434937, 0.051217518746852875, 0.27303385734558105], [-0.08633632957935333, -0.0373251810669899, 0.05667819827795029, -0.0030652107670903206], [-0.08708283305168152, -0.23321224749088287, 0.0566168911755085, 0.3069480359554291], [-0.09174708276987076, -0.03894084319472313, 0.06275585293769836, 0.032644327729940414], [-0.0925258994102478, 0.1552276462316513, 0.0634087398648262, -0.23959696292877197], [-0.089421346783638, -0.04074012115597725, 0.05861680209636688, 0.07239362597465515], [-0.09023614972829819, -0.23665130138397217, 0.06006467342376709, 0.382979154586792], [-0.09496917575597763, -0.042431317269802094, 0.06772425770759583, 0.10982294380664825], [-0.09581779688596725, -0.23845508694648743, 0.06992071866989136, 0.4230802655220032], [-0.100586898624897, -0.044389739632606506, 0.07838232070207596, 0.15323346853256226], [-0.10147469490766525, -0.24054141342639923, 0.08144699037075043, 0.46957844495773315], [-0.10628551989793777, -0.046658776700496674, 0.09083855897188187, 0.20363749563694], [-0.10721869766712189, 0.14705459773540497, 0.09491130709648132, -0.05906473845243454], [-0.104277603328228, 0.3406966030597687, 0.09373001009225845, -0.32035842537879944], [-0.09746367484331131, 0.5343674421310425, 0.08732284605503082, -0.5820732116699219], [-0.08677632361650467, 0.33813753724098206, 0.07568138092756271, -0.26320958137512207], [-0.08001357316970825, 0.14202149212360382, 0.07041718810796738, 0.05235152319073677], [-0.0771731436252594, -0.05403580144047737, 0.07146421819925308, 0.36639419198036194], [-0.0782538577914238, 0.14000169932842255, 0.07879210263490677, 0.09707345813512802], [-0.07545382529497147, 0.33391115069389343, 0.08073357492685318, -0.16974739730358124], [-0.06877560168504715, 0.5277903079986572, 0.07733862847089767, -0.4359089732170105], [-0.058219797909259796, 0.3316636085510254, 0.06862044334411621, -0.11988339573144913], [-0.05158652737736702, 0.5257387161254883, 0.06622277945280075, -0.39015236496925354], [-0.041071753948926926, 0.7198613286018372, 0.05841973051428795, -0.6612427830696106], [-0.026674525812268257, 0.9141238331794739, 0.045194875448942184, -0.9349737763404846], [-0.008392048999667168, 0.7184223532676697, 0.026495398953557014, -0.6284385323524475], [0.005976397544145584, 0.5229408144950867, 0.013926628977060318, -0.3275304436683655], [0.01643521524965763, 0.3276234269142151, 0.0073760198429226875, -0.030488435178995132], [0.02298768237233162, 0.5226387977600098, 0.0067662508226931095, -0.32083505392074585], [0.03344045951962471, 0.7176637649536133, 0.00034954986767843366, -0.6113765239715576], [0.047793734818696976, 0.5225369334220886, -0.011877980083227158, -0.31858351826667786], [0.05824447423219681, 0.3275861442089081, -0.018249649554491043, -0.029670001938939095], [0.06479619443416595, 0.5229649543762207, -0.01884305104613304, -0.3280545771121979], [0.07525549829006195, 0.3281162977218628, -0.02540414221584797, -0.041372936218976974], [0.08181782066822052, 0.5235931277275085, -0.02623159997165203, -0.3419616222381592], [0.09228968620300293, 0.3288540244102478, -0.03307083249092102, -0.0576646514236927], [0.09886676073074341, 0.13422147929668427, -0.03422412648797035, 0.2244034856557846], [0.10155119746923447, 0.32981544733047485, -0.029736056923866272, -0.0788755714893341], [0.1081475019454956, 0.1351321041584015, -0.031313568353652954, 0.20427921414375305], [0.11085014790296555, -0.059528373181819916, -0.027227982878684998, 0.48692211508750916], [0.1096595749258995, 0.1359669715166092, -0.017489541321992874, 0.1857837438583374], [0.11237891763448715, -0.05890043079853058, -0.01377386599779129, 0.4728984832763672], [0.11120090633630753, 0.1364133208990097, -0.004315896891057491, 0.1759062558412552], [0.11392917484045029, 0.3315967619419098, -0.0007977716159075499, -0.11813505738973618], [0.12056110799312592, 0.1364862620830536, -0.0031604727264493704, 0.1742960661649704], [0.12329083681106567, 0.33165329694747925, 0.0003254485782235861, -0.11938221007585526], [0.12992389500141144, 0.1365266889333725, -0.00206219544634223, 0.17340338230133057], [0.13265442848205566, 0.3316780924797058, 0.0014058720553293824, -0.11992938816547394], [0.13928799331188202, 0.13653601706027985, -0.0009927158243954182, 0.17319674789905548], [0.14201872050762177, -0.058571707457304, 0.0024712190497666597, 0.46556633710861206], [0.14084728062152863, 0.13651524484157562, 0.01178254559636116, 0.17366334795951843], [0.14357759058475494, 0.33146658539772034, 0.015255812555551529, -0.11527939885854721], [0.15020692348480225, 0.526366651058197, 0.012950224801898003, -0.40311044454574585], [0.16073425114154816, 0.7213025689125061, 0.004888015799224377, -0.6916825175285339], [0.17516030371189117, 0.5261131525039673, -0.008945634588599205, -0.3974648118019104], [0.18568256497383118, 0.33111923933029175, -0.016894930973649025, -0.1076156497001648], [0.19230495393276215, 0.13624341785907745, -0.019047243520617485, 0.17968948185443878], [0.1950298249721527, 0.33163267374038696, -0.015453455038368702, -0.1189407929778099], [0.20166248083114624, 0.13673551380634308, -0.01783226989209652, 0.16882692277431488], [0.20439718663692474, 0.33210811018943787, -0.014455731958150864, -0.12942779064178467], [0.21103934943675995, 0.5274341106414795, -0.01704428717494011, -0.4266360402107239], [0.22158803045749664, 0.33255767822265625, -0.025577008724212646, -0.13937461376190186], [0.22823917865753174, 0.5280364751815796, -0.028364501893520355, -0.44001567363739014], [0.23879991471767426, 0.33332717418670654, -0.03716481477022171, -0.15640728175640106], [0.2454664558172226, 0.13875649869441986, -0.04029295966029167, 0.12432324886322021], [0.24824158847332, -0.055765729397535324, -0.037806496024131775, 0.4040268361568451], [0.2471262663602829, 0.13987143337726593, -0.02972595952451229, 0.09966833144426346], [0.2499237060546875, -0.05481215938925743, -0.027732592076063156, 0.382826566696167], [0.24882745742797852, -0.24952960014343262, -0.02007606066763401, 0.6666380763053894], [0.24383686482906342, -0.4443666636943817, -0.006743299309164286, 0.9529328346252441], [0.23494952917099, -0.6393972635269165, 0.012315357103943825, 1.2434895038604736], [0.22216159105300903, -0.8346750736236572, 0.037185147404670715, 1.5400046110153198], [0.205468088388443, -0.6400195360183716, 0.06798523664474487, 1.259153127670288], [0.19266769289970398, -0.835942268371582, 0.09316830337047577, 1.5723305940628052], [0.1759488433599472, -0.6420471668243408, 0.12461491674184799, 1.3101012706756592], [0.16310790181159973, -0.4487043619155884, 0.1508169323205948, 1.058877944946289], [0.15413381159305573, -0.2558668851852417, 0.17199449241161346, 0.8170773983001709], [0.14901648461818695, -0.06346412003040314, 0.18833604454994202, 0.583048939704895], [0.147747203707695, 0.12858973443508148, 0.19999702274799347, 0.35510629415512085], [0.15031899511814117, -0.06873030215501785, 0.20709915459156036, 0.7035945653915405], [0.14894439280033112, 0.12301186472177505, 0.221171036362648, 0.4825800061225891]], "action_prob": [0.5088157653808594, 0.6176013946533203, 0.4960686266422272, 0.6244245171546936, 0.5186683535575867, 0.603756308555603, 0.47001734375953674, 0.3647386431694031, 0.6559449434280396, 0.3566640615463257, 0.6568465232849121, 0.65154629945755, 0.5965604782104492, 0.47326311469078064, 0.6192196011543274, 0.49650609493255615, 0.6096654534339905, 0.5172080397605896, 0.40041494369506836, 0.643744707107544, 0.4069594442844391, 0.6434674263000488, 0.4102075397968292, 0.6439294219017029, 0.4097940921783447, 0.6452333331108093, 0.5942932367324829, 0.4643977880477905, 0.6352165937423706, 0.5349031090736389, 0.4024955630302429, 0.6479877829551697, 0.6039853692054749, 0.4812195301055908, 0.37357839941978455, 0.6539193391799927, 0.6276758909225464, 0.48195338249206543, 0.37114694714546204, 0.6552954912185669, 0.36624056100845337, 0.6565184593200684, 0.6406711935997009, 0.5547349452972412, 0.42412394285202026, 0.6397863030433655, 0.430656373500824, 0.3609086275100708, 0.6523170471191406, 0.6411606669425964, 0.4270189702510834, 0.643390417098999, 0.4197719693183899, 0.64640873670578, 0.5904721617698669, 0.5377247929573059, 0.40066301822662354, 0.6520757675170898, 0.6115519404411316, 0.49726787209510803, 0.6133409142494202, 0.511880099773407, 0.3938343822956085, 0.6476497054100037, 0.396804541349411, 0.3519335389137268, 0.6483999490737915, 0.6503434181213379, 0.6124864220619202, 0.49443432688713074, 0.6177360415458679, 0.5006778240203857, 0.6152603030204773, 0.4949903190135956, 0.6218448281288147, 0.5131101012229919, 0.39181357622146606, 0.6516513228416443, 0.6091227531433105, 0.514542281627655, 0.609778642654419, 0.5129045248031616, 0.38882458209991455, 0.654116690158844, 0.6165621280670166, 0.49817442893981934, 0.378586083650589, 0.6572853922843933, 0.6295256614685059, 0.5305078625679016, 0.5925275087356567, 0.5422605276107788, 0.41507843136787415, 0.6415492296218872, 0.417762815952301, 0.3580365478992462, 0.35160234570503235, 0.3613570034503937, 0.6256346106529236, 0.6371983289718628, 0.649135172367096, 0.6564319133758545, 0.643456757068634, 0.577385663986206, 0.46074965596199036, 0.3789574205875397, 0.6492491364479065, 0.607092559337616, 0.5231854319572449, 0.5895103216171265, 0.44975754618644714, 0.647284209728241, 0.4212000370025635, 0.34410354495048523, 0.3406060039997101, 0.6417532563209534, 0.65799480676651, 0.6690025329589844, 0.33954519033432007, 0.6691239476203918, 0.6725881099700928, 0.3519040048122406, 0.32306191325187683, 0.5092047452926636, 0.6177842020988464, 0.5051289200782776, 0.6118040680885315, 0.5159171223640442, 0.6065367460250854, 0.5248114466667175, 0.601821780204773, 0.5320784449577332, 0.5976908206939697, 0.4620322585105896, 0.36385801434516907, 0.3462298512458801, 0.35588905215263367, 0.6292212009429932, 0.6424174308776855, 0.3445197641849518, 0.36114752292633057, 0.378989040851593, 0.6056170463562012, 0.6142578721046448, 0.5083431005477905, 0.6100479960441589, 0.5220322608947754, 0.3974672853946686, 0.6494346857070923, 0.400971919298172, 0.649743378162384, 0.5987834930419922, 0.4641411602497101, 0.632810652256012, 0.5421609878540039, 0.4080110788345337, 0.6487911343574524, 0.593286395072937, 0.4573443830013275, 0.6344630718231201, 0.45297136902809143, 0.6368427276611328, 0.44533708691596985, 0.640110194683075, 0.5653885006904602, 0.5697759389877319, 0.42582812905311584, 0.6461464166641235, 0.4129333198070526, 0.6499139070510864, 0.6020235419273376, 0.521562397480011, 0.3854932487010956, 0.6553643941879272, 0.3710714876651764, 0.3424872159957886, 0.6470699310302734, 0.6590922474861145, 0.34351563453674316, 0.34183746576309204, 0.3604922294616699, 0.6197212934494019, 0.3665260374546051, 0.5097176432609558, 0.6126583814620972, 0.515440821647644, 0.3900867700576782, 0.34730014204978943, 0.6520518064498901, 0.34493494033813477, 0.6524243950843811, 0.6579083800315857, 0.6333143711090088, 0.5351058840751648, 0.5890835523605347, 0.5518977642059326, 0.5776793360710144, 0.4335581362247467, 0.6507120132446289, 0.5838456153869629, 0.4527006447315216, 0.3716374337673187, 0.6475873589515686, 0.6278635263442993, 0.5351800322532654, 0.3972448706626892, 0.6565151214599609, 0.389305055141449, 0.6586847305297852, 0.620822012424469, 0.5026605129241943, 0.39156362414360046, 0.6455065608024597, 0.3928631842136383, 0.6464966535568237, 0.6093126535415649, 0.5080686211585999, 0.38829872012138367, 0.35097536444664, 0.6488999724388123, 0.6519712805747986, 0.6305270791053772, 0.45538076758384705, 0.6390724778175354, 0.5685299038887024, 0.5595396161079407, 0.5885186195373535, 0.46379199624061584, 0.6274262070655823, 0.4840129613876343, 0.6196345090866089, 0.49800264835357666, 0.6251528859138489, 0.47677063941955566, 0.6345996260643005, 0.5461093187332153, 0.5812018513679504, 0.43484967947006226, 0.6481695175170898, 0.4134502112865448, 0.6538678407669067, 0.3920763432979584, 0.6583407521247864, 0.6279435157775879, 0.5267759561538696, 0.41099023818969727, 0.6394004821777344, 0.5732546448707581, 0.42601415514945984, 0.654850423336029, 0.5969057083129883, 0.47227951884269714, 0.618644118309021, 0.49266287684440613, 0.3894208073616028, 0.3536701500415802, 0.6501420140266418, 0.6476911306381226, 0.6085909605026245, 0.5094485878944397, 0.39038193225860596, 0.6498979926109314, 0.6149850487709045, 0.49441859126091003, 0.6202621459960938, 0.48282870650291443, 0.6262848973274231, 0.5312836170196533, 0.5967398881912231, 0.5426961779594421, 0.4116017818450928, 0.6477714776992798, 0.41553327441215515, 0.6476632952690125, 0.583966076374054, 0.5545567870140076, 0.5824623703956604, 0.5559905767440796, 0.5812443494796753, 0.5570807456970215, 0.4196869432926178, 0.6471515893936157, 0.5842088460922241, 0.4485485255718231, 0.3632955551147461, 0.6556255221366882, 0.6402226686477661, 0.5636307597160339, 0.5708400011062622, 0.5696933269500732, 0.5648793578147888, 0.424681156873703, 0.6472223401069641, 0.4150174558162689, 0.6507633924484253, 0.5970383286476135, 0.47184258699417114, 0.6243851184844971, 0.4817199110984802, 0.37884461879730225, 0.35167431831359863, 0.35662609338760376, 0.36949554085731506, 0.6169954538345337, 0.37142297625541687, 0.6137068271636963, 0.6246073842048645, 0.6378666162490845, 0.6525634527206421, 0.6648767590522766, 0.3359527289867401, 0.6625622510910034], "advantages": [60.0850830078125, 59.96125030517578, 59.68342971801758, 59.59204864501953, 59.31051254272461, 59.27581787109375, 58.8343391418457, 58.7922248840332, 59.13050079345703, 58.651023864746094, 59.10540771484375, 58.69548034667969, 58.48833465576172, 58.52772903442383, 58.798583984375, 58.22465515136719, 58.433006286621094, 57.88117980957031, 58.03108215332031, 58.33951187133789, 57.390281677246094, 57.615684509277344, 56.62627029418945, 56.77862548828125, 55.740272521972656, 55.83068084716797, 54.7364501953125, 54.001380920410156, 53.68709945678711, 53.234073638916016, 53.06167221069336, 53.107730865478516, 51.94508743286133, 51.13101577758789, 50.72166442871094, 50.69715118408203, 50.001163482666016, 49.560943603515625, 49.221012115478516, 49.285518646240234, 48.67134094238281, 48.82034683227539, 48.277862548828125, 47.966888427734375, 47.90703201293945, 48.02971649169922, 47.03562927246094, 47.084312438964844, 47.201499938964844, 45.846473693847656, 44.72663116455078, 44.62712097167969, 43.4520149230957, 43.31584167480469, 42.082069396972656, 41.19466018676758, 40.79049301147461, 40.633209228515625, 39.313621520996094, 38.32167434692383, 37.69270706176758, 37.018211364746094, 36.38003158569336, 36.08710861206055, 35.23350524902344, 34.97962951660156, 35.038002014160156, 34.12879943847656, 33.40171432495117, 32.92251968383789, 32.704551696777344, 31.808706283569336, 31.55068016052246, 30.640562057495117, 30.139650344848633, 29.583234786987305, 29.289682388305664, 29.2006778717041, 27.898401260375977, 26.943195343017578, 26.551738739013672, 25.57399559020996, 25.158447265625, 24.96173667907715, 23.568601608276367, 22.50288963317871, 22.018890380859375, 21.760536193847656, 20.28765106201172, 19.122146606445312, 18.29212188720703, 17.509632110595703, 16.66322135925293, 16.136608123779297, 15.15781307220459, 14.657554626464844, 14.45730209350586, 14.50910472869873, 14.744093894958496, 13.841073989868164, 13.007997512817383, 12.286236763000488, 11.728032112121582, 11.378854751586914, 11.239956855773926, 11.237979888916016, 11.243559837341309, 10.02245044708252, 9.124353408813477, 8.888949394226074, 8.043601036071777, 7.612763404846191, 7.184744358062744, 6.844032287597656, 6.808350563049316, 6.895843982696533, 6.753068923950195, 6.673562526702881, 6.61690616607666, 6.5723090171813965, 6.603211402893066, 6.546738147735596, 6.351680278778076, 8.256518363952637, 7.534050464630127, 6.412839889526367, 5.610804557800293, 4.631770133972168, 3.8091607093811035, 2.839858055114746, 1.9965449571609497, 1.0316559076309204, 0.16769282519817352, -0.7971253395080566, -1.5214194059371948, -2.02962327003479, -2.3888559341430664, -2.6934866905212402, -4.7811784744262695, -6.670348644256592, -7.161866188049316, -7.583072185516357, -8.011861801147461, -10.201667785644531, 21.957963943481445, 21.255775451660156, 20.423276901245117, 19.699447631835938, 19.290019989013672, 18.263917922973633, 17.87127113342285, 16.87515640258789, 16.1173095703125, 15.61191463470459, 14.507190704345703, 13.74330997467041, 13.305685043334961, 12.29590129852295, 11.520195960998535, 10.990951538085938, 9.840761184692383, 9.275350570678711, 8.088486671447754, 7.490909099578857, 6.265582084655762, 5.355844497680664, 4.4826765060424805, 3.850625514984131, 2.5628843307495117, 1.9041577577590942, 0.5788694024085999, -0.469959557056427, -1.377331256866455, -2.0654332637786865, -3.448697328567505, -4.159695625305176, -4.696975231170654, -6.36993408203125, -7.798952579498291, -8.559803009033203, -9.174720764160156, -9.688361167907715, -11.530924797058105, 62.55788803100586, 62.299110412597656, 61.938812255859375, 61.67546081542969, 61.76630401611328, 62.167152404785156, 61.50618362426758, 62.016212463378906, 61.45028305053711, 61.051387786865234, 60.881614685058594, 60.96369552612305, 60.550418853759766, 60.59149169921875, 60.197425842285156, 60.268028259277344, 60.033016204833984, 60.049739837646484, 60.27859115600586, 60.608192443847656, 59.487178802490234, 58.67006301879883, 58.27531051635742, 58.32302474975586, 57.915164947509766, 58.0286979675293, 57.670799255371094, 57.554752349853516, 57.65821075439453, 57.87545394897461, 56.80146026611328, 56.937782287597656, 55.79330825805664, 54.9661979675293, 54.84675598144531, 54.894615173339844, 54.97768020629883, 53.45366668701172, 52.07807540893555, 50.996124267578125, 50.75006103515625, 49.618160247802734, 48.843284606933594, 48.35327911376953, 47.54794692993164, 47.089595794677734, 46.38947296142578, 45.92238998413086, 45.27162170410156, 44.91337585449219, 44.060333251953125, 43.71162796020508, 42.82602310180664, 42.24946594238281, 41.66766357421875, 41.35079574584961, 40.42045211791992, 40.103885650634766, 39.14765167236328, 38.83124542236328, 37.854408264160156, 37.12136459350586, 36.59396743774414, 36.246856689453125, 35.4161376953125, 34.77120590209961, 34.31275177001953, 33.533851623535156, 32.93509292602539, 32.491580963134766, 31.74387550354004, 31.28199577331543, 30.968612670898438, 30.81366729736328, 29.87786865234375, 29.057905197143555, 28.36553382873535, 27.915969848632812, 27.652753829956055, 26.831735610961914, 26.135164260864258, 25.71406364440918, 25.005456924438477, 24.601484298706055, 23.880001068115234, 23.303726196289062, 22.687929153442383, 22.087594985961914, 21.65118408203125, 20.76886558532715, 20.297231674194336, 19.39394187927246, 18.73039436340332, 18.037872314453125, 17.36115837097168, 16.651838302612305, 15.961237907409668, 15.235159873962402, 14.683096885681152, 13.70791244506836, 12.967727661132812, 12.452768325805664, 12.164347648620605, 11.098814010620117, 10.17460823059082, 9.413872718811035, 8.682778358459473, 7.8987555503845215, 7.16050910949707, 6.6918158531188965, 5.7122602462768555, 5.276860237121582, 4.29376220703125, 3.4803948402404785, 2.8540735244750977, 1.83710777759552, 1.1662193536758423, 0.6787793040275574, 0.33058401942253113, 0.0489732101559639, -0.24549973011016846, -2.367155075073242, -2.731349468231201, -4.879985809326172, -6.8488640785217285, -8.573487281799316, -10.059957504272461, -11.358094215393066, -12.267733573913574], "value_targets": [70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 72.65108489990234, 72.37483215332031, 72.09579467773438, 71.81392669677734, 71.52922058105469, 71.24163818359375, 70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 153171221, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 1011700322, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 330699492, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 1757350257, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065, 821888065], "obs": [[-0.0286868829280138, -0.028004536405205727, 0.04403194040060043, 0.04048096761107445], [-0.029246972873806953, 0.16645924746990204, 0.04484155774116516, -0.23799078166484833], [-0.025917788967490196, -0.029273677617311478, 0.04008174315094948, 0.06849247962236404], [-0.02650326117873192, 0.16525138914585114, 0.0414515919983387, -0.21127988398075104], [-0.023198233917355537, 0.3597569167613983, 0.03722599521279335, -0.4906042814254761], [-0.016003096476197243, 0.16413013637065887, 0.027413908392190933, -0.18642549216747284], [-0.012720493599772453, 0.35884934663772583, 0.023685399442911148, -0.4703359007835388], [-0.005543506238609552, 0.16340097784996033, 0.014278681017458439, -0.17028270661830902], [-0.0022754864767193794, 0.35831567645072937, 0.01087302714586258, -0.45842716097831726], [0.0048908269964158535, 0.5532822608947754, 0.0017044837586581707, -0.747663140296936], [0.015956472605466843, 0.3581368327140808, -0.013248778879642487, -0.4544442892074585], [0.023119209334254265, 0.5534436106681824, -0.022337663918733597, -0.7512737512588501], [0.034188080579042435, 0.3586367070674896, -0.03736313804984093, -0.4657030403614044], [0.04136081412434578, 0.554266095161438, -0.046677201986312866, -0.7699245810508728], [0.052446138113737106, 0.35981661081314087, -0.062075693160295486, -0.4922861158847809], [0.05964246764779091, 0.16562263667583466, -0.07192141562700272, -0.21979475021362305], [0.06295492500066757, -0.028401486575603485, -0.07631731033325195, 0.04936237260699272], [0.0623868927359581, 0.16772711277008057, -0.07533006370067596, -0.26638972759246826], [0.06574143469333649, -0.02624339610338211, -0.08065785467624664, 0.0016148037975654006], [0.065216563642025, -0.22012151777744293, -0.08062556385993958, 0.2677988111972809], [0.060814134776592255, -0.02394702099263668, -0.07526958733797073, -0.04918527230620384], [0.0603351965546608, 0.1721690148115158, -0.07625328749418259, -0.36463475227355957], [0.06377857178449631, 0.3682871460914612, -0.083545982837677, -0.6803538799285889], [0.07114432007074356, 0.17441889643669128, -0.09715306013822556, -0.41509976983070374], [0.07463269680738449, -0.01920148730278015, -0.10545505583286285, -0.15455682575702667], [0.07424866408109665, -0.21266785264015198, -0.1085461974143982, 0.10308424383401871], [0.06999530643224716, -0.40608033537864685, -0.10648451000452042, 0.3596455454826355], [0.06187370419502258, -0.20961855351924896, -0.0992916002869606, 0.03537473827600479], [0.057681333273649216, -0.013223282061517239, -0.09858410060405731, -0.2869109809398651], [0.05741686746478081, 0.18315626680850983, -0.10432232171297073, -0.6089867949485779], [0.06107999011874199, -0.010364515706896782, -0.1165020614862442, -0.35089895129203796], [0.060872700065374374, 0.18620486557483673, -0.12352003902196884, -0.6779285073280334], [0.06459680199623108, 0.3828066885471344, -0.13707861304283142, -1.0068069696426392], [0.07225292921066284, 0.5794661641120911, -0.15721474587917328, -1.3392040729522705], [0.08384225517511368, 0.38663387298583984, -0.18399883806705475, -1.0995538234710693], [0.09157493710517883, 0.5836371183395386, -0.20598991215229034, -1.443861484527588], [0.030552633106708527, -0.023318255320191383, 0.048968516290187836, -0.04276212677359581], [0.030086267739534378, 0.17106854915618896, 0.048113275319337845, -0.31960180401802063], [0.033507637679576874, -0.024704428389668465, 0.04172123968601227, -0.01214233785867691], [0.03301354870200157, -0.22039911150932312, 0.041478391736745834, 0.29340672492980957], [0.028605567291378975, -0.41608715057373047, 0.04734652489423752, 0.5988774299621582], [0.02028382383286953, -0.22165849804878235, 0.059324074536561966, 0.321476012468338], [0.015850653871893883, -0.027429327368736267, 0.06575359404087067, 0.04807581007480621], [0.015302067622542381, 0.16669116914272308, 0.06671511381864548, -0.223158061504364], [0.018635891377925873, -0.029317766427993774, 0.06225195154547691, 0.08980096131563187], [0.018049536272883415, 0.16485920548439026, 0.06404796987771988, -0.18261004984378815], [0.021346719935536385, 0.3590089976787567, 0.06039576977491379, -0.45442041754722595], [0.028526900336146355, 0.163087397813797, 0.05130736157298088, -0.1433282494544983], [0.031788647174835205, 0.35743844509124756, 0.04844079539179802, -0.4193934202194214], [0.038937415927648544, 0.16166475415229797, 0.040052928030490875, -0.1118413582444191], [0.04217071086168289, -0.03400755673646927, 0.03781609982252121, 0.1932041198015213], [0.04149056226015091, -0.22964948415756226, 0.04168018326163292, 0.49757248163223267], [0.03689756989479065, -0.03513924777507782, 0.051631633192300797, 0.21831095218658447], [0.03619478642940521, 0.15920807421207428, 0.055997852236032486, -0.05764857679605484], [0.039378948509693146, -0.03667021542787552, 0.05484487861394882, 0.2521630525588989], [0.03864554315805435, 0.1576274335384369, 0.05988813936710358, -0.022728877142071724], [0.04179809242486954, -0.038299959152936935, 0.05943356454372406, 0.2882319390773773], [0.0410320907831192, -0.23421688377857208, 0.06519820541143417, 0.5990515947341919], [0.036347754299640656, -0.43018755316734314, 0.07717923074960709, 0.911537766456604], [0.027744004502892494, -0.6262641549110413, 0.09540998935699463, 1.227445363998413], [0.015218720771372318, -0.43249091506004333, 0.11995889246463776, 0.9661153554916382], [0.006568902637809515, -0.6290018558502197, 0.13928119838237762, 1.2939468622207642], [-0.006011134944856167, -0.8255915641784668, 0.1651601344347, 1.6267921924591064], [-0.02252296730875969, -0.6327523589134216, 0.19769598543643951, 1.3898061513900757], [-0.03670455142855644, 0.04419868811964989, 0.01121390052139759, 0.0031842943280935287], [-0.035820577293634415, 0.239158034324646, 0.011277586221694946, -0.2859395146369934], [-0.03103741630911827, 0.4341173470020294, 0.005558795761317015, -0.5750443339347839], [-0.02235507033765316, 0.23891791701316833, -0.005942091345787048, -0.2806154489517212], [-0.017576711252331734, 0.04388122260570526, -0.011554400436580181, 0.010187455452978611], [-0.016699086874723434, -0.1510731279850006, -0.011350651271641254, 0.299202561378479], [-0.019720550626516342, -0.34603145718574524, -0.00536660011857748, 0.5882841944694519], [-0.026641178876161575, -0.5410778522491455, 0.006399083416908979, 0.8792718052864075], [-0.037462737411260605, -0.7362861633300781, 0.023984519764780998, 1.1739596128463745], [-0.052188459783792496, -0.9317114949226379, 0.047463711351156235, 1.4740639925003052], [-0.07082268595695496, -0.7372006773948669, 0.0769449919462204, 1.1965755224227905], [-0.0855666995048523, -0.5431544184684753, 0.10087650269269943, 0.9289668202400208], [-0.09642978757619858, -0.7394828200340271, 0.11945583671331406, 1.2515696287155151], [-0.11121944338083267, -0.5460765957832336, 0.14448723196983337, 0.9985644221305847], [-0.12214098125696182, -0.35315069556236267, 0.1644585132598877, 0.7545225620269775], [-0.12920399010181427, -0.1606316715478897, 0.1795489639043808, 0.5177736282348633], [-0.13241662085056305, 0.031568460166454315, 0.18990443646907806, 0.28661230206489563], [-0.13178525865077972, 0.22354650497436523, 0.19563668966293335, 0.059319134801626205], [-0.12731432914733887, 0.41540396213531494, 0.19682307541370392, -0.16582629084587097], [-0.11900624632835388, 0.2180889993906021, 0.19350653886795044, 0.18192486464977264], [-0.11464446783065796, 0.4099915027618408, 0.19714504480361938, -0.044019829481840134], [-0.10644463449716568, 0.6018206477165222, 0.19626463949680328, -0.26860398054122925], [-0.09440822154283524, 0.7936794757843018, 0.1908925622701645, -0.4935351610183716], [-0.07853463292121887, 0.9856691360473633, 0.18102186918258667, -0.7205063104629517], [-0.05882125347852707, 0.7885660529136658, 0.16661173105239868, -0.3767523765563965], [-0.04304993152618408, 0.5915181636810303, 0.15907669067382812, -0.03651592880487442], [-0.031219568103551865, 0.3945150077342987, 0.15834636986255646, 0.3018292784690857], [-0.023329267278313637, 0.5870674848556519, 0.1643829643726349, 0.06297348439693451], [-0.011587917804718018, 0.7794978022575378, 0.16564242541790009, -0.17366962134838104], [0.004002037923783064, 0.9719094634056091, 0.16216903924942017, -0.4098602533340454], [0.023440226912498474, 0.7749046087265015, 0.1539718359708786, -0.07076117396354675], [0.03893831744790077, 0.5779489278793335, 0.15255659818649292, 0.2662663757801056], [0.05049729719758034, 0.770601749420166, 0.1578819304704666, 0.02532125450670719], [0.06590933352708817, 0.9631486535072327, 0.15838836133480072, -0.21368227899074554], [0.08517230302095413, 0.7661586403846741, 0.1541147083044052, 0.1244758665561676], [0.10049548000097275, 0.5692031979560852, 0.15660423040390015, 0.46153807640075684], [0.11187954246997833, 0.7618053555488586, 0.16583499312400818, 0.22202394902706146], [0.1271156519651413, 0.9542166590690613, 0.1702754646539688, -0.014101093634963036], [0.14619998633861542, 0.7571137547492981, 0.16999344527721405, 0.3270969092845917], [0.16134226322174072, 0.9494593143463135, 0.17653538286685944, 0.0924750491976738], [0.18033143877983093, 0.7523042559623718, 0.17838488519191742, 0.4352436065673828], [0.19537752866744995, 0.5551648736000061, 0.18708975613117218, 0.7784276604652405], [0.20648083090782166, 0.3580309748649597, 0.20265831053256989, 1.1236525774002075], [0.0069489930756390095, 0.010335911065340042, 0.018377970904111862, -0.022429730743169785], [0.00715571129694581, -0.18504470586776733, 0.017929375171661377, 0.27599453926086426], [0.003454816760495305, 0.009816911071538925, 0.023449266329407692, -0.0109799699857831], [0.0036511551588773727, -0.1856333464384079, 0.02322966791689396, 0.2890082597732544], [-6.15118769928813e-05, -0.38107872009277344, 0.029009832069277763, 0.5889261364936829], [-0.007683086208999157, -0.5765946507453918, 0.040788356214761734, 0.8906043171882629], [-0.01921497844159603, -0.3820491135120392, 0.05860044062137604, 0.6110171675682068], [-0.026855960488319397, -0.1877930760383606, 0.07082078605890274, 0.3373519778251648], [-0.03061182238161564, 0.006253357976675034, 0.07756782323122025, 0.0678158700466156], [-0.030486755073070526, 0.2001824676990509, 0.07892414182424545, -0.19942103326320648], [-0.02648310549557209, 0.004025605041533709, 0.07493571937084198, 0.11707795411348343], [-0.02640259452164173, -0.19208559393882751, 0.0772772803902626, 0.432429701089859], [-0.030244305729866028, 0.001862007542513311, 0.0859258770942688, 0.1650734394788742], [-0.030207065865397453, -0.19437815248966217, 0.0892273411154747, 0.48357880115509033], [-0.03409462794661522, -0.0006213149172253907, 0.09889891743659973, 0.22029778361320496], [-0.03410705551505089, -0.19700762629508972, 0.10330487787723541, 0.5424667000770569], [-0.03804720565676689, -0.0034776765387505293, 0.11415421217679977, 0.2840370237827301], [-0.038116760551929474, 0.18984675407409668, 0.11983495205640793, 0.02942626178264618], [-0.03431982547044754, -0.006771688815206289, 0.12042347341775894, 0.3573860228061676], [-0.03445525839924812, -0.20338144898414612, 0.1275711953639984, 0.6854838728904724], [-0.03852288797497749, -0.01023970078676939, 0.1412808746099472, 0.43552976846694946], [-0.03872768208384514, 0.18262916803359985, 0.1499914675951004, 0.19050747156143188], [-0.035075098276138306, 0.3753226101398468, 0.15380162000656128, -0.05135510489344597], [-0.027568647637963295, 0.5679430365562439, 0.15277451276779175, -0.29183557629585266], [-0.016209786757826805, 0.7605941295623779, 0.1469378024339676, -0.5327051877975464], [-0.0009979037567973137, 0.5637443661689758, 0.13628369569778442, -0.19756795465946198], [0.010276983492076397, 0.3669629395008087, 0.13233233988285065, 0.13481071591377258], [0.017616242170333862, 0.5599656105041504, 0.13502855598926544, -0.11336984485387802], [0.028815554454922676, 0.7529203295707703, 0.132761150598526, -0.36058950424194336], [0.04387396201491356, 0.9459299445152283, 0.12554936110973358, -0.6086390018463135], [0.06279256194829941, 0.7492971420288086, 0.11337658762931824, -0.27919670939445496], [0.07777850329875946, 0.5527557730674744, 0.10779265314340591, 0.046983931213617325], [0.08883361518383026, 0.7461801767349243, 0.10873233526945114, -0.20983903110027313], [0.10375722497701645, 0.5496850609779358, 0.1045355498790741, 0.11506734788417816], [0.1147509217262268, 0.3532326817512512, 0.10683690011501312, 0.43881481885910034], [0.12181557714939117, 0.5466931462287903, 0.11561319231987, 0.1816290318965912], [0.13274943828582764, 0.7399872541427612, 0.11924577504396439, -0.07246197015047073], [0.14754918217658997, 0.9332157373428345, 0.11779654026031494, -0.3252711594104767], [0.1662134975194931, 0.7366307973861694, 0.11129111051559448, 0.0021148757077753544], [0.18094611167907715, 0.5401033163070679, 0.11133340746164322, 0.32773450016975403], [0.19174818694591522, 0.7334787249565125, 0.11788810044527054, 0.07213166356086731], [0.2064177542924881, 0.9267305731773376, 0.11933073401451111, -0.18115529417991638], [0.22495236992835999, 1.1199607849121094, 0.115707628428936, -0.4339393377304077], [0.24735158681869507, 1.3132708072662354, 0.10702884197235107, -0.6880232095718384], [0.2736169993877411, 1.1168389320373535, 0.09326837956905365, -0.3636550307273865], [0.29595378041267395, 0.9205237627029419, 0.08599527925252914, -0.04308094456791878], [0.3143642544746399, 1.1143139600753784, 0.08513365685939789, -0.30744072794914246], [0.3366505205631256, 0.9180886745452881, 0.07898484170436859, 0.01083037443459034], [0.35501229763031006, 0.7219280004501343, 0.07920145243406296, 0.3273513913154602], [0.3694508671760559, 0.5257730484008789, 0.08574847877025604, 0.6439223289489746], [0.3799663186073303, 0.7196018695831299, 0.09862692654132843, 0.379426509141922], [0.394358366727829, 0.5232278108596802, 0.1062154546380043, 0.7015055418014526], [0.4048229157924652, 0.7167296409606934, 0.1202455684542656, 0.4440571367740631], [0.4191575050354004, 0.5201298594474792, 0.12912671267986298, 0.7720944881439209], [0.429560124874115, 0.7132610082626343, 0.14456859230995178, 0.5226673483848572], [0.4438253343105316, 0.5164318084716797, 0.15502195060253143, 0.857186496257782], [0.45415398478507996, 0.7091405391693115, 0.1721656769514084, 0.6169840097427368], [0.4683367908000946, 0.9014924168586731, 0.18450535833835602, 0.38308876752853394], [0.4863666296005249, 1.0935810804367065, 0.19216713309288025, 0.15378345549106598], [0.5082382559776306, 0.8963015079498291, 0.19524279236793518, 0.5004058480262756], [0.5261642932891846, 0.6990407705307007, 0.20525091886520386, 0.8477126359939575], [0.029752200469374657, -0.01597285084426403, -0.03936419636011124, 0.03326830267906189], [0.029432743787765503, -0.21050883829593658, -0.03869882971048355, 0.31327614188194275], [0.025222565978765488, -0.014857579953968525, -0.03243330493569374, 0.00864437222480774], [0.024925414472818375, 0.18071413040161133, -0.03226041793823242, -0.29409265518188477], [0.02853969857096672, -0.013933378271758556, -0.03814227133989334, -0.01175620686262846], [0.028261030092835426, -0.20848815143108368, -0.03837739676237106, 0.2686525881290436], [0.024091267958283424, -0.01284012570977211, -0.03300434350967407, -0.035883549600839615], [0.023834465071558952, 0.18273918330669403, -0.03372201696038246, -0.3387942612171173], [0.027489248663187027, 0.37832435965538025, -0.04049789905548096, -0.6419175863265991], [0.0350557342171669, 0.18378962576389313, -0.053336251527071, -0.3622578978538513], [0.03873152658343315, 0.3796274960041046, -0.06058141216635704, -0.6712703704833984], [0.04632407799363136, 0.18539772927761078, -0.0740068182349205, -0.3982602655887604], [0.050032030791044235, 0.38148728013038635, -0.08197202533483505, -0.7133276462554932], [0.05766177922487259, 0.5776426792144775, -0.09623857587575912, -1.0306456089019775], [0.06921463459730148, 0.38392373919487, -0.11685148626565933, -0.7696622014045715], [0.07689310610294342, 0.19058731198310852, -0.13224473595619202, -0.5159114003181458], [0.08070485293865204, -0.002448753220960498, -0.14256295561790466, -0.26765233278274536], [0.08065588027238846, -0.1952788382768631, -0.1479160040616989, -0.023113245144486427], [0.07675030082464218, 0.0016206365544348955, -0.14837826788425446, -0.3585662543773651], [0.0767827108502388, -0.19111478328704834, -0.15554960072040558, -0.11610307544469833], [0.07296042144298553, -0.3837055563926697, -0.15787166357040405, 0.12374783307313919], [0.0652863085269928, -0.5762549042701721, -0.1553966999053955, 0.36275842785835266], [0.053761210292577744, -0.768866240978241, -0.1481415331363678, 0.6026909947395325], [0.038383882492780685, -0.9616395831108093, -0.13608771562576294, 0.845289409160614], [0.019151093438267708, -1.1546684503555298, -0.11918192356824875, 1.0922693014144897], [-0.0039422763511538506, -0.9581950306892395, -0.0973365381360054, 0.7646931409835815], [-0.023106176406145096, -0.7618770599365234, -0.08204267919063568, 0.44303831458091736], [-0.03834371641278267, -0.5656958222389221, -0.07318191230297089, 0.12566283345222473], [-0.049657635390758514, -0.7596972584724426, -0.07066865265369415, 0.3943897485733032], [-0.06485158205032349, -0.9537490010261536, -0.06278085708618164, 0.663981556892395], [-0.08392655849456787, -0.7578124403953552, -0.04950122907757759, 0.35221031308174133], [-0.09908280521631241, -0.9521968364715576, -0.04245702177286148, 0.6288822889328003], [-0.11812674254179001, -1.1467013359069824, -0.0298793762922287, 0.9078975319862366], [-0.14106076955795288, -0.9511879086494446, -0.01172142568975687, 0.6059750914573669], [-0.160084530711174, -0.7559040188789368, 0.00039807605207897723, 0.3096233606338501], [-0.1752026081085205, -0.5607877373695374, 0.0065905433148145676, 0.017065996304154396], [-0.18641836941242218, -0.3657609522342682, 0.006931863259524107, -0.2735302746295929], [-0.1937335878610611, -0.5609810948371887, 0.0014612575760111213, 0.021330896764993668], [-0.20495320856571198, -0.7561240196228027, 0.0018878754926845431, 0.31447452306747437], [-0.22007568180561066, -0.5610289573669434, 0.008177366107702255, 0.0223875530064106], [-0.23129627108573914, -0.36602526903152466, 0.008625117130577564, -0.2677041292190552], [-0.23861676454544067, -0.17102745175361633, 0.003271033987402916, -0.5576542019844055], [-0.2420373260974884, 0.024048427119851112, -0.00788205023854971, -0.8493047952651978], [-0.2415563464164734, -0.17096514999866486, -0.02486814558506012, -0.5591108202934265], [-0.24497565627098083, -0.36572936177253723, -0.03605036064982414, -0.27436527609825134], [-0.2522902488708496, -0.5603188872337341, -0.04153766855597496, 0.0067328582517802715], [-0.26349660754203796, -0.7548213005065918, -0.04140301048755646, 0.2860262095928192], [-0.2785930335521698, -0.9493290781974792, -0.03568248823285103, 0.5653688311576843], [-0.2975796163082123, -1.1439327001571655, -0.024375109001994133, 0.8466000556945801], [-0.3204582929611206, -0.948486864566803, -0.007443108595907688, 0.5463528037071228], [-0.33942800760269165, -1.1435034275054932, 0.0034839475993067026, 0.8366813063621521], [-0.3622981011867523, -0.94842928647995, 0.020217575132846832, 0.5450960993766785], [-0.38126668334007263, -0.7535971403121948, 0.031119495630264282, 0.25885120034217834], [-0.3963386118412018, -0.5589329600334167, 0.03629652038216591, -0.023856032639741898], [-0.40751728415489197, -0.3643498122692108, 0.0358194001019001, -0.3048696517944336], [-0.41480427980422974, -0.16975614428520203, 0.029722006991505623, -0.5860443115234375], [-0.4181993901729584, 0.02493717148900032, 0.018001120537519455, -0.8692182898521423], [-0.4177006483078003, -0.17042498290538788, 0.0006167549290694296, -0.5709304809570312], [-0.421109139919281, -0.3655555844306946, -0.01080185454338789, -0.278053343296051], [-0.4284202754497528, -0.17028121650218964, -0.01636292226612568, -0.5741235017776489], [-0.4318258762359619, -0.3651699721813202, -0.027845392003655434, -0.2866399586200714], [-0.4391292929649353, -0.169662207365036, -0.033578190952539444, -0.587973415851593], [-0.4425225257873535, 0.025913486257195473, -0.04533765837550163, -0.8910416960716248], [-0.4420042634010315, -0.16856501996517181, -0.06315848976373672, -0.6129484176635742], [-0.44537556171417236, 0.02738005667924881, -0.07541745901107788, -0.924836277961731], [-0.44482797384262085, -0.16664667427539825, -0.09391418844461441, -0.656775176525116], [-0.44816088676452637, -0.3603444993495941, -0.10704968869686127, -0.39507901668548584], [-0.455367773771286, -0.5537975430488586, -0.11495126783847809, -0.13797302544116974], [-0.4664437472820282, -0.35723286867141724, -0.11771073192358017, -0.4645954668521881], [-0.47358840703964233, -0.55051189661026, -0.12700264155864716, -0.2112102210521698], [-0.48459863662719727, -0.7436107993125916, -0.13122685253620148, 0.03886682912707329], [-0.49947085976600647, -0.5468750596046448, -0.13044950366020203, -0.29216957092285156], [-0.510408341884613, -0.35015782713890076, -0.13629290461540222, -0.6229817867279053], [-0.5174115300178528, -0.15342256426811218, -0.14875254034996033, -0.9552942514419556], [-0.5204799771308899, -0.3462645411491394, -0.16785842180252075, -0.7127978205680847], [-0.5274052619934082, -0.5387138724327087, -0.182114377617836, -0.47730013728141785], [-0.5381795167922974, -0.7308604717254639, -0.19166037440299988, -0.24709267914295197], [-0.5527967214584351, -0.9228023290634155, -0.1966022402048111, -0.020455656573176384], [-0.5712527632713318, -1.1146413087844849, -0.19701135158538818, 0.2043299674987793], [-0.5935456156730652, -0.9173275828361511, -0.19292475283145905, -0.14346270263195038], [-0.6118921637535095, -0.7200414538383484, -0.1957940012216568, -0.49027037620544434], [-0.6262930035591125, -0.5227746367454529, -0.20559941232204437, -0.8377133011817932]], "actions": [1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.029246972873806953, 0.16645924746990204, 0.04484155774116516, -0.23799078166484833], [-0.025917788967490196, -0.029273677617311478, 0.04008174315094948, 0.06849247962236404], [-0.02650326117873192, 0.16525138914585114, 0.0414515919983387, -0.21127988398075104], [-0.023198233917355537, 0.3597569167613983, 0.03722599521279335, -0.4906042814254761], [-0.016003096476197243, 0.16413013637065887, 0.027413908392190933, -0.18642549216747284], [-0.012720493599772453, 0.35884934663772583, 0.023685399442911148, -0.4703359007835388], [-0.005543506238609552, 0.16340097784996033, 0.014278681017458439, -0.17028270661830902], [-0.0022754864767193794, 0.35831567645072937, 0.01087302714586258, -0.45842716097831726], [0.0048908269964158535, 0.5532822608947754, 0.0017044837586581707, -0.747663140296936], [0.015956472605466843, 0.3581368327140808, -0.013248778879642487, -0.4544442892074585], [0.023119209334254265, 0.5534436106681824, -0.022337663918733597, -0.7512737512588501], [0.034188080579042435, 0.3586367070674896, -0.03736313804984093, -0.4657030403614044], [0.04136081412434578, 0.554266095161438, -0.046677201986312866, -0.7699245810508728], [0.052446138113737106, 0.35981661081314087, -0.062075693160295486, -0.4922861158847809], [0.05964246764779091, 0.16562263667583466, -0.07192141562700272, -0.21979475021362305], [0.06295492500066757, -0.028401486575603485, -0.07631731033325195, 0.04936237260699272], [0.0623868927359581, 0.16772711277008057, -0.07533006370067596, -0.26638972759246826], [0.06574143469333649, -0.02624339610338211, -0.08065785467624664, 0.0016148037975654006], [0.065216563642025, -0.22012151777744293, -0.08062556385993958, 0.2677988111972809], [0.060814134776592255, -0.02394702099263668, -0.07526958733797073, -0.04918527230620384], [0.0603351965546608, 0.1721690148115158, -0.07625328749418259, -0.36463475227355957], [0.06377857178449631, 0.3682871460914612, -0.083545982837677, -0.6803538799285889], [0.07114432007074356, 0.17441889643669128, -0.09715306013822556, -0.41509976983070374], [0.07463269680738449, -0.01920148730278015, -0.10545505583286285, -0.15455682575702667], [0.07424866408109665, -0.21266785264015198, -0.1085461974143982, 0.10308424383401871], [0.06999530643224716, -0.40608033537864685, -0.10648451000452042, 0.3596455454826355], [0.06187370419502258, -0.20961855351924896, -0.0992916002869606, 0.03537473827600479], [0.057681333273649216, -0.013223282061517239, -0.09858410060405731, -0.2869109809398651], [0.05741686746478081, 0.18315626680850983, -0.10432232171297073, -0.6089867949485779], [0.06107999011874199, -0.010364515706896782, -0.1165020614862442, -0.35089895129203796], [0.060872700065374374, 0.18620486557483673, -0.12352003902196884, -0.6779285073280334], [0.06459680199623108, 0.3828066885471344, -0.13707861304283142, -1.0068069696426392], [0.07225292921066284, 0.5794661641120911, -0.15721474587917328, -1.3392040729522705], [0.08384225517511368, 0.38663387298583984, -0.18399883806705475, -1.0995538234710693], [0.09157493710517883, 0.5836371183395386, -0.20598991215229034, -1.443861484527588], [0.10324767976999283, 0.7806114554405212, -0.2348671406507492, -1.7932102680206299], [0.030086267739534378, 0.17106854915618896, 0.048113275319337845, -0.31960180401802063], [0.033507637679576874, -0.024704428389668465, 0.04172123968601227, -0.01214233785867691], [0.03301354870200157, -0.22039911150932312, 0.041478391736745834, 0.29340672492980957], [0.028605567291378975, -0.41608715057373047, 0.04734652489423752, 0.5988774299621582], [0.02028382383286953, -0.22165849804878235, 0.059324074536561966, 0.321476012468338], [0.015850653871893883, -0.027429327368736267, 0.06575359404087067, 0.04807581007480621], [0.015302067622542381, 0.16669116914272308, 0.06671511381864548, -0.223158061504364], [0.018635891377925873, -0.029317766427993774, 0.06225195154547691, 0.08980096131563187], [0.018049536272883415, 0.16485920548439026, 0.06404796987771988, -0.18261004984378815], [0.021346719935536385, 0.3590089976787567, 0.06039576977491379, -0.45442041754722595], [0.028526900336146355, 0.163087397813797, 0.05130736157298088, -0.1433282494544983], [0.031788647174835205, 0.35743844509124756, 0.04844079539179802, -0.4193934202194214], [0.038937415927648544, 0.16166475415229797, 0.040052928030490875, -0.1118413582444191], [0.04217071086168289, -0.03400755673646927, 0.03781609982252121, 0.1932041198015213], [0.04149056226015091, -0.22964948415756226, 0.04168018326163292, 0.49757248163223267], [0.03689756989479065, -0.03513924777507782, 0.051631633192300797, 0.21831095218658447], [0.03619478642940521, 0.15920807421207428, 0.055997852236032486, -0.05764857679605484], [0.039378948509693146, -0.03667021542787552, 0.05484487861394882, 0.2521630525588989], [0.03864554315805435, 0.1576274335384369, 0.05988813936710358, -0.022728877142071724], [0.04179809242486954, -0.038299959152936935, 0.05943356454372406, 0.2882319390773773], [0.0410320907831192, -0.23421688377857208, 0.06519820541143417, 0.5990515947341919], [0.036347754299640656, -0.43018755316734314, 0.07717923074960709, 0.911537766456604], [0.027744004502892494, -0.6262641549110413, 0.09540998935699463, 1.227445363998413], [0.015218720771372318, -0.43249091506004333, 0.11995889246463776, 0.9661153554916382], [0.006568902637809515, -0.6290018558502197, 0.13928119838237762, 1.2939468622207642], [-0.006011134944856167, -0.8255915641784668, 0.1651601344347, 1.6267921924591064], [-0.02252296730875969, -0.6327523589134216, 0.19769598543643951, 1.3898061513900757], [-0.035178013145923615, -0.44056469202041626, 0.22549210488796234, 1.1648846864700317], [-0.035820577293634415, 0.239158034324646, 0.011277586221694946, -0.2859395146369934], [-0.03103741630911827, 0.4341173470020294, 0.005558795761317015, -0.5750443339347839], [-0.02235507033765316, 0.23891791701316833, -0.005942091345787048, -0.2806154489517212], [-0.017576711252331734, 0.04388122260570526, -0.011554400436580181, 0.010187455452978611], [-0.016699086874723434, -0.1510731279850006, -0.011350651271641254, 0.299202561378479], [-0.019720550626516342, -0.34603145718574524, -0.00536660011857748, 0.5882841944694519], [-0.026641178876161575, -0.5410778522491455, 0.006399083416908979, 0.8792718052864075], [-0.037462737411260605, -0.7362861633300781, 0.023984519764780998, 1.1739596128463745], [-0.052188459783792496, -0.9317114949226379, 0.047463711351156235, 1.4740639925003052], [-0.07082268595695496, -0.7372006773948669, 0.0769449919462204, 1.1965755224227905], [-0.0855666995048523, -0.5431544184684753, 0.10087650269269943, 0.9289668202400208], [-0.09642978757619858, -0.7394828200340271, 0.11945583671331406, 1.2515696287155151], [-0.11121944338083267, -0.5460765957832336, 0.14448723196983337, 0.9985644221305847], [-0.12214098125696182, -0.35315069556236267, 0.1644585132598877, 0.7545225620269775], [-0.12920399010181427, -0.1606316715478897, 0.1795489639043808, 0.5177736282348633], [-0.13241662085056305, 0.031568460166454315, 0.18990443646907806, 0.28661230206489563], [-0.13178525865077972, 0.22354650497436523, 0.19563668966293335, 0.059319134801626205], [-0.12731432914733887, 0.41540396213531494, 0.19682307541370392, -0.16582629084587097], [-0.11900624632835388, 0.2180889993906021, 0.19350653886795044, 0.18192486464977264], [-0.11464446783065796, 0.4099915027618408, 0.19714504480361938, -0.044019829481840134], [-0.10644463449716568, 0.6018206477165222, 0.19626463949680328, -0.26860398054122925], [-0.09440822154283524, 0.7936794757843018, 0.1908925622701645, -0.4935351610183716], [-0.07853463292121887, 0.9856691360473633, 0.18102186918258667, -0.7205063104629517], [-0.05882125347852707, 0.7885660529136658, 0.16661173105239868, -0.3767523765563965], [-0.04304993152618408, 0.5915181636810303, 0.15907669067382812, -0.03651592880487442], [-0.031219568103551865, 0.3945150077342987, 0.15834636986255646, 0.3018292784690857], [-0.023329267278313637, 0.5870674848556519, 0.1643829643726349, 0.06297348439693451], [-0.011587917804718018, 0.7794978022575378, 0.16564242541790009, -0.17366962134838104], [0.004002037923783064, 0.9719094634056091, 0.16216903924942017, -0.4098602533340454], [0.023440226912498474, 0.7749046087265015, 0.1539718359708786, -0.07076117396354675], [0.03893831744790077, 0.5779489278793335, 0.15255659818649292, 0.2662663757801056], [0.05049729719758034, 0.770601749420166, 0.1578819304704666, 0.02532125450670719], [0.06590933352708817, 0.9631486535072327, 0.15838836133480072, -0.21368227899074554], [0.08517230302095413, 0.7661586403846741, 0.1541147083044052, 0.1244758665561676], [0.10049548000097275, 0.5692031979560852, 0.15660423040390015, 0.46153807640075684], [0.11187954246997833, 0.7618053555488586, 0.16583499312400818, 0.22202394902706146], [0.1271156519651413, 0.9542166590690613, 0.1702754646539688, -0.014101093634963036], [0.14619998633861542, 0.7571137547492981, 0.16999344527721405, 0.3270969092845917], [0.16134226322174072, 0.9494593143463135, 0.17653538286685944, 0.0924750491976738], [0.18033143877983093, 0.7523042559623718, 0.17838488519191742, 0.4352436065673828], [0.19537752866744995, 0.5551648736000061, 0.18708975613117218, 0.7784276604652405], [0.20648083090782166, 0.3580309748649597, 0.20265831053256989, 1.1236525774002075], [0.2136414498090744, 0.16091375052928925, 0.22513136267662048, 1.47245192527771], [0.00715571129694581, -0.18504470586776733, 0.017929375171661377, 0.27599453926086426], [0.003454816760495305, 0.009816911071538925, 0.023449266329407692, -0.0109799699857831], [0.0036511551588773727, -0.1856333464384079, 0.02322966791689396, 0.2890082597732544], [-6.15118769928813e-05, -0.38107872009277344, 0.029009832069277763, 0.5889261364936829], [-0.007683086208999157, -0.5765946507453918, 0.040788356214761734, 0.8906043171882629], [-0.01921497844159603, -0.3820491135120392, 0.05860044062137604, 0.6110171675682068], [-0.026855960488319397, -0.1877930760383606, 0.07082078605890274, 0.3373519778251648], [-0.03061182238161564, 0.006253357976675034, 0.07756782323122025, 0.0678158700466156], [-0.030486755073070526, 0.2001824676990509, 0.07892414182424545, -0.19942103326320648], [-0.02648310549557209, 0.004025605041533709, 0.07493571937084198, 0.11707795411348343], [-0.02640259452164173, -0.19208559393882751, 0.0772772803902626, 0.432429701089859], [-0.030244305729866028, 0.001862007542513311, 0.0859258770942688, 0.1650734394788742], [-0.030207065865397453, -0.19437815248966217, 0.0892273411154747, 0.48357880115509033], [-0.03409462794661522, -0.0006213149172253907, 0.09889891743659973, 0.22029778361320496], [-0.03410705551505089, -0.19700762629508972, 0.10330487787723541, 0.5424667000770569], [-0.03804720565676689, -0.0034776765387505293, 0.11415421217679977, 0.2840370237827301], [-0.038116760551929474, 0.18984675407409668, 0.11983495205640793, 0.02942626178264618], [-0.03431982547044754, -0.006771688815206289, 0.12042347341775894, 0.3573860228061676], [-0.03445525839924812, -0.20338144898414612, 0.1275711953639984, 0.6854838728904724], [-0.03852288797497749, -0.01023970078676939, 0.1412808746099472, 0.43552976846694946], [-0.03872768208384514, 0.18262916803359985, 0.1499914675951004, 0.19050747156143188], [-0.035075098276138306, 0.3753226101398468, 0.15380162000656128, -0.05135510489344597], [-0.027568647637963295, 0.5679430365562439, 0.15277451276779175, -0.29183557629585266], [-0.016209786757826805, 0.7605941295623779, 0.1469378024339676, -0.5327051877975464], [-0.0009979037567973137, 0.5637443661689758, 0.13628369569778442, -0.19756795465946198], [0.010276983492076397, 0.3669629395008087, 0.13233233988285065, 0.13481071591377258], [0.017616242170333862, 0.5599656105041504, 0.13502855598926544, -0.11336984485387802], [0.028815554454922676, 0.7529203295707703, 0.132761150598526, -0.36058950424194336], [0.04387396201491356, 0.9459299445152283, 0.12554936110973358, -0.6086390018463135], [0.06279256194829941, 0.7492971420288086, 0.11337658762931824, -0.27919670939445496], [0.07777850329875946, 0.5527557730674744, 0.10779265314340591, 0.046983931213617325], [0.08883361518383026, 0.7461801767349243, 0.10873233526945114, -0.20983903110027313], [0.10375722497701645, 0.5496850609779358, 0.1045355498790741, 0.11506734788417816], [0.1147509217262268, 0.3532326817512512, 0.10683690011501312, 0.43881481885910034], [0.12181557714939117, 0.5466931462287903, 0.11561319231987, 0.1816290318965912], [0.13274943828582764, 0.7399872541427612, 0.11924577504396439, -0.07246197015047073], [0.14754918217658997, 0.9332157373428345, 0.11779654026031494, -0.3252711594104767], [0.1662134975194931, 0.7366307973861694, 0.11129111051559448, 0.0021148757077753544], [0.18094611167907715, 0.5401033163070679, 0.11133340746164322, 0.32773450016975403], [0.19174818694591522, 0.7334787249565125, 0.11788810044527054, 0.07213166356086731], [0.2064177542924881, 0.9267305731773376, 0.11933073401451111, -0.18115529417991638], [0.22495236992835999, 1.1199607849121094, 0.115707628428936, -0.4339393377304077], [0.24735158681869507, 1.3132708072662354, 0.10702884197235107, -0.6880232095718384], [0.2736169993877411, 1.1168389320373535, 0.09326837956905365, -0.3636550307273865], [0.29595378041267395, 0.9205237627029419, 0.08599527925252914, -0.04308094456791878], [0.3143642544746399, 1.1143139600753784, 0.08513365685939789, -0.30744072794914246], [0.3366505205631256, 0.9180886745452881, 0.07898484170436859, 0.01083037443459034], [0.35501229763031006, 0.7219280004501343, 0.07920145243406296, 0.3273513913154602], [0.3694508671760559, 0.5257730484008789, 0.08574847877025604, 0.6439223289489746], [0.3799663186073303, 0.7196018695831299, 0.09862692654132843, 0.379426509141922], [0.394358366727829, 0.5232278108596802, 0.1062154546380043, 0.7015055418014526], [0.4048229157924652, 0.7167296409606934, 0.1202455684542656, 0.4440571367740631], [0.4191575050354004, 0.5201298594474792, 0.12912671267986298, 0.7720944881439209], [0.429560124874115, 0.7132610082626343, 0.14456859230995178, 0.5226673483848572], [0.4438253343105316, 0.5164318084716797, 0.15502195060253143, 0.857186496257782], [0.45415398478507996, 0.7091405391693115, 0.1721656769514084, 0.6169840097427368], [0.4683367908000946, 0.9014924168586731, 0.18450535833835602, 0.38308876752853394], [0.4863666296005249, 1.0935810804367065, 0.19216713309288025, 0.15378345549106598], [0.5082382559776306, 0.8963015079498291, 0.19524279236793518, 0.5004058480262756], [0.5261642932891846, 0.6990407705307007, 0.20525091886520386, 0.8477126359939575], [0.5401450991630554, 0.890860915184021, 0.22220516204833984, 0.6259427666664124], [0.029432743787765503, -0.21050883829593658, -0.03869882971048355, 0.31327614188194275], [0.025222565978765488, -0.014857579953968525, -0.03243330493569374, 0.00864437222480774], [0.024925414472818375, 0.18071413040161133, -0.03226041793823242, -0.29409265518188477], [0.02853969857096672, -0.013933378271758556, -0.03814227133989334, -0.01175620686262846], [0.028261030092835426, -0.20848815143108368, -0.03837739676237106, 0.2686525881290436], [0.024091267958283424, -0.01284012570977211, -0.03300434350967407, -0.035883549600839615], [0.023834465071558952, 0.18273918330669403, -0.03372201696038246, -0.3387942612171173], [0.027489248663187027, 0.37832435965538025, -0.04049789905548096, -0.6419175863265991], [0.0350557342171669, 0.18378962576389313, -0.053336251527071, -0.3622578978538513], [0.03873152658343315, 0.3796274960041046, -0.06058141216635704, -0.6712703704833984], [0.04632407799363136, 0.18539772927761078, -0.0740068182349205, -0.3982602655887604], [0.050032030791044235, 0.38148728013038635, -0.08197202533483505, -0.7133276462554932], [0.05766177922487259, 0.5776426792144775, -0.09623857587575912, -1.0306456089019775], [0.06921463459730148, 0.38392373919487, -0.11685148626565933, -0.7696622014045715], [0.07689310610294342, 0.19058731198310852, -0.13224473595619202, -0.5159114003181458], [0.08070485293865204, -0.002448753220960498, -0.14256295561790466, -0.26765233278274536], [0.08065588027238846, -0.1952788382768631, -0.1479160040616989, -0.023113245144486427], [0.07675030082464218, 0.0016206365544348955, -0.14837826788425446, -0.3585662543773651], [0.0767827108502388, -0.19111478328704834, -0.15554960072040558, -0.11610307544469833], [0.07296042144298553, -0.3837055563926697, -0.15787166357040405, 0.12374783307313919], [0.0652863085269928, -0.5762549042701721, -0.1553966999053955, 0.36275842785835266], [0.053761210292577744, -0.768866240978241, -0.1481415331363678, 0.6026909947395325], [0.038383882492780685, -0.9616395831108093, -0.13608771562576294, 0.845289409160614], [0.019151093438267708, -1.1546684503555298, -0.11918192356824875, 1.0922693014144897], [-0.0039422763511538506, -0.9581950306892395, -0.0973365381360054, 0.7646931409835815], [-0.023106176406145096, -0.7618770599365234, -0.08204267919063568, 0.44303831458091736], [-0.03834371641278267, -0.5656958222389221, -0.07318191230297089, 0.12566283345222473], [-0.049657635390758514, -0.7596972584724426, -0.07066865265369415, 0.3943897485733032], [-0.06485158205032349, -0.9537490010261536, -0.06278085708618164, 0.663981556892395], [-0.08392655849456787, -0.7578124403953552, -0.04950122907757759, 0.35221031308174133], [-0.09908280521631241, -0.9521968364715576, -0.04245702177286148, 0.6288822889328003], [-0.11812674254179001, -1.1467013359069824, -0.0298793762922287, 0.9078975319862366], [-0.14106076955795288, -0.9511879086494446, -0.01172142568975687, 0.6059750914573669], [-0.160084530711174, -0.7559040188789368, 0.00039807605207897723, 0.3096233606338501], [-0.1752026081085205, -0.5607877373695374, 0.0065905433148145676, 0.017065996304154396], [-0.18641836941242218, -0.3657609522342682, 0.006931863259524107, -0.2735302746295929], [-0.1937335878610611, -0.5609810948371887, 0.0014612575760111213, 0.021330896764993668], [-0.20495320856571198, -0.7561240196228027, 0.0018878754926845431, 0.31447452306747437], [-0.22007568180561066, -0.5610289573669434, 0.008177366107702255, 0.0223875530064106], [-0.23129627108573914, -0.36602526903152466, 0.008625117130577564, -0.2677041292190552], [-0.23861676454544067, -0.17102745175361633, 0.003271033987402916, -0.5576542019844055], [-0.2420373260974884, 0.024048427119851112, -0.00788205023854971, -0.8493047952651978], [-0.2415563464164734, -0.17096514999866486, -0.02486814558506012, -0.5591108202934265], [-0.24497565627098083, -0.36572936177253723, -0.03605036064982414, -0.27436527609825134], [-0.2522902488708496, -0.5603188872337341, -0.04153766855597496, 0.0067328582517802715], [-0.26349660754203796, -0.7548213005065918, -0.04140301048755646, 0.2860262095928192], [-0.2785930335521698, -0.9493290781974792, -0.03568248823285103, 0.5653688311576843], [-0.2975796163082123, -1.1439327001571655, -0.024375109001994133, 0.8466000556945801], [-0.3204582929611206, -0.948486864566803, -0.007443108595907688, 0.5463528037071228], [-0.33942800760269165, -1.1435034275054932, 0.0034839475993067026, 0.8366813063621521], [-0.3622981011867523, -0.94842928647995, 0.020217575132846832, 0.5450960993766785], [-0.38126668334007263, -0.7535971403121948, 0.031119495630264282, 0.25885120034217834], [-0.3963386118412018, -0.5589329600334167, 0.03629652038216591, -0.023856032639741898], [-0.40751728415489197, -0.3643498122692108, 0.0358194001019001, -0.3048696517944336], [-0.41480427980422974, -0.16975614428520203, 0.029722006991505623, -0.5860443115234375], [-0.4181993901729584, 0.02493717148900032, 0.018001120537519455, -0.8692182898521423], [-0.4177006483078003, -0.17042498290538788, 0.0006167549290694296, -0.5709304809570312], [-0.421109139919281, -0.3655555844306946, -0.01080185454338789, -0.278053343296051], [-0.4284202754497528, -0.17028121650218964, -0.01636292226612568, -0.5741235017776489], [-0.4318258762359619, -0.3651699721813202, -0.027845392003655434, -0.2866399586200714], [-0.4391292929649353, -0.169662207365036, -0.033578190952539444, -0.587973415851593], [-0.4425225257873535, 0.025913486257195473, -0.04533765837550163, -0.8910416960716248], [-0.4420042634010315, -0.16856501996517181, -0.06315848976373672, -0.6129484176635742], [-0.44537556171417236, 0.02738005667924881, -0.07541745901107788, -0.924836277961731], [-0.44482797384262085, -0.16664667427539825, -0.09391418844461441, -0.656775176525116], [-0.44816088676452637, -0.3603444993495941, -0.10704968869686127, -0.39507901668548584], [-0.455367773771286, -0.5537975430488586, -0.11495126783847809, -0.13797302544116974], [-0.4664437472820282, -0.35723286867141724, -0.11771073192358017, -0.4645954668521881], [-0.47358840703964233, -0.55051189661026, -0.12700264155864716, -0.2112102210521698], [-0.48459863662719727, -0.7436107993125916, -0.13122685253620148, 0.03886682912707329], [-0.49947085976600647, -0.5468750596046448, -0.13044950366020203, -0.29216957092285156], [-0.510408341884613, -0.35015782713890076, -0.13629290461540222, -0.6229817867279053], [-0.5174115300178528, -0.15342256426811218, -0.14875254034996033, -0.9552942514419556], [-0.5204799771308899, -0.3462645411491394, -0.16785842180252075, -0.7127978205680847], [-0.5274052619934082, -0.5387138724327087, -0.182114377617836, -0.47730013728141785], [-0.5381795167922974, -0.7308604717254639, -0.19166037440299988, -0.24709267914295197], [-0.5527967214584351, -0.9228023290634155, -0.1966022402048111, -0.020455656573176384], [-0.5712527632713318, -1.1146413087844849, -0.19701135158538818, 0.2043299674987793], [-0.5935456156730652, -0.9173275828361511, -0.19292475283145905, -0.14346270263195038], [-0.6118921637535095, -0.7200414538383484, -0.1957940012216568, -0.49027037620544434], [-0.6262930035591125, -0.5227746367454529, -0.20559941232204437, -0.8377133011817932], [-0.6367484927177429, -0.7145851850509644, -0.22235368192195892, -0.6160783767700195]], "action_prob": [0.5358656644821167, 0.592189371585846, 0.5492844581604004, 0.4174622595310211, 0.643700361251831, 0.4228176772594452, 0.6433765292167664, 0.424747109413147, 0.35607051849365234, 0.6529425382614136, 0.35296475887298584, 0.653745174407959, 0.3486517071723938, 0.6540251970291138, 0.6559675931930542, 0.6235203146934509, 0.48189646005630493, 0.6365009546279907, 0.546987771987915, 0.5772851705551147, 0.42891308665275574, 0.346685528755188, 0.658739447593689, 0.6606625914573669, 0.6246354579925537, 0.518987238407135, 0.591073751449585, 0.44841572642326355, 0.34637463092803955, 0.6643224358558655, 0.3358594477176666, 0.3370431959629059, 0.3573317527770996, 0.6218216419219971, 0.36332938075065613, 0.38495004177093506, 0.4816237688064575, 0.62349933385849, 0.5039898157119751, 0.3800106644630432, 0.652492105960846, 0.6312481164932251, 0.5417842864990234, 0.5848103761672974, 0.5621334314346313, 0.43210726976394653, 0.6385298371315002, 0.4457706809043884, 0.6351704001426697, 0.5431810617446899, 0.4018603563308716, 0.6517906188964844, 0.6113705039024353, 0.5067486763000488, 0.6224328279495239, 0.48562341928482056, 0.36743906140327454, 0.3430594801902771, 0.35399535298347473, 0.6287620663642883, 0.35686543583869934, 0.3759194612503052, 0.607327938079834, 0.6174911856651306, 0.510557234287262, 0.3883862793445587, 0.6507793068885803, 0.6150972843170166, 0.4969349801540375, 0.3807547986507416, 0.3479873239994049, 0.3521404266357422, 0.3651559352874756, 0.6211063265800476, 0.6328058838844299, 0.35382694005966187, 0.6288591623306274, 0.6421567797660828, 0.6566460132598877, 0.6682811975479126, 0.6653844714164734, 0.6241113543510437, 0.46947458386421204, 0.6565691232681274, 0.5908933877944946, 0.48754963278770447, 0.40591609477996826, 0.6338390707969666, 0.5626264810562134, 0.4157082736492157, 0.6720260381698608, 0.6233291029930115, 0.5264790654182434, 0.569449245929718, 0.43201807141304016, 0.6665924191474915, 0.6061763167381287, 0.4926972985267639, 0.36514806747436523, 0.6833748817443848, 0.6582295894622803, 0.4084930419921875, 0.6735104918479919, 0.3740924298763275, 0.3167945444583893, 0.31588730216026306, 0.33816710114479065, 0.5114514231681824, 0.6144915223121643, 0.5023900866508484, 0.38028836250305176, 0.34730783104896545, 0.6474906802177429, 0.6551591157913208, 0.6412658095359802, 0.5659225583076477, 0.5618090629577637, 0.41213274002075195, 0.6540910005569458, 0.3894258439540863, 0.6585251092910767, 0.3687817454338074, 0.6611617803573608, 0.6483544111251831, 0.42251116037368774, 0.34074071049690247, 0.6600370407104492, 0.6669659614562988, 0.6439073085784912, 0.5615589022636414, 0.4493313431739807, 0.6200979351997375, 0.5129950046539307, 0.6289774179458618, 0.5286970734596252, 0.42287933826446533, 0.6321169137954712, 0.5528774857521057, 0.5907289981842041, 0.5251018404960632, 0.38609009981155396, 0.6721149682998657, 0.6358721852302551, 0.5415062308311462, 0.5654047131538391, 0.429891973733902, 0.661919891834259, 0.5983209013938904, 0.4918355643749237, 0.40373560786247253, 0.6398947238922119, 0.582899272441864, 0.5357339382171631, 0.5685632228851318, 0.44694826006889343, 0.35090139508247375, 0.6761676669120789, 0.34089046716690063, 0.6773676872253418, 0.33152562379837036, 0.6777022480964661, 0.32373949885368347, 0.6768879294395447, 0.6817386150360107, 0.665779173374176, 0.37991395592689514, 0.3229316174983978, 0.683292806148529, 0.5072172284126282, 0.6093976497650146, 0.4819159209728241, 0.6316437721252441, 0.5323242545127869, 0.5944988131523132, 0.4568016231060028, 0.3589007258415222, 0.6571769714355469, 0.351688027381897, 0.6577255725860596, 0.34444645047187805, 0.34262338280677795, 0.6416710615158081, 0.655962347984314, 0.666268527507782, 0.6574065685272217, 0.4020540714263916, 0.6680406928062439, 0.6343405246734619, 0.5400954484939575, 0.4328095614910126, 0.37461531162261963, 0.35499945282936096, 0.6477001309394836, 0.6447480320930481, 0.6075447797775269, 0.5081493258476257, 0.40188276767730713, 0.6421422958374023, 0.4075932800769806, 0.3580743074417114, 0.6529048085212708, 0.6440905332565308, 0.5965995192527771, 0.48036086559295654, 0.631008505821228, 0.516680896282196, 0.6022136807441711, 0.4897676706314087, 0.3750903010368347, 0.33735963702201843, 0.6564133167266846, 0.6645567417144775, 0.6346083879470825, 0.5313043594360352, 0.4127391576766968, 0.3574095368385315, 0.6559317708015442, 0.35510188341140747, 0.6575023531913757, 0.6489396691322327, 0.6048600077629089, 0.49869462847709656, 0.3874403238296509, 0.34449461102485657, 0.6545714735984802, 0.6567291021347046, 0.38673555850982666, 0.6578954458236694, 0.3814619183540344, 0.3403625190258026, 0.6551506519317627, 0.33733275532722473, 0.6545435786247253, 0.6653546690940857, 0.6540077924728394, 0.40611377358436584, 0.6625635027885437, 0.6200451850891113, 0.4733250141143799, 0.36024242639541626, 0.3285917341709137, 0.6611411571502686, 0.6736463904380798, 0.6712419986724854, 0.6402446627616882, 0.5723661184310913, 0.5140047669410706, 0.3894400894641876, 0.3272883892059326, 0.6783669590950012], "advantages": [19.501846313476562, 18.740066528320312, 17.93284034729004, 17.145652770996094, 16.656156539916992, 15.647771835327148, 15.164509773254395, 14.179577827453613, 13.707770347595215, 13.52881145477295, 12.4163236618042, 12.31791877746582, 11.253297805786133, 11.261115074157715, 10.259993553161621, 9.423649787902832, 8.806478500366211, 8.32577896118164, 7.695389747619629, 7.306921005249023, 6.467719554901123, 6.113421440124512, 6.1835713386535645, 5.417426586151123, 4.844336032867432, 4.4933271408081055, 4.3205366134643555, 3.397353410720825, 2.9572596549987793, 2.9364850521087646, 2.4590821266174316, 2.510125160217285, 2.67280912399292, 2.752802610397339, 2.8738062381744385, 2.772705078125, 14.58640193939209, 13.824645042419434, 12.861669540405273, 12.184621810913086, 11.755916595458984, 10.19831657409668, 8.957723617553711, 8.031682968139648, 7.082801342010498, 6.123274803161621, 5.441469192504883, 4.304318428039551, 3.609346866607666, 2.501413345336914, 1.6271849870681763, 0.9838491082191467, -0.3656485676765442, -1.4415497779846191, -2.3356502056121826, -3.4485762119293213, -4.344236373901367, -5.036323070526123, -5.559523582458496, -5.974609851837158, -7.898469924926758, -8.377206802368164, -8.81640911102295, -10.869946479797363, 23.88377571105957, 23.318151473999023, 23.05791664123535, 22.127077102661133, 21.409608840942383, 20.931554794311523, 20.67793846130371, 20.584400177001953, 20.55173683166504, 20.482515335083008, 18.520788192749023, 16.667409896850586, 16.492910385131836, 14.651559829711914, 13.044233322143555, 11.690533638000488, 10.551554679870605, 9.568924903869629, 8.693280220031738, 7.826020240783691, 6.933302879333496, 6.104182720184326, 5.323573112487793, 4.587957859039307, 3.571364402770996, 2.6367928981781006, 1.7657897472381592, 0.8741804361343384, 0.015321800485253334, -0.816006600856781, -1.7761930227279663, -2.6932566165924072, -3.6003975868225098, -4.4877214431762695, -5.446538925170898, -6.377511978149414, -7.3310627937316895, -8.271075248718262, -9.243802070617676, -10.208447456359863, -11.19198989868164, -12.162284851074219, -13.119444847106934, 35.36753845214844, 34.95883560180664, 34.12009811401367, 33.69795227050781, 33.517845153808594, 33.500553131103516, 31.945756912231445, 30.65952491760254, 29.66815948486328, 28.9505672454834, 28.243803024291992, 27.776670455932617, 26.741554260253906, 26.274198532104492, 25.218515396118164, 24.749526977539062, 23.68024253845215, 22.814359664916992, 22.178298950195312, 21.706918716430664, 20.631519317626953, 19.727968215942383, 18.94745445251465, 18.25757598876953, 17.643905639648438, 16.75443458557129, 15.970284461975098, 15.233736038208008, 14.559446334838867, 13.946181297302246, 13.040223121643066, 12.214170455932617, 11.493325233459473, 10.671605110168457, 9.909402847290039, 9.087955474853516, 8.312586784362793, 7.578022003173828, 6.703127861022949, 5.876213550567627, 5.054289817810059, 4.2656025886535645, 3.511815071105957, 2.8017899990081787, 1.826293706893921, 0.8976427316665649, 0.10429484397172928, -0.8325375914573669, -1.7357553243637085, -2.610572099685669, -3.539572238922119, -4.430995941162109, -5.383058547973633, -6.290979385375977, -7.265739917755127, -8.190276145935059, -9.187020301818848, -10.166852951049805, -11.1362943649292, -12.134434700012207, -13.120293617248535, 46.14875030517578, 46.02583694458008, 45.38694381713867, 45.16345977783203, 44.741722106933594, 44.57851791381836, 43.9708251953125, 43.79374313354492, 44.016353607177734, 43.40202331542969, 43.738277435302734, 43.21206283569336, 43.68001174926758, 44.403114318847656, 44.12928009033203, 43.99678039550781, 44.04443359375, 44.284915924072266, 44.56178283691406, 44.86261749267578, 45.26605224609375, 45.6482048034668, 45.872650146484375, 45.85352325439453, 45.57237243652344, 44.91510009765625, 44.26709747314453, 43.70219039916992, 43.41523361206055, 42.96232223510742, 42.219329833984375, 41.663455963134766, 40.94303894042969, 39.95432662963867, 38.93699264526367, 37.98410415649414, 37.200626373291016, 36.54987335205078, 35.885276794433594, 34.87926483154297, 34.05759811401367, 33.4749870300293, 33.101165771484375, 32.5848388671875, 32.07640838623047, 31.575124740600586, 31.036842346191406, 30.401227951049805, 29.63300323486328, 28.485933303833008, 27.64281463623047, 26.324485778808594, 24.993812561035156, 23.75865364074707, 22.722421646118164, 21.93854522705078, 21.393993377685547, 20.58125877380371, 19.812503814697266, 19.22942543029785, 18.528369903564453, 18.018930435180664, 17.715137481689453, 17.213947296142578, 16.999984741210938, 16.678117752075195, 16.348909378051758, 15.986052513122559, 15.660602569580078, 15.320712089538574, 14.880707740783691, 14.48033332824707, 14.148541450500488, 13.806905746459961, 13.710963249206543, 13.48619556427002, 13.110799789428711, 12.569506645202637, 11.854371070861816, 11.42985725402832, 10.928348541259766, 10.333455085754395], "value_targets": [30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 526170535, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1804566556, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 1893943449, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712, 579425712], "obs": [[-0.04736221209168434, 0.026181744411587715, -0.04731771722435951, 0.02832026220858097], [-0.04683857783675194, -0.1682308316230774, -0.04675131291151047, 0.3057065010070801], [-0.050203192979097366, -0.36265647411346436, -0.04063718020915985, 0.5832864046096802], [-0.05745632201433182, -0.16698946058750153, -0.02897145412862301, 0.2780841886997223], [-0.060796111822128296, -0.3616863787174225, -0.0234097708016634, 0.5614905953407288], [-0.06802984327077866, -0.55647212266922, -0.012179957702755928, 0.846707284450531], [-0.07915928214788437, -0.361186146736145, 0.004754188004881144, 0.5502192378044128], [-0.08638300746679306, -0.5563745498657227, 0.01575857400894165, 0.8443962931632996], [-0.09751049429178238, -0.36147114634513855, 0.03264649957418442, 0.5567103028297424], [-0.10473991930484772, -0.1668223738670349, 0.04378070309758186, 0.27448907494544983], [-0.10807636380195618, 0.02764846757054329, 0.04927048459649086, -0.004070250317454338], [-0.10752339661121368, 0.22203044593334198, 0.04918907955288887, -0.2808097302913666], [-0.10308279097080231, 0.026242611929774284, 0.043572887778282166, 0.026972571387887], [-0.10255793482065201, -0.1694762408733368, 0.04411233589053154, 0.3330785930156708], [-0.10594745725393295, 0.02499099262058735, 0.05077391117811203, 0.05462631210684776], [-0.10544764250516891, -0.17082083225250244, 0.05186643451452255, 0.3628866374492645], [-0.10886405408382416, 0.023527057841420174, 0.0591241680085659, 0.08699873834848404], [-0.10839351266622543, 0.21775387227535248, 0.06086414307355881, -0.18646003305912018], [-0.10403843969106674, 0.021816300228238106, 0.05713494122028351, 0.12478511780500412], [-0.10360211133956909, 0.21607515215873718, 0.05963064357638359, -0.14933915436267853], [-0.09928061068058014, 0.410294771194458, 0.05664386227726936, -0.4226297438144684], [-0.09107471257448196, 0.6045703887939453, 0.048191267997026443, -0.6969314217567444], [-0.07898330688476562, 0.4088144600391388, 0.03425263985991478, -0.38947564363479614], [-0.07080701738595963, 0.21322350203990936, 0.02646312490105629, -0.0861930176615715], [-0.06654255092144012, 0.017732415348291397, 0.02473926544189453, 0.21472018957138062], [-0.06618789583444595, 0.21249210834503174, 0.029033668339252472, -0.07005734741687775], [-0.06193805858492851, 0.40718603134155273, 0.027632521465420723, -0.35344046354293823], [-0.05379433557391167, 0.2116822898387909, 0.02056371234357357, -0.05217386409640312], [-0.04956069216132164, 0.01627160608768463, 0.019520234316587448, 0.246925488114357], [-0.049235258251428604, 0.21110941469669342, 0.0244587454944849, -0.03953694924712181], [-0.04501307010650635, 0.01564541459083557, 0.02366800606250763, 0.2607614994049072], [-0.04470016062259674, 0.21042165160179138, 0.028883235529065132, -0.02436327375471592], [-0.040491729974746704, 0.014897647313773632, 0.028395971283316612, 0.27729088068008423], [-0.04019377753138542, 0.2096032202243805, 0.033941786736249924, -0.0063024405390024185], [-0.03600171208381653, 0.40422236919403076, 0.033815737813711166, -0.28808605670928955], [-0.02791726402938366, 0.20863492786884308, 0.028054017573595047, 0.015067328698933125], [-0.02374456636607647, 0.01312210876494646, 0.028355365619063377, 0.31646794080734253], [-0.023482123389840126, 0.20782893896102905, 0.03468472510576248, 0.032860469073057175], [-0.01932554505765438, 0.012227204628288746, 0.035341933369636536, 0.3362818658351898], [-0.019081000238656998, -0.1833794116973877, 0.04206756874918938, 0.6398969292640686], [-0.022748589515686035, 0.011131568811833858, 0.054865509271621704, 0.36075282096862793], [-0.022525956854224205, 0.2054324597120285, 0.062080565840005875, 0.0858624055981636], [-0.01841730810701847, 0.3996121287345886, 0.06379781663417816, -0.1866060346364975], [-0.010425065644085407, 0.20363815128803253, 0.06006569415330887, 0.12550072371959686], [-0.006352302618324757, 0.007709424011409283, 0.06257570534944534, 0.4365125000476837], [-0.00619811424985528, 0.20189234614372253, 0.07130596041679382, 0.16419346630573273], [-0.0021602672059088945, 0.005825924687087536, 0.07458982616662979, 0.4784919321537018], [-0.002043748740106821, 0.1998199224472046, 0.08415966480970383, 0.2102191001176834], [0.0019526499090716243, 0.3936440050601959, 0.08836404979228973, -0.05477425828576088], [0.009825530461966991, 0.19737347960472107, 0.08726856112480164, 0.26442813873291016], [0.013772999867796898, 0.3911484479904175, 0.09255712479352951, 0.0004961864906363189], [0.021595967933535576, 0.5848295092582703, 0.09256704896688461, -0.26160889863967896], [0.033292558044195175, 0.38851648569107056, 0.08733487129211426, 0.05877579376101494], [0.041062887758016586, 0.582284688949585, 0.08851038664579391, -0.20512497425079346], [0.05270858108997345, 0.3860158622264862, 0.08440788835287094, 0.11411397159099579], [0.06042889878153801, 0.5798332691192627, 0.08669016510248184, -0.15079066157341003], [0.07202556729316711, 0.7736138105392456, 0.083674356341362, -0.41491493582725525], [0.08749784529209137, 0.9674563407897949, 0.07537605613470078, -0.6800898313522339], [0.10684696584939957, 0.7713727951049805, 0.06177425757050514, -0.3646601140499115], [0.12227442115545273, 0.9655649065971375, 0.054481055587530136, -0.6372426152229309], [0.14158572256565094, 1.1598864793777466, 0.04173620417714119, -0.9122829437255859], [0.16478344798088074, 0.9642254710197449, 0.0234905444085598, -0.6067801713943481], [0.184067964553833, 1.1590112447738647, 0.011354941874742508, -0.8919726014137268], [0.20724818110466003, 0.9637371301651001, -0.006484510377049446, -0.5957419872283936], [0.22652292251586914, 1.1589492559432983, -0.018399350345134735, -0.8904604315757751], [0.24970191717147827, 1.3543158769607544, -0.036208558827638626, -1.1888699531555176], [0.27678823471069336, 1.1596815586090088, -0.05998595803976059, -0.9077527523040771], [0.29998186230659485, 1.3555619716644287, -0.07814101129770279, -1.2186702489852905], [0.32709309458732605, 1.5515995025634766, -0.10251442342996597, -1.53477942943573], [0.35812509059906006, 1.3578507900238037, -0.13321000337600708, -1.275768518447876], [0.38528209924697876, 1.1646552085876465, -0.15872538089752197, -1.0275905132293701], [0.4085752069950104, 0.9719610214233398, -0.1792771965265274, -0.7886521816253662], [0.4280144274234772, 0.7796945571899414, -0.19505023956298828, -0.557300329208374], [0.4436083137989044, 0.9769424796104431, -0.20619623363018036, -0.9045437574386597], [0.03709660843014717, 0.011757790111005306, -0.020455816760659218, -0.02227775938808918], [0.03733176365494728, -0.18306492269039154, -0.020901372656226158, 0.2638815641403198], [0.033670466393232346, -0.3778823912143707, -0.01562374085187912, 0.5498993992805481], [0.026112819090485573, -0.1825445145368576, -0.004625752568244934, 0.25233516097068787], [0.02246192842721939, -0.3776001036167145, 0.00042095035314559937, 0.5435554385185242], [0.014909926801919937, -0.18248407542705536, 0.01129205897450447, 0.2510051727294922], [0.011260244995355606, -0.3777654469013214, 0.016312163323163986, 0.5472283363342285], [0.003704936010763049, -0.18287642300128937, 0.02725672908127308, 0.259729266166687], [4.740770236821845e-05, -0.37837666273117065, 0.032451316714286804, 0.5608831644058228], [-0.00752012524753809, -0.5739386677742004, 0.04366897791624069, 0.8636107444763184], [-0.018998898565769196, -0.37943753600120544, 0.060941193252801895, 0.5849718451499939], [-0.026587650179862976, -0.18521979451179504, 0.07264062762260437, 0.3120916187763214], [-0.030292045325040817, 0.00879615917801857, 0.07888246327638626, 0.04317273944616318], [-0.030116122215986252, -0.18736311793327332, 0.07974591851234436, 0.35966411232948303], [-0.033863384276628494, 0.0065400125458836555, 0.08693920075893402, 0.0931541919708252], [-0.0337325856089592, 0.20031523704528809, 0.0888022854924202, -0.1708829253911972], [-0.02972627989947796, 0.004041898529976606, 0.08538462221622467, 0.14844058454036713], [-0.029645441100001335, 0.19784395396709442, 0.08835344016551971, -0.11613085865974426], [-0.02568856254220009, 0.39159613847732544, 0.08603081852197647, -0.37968340516090393], [-0.017856640741229057, 0.1953645646572113, 0.07843714952468872, -0.06116274744272232], [-0.013949348591268063, 0.38927939534187317, 0.07721389830112457, -0.32810378074645996], [-0.006163761019706726, 0.1931479573249817, 0.0706518217921257, -0.012104873545467854], [-0.0023008016869425774, -0.0029123681597411633, 0.07040972262620926, 0.3020062744617462], [-0.002359048929065466, 0.1911391168832779, 0.07644984871149063, 0.0323336198925972], [0.0014637334970757365, -0.004991173278540373, 0.07709652185440063, 0.34812411665916443], [0.001363910036161542, 0.1889543980360031, 0.08405900746583939, 0.08071386069059372], [0.0051429979503154755, -0.007265665102750063, 0.08567328006029129, 0.3986889719963074], [0.004997684620320797, -0.20349189639091492, 0.0936470627784729, 0.7171059250831604], [0.0009278468205593526, -0.009782165288925171, 0.10798917710781097, 0.4553065001964569], [0.0007322034798562527, -0.20625203847885132, 0.11709530651569366, 0.7799817323684692], [-0.003392837243154645, -0.012917831540107727, 0.13269494473934174, 0.5263137221336365], [-0.0036511938087642193, 0.1801118552684784, 0.14322121441364288, 0.2782125174999237], [-4.8956702812574804e-05, 0.3729311227798462, 0.14878547191619873, 0.03390814736485481], [0.007409665733575821, 0.565640926361084, 0.14946362376213074, -0.20838123559951782], [0.01872248388826847, 0.3687330186367035, 0.14529600739479065, 0.12746655941009521], [0.026097144931554794, 0.17186078429222107, 0.1478453427553177, 0.4622301757335663], [0.029534360393881798, 0.36461785435676575, 0.1570899486541748, 0.21955719590187073], [0.0368267185986042, 0.5571862459182739, 0.1614810824394226, -0.01974400505423546], [0.04797044396400452, 0.7496683597564697, 0.16108620166778564, -0.25744158029556274], [0.0629638135433197, 0.9421678781509399, 0.15593737363815308, -0.4952978193759918], [0.08180716633796692, 1.1347867250442505, 0.1460314244031906, -0.7350603938102722], [0.10450290143489838, 1.3276220560073853, 0.131330206990242, -0.9784536957740784], [0.1310553401708603, 1.131007194519043, 0.11176113784313202, -0.6475710272789001], [0.15367548167705536, 1.3244092464447021, 0.09880971163511276, -0.9030748009681702], [0.1801636666059494, 1.128097653388977, 0.08074822276830673, -0.5810409784317017], [0.2027256339788437, 0.9319427013397217, 0.0691273957490921, -0.26405298709869385], [0.22136448323726654, 1.1260133981704712, 0.06384634226560593, -0.5341564416885376], [0.24388474225997925, 0.9300543665885925, 0.05316321179270744, -0.22205878794193268], [0.2624858319759369, 1.124377727508545, 0.0487220361828804, -0.4975093901157379], [0.2849733829498291, 0.9286038875579834, 0.038771845400333405, -0.18987847864627838], [0.3035454750061035, 0.7329493165016174, 0.03497427701950073, 0.11477887630462646], [0.31820446252822876, 0.927553117275238, 0.03726985678076744, -0.16666799783706665], [0.33675551414489746, 0.7319180369377136, 0.03393649682402611, 0.13753563165664673], [0.3513938784599304, 0.5363268852233887, 0.036687206476926804, 0.4407288730144501], [0.3621204197406769, 0.3407054543495178, 0.04550178349018097, 0.7447471618652344], [0.3689345121383667, 0.1449860781431198, 0.06039672717452049, 1.051395297050476], [0.37183424830436707, 0.33925727009773254, 0.08142463117837906, 0.778265655040741], [0.37861940264701843, 0.5331708192825317, 0.0969899445772171, 0.5122714638710022], [0.38928282260894775, 0.726802408695221, 0.1072353795170784, 0.25165945291519165], [0.40381884574890137, 0.5303256511688232, 0.11226856708526611, 0.5761485695838928], [0.4144253730773926, 0.3338238298892975, 0.12379153817892075, 0.9019833207130432], [0.421101838350296, 0.527070939540863, 0.1418312042951584, 0.6506326794624329], [0.4316432774066925, 0.7199623584747314, 0.15484385192394257, 0.4057595729827881], [0.4460425078868866, 0.5230225920677185, 0.1629590541124344, 0.7429772615432739], [0.4565029740333557, 0.3260713815689087, 0.17781859636306763, 1.0821882486343384], [0.463024377822876, 0.12910570204257965, 0.19946235418319702, 1.424981713294983], [0.04156698286533356, -0.03860153630375862, 0.003960105124861002, 0.006779628340154886], [0.04079495370388031, 0.1564633995294571, 0.004095697775483131, -0.2846512198448181], [0.04392421990633011, 0.3515267074108124, -0.0015973264817148447, -0.5760395526885986], [0.050954755395650864, 0.15642717480659485, -0.013118118047714233, -0.2838602662086487], [0.05408329889178276, 0.3517337441444397, -0.018795322626829147, -0.5806515216827393], [0.06111797317862511, 0.5471139550209045, -0.030408354476094246, -0.8791955709457397], [0.0720602497458458, 0.35241806507110596, -0.047992266714572906, -0.5962254405021667], [0.07910861074924469, 0.5481776595115662, -0.05991677567362785, -0.9036310315132141], [0.09007216989994049, 0.353916198015213, -0.07798939943313599, -0.6303667426109314], [0.09715048968791962, 0.5500348210334778, -0.09059672802686691, -0.9465560913085938], [0.10815118998289108, 0.35624203085899353, -0.10952785611152649, -0.6836580634117126], [0.1152760237455368, 0.16279760003089905, -0.12320101261138916, -0.42736703157424927], [0.1185319796204567, -0.030383719131350517, -0.13174834847450256, -0.17592096328735352], [0.11792430281639099, -0.22339823842048645, -0.13526678085327148, 0.07246968150138855], [0.11345633864402771, -0.41634777188301086, -0.1338173747062683, 0.31960293650627136], [0.10512938350439072, -0.21959906816482544, -0.12742532789707184, -0.01210664864629507], [0.10073740035295486, -0.022901825606822968, -0.12766745686531067, -0.3421221375465393], [0.10027936846017838, -0.21599817276000977, -0.1345098912715912, -0.0922672376036644], [0.09595940262079239, -0.4089614152908325, -0.1363552361726761, 0.155136376619339], [0.0877801775932312, -0.6018943190574646, -0.13325251638889313, 0.4018852114677429], [0.07574228942394257, -0.4051589071750641, -0.1252148151397705, 0.07033777236938477], [0.06763911247253418, -0.2084849774837494, -0.12380805611610413, -0.2590804994106293], [0.06346940994262695, -0.40164196491241455, -0.12898966670036316, -0.007869413122534752], [0.055436570197343826, -0.5947007536888123, -0.12914705276489258, 0.2414950728416443], [0.04354255646467209, -0.7877640724182129, -0.12431715428829193, 0.49081459641456604], [0.02778727374970913, -0.5911279320716858, -0.11450085788965225, 0.16168144345283508], [0.01596471481025219, -0.3945688307285309, -0.11126723140478134, -0.16481631994247437], [0.008073339238762856, -0.5879366993904114, -0.11456355452537537, 0.09079672396183014], [-0.003685394302010536, -0.3913749158382416, -0.11274762451648712, -0.23572121560573578], [-0.011512892320752144, -0.1948377937078476, -0.11746204644441605, -0.5617327094078064], [-0.015409648418426514, -0.3881324529647827, -0.12869669497013092, -0.3082430958747864], [-0.023172298446297646, -0.5812082290649414, -0.134861558675766, -0.05875704064965248], [-0.03479646146297455, -0.774164617061615, -0.1360367089509964, 0.18852029740810394], [-0.050279755145311356, -0.9671046733856201, -0.13226629793643951, 0.43538498878479004], [-0.06962184607982635, -0.7703825831413269, -0.12355859577655792, 0.10410628467798233], [-0.0850294977426529, -0.9635371565818787, -0.12147647142410278, 0.35539543628692627], [-0.10430024564266205, -0.7669163346290588, -0.11436856538057327, 0.027011290192604065], [-0.11963856965303421, -0.9602282047271729, -0.11382833868265152, 0.2815336585044861], [-0.1388431340456009, -1.1535580158233643, -0.1081976667046547, 0.5362583994865417], [-0.16191428899765015, -1.3470056056976318, -0.09747249633073807, 0.7929848432540894], [-0.1888544112443924, -1.1506903171539307, -0.08161280304193497, 0.4712981581687927], [-0.21186821162700653, -1.3445703983306885, -0.07218683511018753, 0.7371827363967896], [-0.2387596219778061, -1.5386251211166382, -0.05744318291544914, 1.0063021183013916], [-0.26953211426734924, -1.732934832572937, -0.03731713816523552, 1.2804070711135864], [-0.30419081449508667, -1.5373578071594238, -0.011708997189998627, 0.9762770533561707], [-0.3349379897117615, -1.732320785522461, 0.00781654380261898, 1.2652591466903687], [-0.3695843815803528, -1.927541732788086, 0.03312172740697861, 1.5603796243667603], [-0.40813523530960083, -2.123044013977051, 0.06432931870222092, 1.863208293914795], [-0.4505960941314697, -2.3188090324401855, 0.1015934869647026, 2.1751482486724854], [-0.49697229266166687, -2.124811887741089, 0.14509645104408264, 1.9154701232910156], [-0.53946852684021, -1.9315199851989746, 0.18340584635734558, 1.671087622642517], [0.04889354482293129, 0.014676018618047237, 0.021171128377318382, 0.03500877320766449], [0.0491870641708374, -0.1807430386543274, 0.021871304139494896, 0.33429551124572754], [0.04557220637798309, 0.014060918241739273, 0.02855721488595009, 0.04858911782503128], [0.045853421092033386, -0.18145863711833954, 0.029528995975852013, 0.35014355182647705], [0.042224250733852386, 0.01323118805885315, 0.03653186932206154, 0.06691639125347137], [0.04248887300491333, -0.18239496648311615, 0.037870194762945175, 0.3708977997303009], [0.03884097561240196, 0.01216906774789095, 0.04528815299272537, 0.09039219468832016], [0.039084356278181076, 0.20661360025405884, 0.047095995396375656, -0.1876654028892517], [0.04321662709116936, 0.4010312259197235, 0.04334268718957901, -0.4651273488998413], [0.05123725160956383, 0.20532448589801788, 0.034040141850709915, -0.15910416841506958], [0.05534374341368675, 0.009732136502861977, 0.030858056619763374, 0.1441202461719513], [0.05553838610649109, -0.18581783771514893, 0.033740460872650146, 0.44637638330459595], [0.051822029054164886, -0.381400465965271, 0.04266798868775368, 0.7495011687278748], [0.044194020330905914, -0.18689221143722534, 0.057658012956380844, 0.4705449044704437], [0.040456175804138184, -0.38277918100357056, 0.067068912088871, 0.7808291912078857], [0.032800592482089996, -0.18864016234874725, 0.08268549293279648, 0.5099788308143616], [0.02902778796851635, -0.38482367992401123, 0.09288506954908371, 0.827530562877655], [0.021331313997507095, -0.19108615815639496, 0.10943568497896194, 0.5654459595680237], [0.017509590834379196, -0.38755953311920166, 0.12074460089206696, 0.8905029296875], [0.009758400730788708, -0.1942644566297531, 0.1385546624660492, 0.6380840539932251], [0.005873111542314291, -0.001318691880442202, 0.1513163447380066, 0.3920438587665558], [0.005846737418323755, 0.19136837124824524, 0.15915721654891968, 0.150633305311203], [0.009674104861915112, 0.38389578461647034, 0.16216988861560822, -0.08791292458772659], [0.017352020367980003, 0.1868657022714615, 0.16041162610054016, 0.25122368335723877], [0.021089335903525352, -0.010139930061995983, 0.16543610394001007, 0.5898972749710083], [0.020886536687612534, 0.18232645094394684, 0.17723403871059418, 0.3535560965538025], [0.024533065035939217, -0.01481450442224741, 0.18430516123771667, 0.6964696645736694], [0.024236775934696198, -0.21194903552532196, 0.19823455810546875, 1.0410429239273071]], "actions": [0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.04683857783675194, -0.1682308316230774, -0.04675131291151047, 0.3057065010070801], [-0.050203192979097366, -0.36265647411346436, -0.04063718020915985, 0.5832864046096802], [-0.05745632201433182, -0.16698946058750153, -0.02897145412862301, 0.2780841886997223], [-0.060796111822128296, -0.3616863787174225, -0.0234097708016634, 0.5614905953407288], [-0.06802984327077866, -0.55647212266922, -0.012179957702755928, 0.846707284450531], [-0.07915928214788437, -0.361186146736145, 0.004754188004881144, 0.5502192378044128], [-0.08638300746679306, -0.5563745498657227, 0.01575857400894165, 0.8443962931632996], [-0.09751049429178238, -0.36147114634513855, 0.03264649957418442, 0.5567103028297424], [-0.10473991930484772, -0.1668223738670349, 0.04378070309758186, 0.27448907494544983], [-0.10807636380195618, 0.02764846757054329, 0.04927048459649086, -0.004070250317454338], [-0.10752339661121368, 0.22203044593334198, 0.04918907955288887, -0.2808097302913666], [-0.10308279097080231, 0.026242611929774284, 0.043572887778282166, 0.026972571387887], [-0.10255793482065201, -0.1694762408733368, 0.04411233589053154, 0.3330785930156708], [-0.10594745725393295, 0.02499099262058735, 0.05077391117811203, 0.05462631210684776], [-0.10544764250516891, -0.17082083225250244, 0.05186643451452255, 0.3628866374492645], [-0.10886405408382416, 0.023527057841420174, 0.0591241680085659, 0.08699873834848404], [-0.10839351266622543, 0.21775387227535248, 0.06086414307355881, -0.18646003305912018], [-0.10403843969106674, 0.021816300228238106, 0.05713494122028351, 0.12478511780500412], [-0.10360211133956909, 0.21607515215873718, 0.05963064357638359, -0.14933915436267853], [-0.09928061068058014, 0.410294771194458, 0.05664386227726936, -0.4226297438144684], [-0.09107471257448196, 0.6045703887939453, 0.048191267997026443, -0.6969314217567444], [-0.07898330688476562, 0.4088144600391388, 0.03425263985991478, -0.38947564363479614], [-0.07080701738595963, 0.21322350203990936, 0.02646312490105629, -0.0861930176615715], [-0.06654255092144012, 0.017732415348291397, 0.02473926544189453, 0.21472018957138062], [-0.06618789583444595, 0.21249210834503174, 0.029033668339252472, -0.07005734741687775], [-0.06193805858492851, 0.40718603134155273, 0.027632521465420723, -0.35344046354293823], [-0.05379433557391167, 0.2116822898387909, 0.02056371234357357, -0.05217386409640312], [-0.04956069216132164, 0.01627160608768463, 0.019520234316587448, 0.246925488114357], [-0.049235258251428604, 0.21110941469669342, 0.0244587454944849, -0.03953694924712181], [-0.04501307010650635, 0.01564541459083557, 0.02366800606250763, 0.2607614994049072], [-0.04470016062259674, 0.21042165160179138, 0.028883235529065132, -0.02436327375471592], [-0.040491729974746704, 0.014897647313773632, 0.028395971283316612, 0.27729088068008423], [-0.04019377753138542, 0.2096032202243805, 0.033941786736249924, -0.0063024405390024185], [-0.03600171208381653, 0.40422236919403076, 0.033815737813711166, -0.28808605670928955], [-0.02791726402938366, 0.20863492786884308, 0.028054017573595047, 0.015067328698933125], [-0.02374456636607647, 0.01312210876494646, 0.028355365619063377, 0.31646794080734253], [-0.023482123389840126, 0.20782893896102905, 0.03468472510576248, 0.032860469073057175], [-0.01932554505765438, 0.012227204628288746, 0.035341933369636536, 0.3362818658351898], [-0.019081000238656998, -0.1833794116973877, 0.04206756874918938, 0.6398969292640686], [-0.022748589515686035, 0.011131568811833858, 0.054865509271621704, 0.36075282096862793], [-0.022525956854224205, 0.2054324597120285, 0.062080565840005875, 0.0858624055981636], [-0.01841730810701847, 0.3996121287345886, 0.06379781663417816, -0.1866060346364975], [-0.010425065644085407, 0.20363815128803253, 0.06006569415330887, 0.12550072371959686], [-0.006352302618324757, 0.007709424011409283, 0.06257570534944534, 0.4365125000476837], [-0.00619811424985528, 0.20189234614372253, 0.07130596041679382, 0.16419346630573273], [-0.0021602672059088945, 0.005825924687087536, 0.07458982616662979, 0.4784919321537018], [-0.002043748740106821, 0.1998199224472046, 0.08415966480970383, 0.2102191001176834], [0.0019526499090716243, 0.3936440050601959, 0.08836404979228973, -0.05477425828576088], [0.009825530461966991, 0.19737347960472107, 0.08726856112480164, 0.26442813873291016], [0.013772999867796898, 0.3911484479904175, 0.09255712479352951, 0.0004961864906363189], [0.021595967933535576, 0.5848295092582703, 0.09256704896688461, -0.26160889863967896], [0.033292558044195175, 0.38851648569107056, 0.08733487129211426, 0.05877579376101494], [0.041062887758016586, 0.582284688949585, 0.08851038664579391, -0.20512497425079346], [0.05270858108997345, 0.3860158622264862, 0.08440788835287094, 0.11411397159099579], [0.06042889878153801, 0.5798332691192627, 0.08669016510248184, -0.15079066157341003], [0.07202556729316711, 0.7736138105392456, 0.083674356341362, -0.41491493582725525], [0.08749784529209137, 0.9674563407897949, 0.07537605613470078, -0.6800898313522339], [0.10684696584939957, 0.7713727951049805, 0.06177425757050514, -0.3646601140499115], [0.12227442115545273, 0.9655649065971375, 0.054481055587530136, -0.6372426152229309], [0.14158572256565094, 1.1598864793777466, 0.04173620417714119, -0.9122829437255859], [0.16478344798088074, 0.9642254710197449, 0.0234905444085598, -0.6067801713943481], [0.184067964553833, 1.1590112447738647, 0.011354941874742508, -0.8919726014137268], [0.20724818110466003, 0.9637371301651001, -0.006484510377049446, -0.5957419872283936], [0.22652292251586914, 1.1589492559432983, -0.018399350345134735, -0.8904604315757751], [0.24970191717147827, 1.3543158769607544, -0.036208558827638626, -1.1888699531555176], [0.27678823471069336, 1.1596815586090088, -0.05998595803976059, -0.9077527523040771], [0.29998186230659485, 1.3555619716644287, -0.07814101129770279, -1.2186702489852905], [0.32709309458732605, 1.5515995025634766, -0.10251442342996597, -1.53477942943573], [0.35812509059906006, 1.3578507900238037, -0.13321000337600708, -1.275768518447876], [0.38528209924697876, 1.1646552085876465, -0.15872538089752197, -1.0275905132293701], [0.4085752069950104, 0.9719610214233398, -0.1792771965265274, -0.7886521816253662], [0.4280144274234772, 0.7796945571899414, -0.19505023956298828, -0.557300329208374], [0.4436083137989044, 0.9769424796104431, -0.20619623363018036, -0.9045437574386597], [0.4631471633911133, 1.1741701364517212, -0.22428710758686066, -1.2543113231658936], [0.03733176365494728, -0.18306492269039154, -0.020901372656226158, 0.2638815641403198], [0.033670466393232346, -0.3778823912143707, -0.01562374085187912, 0.5498993992805481], [0.026112819090485573, -0.1825445145368576, -0.004625752568244934, 0.25233516097068787], [0.02246192842721939, -0.3776001036167145, 0.00042095035314559937, 0.5435554385185242], [0.014909926801919937, -0.18248407542705536, 0.01129205897450447, 0.2510051727294922], [0.011260244995355606, -0.3777654469013214, 0.016312163323163986, 0.5472283363342285], [0.003704936010763049, -0.18287642300128937, 0.02725672908127308, 0.259729266166687], [4.740770236821845e-05, -0.37837666273117065, 0.032451316714286804, 0.5608831644058228], [-0.00752012524753809, -0.5739386677742004, 0.04366897791624069, 0.8636107444763184], [-0.018998898565769196, -0.37943753600120544, 0.060941193252801895, 0.5849718451499939], [-0.026587650179862976, -0.18521979451179504, 0.07264062762260437, 0.3120916187763214], [-0.030292045325040817, 0.00879615917801857, 0.07888246327638626, 0.04317273944616318], [-0.030116122215986252, -0.18736311793327332, 0.07974591851234436, 0.35966411232948303], [-0.033863384276628494, 0.0065400125458836555, 0.08693920075893402, 0.0931541919708252], [-0.0337325856089592, 0.20031523704528809, 0.0888022854924202, -0.1708829253911972], [-0.02972627989947796, 0.004041898529976606, 0.08538462221622467, 0.14844058454036713], [-0.029645441100001335, 0.19784395396709442, 0.08835344016551971, -0.11613085865974426], [-0.02568856254220009, 0.39159613847732544, 0.08603081852197647, -0.37968340516090393], [-0.017856640741229057, 0.1953645646572113, 0.07843714952468872, -0.06116274744272232], [-0.013949348591268063, 0.38927939534187317, 0.07721389830112457, -0.32810378074645996], [-0.006163761019706726, 0.1931479573249817, 0.0706518217921257, -0.012104873545467854], [-0.0023008016869425774, -0.0029123681597411633, 0.07040972262620926, 0.3020062744617462], [-0.002359048929065466, 0.1911391168832779, 0.07644984871149063, 0.0323336198925972], [0.0014637334970757365, -0.004991173278540373, 0.07709652185440063, 0.34812411665916443], [0.001363910036161542, 0.1889543980360031, 0.08405900746583939, 0.08071386069059372], [0.0051429979503154755, -0.007265665102750063, 0.08567328006029129, 0.3986889719963074], [0.004997684620320797, -0.20349189639091492, 0.0936470627784729, 0.7171059250831604], [0.0009278468205593526, -0.009782165288925171, 0.10798917710781097, 0.4553065001964569], [0.0007322034798562527, -0.20625203847885132, 0.11709530651569366, 0.7799817323684692], [-0.003392837243154645, -0.012917831540107727, 0.13269494473934174, 0.5263137221336365], [-0.0036511938087642193, 0.1801118552684784, 0.14322121441364288, 0.2782125174999237], [-4.8956702812574804e-05, 0.3729311227798462, 0.14878547191619873, 0.03390814736485481], [0.007409665733575821, 0.565640926361084, 0.14946362376213074, -0.20838123559951782], [0.01872248388826847, 0.3687330186367035, 0.14529600739479065, 0.12746655941009521], [0.026097144931554794, 0.17186078429222107, 0.1478453427553177, 0.4622301757335663], [0.029534360393881798, 0.36461785435676575, 0.1570899486541748, 0.21955719590187073], [0.0368267185986042, 0.5571862459182739, 0.1614810824394226, -0.01974400505423546], [0.04797044396400452, 0.7496683597564697, 0.16108620166778564, -0.25744158029556274], [0.0629638135433197, 0.9421678781509399, 0.15593737363815308, -0.4952978193759918], [0.08180716633796692, 1.1347867250442505, 0.1460314244031906, -0.7350603938102722], [0.10450290143489838, 1.3276220560073853, 0.131330206990242, -0.9784536957740784], [0.1310553401708603, 1.131007194519043, 0.11176113784313202, -0.6475710272789001], [0.15367548167705536, 1.3244092464447021, 0.09880971163511276, -0.9030748009681702], [0.1801636666059494, 1.128097653388977, 0.08074822276830673, -0.5810409784317017], [0.2027256339788437, 0.9319427013397217, 0.0691273957490921, -0.26405298709869385], [0.22136448323726654, 1.1260133981704712, 0.06384634226560593, -0.5341564416885376], [0.24388474225997925, 0.9300543665885925, 0.05316321179270744, -0.22205878794193268], [0.2624858319759369, 1.124377727508545, 0.0487220361828804, -0.4975093901157379], [0.2849733829498291, 0.9286038875579834, 0.038771845400333405, -0.18987847864627838], [0.3035454750061035, 0.7329493165016174, 0.03497427701950073, 0.11477887630462646], [0.31820446252822876, 0.927553117275238, 0.03726985678076744, -0.16666799783706665], [0.33675551414489746, 0.7319180369377136, 0.03393649682402611, 0.13753563165664673], [0.3513938784599304, 0.5363268852233887, 0.036687206476926804, 0.4407288730144501], [0.3621204197406769, 0.3407054543495178, 0.04550178349018097, 0.7447471618652344], [0.3689345121383667, 0.1449860781431198, 0.06039672717452049, 1.051395297050476], [0.37183424830436707, 0.33925727009773254, 0.08142463117837906, 0.778265655040741], [0.37861940264701843, 0.5331708192825317, 0.0969899445772171, 0.5122714638710022], [0.38928282260894775, 0.726802408695221, 0.1072353795170784, 0.25165945291519165], [0.40381884574890137, 0.5303256511688232, 0.11226856708526611, 0.5761485695838928], [0.4144253730773926, 0.3338238298892975, 0.12379153817892075, 0.9019833207130432], [0.421101838350296, 0.527070939540863, 0.1418312042951584, 0.6506326794624329], [0.4316432774066925, 0.7199623584747314, 0.15484385192394257, 0.4057595729827881], [0.4460425078868866, 0.5230225920677185, 0.1629590541124344, 0.7429772615432739], [0.4565029740333557, 0.3260713815689087, 0.17781859636306763, 1.0821882486343384], [0.463024377822876, 0.12910570204257965, 0.19946235418319702, 1.424981713294983], [0.4656065106391907, 0.3212828040122986, 0.22796198725700378, 1.2006852626800537], [0.04079495370388031, 0.1564633995294571, 0.004095697775483131, -0.2846512198448181], [0.04392421990633011, 0.3515267074108124, -0.0015973264817148447, -0.5760395526885986], [0.050954755395650864, 0.15642717480659485, -0.013118118047714233, -0.2838602662086487], [0.05408329889178276, 0.3517337441444397, -0.018795322626829147, -0.5806515216827393], [0.06111797317862511, 0.5471139550209045, -0.030408354476094246, -0.8791955709457397], [0.0720602497458458, 0.35241806507110596, -0.047992266714572906, -0.5962254405021667], [0.07910861074924469, 0.5481776595115662, -0.05991677567362785, -0.9036310315132141], [0.09007216989994049, 0.353916198015213, -0.07798939943313599, -0.6303667426109314], [0.09715048968791962, 0.5500348210334778, -0.09059672802686691, -0.9465560913085938], [0.10815118998289108, 0.35624203085899353, -0.10952785611152649, -0.6836580634117126], [0.1152760237455368, 0.16279760003089905, -0.12320101261138916, -0.42736703157424927], [0.1185319796204567, -0.030383719131350517, -0.13174834847450256, -0.17592096328735352], [0.11792430281639099, -0.22339823842048645, -0.13526678085327148, 0.07246968150138855], [0.11345633864402771, -0.41634777188301086, -0.1338173747062683, 0.31960293650627136], [0.10512938350439072, -0.21959906816482544, -0.12742532789707184, -0.01210664864629507], [0.10073740035295486, -0.022901825606822968, -0.12766745686531067, -0.3421221375465393], [0.10027936846017838, -0.21599817276000977, -0.1345098912715912, -0.0922672376036644], [0.09595940262079239, -0.4089614152908325, -0.1363552361726761, 0.155136376619339], [0.0877801775932312, -0.6018943190574646, -0.13325251638889313, 0.4018852114677429], [0.07574228942394257, -0.4051589071750641, -0.1252148151397705, 0.07033777236938477], [0.06763911247253418, -0.2084849774837494, -0.12380805611610413, -0.2590804994106293], [0.06346940994262695, -0.40164196491241455, -0.12898966670036316, -0.007869413122534752], [0.055436570197343826, -0.5947007536888123, -0.12914705276489258, 0.2414950728416443], [0.04354255646467209, -0.7877640724182129, -0.12431715428829193, 0.49081459641456604], [0.02778727374970913, -0.5911279320716858, -0.11450085788965225, 0.16168144345283508], [0.01596471481025219, -0.3945688307285309, -0.11126723140478134, -0.16481631994247437], [0.008073339238762856, -0.5879366993904114, -0.11456355452537537, 0.09079672396183014], [-0.003685394302010536, -0.3913749158382416, -0.11274762451648712, -0.23572121560573578], [-0.011512892320752144, -0.1948377937078476, -0.11746204644441605, -0.5617327094078064], [-0.015409648418426514, -0.3881324529647827, -0.12869669497013092, -0.3082430958747864], [-0.023172298446297646, -0.5812082290649414, -0.134861558675766, -0.05875704064965248], [-0.03479646146297455, -0.774164617061615, -0.1360367089509964, 0.18852029740810394], [-0.050279755145311356, -0.9671046733856201, -0.13226629793643951, 0.43538498878479004], [-0.06962184607982635, -0.7703825831413269, -0.12355859577655792, 0.10410628467798233], [-0.0850294977426529, -0.9635371565818787, -0.12147647142410278, 0.35539543628692627], [-0.10430024564266205, -0.7669163346290588, -0.11436856538057327, 0.027011290192604065], [-0.11963856965303421, -0.9602282047271729, -0.11382833868265152, 0.2815336585044861], [-0.1388431340456009, -1.1535580158233643, -0.1081976667046547, 0.5362583994865417], [-0.16191428899765015, -1.3470056056976318, -0.09747249633073807, 0.7929848432540894], [-0.1888544112443924, -1.1506903171539307, -0.08161280304193497, 0.4712981581687927], [-0.21186821162700653, -1.3445703983306885, -0.07218683511018753, 0.7371827363967896], [-0.2387596219778061, -1.5386251211166382, -0.05744318291544914, 1.0063021183013916], [-0.26953211426734924, -1.732934832572937, -0.03731713816523552, 1.2804070711135864], [-0.30419081449508667, -1.5373578071594238, -0.011708997189998627, 0.9762770533561707], [-0.3349379897117615, -1.732320785522461, 0.00781654380261898, 1.2652591466903687], [-0.3695843815803528, -1.927541732788086, 0.03312172740697861, 1.5603796243667603], [-0.40813523530960083, -2.123044013977051, 0.06432931870222092, 1.863208293914795], [-0.4505960941314697, -2.3188090324401855, 0.1015934869647026, 2.1751482486724854], [-0.49697229266166687, -2.124811887741089, 0.14509645104408264, 1.9154701232910156], [-0.53946852684021, -1.9315199851989746, 0.18340584635734558, 1.671087622642517], [-0.5780989527702332, -1.7389415502548218, 0.2168276011943817, 1.4406843185424805], [0.0491870641708374, -0.1807430386543274, 0.021871304139494896, 0.33429551124572754], [0.04557220637798309, 0.014060918241739273, 0.02855721488595009, 0.04858911782503128], [0.045853421092033386, -0.18145863711833954, 0.029528995975852013, 0.35014355182647705], [0.042224250733852386, 0.01323118805885315, 0.03653186932206154, 0.06691639125347137], [0.04248887300491333, -0.18239496648311615, 0.037870194762945175, 0.3708977997303009], [0.03884097561240196, 0.01216906774789095, 0.04528815299272537, 0.09039219468832016], [0.039084356278181076, 0.20661360025405884, 0.047095995396375656, -0.1876654028892517], [0.04321662709116936, 0.4010312259197235, 0.04334268718957901, -0.4651273488998413], [0.05123725160956383, 0.20532448589801788, 0.034040141850709915, -0.15910416841506958], [0.05534374341368675, 0.009732136502861977, 0.030858056619763374, 0.1441202461719513], [0.05553838610649109, -0.18581783771514893, 0.033740460872650146, 0.44637638330459595], [0.051822029054164886, -0.381400465965271, 0.04266798868775368, 0.7495011687278748], [0.044194020330905914, -0.18689221143722534, 0.057658012956380844, 0.4705449044704437], [0.040456175804138184, -0.38277918100357056, 0.067068912088871, 0.7808291912078857], [0.032800592482089996, -0.18864016234874725, 0.08268549293279648, 0.5099788308143616], [0.02902778796851635, -0.38482367992401123, 0.09288506954908371, 0.827530562877655], [0.021331313997507095, -0.19108615815639496, 0.10943568497896194, 0.5654459595680237], [0.017509590834379196, -0.38755953311920166, 0.12074460089206696, 0.8905029296875], [0.009758400730788708, -0.1942644566297531, 0.1385546624660492, 0.6380840539932251], [0.005873111542314291, -0.001318691880442202, 0.1513163447380066, 0.3920438587665558], [0.005846737418323755, 0.19136837124824524, 0.15915721654891968, 0.150633305311203], [0.009674104861915112, 0.38389578461647034, 0.16216988861560822, -0.08791292458772659], [0.017352020367980003, 0.1868657022714615, 0.16041162610054016, 0.25122368335723877], [0.021089335903525352, -0.010139930061995983, 0.16543610394001007, 0.5898972749710083], [0.020886536687612534, 0.18232645094394684, 0.17723403871059418, 0.3535560965538025], [0.024533065035939217, -0.01481450442224741, 0.18430516123771667, 0.6964696645736694], [0.024236775934696198, -0.21194903552532196, 0.19823455810546875, 1.0410429239273071], [0.019997794181108475, -0.019932851195335388, 0.2190554141998291, 0.816559374332428]], "action_prob": [0.49751731753349304, 0.3850826025009155, 0.6501398086547852, 0.38849136233329773, 0.3493909239768982, 0.6494950652122498, 0.3473324775695801, 0.6500719785690308, 0.6553202271461487, 0.6298614144325256, 0.5294822454452515, 0.5946071147918701, 0.45607849955558777, 0.6421706676483154, 0.4384501576423645, 0.6481589078903198, 0.5806140899658203, 0.5496326684951782, 0.5962029099464417, 0.46862655878067017, 0.376852422952652, 0.6485322713851929, 0.6211353540420532, 0.5134183764457703, 0.6172553896903992, 0.49601081013679504, 0.6146604418754578, 0.49879828095436096, 0.6244204640388489, 0.49077165126800537, 0.6287561655044556, 0.4811129570007324, 0.6335479617118835, 0.5303288102149963, 0.5951328873634338, 0.4617004096508026, 0.6409788131713867, 0.4502451717853546, 0.354518860578537, 0.6587651968002319, 0.6521772742271423, 0.5852561593055725, 0.5441438555717468, 0.39957645535469055, 0.6601212024688721, 0.38247373700141907, 0.6634414792060852, 0.6342549920082092, 0.46669870615005493, 0.6469289660453796, 0.5623918175697327, 0.5599040389060974, 0.5862943530082703, 0.5369412302970886, 0.6065447330474854, 0.4876886010169983, 0.3912920355796814, 0.6462460160255432, 0.39849957823753357, 0.35437899827957153, 0.655035138130188, 0.35292091965675354, 0.6564863920211792, 0.3498871326446533, 0.3422180712223053, 0.6523789167404175, 0.3411029875278473, 0.3488388955593109, 0.6404669284820557, 0.6482043266296387, 0.6563048362731934, 0.6638348698616028, 0.33171507716178894, 0.3402884900569916, 0.5303375720977783, 0.4017045497894287, 0.6465060114860535, 0.400489866733551, 0.6478197574615479, 0.3957825005054474, 0.649712860584259, 0.3879881501197815, 0.34807735681533813, 0.6486108303070068, 0.6549170017242432, 0.6368399262428284, 0.44626548886299133, 0.6463454961776733, 0.581758439540863, 0.5436144471168518, 0.6042882800102234, 0.4853544533252716, 0.6138514876365662, 0.5111446380615234, 0.6014788150787354, 0.46568307280540466, 0.6426345109939575, 0.44012680649757385, 0.6511307954788208, 0.41441774368286133, 0.3420797884464264, 0.6576463580131531, 0.3359447717666626, 0.655591607093811, 0.667596697807312, 0.658015787601471, 0.5964012742042542, 0.5150538086891174, 0.37117794156074524, 0.6732035279273987, 0.6541933417320251, 0.5817244648933411, 0.47382959723472595, 0.39480265974998474, 0.35896122455596924, 0.6527314186096191, 0.36363527178764343, 0.6531931161880493, 0.6325517892837524, 0.44049400091171265, 0.6288090944290161, 0.4493938386440277, 0.6261550188064575, 0.5451462864875793, 0.5807952284812927, 0.5388798713684082, 0.41409358382225037, 0.34125739336013794, 0.3304530680179596, 0.6539484858512878, 0.6703063249588013, 0.6704487800598145, 0.3659501373767853, 0.3257031738758087, 0.6681020855903625, 0.6776671409606934, 0.33395111560821533, 0.3214609920978546, 0.3378676176071167, 0.6378632187843323, 0.4899478256702423, 0.37509530782699585, 0.6554974317550659, 0.3710494935512543, 0.3431411683559418, 0.6499674916267395, 0.34105944633483887, 0.6489979028701782, 0.33968544006347656, 0.646772563457489, 0.660186231136322, 0.6655510067939758, 0.6407602429389954, 0.552982747554779, 0.5621236562728882, 0.4086664319038391, 0.6667602062225342, 0.6251549124717712, 0.5202775001525879, 0.5838310122489929, 0.44071030616760254, 0.6619765162467957, 0.596717119216919, 0.48121345043182373, 0.6053286790847778, 0.485895037651062, 0.6432856321334839, 0.4513615667819977, 0.34165719151496887, 0.6769042611122131, 0.6710812449455261, 0.6175516843795776, 0.5126745700836182, 0.583163321018219, 0.5461490750312805, 0.5600804090499878, 0.575144350528717, 0.46499133110046387, 0.38886910676956177, 0.6443098187446594, 0.39695098996162415, 0.35707443952560425, 0.34463194012641907, 0.6559363007545471, 0.34257644414901733, 0.34294307231903076, 0.34847962856292725, 0.35603561997413635, 0.6357028484344482, 0.6406564116477966, 0.6458765268325806, 0.48276323080062866, 0.6276708841323853, 0.47180476784706116, 0.632698118686676, 0.45825111865997314, 0.638174831867218, 0.5577548742294312, 0.42545169591903687, 0.641671359539032, 0.5669139623641968, 0.42294180393218994, 0.35253384709358215, 0.6521002054214478, 0.3474331498146057, 0.6517812013626099, 0.3427512049674988, 0.6503546833992004, 0.33961760997772217, 0.6474987268447876, 0.6610761284828186, 0.6638162136077881, 0.6315733790397644, 0.4603675901889801, 0.3451939523220062, 0.6682456731796265, 0.3302273452281952, 0.334471732378006, 0.6412723660469055], "advantages": [41.65803146362305, 41.48064422607422, 41.523128509521484, 40.50852584838867, 40.49465560913086, 40.63951110839844, 39.266300201416016, 39.34459686279297, 37.93157196044922, 36.7945556640625, 35.960533142089844, 35.414093017578125, 34.76123809814453, 34.352012634277344, 33.47389602661133, 33.058990478515625, 32.15245819091797, 31.498376846313477, 30.870059967041016, 30.189558029174805, 29.725603103637695, 29.465221405029297, 28.531509399414062, 27.769805908203125, 27.196937561035156, 26.483352661132812, 25.991905212402344, 25.233213424682617, 24.656431198120117, 23.909223556518555, 23.320674896240234, 22.54953384399414, 21.9495906829834, 21.153366088867188, 20.560680389404297, 19.780378341674805, 19.169132232666016, 18.331207275390625, 17.70636558532715, 17.247262954711914, 16.150259017944336, 15.251869201660156, 14.518842697143555, 13.715744972229004, 13.057730674743652, 12.112793922424316, 11.443036079406738, 10.474571228027344, 9.640202522277832, 8.836673736572266, 7.974212646484375, 7.212347984313965, 6.310791492462158, 5.520359992980957, 4.624729633331299, 3.805880546569824, 3.0686452388763428, 2.419703245162964, 1.3604398965835571, 0.7019262909889221, 0.15662771463394165, -0.9769958853721619, -1.4944566488265991, -2.628200054168701, -3.098283529281616, -3.386643648147583, -4.555391311645508, -4.707739353179932, -4.651360511779785, -5.670603275299072, -6.633082389831543, -7.528431415557861, -8.341958999633789, -8.078737258911133, 38.49376678466797, 38.20043182373047, 38.14195251464844, 37.0303955078125, 36.918190002441406, 35.76642990112305, 35.607933044433594, 34.414554595947266, 34.217369079589844, 34.1902961730957, 32.6371955871582, 31.35661506652832, 30.37605857849121, 29.876379013061523, 28.866661071777344, 28.116722106933594, 27.418350219726562, 26.638710021972656, 26.07065200805664, 25.22563362121582, 24.633155822753906, 23.82146644592285, 23.20148468017578, 22.356834411621094, 21.740259170532227, 20.868690490722656, 20.253459930419922, 19.796388626098633, 18.697465896606445, 18.217697143554688, 17.118074417114258, 16.182405471801758, 15.362748146057129, 14.626677513122559, 13.813651084899902, 13.093217849731445, 12.23669147491455, 11.44589614868164, 10.703195571899414, 10.003390312194824, 9.350461959838867, 8.755293846130371, 7.743400573730469, 7.1404008865356445, 6.14049768447876, 5.203132629394531, 4.512016773223877, 3.569718360900879, 2.8661201000213623, 1.9149835109710693, 1.0103927850723267, 0.21499355137348175, -0.7043094038963318, -1.582684874534607, -2.420823335647583, -3.2151551246643066, -4.2706708908081055, -5.263055801391602, -6.211982727050781, -7.1441168785095215, -8.044031143188477, -9.079401969909668, -10.079938888549805, -11.041842460632324, -11.97989273071289, -12.89201831817627, 30.372936248779297, 29.86773681640625, 29.73341178894043, 28.864198684692383, 28.791879653930664, 29.0379581451416, 28.167205810546875, 28.54501724243164, 27.82742691040039, 28.342004776000977, 27.839235305786133, 27.482213973999023, 27.314762115478516, 27.346899032592773, 27.51485824584961, 27.04292869567871, 27.015687942504883, 27.033710479736328, 27.140846252441406, 27.2159423828125, 26.693336486816406, 26.45025062561035, 26.449596405029297, 26.38461685180664, 26.148164749145508, 25.605182647705078, 25.178022384643555, 24.94760513305664, 24.529586791992188, 24.174556732177734, 24.09464454650879, 23.883726119995117, 23.48130989074707, 22.847679138183594, 22.41897201538086, 21.71054458618164, 21.234159469604492, 20.473291397094727, 19.493919372558594, 18.31321144104004, 17.763538360595703, 16.48760986328125, 15.047924041748047, 13.480138778686523, 12.596384048461914, 10.912415504455566, 9.159485816955566, 7.3671159744262695, 5.556756019592285, 3.9105136394500732, 2.0555319786071777, 13.720742225646973, 13.119091987609863, 12.02326774597168, 11.400839805603027, 10.267521858215332, 9.626664161682129, 8.455345153808594, 7.579642295837402, 6.976961612701416, 5.880390167236328, 5.008805274963379, 4.366434097290039, 3.9232068061828613, 2.365817070007324, 1.8758946657180786, 0.2978225648403168, -0.23322327435016632, -1.8186240196228027, -2.3872029781341553, -3.9648239612579346, -5.314981460571289, -6.48883581161499, -7.536246299743652, -8.551626205444336, -9.446617126464844, -10.645462989807129, -11.545631408691406, -12.352807998657227], "value_targets": [52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 365965731, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 53913026, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 731271860, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 1708140011, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 828827825, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1430218404, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551, 1629283551], "obs": [[0.04564739763736725, 0.026045044884085655, 0.02006727084517479, -0.02303975634276867], [0.04616829752922058, -0.16935884952545166, 0.01960647664964199, 0.2759064733982086], [0.04278112202882767, -0.36475497484207153, 0.025124605745077133, 0.5747082233428955], [0.035486020147800446, -0.560219943523407, 0.03661876916885376, 0.8751990795135498], [0.02428162284195423, -0.3656144440174103, 0.05412274971604347, 0.594249963760376], [0.016969332471489906, -0.17129014432430267, 0.06600774824619293, 0.3190946578979492], [0.013543530367314816, -0.3672870397567749, 0.0723896473646164, 0.6318419575691223], [0.006197789218276739, -0.5633403658866882, 0.08502648770809174, 0.9464157223701477], [-0.005069017875939608, -0.759498119354248, 0.10395479947328568, 1.2645570039749146], [-0.020258979871869087, -0.9557836651802063, 0.12924593687057495, 1.587903618812561], [-0.03937465324997902, -1.1521828174591064, 0.16100400686264038, 1.9179378747940063], [-0.06241830810904503, -0.9591179490089417, 0.19936276972293854, 1.6792168617248535], [0.03267543762922287, 0.022108225151896477, 0.026787562295794487, -0.023095007985830307], [0.03311759978532791, -0.17338743805885315, 0.026325661689043045, 0.27791789174079895], [0.029649851843714714, -0.3688748776912689, 0.03188401833176613, 0.5787862539291382], [0.02227235585451126, -0.1742139309644699, 0.04345974698662758, 0.29631558060646057], [0.01878807693719864, 0.02026239223778248, 0.04938605800271034, 0.017649689689278603], [0.01919332519173622, -0.17553174495697021, 0.0497390516102314, 0.3254964053630829], [0.01568268984556198, 0.018848029896616936, 0.0562489777803421, 0.048904597759246826], [0.016059650108218193, -0.17703348398208618, 0.05722707137465477, 0.35879063606262207], [0.012518980540335178, 0.01723022200167179, 0.06440288573503494, 0.08468768745660782], [0.0128635847941041, 0.21137270331382751, 0.06609664112329483, -0.18700094521045685], [0.017091039568185806, 0.01537040714174509, 0.0623566210269928, 0.12577879428863525], [0.017398446798324585, 0.20954617857933044, 0.06487219780683517, -0.14659781754016876], [0.021589370444417, 0.40368202328681946, 0.06194023787975311, -0.4181300103664398], [0.02966301143169403, 0.20773953199386597, 0.053577639162540436, -0.10658111423254013], [0.033817801624536514, 0.011892363429069519, 0.05144601687788963, 0.20251239836215973], [0.03405565023422241, 0.20624226331710815, 0.05549626424908638, -0.07350828498601913], [0.03818049654364586, 0.4005264937877655, 0.05402609705924988, -0.3481784760951996], [0.0461910255253315, 0.5948400497436523, 0.047062527388334274, -0.6233475804328918], [0.058087825775146484, 0.7892743945121765, 0.03459557518362999, -0.900844931602478], [0.07387331128120422, 0.5937012434005737, 0.01657867804169655, -0.5974915623664856], [0.08574733883142471, 0.39835125207901, 0.004628846421837807, -0.2996329963207245], [0.09371436387300491, 0.20316362380981445, -0.0013638132950291038, -0.005493819713592529], [0.09777763485908508, 0.39830511808395386, -0.0014736896846443415, -0.2986067235469818], [0.10574373602867126, 0.5934480428695679, -0.007445824332535267, -0.5917540788650513], [0.11761269718408585, 0.788673460483551, -0.01928090490400791, -0.8867731094360352], [0.13338616490364075, 0.9840517044067383, -0.0370163694024086, -1.185454249382019], [0.1530672013759613, 0.7894289493560791, -0.06072545424103737, -0.9046003818511963], [0.16885578632354736, 0.5951796174049377, -0.0788174644112587, -0.631605863571167], [0.18075937032699585, 0.7913076281547546, -0.09144958108663559, -0.9480329155921936], [0.1965855211019516, 0.5975281000137329, -0.11041023582220078, -0.6854268908500671], [0.2085360884666443, 0.4040980935096741, -0.12411877512931824, -0.42944326996803284], [0.21661804616451263, 0.21093229949474335, -0.1327076405286789, -0.17832088470458984], [0.22083669900894165, 0.017934445291757584, -0.136274054646492, 0.0697287991642952], [0.22119538486003876, -0.17499734461307526, -0.1348794847726822, 0.31650280952453613], [0.2176954448223114, 0.021762125194072723, -0.12854942679405212, -0.015490245074033737], [0.2181306779384613, -0.1713043451309204, -0.1288592368364334, 0.23403042554855347], [0.21470458805561066, -0.36437225341796875, -0.12417861819267273, 0.48345136642456055], [0.20741714537143707, -0.5575429797172546, -0.11450959742069244, 0.7345614433288574], [0.1962662935256958, -0.36104094982147217, -0.09981836378574371, 0.4081465005874634], [0.1890454739332199, -0.554616391658783, -0.091655433177948, 0.6677664518356323], [0.17795313894748688, -0.35834741592407227, -0.0783001035451889, 0.34768974781036377], [0.17078618705272675, -0.16220416128635406, -0.07134631276130676, 0.0313795730471611], [0.16754211485385895, -0.35623428225517273, -0.07071872055530548, 0.3007262945175171], [0.16041742265224457, -0.16017936170101166, -0.06470419466495514, -0.01339498907327652], [0.15721383690834045, -0.3543165922164917, -0.06497209519147873, 0.25819167494773865], [0.15012750029563904, -0.548453688621521, -0.05980825796723366, 0.5296945571899414], [0.1391584277153015, -0.7426855564117432, -0.04921436682343483, 0.8029482960700989], [0.12430471926927567, -0.5469245314598083, -0.0331554040312767, 0.4951991140842438], [0.11336623132228851, -0.741563618183136, -0.023251419886946678, 0.7772513628005981], [0.09853495657444, -0.5461297631263733, -0.007706393022090197, 0.4773445129394531], [0.08761236071586609, -0.3508998453617096, 0.0018404977163299918, 0.18224270641803741], [0.08059436827898026, -0.546048104763031, 0.005485351663082838, 0.47550567984580994], [0.06967340409755707, -0.351004034280777, 0.01499546505510807, 0.18455666303634644], [0.0626533254981041, -0.5463373064994812, 0.018686598166823387, 0.4819321036338806], [0.051726579666137695, -0.3514840006828308, 0.028325241059064865, 0.19519677758216858], [0.04469689726829529, -0.546999454498291, 0.03222917765378952, 0.49667876958847046], [0.033756908029317856, -0.7425606846809387, 0.04216275364160538, 0.7993420362472534], [0.018905695527791977, -0.5480417013168335, 0.05814959108829498, 0.5202150344848633], [0.007944862358272076, -0.7439319491386414, 0.06855389475822449, 0.8306401371955872], [-0.0069337766617536545, -0.9399206042289734, 0.08516669273376465, 1.1440715789794922], [-0.025732187554240227, -1.1360455751419067, 0.10804812610149384, 1.4622015953063965], [-0.04845310002565384, -0.9424009919166565, 0.13729216158390045, 1.2051329612731934], [-0.06730112433433533, -0.7492941617965698, 0.16139481961727142, 0.9584354758262634], [-0.0822870060801506, -0.5566667914390564, 0.1805635243654251, 0.7204938530921936], [-0.09342034161090851, -0.3644411265850067, 0.1949734091758728, 0.4896406829357147], [-0.10070916265249252, -0.17252682149410248, 0.20476622879505157, 0.26418328285217285], [0.00836584810167551, 0.013558722101151943, 0.019360128790140152, -0.044864438474178314], [0.008637022227048874, -0.18183541297912598, 0.018462838605046272, 0.2538633644580841], [0.0050003137439489365, 0.013018112629652023, 0.023540107533335686, -0.03293934836983681], [0.005260676145553589, -0.1824333667755127, 0.022881319746375084, 0.2670767903327942], [0.0016120088985189795, -0.3778742849826813, 0.028222855180501938, 0.5668879151344299], [-0.005945476703345776, -0.18315936625003815, 0.03956061601638794, 0.2832283079624176], [-0.009608663618564606, -0.37882259488105774, 0.04522518068552017, 0.5881212949752808], [-0.017185116186738014, -0.5745477080345154, 0.05698760598897934, 0.8947004675865173], [-0.028676070272922516, -0.3802429437637329, 0.07488161325454712, 0.6204617023468018], [-0.036280930042266846, -0.5763263702392578, 0.08729085326194763, 0.9357572793960571], [-0.04780745506286621, -0.3824833035469055, 0.10600599646568298, 0.671730637550354], [-0.05545712262392044, -0.18898218870162964, 0.11944060772657394, 0.41421571373939514], [-0.059236764907836914, 0.004262239206582308, 0.12772493064403534, 0.16144634783267975], [-0.05915152281522751, 0.1973462998867035, 0.130953848361969, -0.0883714035153389], [-0.0552045963704586, 0.000614116492215544, 0.12918642163276672, 0.24259065091609955], [-0.055192314088344574, 0.19367682933807373, 0.13403823971748352, -0.0067149922251701355], [-0.05131877586245537, 0.3866472542285919, 0.13390393555164337, -0.25428497791290283], [-0.04358582943677902, 0.5796284675598145, 0.12881824374198914, -0.5019152760505676], [-0.031993262469768524, 0.38294848799705505, 0.11877993494272232, -0.17157183587551117], [-0.024334292858839035, 0.1863444596529007, 0.11534849554300308, 0.15609554946422577], [-0.02060740254819393, -0.01022386271506548, 0.11847040802240372, 0.48282596468925476], [-0.020811880007386208, 0.1830442249774933, 0.12812691926956177, 0.22970475256443024], [-0.0171509962528944, -0.013653641566634178, 0.13272102177143097, 0.5598993897438049], [-0.017424067482352257, 0.17938029766082764, 0.14391900599002838, 0.31180045008659363], [-0.013836462050676346, 0.37219002842903137, 0.15015502274036407, 0.06774217635393143], [-0.006392661947757006, 0.5648759007453918, 0.1515098661184311, -0.17405462265014648], [0.004904856439679861, 0.36794692277908325, 0.14802876114845276, 0.16232864558696747], [0.012263794429600239, 0.1710500717163086, 0.15127533674240112, 0.4978056252002716], [0.01568479649722576, 0.36375167965888977, 0.16123145818710327, 0.2563597857952118], [0.02295983023941517, 0.1667390912771225, 0.16635864973068237, 0.5952427983283997], [0.026294611394405365, 0.35919010639190674, 0.17826350033283234, 0.35923585295677185], [0.03347841277718544, 0.1620413213968277, 0.18544822931289673, 0.7024050951004028], [0.03671924024820328, 0.35417500138282776, 0.199496328830719, 0.4733559191226959], [0.043802741914987564, 0.15687759220600128, 0.20896343886852264, 0.8216960430145264], [-0.02748679369688034, -0.0374392531812191, -0.007910864427685738, -0.03355800360441208], [-0.028235578909516335, -0.23244687914848328, -0.008582024835050106, 0.2566184997558594], [-0.032884515821933746, -0.03720345348119736, -0.003449654672294855, -0.03875892981886864], [-0.03362858295440674, 0.15796779096126556, -0.004224833101034164, -0.3325282633304596], [-0.030469229444861412, -0.037093766033649445, -0.01087539829313755, -0.04118062183260918], [-0.03121110424399376, 0.15818242728710175, -0.011699010618031025, -0.3372749090194702], [-0.028047455474734306, 0.3534688949584961, -0.01844450831413269, -0.6336239576339722], [-0.02097807638347149, 0.1586090326309204, -0.031116988509893417, -0.34680628776550293], [-0.01780589669942856, -0.03605680540204048, -0.03805311396718025, -0.06409579515457153], [-0.018527032807469368, -0.2306130975484848, -0.03933503106236458, 0.21634244918823242], [-0.023139294236898422, -0.03495154157280922, -0.035008180886507034, -0.08848437666893005], [-0.023838326334953308, -0.2295546531677246, -0.03677786886692047, 0.19295114278793335], [-0.028429418802261353, -0.03392641991376877, -0.03291884437203407, -0.11110303550958633], [-0.029107946902513504, 0.1616514027118683, -0.035140905529260635, -0.4139872193336487], [-0.025874918326735497, 0.35725337266921997, -0.04342065006494522, -0.7175382971763611], [-0.01872985251247883, 0.16275835037231445, -0.05777141824364662, -0.43883246183395386], [-0.015474684536457062, -0.03150037303566933, -0.06654806435108185, -0.1649058312177658], [-0.016104692593216896, 0.16450797021389008, -0.06984618306159973, -0.47781825065612793], [-0.012814532965421677, 0.3605429530143738, -0.07940255105495453, -0.7916718125343323], [-0.005603673402220011, 0.5566601157188416, -0.09523598849773407, -1.1082404851913452], [0.005529528483748436, 0.7528958320617676, -0.11740079522132874, -1.4292173385620117], [0.02058744616806507, 0.5594030022621155, -0.14598514139652252, -1.1754125356674194], [0.03177550435066223, 0.7560883164405823, -0.1694933921098709, -1.510069727897644], [0.046897273510694504, 0.5633768439292908, -0.19969478249549866, -1.2747374773025513], [-0.01720239222049713, 0.013725927099585533, -0.03560846298933029, 0.0090573038905859], [-0.016927873715758324, -0.1808677315711975, -0.03542731702327728, 0.2902960777282715], [-0.020545227453112602, 0.014741002582013607, -0.029621392488479614, -0.013346358202397823], [-0.020250407978892326, -0.17994388937950134, -0.029888320714235306, 0.26984545588493347], [-0.023849286139011383, 0.015591545961797237, -0.024491410702466965, -0.03211255744099617], [-0.02353745512664318, 0.21105599403381348, -0.025133661925792694, -0.33242106437683105], [-0.019316334277391434, 0.016300639137625694, -0.031782083213329315, -0.04776880890130997], [-0.018990322947502136, -0.1783515065908432, -0.03273745998740196, 0.23471960425376892], [-0.022557351738214493, 0.01722252182662487, -0.028043067082762718, -0.06810734421014786], [-0.022212902083992958, 0.21273507177829742, -0.02940521575510502, -0.369504451751709], [-0.017958199605345726, 0.01804298348724842, -0.03679530322551727, -0.08623644709587097], [-0.017597340047359467, -0.17653274536132812, -0.03852003440260887, 0.1946142166852951], [-0.02112799510359764, -0.3710831105709076, -0.03462774679064751, 0.4749011993408203], [-0.02854965813457966, -0.5656993985176086, -0.02512972429394722, 0.756472110748291], [-0.039863646030426025, -0.7604661583900452, -0.01000028196722269, 1.0411425828933716], [-0.05507297068834305, -0.9554538130760193, 0.010822569951415062, 1.3306695222854614], [-0.07418204843997955, -0.7604700326919556, 0.03743596002459526, 1.0413926839828491], [-0.08939144760370255, -0.956068754196167, 0.05826381593942642, 1.3455888032913208], [-0.10851281881332397, -0.7617258429527283, 0.08517558872699738, 1.0716890096664429], [-0.1237473413348198, -0.5678269267082214, 0.10660936683416367, 0.8069062829017639], [-0.13510388135910034, -0.3743150532245636, 0.1227474957704544, 0.5495703220367432], [-0.14259018003940582, -0.18111170828342438, 0.1337389051914215, 0.29794299602508545], [-0.1462124139070511, 0.011875506490468979, 0.13969776034355164, 0.05024930089712143], [-0.14597490429878235, -0.18494437634944916, 0.1407027542591095, 0.38354071974754333], [-0.14967378973960876, -0.3817543387413025, 0.1483735591173172, 0.7170684933662415], [-0.15730887651443481, -0.5785841941833496, 0.16271492838859558, 1.052531361579895], [-0.16888056695461273, -0.38594967126846313, 0.18376556038856506, 0.81502366065979], [-0.17659954726696014, -0.5830481648445129, 0.20006603002548218, 1.159416913986206], [0.015553594566881657, -0.03333761543035507, 0.00871417485177517, -0.049486178904771805], [0.014886842109262943, -0.228583425283432, 0.007724451832473278, 0.24593335390090942], [0.01031517330557108, -0.4238148629665375, 0.012643118388950825, 0.541042685508728], [0.0018388766329735518, -0.2288728654384613, 0.02346397377550602, 0.25237008929252625], [-0.0027385808061808348, -0.42432186007499695, 0.028511375188827515, 0.5523606538772583], [-0.01122501865029335, -0.22961169481277466, 0.039558589458465576, 0.26879531145095825], [-0.015817251056432724, -0.035075947642326355, 0.04493449628353119, -0.011152821592986584], [-0.016518771648406982, -0.23081254959106445, 0.044711437076330185, 0.29536202549934387], [-0.02113502286374569, -0.4265424609184265, 0.05061867833137512, 0.601804256439209], [-0.0296658705919981, -0.23216375708580017, 0.0626547634601593, 0.3254851698875427], [-0.03430914506316185, -0.4281192421913147, 0.0691644698381424, 0.6372501254081726], [-0.04287153109908104, -0.2340264916419983, 0.08190947026014328, 0.3671252131462097], [-0.04755206033587456, -0.43021103739738464, 0.08925197273492813, 0.6844698786735535], [-0.056156281381845474, -0.2364342212677002, 0.1029413715004921, 0.4211668372154236], [-0.06088496744632721, -0.042909927666187286, 0.1113647073507309, 0.16262847185134888], [-0.06174316629767418, -0.2394353747367859, 0.11461728066205978, 0.4882641136646271], [-0.06653187423944473, -0.43597203493118286, 0.12438256293535233, 0.8147585391998291], [-0.07525131106376648, -0.63255774974823, 0.14067773520946503, 1.1438332796096802], [-0.08790246397256851, -0.8292088508605957, 0.16355440020561218, 1.4771188497543335], [-0.10448664426803589, -0.6364182829856873, 0.19309677183628082, 1.2396631240844727], [-0.04517751187086105, 0.04248572885990143, -0.027639275416731834, -0.0003390698984730989], [-0.04432779923081398, 0.23799294233322144, -0.027646057307720184, -0.3016127943992615], [-0.039567939937114716, 0.4334977865219116, -0.033678311854600906, -0.6028848886489868], [-0.03089798428118229, 0.23886267840862274, -0.04573601111769676, -0.32099735736846924], [-0.026120729744434357, 0.04442087560892105, -0.052155956625938416, -0.043081339448690414], [-0.025232313200831413, -0.1499158889055252, -0.05301758274435997, 0.23270051181316376], [-0.028230631723999977, 0.04592195153236389, -0.0483635738492012, -0.07622335851192474], [-0.02731219120323658, -0.14847451448440552, -0.049888040870428085, 0.2008170187473297], [-0.030281681567430496, 0.04732413589954376, -0.04587170109152794, -0.1071765348315239], [-0.029335198923945427, 0.24307240545749664, -0.048015233129262924, -0.41397160291671753], [-0.024473750963807106, 0.4388408660888672, -0.05629466474056244, -0.7213969230651855], [-0.01569693349301815, 0.634694516658783, -0.07072260230779648, -1.0312539339065552], [-0.0030030428897589445, 0.8306824564933777, -0.09134767949581146, -1.3452759981155396], [0.013610606081783772, 0.6368202567100525, -0.1182532012462616, -1.0825140476226807], [0.02634701132774353, 0.4434405267238617, -0.1399034857749939, -0.829155683517456], [0.035215821117162704, 0.6401693820953369, -0.1564866006374359, -1.1623632907867432], [0.04801920801401138, 0.44739240407943726, -0.17973385751247406, -0.9225506782531738], [0.056967057287693024, 0.25509417057037354, -0.19818487763404846, -0.691307544708252]], "actions": [0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[0.04616829752922058, -0.16935884952545166, 0.01960647664964199, 0.2759064733982086], [0.04278112202882767, -0.36475497484207153, 0.025124605745077133, 0.5747082233428955], [0.035486020147800446, -0.560219943523407, 0.03661876916885376, 0.8751990795135498], [0.02428162284195423, -0.3656144440174103, 0.05412274971604347, 0.594249963760376], [0.016969332471489906, -0.17129014432430267, 0.06600774824619293, 0.3190946578979492], [0.013543530367314816, -0.3672870397567749, 0.0723896473646164, 0.6318419575691223], [0.006197789218276739, -0.5633403658866882, 0.08502648770809174, 0.9464157223701477], [-0.005069017875939608, -0.759498119354248, 0.10395479947328568, 1.2645570039749146], [-0.020258979871869087, -0.9557836651802063, 0.12924593687057495, 1.587903618812561], [-0.03937465324997902, -1.1521828174591064, 0.16100400686264038, 1.9179378747940063], [-0.06241830810904503, -0.9591179490089417, 0.19936276972293854, 1.6792168617248535], [-0.08160066604614258, -1.155914306640625, 0.23294711112976074, 2.026789665222168], [0.03311759978532791, -0.17338743805885315, 0.026325661689043045, 0.27791789174079895], [0.029649851843714714, -0.3688748776912689, 0.03188401833176613, 0.5787862539291382], [0.02227235585451126, -0.1742139309644699, 0.04345974698662758, 0.29631558060646057], [0.01878807693719864, 0.02026239223778248, 0.04938605800271034, 0.017649689689278603], [0.01919332519173622, -0.17553174495697021, 0.0497390516102314, 0.3254964053630829], [0.01568268984556198, 0.018848029896616936, 0.0562489777803421, 0.048904597759246826], [0.016059650108218193, -0.17703348398208618, 0.05722707137465477, 0.35879063606262207], [0.012518980540335178, 0.01723022200167179, 0.06440288573503494, 0.08468768745660782], [0.0128635847941041, 0.21137270331382751, 0.06609664112329483, -0.18700094521045685], [0.017091039568185806, 0.01537040714174509, 0.0623566210269928, 0.12577879428863525], [0.017398446798324585, 0.20954617857933044, 0.06487219780683517, -0.14659781754016876], [0.021589370444417, 0.40368202328681946, 0.06194023787975311, -0.4181300103664398], [0.02966301143169403, 0.20773953199386597, 0.053577639162540436, -0.10658111423254013], [0.033817801624536514, 0.011892363429069519, 0.05144601687788963, 0.20251239836215973], [0.03405565023422241, 0.20624226331710815, 0.05549626424908638, -0.07350828498601913], [0.03818049654364586, 0.4005264937877655, 0.05402609705924988, -0.3481784760951996], [0.0461910255253315, 0.5948400497436523, 0.047062527388334274, -0.6233475804328918], [0.058087825775146484, 0.7892743945121765, 0.03459557518362999, -0.900844931602478], [0.07387331128120422, 0.5937012434005737, 0.01657867804169655, -0.5974915623664856], [0.08574733883142471, 0.39835125207901, 0.004628846421837807, -0.2996329963207245], [0.09371436387300491, 0.20316362380981445, -0.0013638132950291038, -0.005493819713592529], [0.09777763485908508, 0.39830511808395386, -0.0014736896846443415, -0.2986067235469818], [0.10574373602867126, 0.5934480428695679, -0.007445824332535267, -0.5917540788650513], [0.11761269718408585, 0.788673460483551, -0.01928090490400791, -0.8867731094360352], [0.13338616490364075, 0.9840517044067383, -0.0370163694024086, -1.185454249382019], [0.1530672013759613, 0.7894289493560791, -0.06072545424103737, -0.9046003818511963], [0.16885578632354736, 0.5951796174049377, -0.0788174644112587, -0.631605863571167], [0.18075937032699585, 0.7913076281547546, -0.09144958108663559, -0.9480329155921936], [0.1965855211019516, 0.5975281000137329, -0.11041023582220078, -0.6854268908500671], [0.2085360884666443, 0.4040980935096741, -0.12411877512931824, -0.42944326996803284], [0.21661804616451263, 0.21093229949474335, -0.1327076405286789, -0.17832088470458984], [0.22083669900894165, 0.017934445291757584, -0.136274054646492, 0.0697287991642952], [0.22119538486003876, -0.17499734461307526, -0.1348794847726822, 0.31650280952453613], [0.2176954448223114, 0.021762125194072723, -0.12854942679405212, -0.015490245074033737], [0.2181306779384613, -0.1713043451309204, -0.1288592368364334, 0.23403042554855347], [0.21470458805561066, -0.36437225341796875, -0.12417861819267273, 0.48345136642456055], [0.20741714537143707, -0.5575429797172546, -0.11450959742069244, 0.7345614433288574], [0.1962662935256958, -0.36104094982147217, -0.09981836378574371, 0.4081465005874634], [0.1890454739332199, -0.554616391658783, -0.091655433177948, 0.6677664518356323], [0.17795313894748688, -0.35834741592407227, -0.0783001035451889, 0.34768974781036377], [0.17078618705272675, -0.16220416128635406, -0.07134631276130676, 0.0313795730471611], [0.16754211485385895, -0.35623428225517273, -0.07071872055530548, 0.3007262945175171], [0.16041742265224457, -0.16017936170101166, -0.06470419466495514, -0.01339498907327652], [0.15721383690834045, -0.3543165922164917, -0.06497209519147873, 0.25819167494773865], [0.15012750029563904, -0.548453688621521, -0.05980825796723366, 0.5296945571899414], [0.1391584277153015, -0.7426855564117432, -0.04921436682343483, 0.8029482960700989], [0.12430471926927567, -0.5469245314598083, -0.0331554040312767, 0.4951991140842438], [0.11336623132228851, -0.741563618183136, -0.023251419886946678, 0.7772513628005981], [0.09853495657444, -0.5461297631263733, -0.007706393022090197, 0.4773445129394531], [0.08761236071586609, -0.3508998453617096, 0.0018404977163299918, 0.18224270641803741], [0.08059436827898026, -0.546048104763031, 0.005485351663082838, 0.47550567984580994], [0.06967340409755707, -0.351004034280777, 0.01499546505510807, 0.18455666303634644], [0.0626533254981041, -0.5463373064994812, 0.018686598166823387, 0.4819321036338806], [0.051726579666137695, -0.3514840006828308, 0.028325241059064865, 0.19519677758216858], [0.04469689726829529, -0.546999454498291, 0.03222917765378952, 0.49667876958847046], [0.033756908029317856, -0.7425606846809387, 0.04216275364160538, 0.7993420362472534], [0.018905695527791977, -0.5480417013168335, 0.05814959108829498, 0.5202150344848633], [0.007944862358272076, -0.7439319491386414, 0.06855389475822449, 0.8306401371955872], [-0.0069337766617536545, -0.9399206042289734, 0.08516669273376465, 1.1440715789794922], [-0.025732187554240227, -1.1360455751419067, 0.10804812610149384, 1.4622015953063965], [-0.04845310002565384, -0.9424009919166565, 0.13729216158390045, 1.2051329612731934], [-0.06730112433433533, -0.7492941617965698, 0.16139481961727142, 0.9584354758262634], [-0.0822870060801506, -0.5566667914390564, 0.1805635243654251, 0.7204938530921936], [-0.09342034161090851, -0.3644411265850067, 0.1949734091758728, 0.4896406829357147], [-0.10070916265249252, -0.17252682149410248, 0.20476622879505157, 0.26418328285217285], [-0.10415969789028168, -0.36989307403564453, 0.21004988253116608, 0.6138291954994202], [0.008637022227048874, -0.18183541297912598, 0.018462838605046272, 0.2538633644580841], [0.0050003137439489365, 0.013018112629652023, 0.023540107533335686, -0.03293934836983681], [0.005260676145553589, -0.1824333667755127, 0.022881319746375084, 0.2670767903327942], [0.0016120088985189795, -0.3778742849826813, 0.028222855180501938, 0.5668879151344299], [-0.005945476703345776, -0.18315936625003815, 0.03956061601638794, 0.2832283079624176], [-0.009608663618564606, -0.37882259488105774, 0.04522518068552017, 0.5881212949752808], [-0.017185116186738014, -0.5745477080345154, 0.05698760598897934, 0.8947004675865173], [-0.028676070272922516, -0.3802429437637329, 0.07488161325454712, 0.6204617023468018], [-0.036280930042266846, -0.5763263702392578, 0.08729085326194763, 0.9357572793960571], [-0.04780745506286621, -0.3824833035469055, 0.10600599646568298, 0.671730637550354], [-0.05545712262392044, -0.18898218870162964, 0.11944060772657394, 0.41421571373939514], [-0.059236764907836914, 0.004262239206582308, 0.12772493064403534, 0.16144634783267975], [-0.05915152281522751, 0.1973462998867035, 0.130953848361969, -0.0883714035153389], [-0.0552045963704586, 0.000614116492215544, 0.12918642163276672, 0.24259065091609955], [-0.055192314088344574, 0.19367682933807373, 0.13403823971748352, -0.0067149922251701355], [-0.05131877586245537, 0.3866472542285919, 0.13390393555164337, -0.25428497791290283], [-0.04358582943677902, 0.5796284675598145, 0.12881824374198914, -0.5019152760505676], [-0.031993262469768524, 0.38294848799705505, 0.11877993494272232, -0.17157183587551117], [-0.024334292858839035, 0.1863444596529007, 0.11534849554300308, 0.15609554946422577], [-0.02060740254819393, -0.01022386271506548, 0.11847040802240372, 0.48282596468925476], [-0.020811880007386208, 0.1830442249774933, 0.12812691926956177, 0.22970475256443024], [-0.0171509962528944, -0.013653641566634178, 0.13272102177143097, 0.5598993897438049], [-0.017424067482352257, 0.17938029766082764, 0.14391900599002838, 0.31180045008659363], [-0.013836462050676346, 0.37219002842903137, 0.15015502274036407, 0.06774217635393143], [-0.006392661947757006, 0.5648759007453918, 0.1515098661184311, -0.17405462265014648], [0.004904856439679861, 0.36794692277908325, 0.14802876114845276, 0.16232864558696747], [0.012263794429600239, 0.1710500717163086, 0.15127533674240112, 0.4978056252002716], [0.01568479649722576, 0.36375167965888977, 0.16123145818710327, 0.2563597857952118], [0.02295983023941517, 0.1667390912771225, 0.16635864973068237, 0.5952427983283997], [0.026294611394405365, 0.35919010639190674, 0.17826350033283234, 0.35923585295677185], [0.03347841277718544, 0.1620413213968277, 0.18544822931289673, 0.7024050951004028], [0.03671924024820328, 0.35417500138282776, 0.199496328830719, 0.4733559191226959], [0.043802741914987564, 0.15687759220600128, 0.20896343886852264, 0.8216960430145264], [0.04694029316306114, 0.34862205386161804, 0.22539736330509186, 0.6013251543045044], [-0.028235578909516335, -0.23244687914848328, -0.008582024835050106, 0.2566184997558594], [-0.032884515821933746, -0.03720345348119736, -0.003449654672294855, -0.03875892981886864], [-0.03362858295440674, 0.15796779096126556, -0.004224833101034164, -0.3325282633304596], [-0.030469229444861412, -0.037093766033649445, -0.01087539829313755, -0.04118062183260918], [-0.03121110424399376, 0.15818242728710175, -0.011699010618031025, -0.3372749090194702], [-0.028047455474734306, 0.3534688949584961, -0.01844450831413269, -0.6336239576339722], [-0.02097807638347149, 0.1586090326309204, -0.031116988509893417, -0.34680628776550293], [-0.01780589669942856, -0.03605680540204048, -0.03805311396718025, -0.06409579515457153], [-0.018527032807469368, -0.2306130975484848, -0.03933503106236458, 0.21634244918823242], [-0.023139294236898422, -0.03495154157280922, -0.035008180886507034, -0.08848437666893005], [-0.023838326334953308, -0.2295546531677246, -0.03677786886692047, 0.19295114278793335], [-0.028429418802261353, -0.03392641991376877, -0.03291884437203407, -0.11110303550958633], [-0.029107946902513504, 0.1616514027118683, -0.035140905529260635, -0.4139872193336487], [-0.025874918326735497, 0.35725337266921997, -0.04342065006494522, -0.7175382971763611], [-0.01872985251247883, 0.16275835037231445, -0.05777141824364662, -0.43883246183395386], [-0.015474684536457062, -0.03150037303566933, -0.06654806435108185, -0.1649058312177658], [-0.016104692593216896, 0.16450797021389008, -0.06984618306159973, -0.47781825065612793], [-0.012814532965421677, 0.3605429530143738, -0.07940255105495453, -0.7916718125343323], [-0.005603673402220011, 0.5566601157188416, -0.09523598849773407, -1.1082404851913452], [0.005529528483748436, 0.7528958320617676, -0.11740079522132874, -1.4292173385620117], [0.02058744616806507, 0.5594030022621155, -0.14598514139652252, -1.1754125356674194], [0.03177550435066223, 0.7560883164405823, -0.1694933921098709, -1.510069727897644], [0.046897273510694504, 0.5633768439292908, -0.19969478249549866, -1.2747374773025513], [0.0581648088991642, 0.3712818920612335, -0.22518953680992126, -1.0506421327590942], [-0.016927873715758324, -0.1808677315711975, -0.03542731702327728, 0.2902960777282715], [-0.020545227453112602, 0.014741002582013607, -0.029621392488479614, -0.013346358202397823], [-0.020250407978892326, -0.17994388937950134, -0.029888320714235306, 0.26984545588493347], [-0.023849286139011383, 0.015591545961797237, -0.024491410702466965, -0.03211255744099617], [-0.02353745512664318, 0.21105599403381348, -0.025133661925792694, -0.33242106437683105], [-0.019316334277391434, 0.016300639137625694, -0.031782083213329315, -0.04776880890130997], [-0.018990322947502136, -0.1783515065908432, -0.03273745998740196, 0.23471960425376892], [-0.022557351738214493, 0.01722252182662487, -0.028043067082762718, -0.06810734421014786], [-0.022212902083992958, 0.21273507177829742, -0.02940521575510502, -0.369504451751709], [-0.017958199605345726, 0.01804298348724842, -0.03679530322551727, -0.08623644709587097], [-0.017597340047359467, -0.17653274536132812, -0.03852003440260887, 0.1946142166852951], [-0.02112799510359764, -0.3710831105709076, -0.03462774679064751, 0.4749011993408203], [-0.02854965813457966, -0.5656993985176086, -0.02512972429394722, 0.756472110748291], [-0.039863646030426025, -0.7604661583900452, -0.01000028196722269, 1.0411425828933716], [-0.05507297068834305, -0.9554538130760193, 0.010822569951415062, 1.3306695222854614], [-0.07418204843997955, -0.7604700326919556, 0.03743596002459526, 1.0413926839828491], [-0.08939144760370255, -0.956068754196167, 0.05826381593942642, 1.3455888032913208], [-0.10851281881332397, -0.7617258429527283, 0.08517558872699738, 1.0716890096664429], [-0.1237473413348198, -0.5678269267082214, 0.10660936683416367, 0.8069062829017639], [-0.13510388135910034, -0.3743150532245636, 0.1227474957704544, 0.5495703220367432], [-0.14259018003940582, -0.18111170828342438, 0.1337389051914215, 0.29794299602508545], [-0.1462124139070511, 0.011875506490468979, 0.13969776034355164, 0.05024930089712143], [-0.14597490429878235, -0.18494437634944916, 0.1407027542591095, 0.38354071974754333], [-0.14967378973960876, -0.3817543387413025, 0.1483735591173172, 0.7170684933662415], [-0.15730887651443481, -0.5785841941833496, 0.16271492838859558, 1.052531361579895], [-0.16888056695461273, -0.38594967126846313, 0.18376556038856506, 0.81502366065979], [-0.17659954726696014, -0.5830481648445129, 0.20006603002548218, 1.159416913986206], [-0.1882605105638504, -0.39101383090019226, 0.22325436770915985, 0.9355388879776001], [0.014886842109262943, -0.228583425283432, 0.007724451832473278, 0.24593335390090942], [0.01031517330557108, -0.4238148629665375, 0.012643118388950825, 0.541042685508728], [0.0018388766329735518, -0.2288728654384613, 0.02346397377550602, 0.25237008929252625], [-0.0027385808061808348, -0.42432186007499695, 0.028511375188827515, 0.5523606538772583], [-0.01122501865029335, -0.22961169481277466, 0.039558589458465576, 0.26879531145095825], [-0.015817251056432724, -0.035075947642326355, 0.04493449628353119, -0.011152821592986584], [-0.016518771648406982, -0.23081254959106445, 0.044711437076330185, 0.29536202549934387], [-0.02113502286374569, -0.4265424609184265, 0.05061867833137512, 0.601804256439209], [-0.0296658705919981, -0.23216375708580017, 0.0626547634601593, 0.3254851698875427], [-0.03430914506316185, -0.4281192421913147, 0.0691644698381424, 0.6372501254081726], [-0.04287153109908104, -0.2340264916419983, 0.08190947026014328, 0.3671252131462097], [-0.04755206033587456, -0.43021103739738464, 0.08925197273492813, 0.6844698786735535], [-0.056156281381845474, -0.2364342212677002, 0.1029413715004921, 0.4211668372154236], [-0.06088496744632721, -0.042909927666187286, 0.1113647073507309, 0.16262847185134888], [-0.06174316629767418, -0.2394353747367859, 0.11461728066205978, 0.4882641136646271], [-0.06653187423944473, -0.43597203493118286, 0.12438256293535233, 0.8147585391998291], [-0.07525131106376648, -0.63255774974823, 0.14067773520946503, 1.1438332796096802], [-0.08790246397256851, -0.8292088508605957, 0.16355440020561218, 1.4771188497543335], [-0.10448664426803589, -0.6364182829856873, 0.19309677183628082, 1.2396631240844727], [-0.11721500754356384, -0.8334226608276367, 0.21789003908634186, 1.586095929145813], [-0.04432779923081398, 0.23799294233322144, -0.027646057307720184, -0.3016127943992615], [-0.039567939937114716, 0.4334977865219116, -0.033678311854600906, -0.6028848886489868], [-0.03089798428118229, 0.23886267840862274, -0.04573601111769676, -0.32099735736846924], [-0.026120729744434357, 0.04442087560892105, -0.052155956625938416, -0.043081339448690414], [-0.025232313200831413, -0.1499158889055252, -0.05301758274435997, 0.23270051181316376], [-0.028230631723999977, 0.04592195153236389, -0.0483635738492012, -0.07622335851192474], [-0.02731219120323658, -0.14847451448440552, -0.049888040870428085, 0.2008170187473297], [-0.030281681567430496, 0.04732413589954376, -0.04587170109152794, -0.1071765348315239], [-0.029335198923945427, 0.24307240545749664, -0.048015233129262924, -0.41397160291671753], [-0.024473750963807106, 0.4388408660888672, -0.05629466474056244, -0.7213969230651855], [-0.01569693349301815, 0.634694516658783, -0.07072260230779648, -1.0312539339065552], [-0.0030030428897589445, 0.8306824564933777, -0.09134767949581146, -1.3452759981155396], [0.013610606081783772, 0.6368202567100525, -0.1182532012462616, -1.0825140476226807], [0.02634701132774353, 0.4434405267238617, -0.1399034857749939, -0.829155683517456], [0.035215821117162704, 0.6401693820953369, -0.1564866006374359, -1.1623632907867432], [0.04801920801401138, 0.44739240407943726, -0.17973385751247406, -0.9225506782531738], [0.056967057287693024, 0.25509417057037354, -0.19818487763404846, -0.691307544708252], [0.062068939208984375, 0.06319316476583481, -0.21201102435588837, -0.4669762849807739]], "action_prob": [0.5152292251586914, 0.38767725229263306, 0.3490338623523712, 0.6476350426673889, 0.653829038143158, 0.3650861084461212, 0.34467756748199463, 0.3553321361541748, 0.37146154046058655, 0.38665157556533813, 0.6004917025566101, 0.3931941092014313, 0.511197030544281, 0.3846288025379181, 0.6518797278404236, 0.6249390840530396, 0.47709304094314575, 0.6331339478492737, 0.4566805064678192, 0.6408519744873047, 0.5653498768806458, 0.5645133256912231, 0.5836623907089233, 0.45466676354408264, 0.6300148963928223, 0.529649019241333, 0.60948646068573, 0.4889121353626251, 0.3835158348083496, 0.35014140605926514, 0.6507266759872437, 0.6514838933944702, 0.6171806454658508, 0.4975198805332184, 0.380865216255188, 0.34626007080078125, 0.3476625978946686, 0.6415442228317261, 0.6522362232208252, 0.34052208065986633, 0.650462806224823, 0.6602355241775513, 0.6614453196525574, 0.6338891983032227, 0.5464661121368408, 0.5669603943824768, 0.5869499444961548, 0.4700978398323059, 0.3871001899242401, 0.6407747268676758, 0.40073585510253906, 0.6388577222824097, 0.5861766338348389, 0.5542327165603638, 0.5710979700088501, 0.5738216042518616, 0.44467198848724365, 0.3717379570007324, 0.6462525129318237, 0.37218812108039856, 0.6474329829216003, 0.6299499869346619, 0.450369268655777, 0.6325186491012573, 0.44260600209236145, 0.636173665523529, 0.43120402097702026, 0.3594447076320648, 0.650779128074646, 0.3534198999404907, 0.34902483224868774, 0.3596383035182953, 0.627128005027771, 0.6363130807876587, 0.6466145515441895, 0.6567586064338684, 0.6626442074775696, 0.34703654050827026, 0.5238867998123169, 0.6076184511184692, 0.5150070190429688, 0.3867890238761902, 0.6518644690513611, 0.37754327058792114, 0.346100777387619, 0.6474415063858032, 0.34382304549217224, 0.6456034183502197, 0.6570347547531128, 0.6578491926193237, 0.6224069595336914, 0.47857677936553955, 0.6439039707183838, 0.5665105581283569, 0.44879859685897827, 0.623389720916748, 0.5166232585906982, 0.37393760681152344, 0.6665852665901184, 0.3521481156349182, 0.6680092811584473, 0.6636449098587036, 0.6121804118156433, 0.4944283962249756, 0.35910341143608093, 0.6746947765350342, 0.3374995291233063, 0.6748751401901245, 0.32390421628952026, 0.6722028851509094, 0.31733638048171997, 0.6671673655509949, 0.5276223421096802, 0.6018133163452148, 0.4719020426273346, 0.6323737502098083, 0.46741315722465515, 0.36515098810195923, 0.6554149985313416, 0.640512228012085, 0.5566725134849548, 0.5763272643089294, 0.5673836469650269, 0.5672001838684082, 0.4229954779148102, 0.34961116313934326, 0.6555086374282837, 0.6556277871131897, 0.3891929090023041, 0.3406844139099121, 0.3461940884590149, 0.36342746019363403, 0.6193029880523682, 0.3680821359157562, 0.6136528253555298, 0.6251773238182068, 0.5099340677261353, 0.6092214584350586, 0.5200253129005432, 0.6041481494903564, 0.4717354476451874, 0.6337328553199768, 0.5403435230255127, 0.5903311371803284, 0.45044422149658203, 0.641452431678772, 0.5626952648162842, 0.4286840856075287, 0.3602845072746277, 0.3494679033756256, 0.35706573724746704, 0.6311565041542053, 0.35718104243278503, 0.6294139623641968, 0.6409654021263123, 0.6529014110565186, 0.6607654690742493, 0.6507707834243774, 0.4080328047275543, 0.3386874496936798, 0.34170475602149963, 0.6392902135848999, 0.3459813892841339, 0.632192850112915, 0.5361813902854919, 0.401945024728775, 0.6478694677352905, 0.39440640807151794, 0.6502537727355957, 0.6157490611076355, 0.4959818720817566, 0.375411719083786, 0.6539258360862732, 0.36438992619514465, 0.6553906202316284, 0.3537200689315796, 0.6558018326759338, 0.6551777720451355, 0.3841812014579773, 0.3398769497871399, 0.3480667769908905, 0.36638781428337097, 0.615969717502594, 0.3729386329650879, 0.4946940243244171, 0.3762824237346649, 0.6539488434791565, 0.6327064633369446, 0.5414676070213318, 0.5867111682891846, 0.5575050115585327, 0.5741962194442749, 0.42810162901878357, 0.3515651226043701, 0.34509310126304626, 0.35788628458976746, 0.6265639066696167, 0.6387869715690613, 0.34757107496261597, 0.6334806680679321, 0.6474016308784485, 0.6622921228408813], "advantages": [0.8816801905632019, 0.10938403010368347, -0.4229792356491089, -0.793014645576477, -2.6834144592285156, -4.303712368011475, -4.93167781829834, -5.394564151763916, -5.787874221801758, -6.200602054595947, -6.691302299499512, -9.01885986328125, 37.93800735473633, 37.530147552490234, 37.36771011352539, 36.171836853027344, 35.295780181884766, 34.85598373413086, 33.94633865356445, 33.50620651245117, 32.564208984375, 31.90101432800293, 31.238601684570312, 30.546241760253906, 30.09457015991211, 29.263042449951172, 28.64707374572754, 27.911890029907227, 27.405105590820312, 27.112146377563477, 27.02830696105957, 25.980792999267578, 25.07288360595703, 24.334680557250977, 23.866064071655273, 23.658336639404297, 23.707660675048828, 23.989971160888672, 23.03312110900879, 22.15251922607422, 22.52911949157715, 21.769119262695312, 21.124143600463867, 20.63895606994629, 20.356000900268555, 20.28795051574707, 19.761266708374023, 19.65878677368164, 19.726579666137695, 19.852903366088867, 18.637556076049805, 18.645671844482422, 17.40683364868164, 16.531291961669922, 16.265092849731445, 15.408027648925781, 15.0792236328125, 14.846219062805176, 14.580288887023926, 13.03537654876709, 12.658916473388672, 10.995451927185059, 9.521726608276367, 8.963580131530762, 7.40905237197876, 6.802192687988281, 5.161106109619141, 4.517011642456055, 3.9623634815216064, 1.9174445867538452, 1.3351863622665405, 0.749751627445221, 0.08686789125204086, -2.310314416885376, -4.739136695861816, -7.0509114265441895, -9.118672370910645, -10.892333984375, 18.63544273376465, 18.03765296936035, 17.043045043945312, 16.430652618408203, 16.064001083374023, 14.653133392333984, 14.248653411865234, 14.011543273925781, 12.254827499389648, 11.968606948852539, 10.197136878967285, 8.68932819366455, 7.442546367645264, 6.4144439697265625, 5.538414478302002, 4.485599517822266, 3.588892698287964, 2.819753408432007, 1.7182470560073853, 0.7707358002662659, -0.03482335805892944, -1.14069402217865, -1.950257658958435, -3.0724081993103027, -4.086236953735352, -5.02409553527832, -6.019506454467773, -6.93214750289917, -7.988949775695801, -8.907413482666016, -9.982977867126465, -10.911391258239746, -12.003311157226562, -12.945290565490723, 11.802562713623047, 11.227606773376465, 10.18412971496582, 9.539047241210938, 8.66478443145752, 8.0348539352417, 7.784497261047363, 6.730290412902832, 5.899438381195068, 5.329737663269043, 4.369681358337402, 3.7601847648620605, 2.8033854961395264, 2.2919669151306152, 2.170705556869507, 1.1577166318893433, 0.3405432105064392, 0.030878139659762383, 0.09357937425374985, 0.3460562229156494, 0.6110695004463196, 0.2738035321235657, 0.504275918006897, 0.5954087376594543, 14.073386192321777, 13.59014892578125, 12.655519485473633, 12.132506370544434, 11.188169479370117, 10.635294914245605, 9.817181587219238, 9.25232982635498, 8.322088241577148, 7.799790382385254, 6.942831039428711, 6.341007232666016, 5.978271007537842, 5.770268440246582, 5.594826698303223, 5.344276428222656, 3.2342612743377686, 2.913017749786377, 0.7100564241409302, -1.4124776124954224, -3.3278236389160156, -4.97122049331665, -6.349482536315918, -7.252601146697998, -7.946023941040039, -8.487170219421387, -10.336282730102539, -10.920129776000977, 8.773490905761719, 8.103592872619629, 7.678624153137207, 6.1470537185668945, 5.674966335296631, 4.0892333984375, 2.840804100036621, 2.071411609649658, 1.5498377084732056, -0.11531975865364075, -0.6682556867599487, -2.3704006671905518, -2.9493484497070312, -4.674943447113037, -6.123140335083008, -6.934205532073975, -7.546889305114746, -8.029541015625, -8.464332580566406, -10.580709457397461, 5.629360198974609, 4.987417221069336, 4.694122791290283, 3.65677547454834, 2.8216562271118164, 2.2252049446105957, 1.2996097803115845, 0.6628603935241699, -0.2501906156539917, -0.7409383058547974, -0.847837507724762, -0.6676802039146423, -0.33848896622657776, -1.102973222732544, -1.7553526163101196, -1.2763217687606812, -1.5593092441558838, -1.6640434265136719], "value_targets": [11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 721233968, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 1875270588, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492, 768898492], "obs": [[-0.04253757372498512, 0.04699067398905754, -0.04415322095155716, 0.048727549612522125], [-0.04159776121377945, -0.14747126400470734, -0.04317866638302803, 0.3271593451499939], [-0.0445471853017807, -0.34195274114608765, -0.03663548082113266, 0.6059190630912781], [-0.05138624086976051, -0.14633816480636597, -0.024517100304365158, 0.3019256591796875], [-0.05431300401687622, 0.04912448301911354, -0.01847858726978302, 0.0016125087859109044], [-0.05333051458001137, -0.14572764933109283, -0.018446337431669235, 0.28840842843055725], [-0.05624506622552872, 0.049652427434921265, -0.012678168714046478, -0.010034757666289806], [-0.05525201931595802, 0.24495388567447662, -0.012878863140940666, -0.30669069290161133], [-0.05035294219851494, 0.05001780018210411, -0.019012676551938057, -0.018097082152962685], [-0.04935258626937866, -0.14482639729976654, -0.01937461830675602, 0.26852700114250183], [-0.052249111235141754, 0.05056660994887352, -0.014004078693687916, -0.030203288421034813], [-0.05123778060078621, 0.24588656425476074, -0.014608144760131836, -0.32727155089378357], [-0.046320050954818726, 0.05097559839487076, -0.02115357480943203, -0.039230942726135254], [-0.04530053585767746, 0.24639439582824707, -0.02193819358944893, -0.33851224184036255], [-0.04037264734506607, 0.44182154536247253, -0.02870843932032585, -0.6380317211151123], [-0.03153621777892113, 0.24711142480373383, -0.04146907478570938, -0.3545260429382324], [-0.026593990623950958, 0.052602898329496384, -0.04855959489941597, -0.07520248740911484], [-0.02554193139076233, -0.1417904794216156, -0.05006364360451698, 0.20177295804023743], [-0.02837774157524109, -0.3361620306968689, -0.04602818563580513, 0.4782523810863495], [-0.03510098159313202, -0.14042147994041443, -0.036463137716054916, 0.17142504453659058], [-0.037909410893917084, 0.055202875286340714, -0.033034637570381165, -0.1325342357158661], [-0.03680535405874252, 0.2507820725440979, -0.03568532317876816, -0.4354533851146698], [-0.031789712607860565, 0.05618298798799515, -0.04439438879489899, -0.15422984957695007], [-0.030666053295135498, 0.25191155076026917, -0.04747898504137993, -0.46058109402656555], [-0.025627821683883667, 0.057491712272167206, -0.056690607219934464, -0.18323355913162231], [-0.024477986618876457, 0.2533770799636841, -0.060355279594659805, -0.4932476878166199], [-0.019410446286201477, 0.4492960274219513, -0.0702202320098877, -0.8043246865272522], [-0.01042452547699213, 0.2552034556865692, -0.08630672842264175, -0.5345311164855957], [-0.00532045541331172, 0.06139449030160904, -0.09699735045433044, -0.2702424228191376], [-0.0040925657376646996, -0.1322191208600998, -0.10240219533443451, -0.00965967122465372], [-0.006736948154866695, 0.06421098858118057, -0.10259538888931274, -0.3328149914741516], [-0.0054527283646166325, -0.1293124407529831, -0.10925169289112091, -0.07416639477014542], [-0.008038977161049843, -0.32271236181259155, -0.11073502153158188, 0.18214774131774902], [-0.014493224211037159, -0.516089916229248, -0.10709206759929657, 0.4379478991031647], [-0.024815022945404053, -0.7095460295677185, -0.09833310544490814, 0.6950446963310242], [-0.03900594264268875, -0.5132076144218445, -0.0844322144985199, 0.37309643626213074], [-0.04927009716629982, -0.3169941008090973, -0.07697028666734695, 0.05503101646900177], [-0.05560997873544693, -0.5109328627586365, -0.07586966454982758, 0.32247093319892883], [-0.06582863628864288, -0.3148171305656433, -0.06942024827003479, 0.006859300192445517], [-0.07212498039007187, -0.5088783502578735, -0.06928306072950363, 0.2768568694591522], [-0.08230254799127579, -0.31283989548683167, -0.06374592334032059, -0.036848291754722595], [-0.0885593444108963, -0.11686449497938156, -0.06448289006948471, -0.34894296526908875], [-0.09089663624763489, -0.3110128939151764, -0.0714617446064949, -0.07727043330669403], [-0.09711689502000809, -0.5050414800643921, -0.07300715893507004, 0.19203777611255646], [-0.10721772164106369, -0.30895519256591797, -0.069166399538517, -0.12275321036577225], [-0.11339682340621948, -0.5030215382575989, -0.07162146270275116, 0.1473315805196762], [-0.12345725297927856, -0.6970486640930176, -0.06867483258247375, 0.4165874123573303], [-0.13739822804927826, -0.8911335468292236, -0.06034308299422264, 0.6868539452552795], [-0.1552208960056305, -0.6952282190322876, -0.04660600423812866, 0.37580063939094543], [-0.16912546753883362, -0.4994763135910034, -0.03908999264240265, 0.06879448145627975], [-0.17911499738693237, -0.30381637811660767, -0.03771410137414932, -0.23596076667308807], [-0.1851913183927536, -0.49837976694107056, -0.04243331775069237, 0.04459148272871971], [-0.195158913731575, -0.6928683519363403, -0.041541486978530884, 0.32359012961387634], [-0.20901627838611603, -0.4971802830696106, -0.03506968542933464, 0.018101535737514496], [-0.21895988285541534, -0.30157339572906494, -0.034707654267549515, -0.285436749458313], [-0.2249913513660431, -0.10597408562898636, -0.04041638970375061, -0.5888610482215881], [-0.2271108329296112, 0.08968982100486755, -0.05219361186027527, -0.8939964175224304], [-0.22531704604625702, -0.1046869233250618, -0.07007353752851486, -0.6181662678718567], [-0.22741077840328217, 0.09134028106927872, -0.08243686705827713, -0.932070255279541], [-0.2255839705467224, 0.28747203946113586, -0.10107827186584473, -1.249477744102478], [-0.21983453631401062, 0.09378047287464142, -0.12606783211231232, -0.9900897741317749], [-0.21795892715454102, 0.290343701839447, -0.14586962759494781, -1.3195605278015137], [-0.21215204894542694, 0.09733562916517258, -0.1722608357667923, -1.0758568048477173], [-0.2102053314447403, -0.09514418989419937, -0.19377796351909637, -0.8418048620223999], [0.02610521763563156, 0.008239185437560081, 0.00043478922452777624, 0.004702997859567404], [0.026270000264048576, -0.18688899278640747, 0.0005288491956889629, 0.2975230813026428], [0.02253222092986107, 0.008225410245358944, 0.006479310803115368, 0.00500698434188962], [0.022696729749441147, -0.18698886036872864, 0.006579450331628323, 0.2997271418571472], [0.018956951797008514, -0.38220396637916565, 0.012573993764817715, 0.5944778323173523], [0.011312872171401978, -0.5774996280670166, 0.024463549256324768, 0.8910948038101196], [-0.0002371205628151074, -0.38271796703338623, 0.04228544607758522, 0.6062012910842896], [-0.007891479879617691, -0.18821200728416443, 0.05440947413444519, 0.32713139057159424], [-0.011655719950795174, 0.006094798911362886, 0.06095210090279579, 0.052090976387262344], [-0.011533823795616627, -0.18984577059745789, 0.06199391931295395, 0.3633648753166199], [-0.015330739319324493, 0.0043428149074316025, 0.06926121562719345, 0.09085608273744583], [-0.01524388324469328, 0.19840717315673828, 0.0710783377289772, -0.17919601500034332], [-0.011275739409029484, 0.002343872794881463, 0.06749441474676132, 0.13503579795360565], [-0.011228862218558788, 0.19643738865852356, 0.07019513100385666, -0.13561329245567322], [-0.007300114259123802, 0.3904873728752136, 0.06748286634683609, -0.4053509831428528], [0.0005096327513456345, 0.19447655975818634, 0.05937584862112999, -0.09217910468578339], [0.004399164114147425, 0.38869941234588623, 0.05753226578235626, -0.36555376648902893], [0.012173152528703213, 0.5829585790634155, 0.050221189856529236, -0.6395552754402161], [0.023832324892282486, 0.7773457169532776, 0.037430085241794586, -0.9160094857215881], [0.039379239082336426, 0.5817381143569946, 0.019109897315502167, -0.6118017435073853], [0.0510140024125576, 0.7765878438949585, 0.006873862352222204, -0.8984049558639526], [0.0665457546710968, 0.581373393535614, -0.011094237677752972, -0.6035693287849426], [0.07817322760820389, 0.38640835881233215, -0.02316562458872795, -0.31440141797065735], [0.08590139448642731, 0.19162394106388092, -0.02945365197956562, -0.029113247990608215], [0.08973387628793716, 0.3871556222438812, -0.030035916715860367, -0.33094167709350586], [0.09747698903083801, 0.19247381389141083, -0.0366547517478466, -0.047879911959171295], [0.10132645815610886, -0.002103887964040041, -0.037612348794937134, 0.2330165058374405], [0.10128438472747803, -0.19666878879070282, -0.032952018082141876, 0.5136020183563232], [0.09735100716352463, -0.0010986151173710823, -0.022679978981614113, 0.21071986854076385], [0.0973290354013443, -0.19588907063007355, -0.01846558041870594, 0.4961630702018738], [0.09341125190258026, -0.3907458186149597, -0.008542319759726524, 0.7829698324203491], [0.08559633791446686, -0.19550752639770508, 0.007117076311260462, 0.4876116216182709], [0.08168618381023407, -0.390729159116745, 0.016869308426976204, 0.7825290560722351], [0.07387160509824753, -0.19584308564662933, 0.03251989185810089, 0.49520087242126465], [0.06995474547147751, -0.0011944614816457033, 0.04242390766739845, 0.2129414826631546], [0.06993085145950317, 0.19329607486724854, 0.04668273776769638, -0.06606294214725494], [0.07379677146673203, 0.38771870732307434, 0.04536147788167, -0.3436594605445862], [0.08155114948749542, 0.19198179244995117, 0.03848829120397568, -0.0370243638753891], [0.08539078384637833, -0.003670350182801485, 0.03774780407547951, 0.2675492465496063], [0.08531738072633743, -0.19931012392044067, 0.04309878870844841, 0.5718950629234314], [0.08133117854595184, -0.004818175919353962, 0.054536689072847366, 0.293095201253891], [0.08123481273651123, -0.20067356526851654, 0.06039859354496002, 0.6024673581123352], [0.0772213414311409, -0.006446117535233498, 0.07244794070720673, 0.3294037878513336], [0.07709241658449173, -0.20252060890197754, 0.07903601974248886, 0.6440250873565674], [0.07304200530052185, -0.008583949878811836, 0.0919165164232254, 0.3772406280040741], [0.07287032902240753, 0.18512052297592163, 0.09946133196353912, 0.11489587277173996], [0.07657273858785629, 0.3786870837211609, 0.10175924748182297, -0.1448255330324173], [0.08414647728204727, 0.5722156763076782, 0.09886273741722107, -0.40375110507011414], [0.09559079259634018, 0.7658066749572754, 0.09078771620988846, -0.6637014150619507], [0.1109069287776947, 0.5695468783378601, 0.077513687312603, -0.3438691198825836], [0.12229786068201065, 0.3734126687049866, 0.07063630223274231, -0.027785036712884903], [0.12976612150669098, 0.17735257744789124, 0.07008060067892075, 0.2863215506076813], [0.1333131641149521, 0.37140873074531555, 0.07580703496932983, 0.016538653522729874], [0.14074134826660156, 0.565366268157959, 0.07613781094551086, -0.25129616260528564], [0.15204866230487823, 0.7593231201171875, 0.07111188769340515, -0.5190256237983704], [0.1672351360321045, 0.5632758140563965, 0.060731373727321625, -0.20480868220329285], [0.17850065231323242, 0.7574790716171265, 0.05663519725203514, -0.47773247957229614], [0.1936502307653427, 0.9517576098442078, 0.04708055034279823, -0.7520411610603333], [0.21268537640571594, 1.1461998224258423, 0.03203972801566124, -1.029544711112976], [0.23560938239097595, 1.340881109237671, 0.011448833160102367, -1.3119986057281494], [0.2624270021915436, 1.145616054534912, -0.014791140332818031, -1.0157544612884521], [0.2853393256664276, 1.340932011604309, -0.03510623052716255, -1.3130449056625366], [0.3121579587459564, 1.1462717056274414, -0.06136712431907654, -1.0315532684326172], [0.33508339524269104, 0.9520174264907837, -0.08199819177389145, -0.7587510347366333], [0.3541237413883209, 0.7581153512001038, -0.09717321395874023, -0.49295562505722046], [0.36928606033325195, 0.5644885897636414, -0.10703232884407043, -0.23240968585014343], [0.38057583570480347, 0.371045857667923, -0.1116805225610733, 0.024686511605978012], [0.38799673318862915, 0.5675775408744812, -0.11118678748607635, -0.30104029178619385], [0.39934828877449036, 0.3742014169692993, -0.1172075942158699, -0.045388881117105484], [0.4068323075771332, 0.570792019367218, -0.1181153729557991, -0.3726317584514618], [0.41824814677238464, 0.7673764824867249, -0.12556800246238708, -0.7000991106033325], [0.4335956871509552, 0.9639948606491089, -0.1395699828863144, -1.0295246839523315], [0.4528755843639374, 0.7709781527519226, -0.16016048192977905, -0.7837154865264893], [0.468295156955719, 0.9678959250450134, -0.1758347898721695, -1.1221979856491089], [0.48765307664871216, 0.7754600048065186, -0.1982787549495697, -0.8894243240356445], [-0.03583930805325508, 0.012690034694969654, 0.03194832056760788, 0.0485382154583931], [-0.03558550775051117, 0.20733965933322906, 0.03291908651590347, -0.23389600217342377], [-0.031438715755939484, 0.011763193644583225, 0.028241164982318878, 0.0689862072467804], [-0.03120345063507557, 0.2064691185951233, 0.029620889574289322, -0.21465441584587097], [-0.027074068784713745, 0.01093648374080658, 0.02532779984176159, 0.08722313493490219], [-0.026855338364839554, 0.20568640530109406, 0.02707226388156414, -0.19736246764659882], [-0.022741610184311867, 0.010187894105911255, 0.02312501333653927, 0.10373611003160477], [-0.022537853568792343, 0.20497094094753265, 0.025199735537171364, -0.18156218528747559], [-0.01843843422830105, 0.009497631341218948, 0.02156849205493927, 0.1189626157283783], [-0.018248481675982475, -0.18592660129070282, 0.023947743698954582, 0.41837143898010254], [-0.02196701429784298, -0.3813795745372772, 0.032315172255039215, 0.7185068130493164], [-0.029594605788588524, -0.18671934306621552, 0.04668530821800232, 0.4361678957939148], [-0.03332899138331413, -0.3824700117111206, 0.05540866777300835, 0.7431944608688354], [-0.04097839072346687, -0.18815483152866364, 0.07027255743741989, 0.4684508144855499], [-0.04474148899316788, 0.005907649639993906, 0.07964157313108444, 0.19871868193149567], [-0.04462333768606186, -0.1902577430009842, 0.08361594378948212, 0.5154239535331726], [-0.0484284907579422, 0.0035933242179453373, 0.09392442554235458, 0.2502177357673645], [-0.04835662245750427, 0.19725725054740906, 0.0989287793636322, -0.011424563825130463], [-0.04441148042678833, 0.0008659533341415226, 0.09870028495788574, 0.31075966358184814], [-0.04439416155219078, 0.19445331394672394, 0.10491548478603363, 0.05076267570257187], [-0.04050509259104729, 0.3879266381263733, 0.10593073815107346, -0.2070629894733429], [-0.032746560871601105, 0.581386923789978, 0.10178947448730469, -0.46454131603240967], [-0.021118823438882828, 0.7749342918395996, 0.09249865263700485, -0.7234851717948914], [-0.005620136857032776, 0.5786629915237427, 0.07802894711494446, -0.4031810164451599], [0.005953123327344656, 0.38252609968185425, 0.06996532529592514, -0.08695361763238907], [0.013603645376861095, 0.5765790343284607, 0.06822625547647476, -0.356767863035202], [0.025135226547718048, 0.7706680297851562, 0.06109089404344559, -0.6271810531616211], [0.04054858535528183, 0.5747489929199219, 0.048547275364398956, -0.31590116024017334], [0.05204356834292412, 0.37897035479545593, 0.04222925007343292, -0.00831189751625061], [0.05962297320365906, 0.5734620094299316, 0.04206301271915436, -0.28737762570381165], [0.07109221816062927, 0.3777662515640259, 0.03631545975804329, 0.018269281834363937], [0.07864753901958466, 0.18214282393455505, 0.03668084740638733, 0.32218536734580994], [0.0822903960943222, 0.3767237663269043, 0.04312455281615257, 0.041292037814855576], [0.0898248702287674, 0.5712016224861145, 0.0439503937959671, -0.23747886717319489], [0.10124890506267548, 0.3754802346229553, 0.03920081630349159, 0.0687369778752327], [0.10875850915908813, 0.17981883883476257, 0.040575556457042694, 0.3735256791114807], [0.11235488951206207, 0.37434160709381104, 0.04804607108235359, 0.09390762448310852], [0.11984171718358994, 0.1785651296377182, 0.049924224615097046, 0.4013535678386688], [0.12341301888227463, 0.372944712638855, 0.057951293885707855, 0.12481912225484848], [0.13087192177772522, 0.5671905875205994, 0.060447677969932556, -0.14903247356414795], [0.14221572875976562, 0.7613972425460815, 0.0574670284986496, -0.42204952239990234], [0.15744367241859436, 0.5655101537704468, 0.049026038497686386, -0.11181801557540894], [0.16875387728214264, 0.7598965764045715, 0.04678967595100403, -0.3886393904685974], [0.18395181000232697, 0.5641428232192993, 0.03901688754558563, -0.08157894760370255], [0.19523465633392334, 0.36848390102386475, 0.03738531097769737, 0.22315409779548645], [0.20260433852672577, 0.5630521178245544, 0.04184839129447937, -0.05750557407736778], [0.21386538445949554, 0.36735591292381287, 0.04069828242063522, 0.24808159470558167], [0.2212125062942505, 0.561873733997345, 0.04565991088747978, -0.031491514295339584], [0.2324499785900116, 0.36612772941589355, 0.04503008350729942, 0.27524080872535706], [0.23977252840995789, 0.1703931987285614, 0.050534896552562714, 0.5817793607711792], [0.24318039417266846, 0.3647720217704773, 0.06217048689723015, 0.3054342567920685], [0.25047582387924194, 0.5589554905891418, 0.06827916949987411, 0.032988179475069046], [0.26165494322776794, 0.36292415857315063, 0.06893893331289291, 0.3464084267616272], [0.2689134180545807, 0.16689278185367584, 0.07586710155010223, 0.6600090265274048], [0.27225127816200256, 0.3608815371990204, 0.08906728029251099, 0.392146497964859], [0.27946892380714417, 0.1646159440279007, 0.09691021591424942, 0.7115290760993958], [0.28276124596595764, 0.35827186703681946, 0.11114079505205154, 0.45085519552230835], [0.289926677942276, 0.5516608953475952, 0.12015789747238159, 0.19516955316066742], [0.30095988512039185, 0.7448774576187134, 0.12406128644943237, -0.05732409656047821], [0.3158574402332306, 0.5482152700424194, 0.12291480600833893, 0.2717825472354889], [0.3268217444419861, 0.7413884997367859, 0.12835045158863068, 0.02025480754673481], [0.34164950251579285, 0.9344584345817566, 0.12875555455684662, -0.2293364554643631], [0.3603386878967285, 1.1275278329849243, 0.12416882812976837, -0.478793740272522], [0.3828892409801483, 0.9308918118476868, 0.11459295451641083, -0.14969861507415771], [0.40150707960128784, 1.1242022514343262, 0.11159897595643997, -0.40414586663246155], [0.4239911139011383, 1.3175792694091797, 0.10351606458425522, -0.6596648693084717], [0.45034271478652954, 1.121180534362793, 0.09032276272773743, -0.3362644910812378], [0.47276630997657776, 0.9248971343040466, 0.08359747380018234, -0.016520662233233452], [0.4912642538547516, 1.1187268495559692, 0.08326706290245056, -0.28170090913772583], [0.5136387944221497, 0.9225220084190369, 0.07763304561376572, 0.03603893518447876], [0.5320892333984375, 1.1164498329162598, 0.07835382223129272, -0.23117542266845703], [0.5544182062149048, 1.3103697299957275, 0.07373031228780746, -0.498150497674942], [0.5806256532669067, 1.1142899990081787, 0.06376730650663376, -0.18317273259162903], [0.6029114127159119, 0.9183163046836853, 0.060103848576545715, 0.12892520427703857], [0.6212777495384216, 1.1125279664993286, 0.06268235296010971, -0.14420649409294128], [0.6435283422470093, 0.9165670275688171, 0.0597982220351696, 0.16757431626319885], [0.6618596315383911, 0.7206423282623291, 0.06314971297979355, 0.4785062074661255], [0.6762725114822388, 0.5246883630752563, 0.07271983474493027, 0.7904050350189209], [0.6867662668228149, 0.3286471664905548, 0.08852793276309967, 1.1050504446029663], [0.6933392286300659, 0.5225005745887756, 0.11062894016504288, 0.8414022326469421], [0.703789234161377, 0.7159525752067566, 0.12745699286460876, 0.5854567289352417], [0.7181082963943481, 0.5192974209785461, 0.13916611671447754, 0.9154176115989685], [0.7284942269325256, 0.71229088306427, 0.15747447311878204, 0.6695091128349304], [0.7427400350570679, 0.9049135446548462, 0.17086465656757355, 0.4302566647529602], [0.7608383297920227, 1.0972563028335571, 0.17946979403495789, 0.19593402743339539], [0.7827834486961365, 1.2894178628921509, 0.18338847160339355, -0.035197507590055466], [0.8085718154907227, 1.4815012216567993, 0.182684525847435, -0.26487645506858826], [0.8382018208503723, 1.2843058109283447, 0.17738698422908783, 0.07940544188022614], [0.8638879060745239, 1.0871431827545166, 0.17897510528564453, 0.4223873019218445], [0.8856307864189148, 0.8899970650672913, 0.18742284178733826, 0.7657210230827332], [0.9034307599067688, 1.082112193107605, 0.20273727178573608, 0.537375271320343]], "actions": [0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[-0.04159776121377945, -0.14747126400470734, -0.04317866638302803, 0.3271593451499939], [-0.0445471853017807, -0.34195274114608765, -0.03663548082113266, 0.6059190630912781], [-0.05138624086976051, -0.14633816480636597, -0.024517100304365158, 0.3019256591796875], [-0.05431300401687622, 0.04912448301911354, -0.01847858726978302, 0.0016125087859109044], [-0.05333051458001137, -0.14572764933109283, -0.018446337431669235, 0.28840842843055725], [-0.05624506622552872, 0.049652427434921265, -0.012678168714046478, -0.010034757666289806], [-0.05525201931595802, 0.24495388567447662, -0.012878863140940666, -0.30669069290161133], [-0.05035294219851494, 0.05001780018210411, -0.019012676551938057, -0.018097082152962685], [-0.04935258626937866, -0.14482639729976654, -0.01937461830675602, 0.26852700114250183], [-0.052249111235141754, 0.05056660994887352, -0.014004078693687916, -0.030203288421034813], [-0.05123778060078621, 0.24588656425476074, -0.014608144760131836, -0.32727155089378357], [-0.046320050954818726, 0.05097559839487076, -0.02115357480943203, -0.039230942726135254], [-0.04530053585767746, 0.24639439582824707, -0.02193819358944893, -0.33851224184036255], [-0.04037264734506607, 0.44182154536247253, -0.02870843932032585, -0.6380317211151123], [-0.03153621777892113, 0.24711142480373383, -0.04146907478570938, -0.3545260429382324], [-0.026593990623950958, 0.052602898329496384, -0.04855959489941597, -0.07520248740911484], [-0.02554193139076233, -0.1417904794216156, -0.05006364360451698, 0.20177295804023743], [-0.02837774157524109, -0.3361620306968689, -0.04602818563580513, 0.4782523810863495], [-0.03510098159313202, -0.14042147994041443, -0.036463137716054916, 0.17142504453659058], [-0.037909410893917084, 0.055202875286340714, -0.033034637570381165, -0.1325342357158661], [-0.03680535405874252, 0.2507820725440979, -0.03568532317876816, -0.4354533851146698], [-0.031789712607860565, 0.05618298798799515, -0.04439438879489899, -0.15422984957695007], [-0.030666053295135498, 0.25191155076026917, -0.04747898504137993, -0.46058109402656555], [-0.025627821683883667, 0.057491712272167206, -0.056690607219934464, -0.18323355913162231], [-0.024477986618876457, 0.2533770799636841, -0.060355279594659805, -0.4932476878166199], [-0.019410446286201477, 0.4492960274219513, -0.0702202320098877, -0.8043246865272522], [-0.01042452547699213, 0.2552034556865692, -0.08630672842264175, -0.5345311164855957], [-0.00532045541331172, 0.06139449030160904, -0.09699735045433044, -0.2702424228191376], [-0.0040925657376646996, -0.1322191208600998, -0.10240219533443451, -0.00965967122465372], [-0.006736948154866695, 0.06421098858118057, -0.10259538888931274, -0.3328149914741516], [-0.0054527283646166325, -0.1293124407529831, -0.10925169289112091, -0.07416639477014542], [-0.008038977161049843, -0.32271236181259155, -0.11073502153158188, 0.18214774131774902], [-0.014493224211037159, -0.516089916229248, -0.10709206759929657, 0.4379478991031647], [-0.024815022945404053, -0.7095460295677185, -0.09833310544490814, 0.6950446963310242], [-0.03900594264268875, -0.5132076144218445, -0.0844322144985199, 0.37309643626213074], [-0.04927009716629982, -0.3169941008090973, -0.07697028666734695, 0.05503101646900177], [-0.05560997873544693, -0.5109328627586365, -0.07586966454982758, 0.32247093319892883], [-0.06582863628864288, -0.3148171305656433, -0.06942024827003479, 0.006859300192445517], [-0.07212498039007187, -0.5088783502578735, -0.06928306072950363, 0.2768568694591522], [-0.08230254799127579, -0.31283989548683167, -0.06374592334032059, -0.036848291754722595], [-0.0885593444108963, -0.11686449497938156, -0.06448289006948471, -0.34894296526908875], [-0.09089663624763489, -0.3110128939151764, -0.0714617446064949, -0.07727043330669403], [-0.09711689502000809, -0.5050414800643921, -0.07300715893507004, 0.19203777611255646], [-0.10721772164106369, -0.30895519256591797, -0.069166399538517, -0.12275321036577225], [-0.11339682340621948, -0.5030215382575989, -0.07162146270275116, 0.1473315805196762], [-0.12345725297927856, -0.6970486640930176, -0.06867483258247375, 0.4165874123573303], [-0.13739822804927826, -0.8911335468292236, -0.06034308299422264, 0.6868539452552795], [-0.1552208960056305, -0.6952282190322876, -0.04660600423812866, 0.37580063939094543], [-0.16912546753883362, -0.4994763135910034, -0.03908999264240265, 0.06879448145627975], [-0.17911499738693237, -0.30381637811660767, -0.03771410137414932, -0.23596076667308807], [-0.1851913183927536, -0.49837976694107056, -0.04243331775069237, 0.04459148272871971], [-0.195158913731575, -0.6928683519363403, -0.041541486978530884, 0.32359012961387634], [-0.20901627838611603, -0.4971802830696106, -0.03506968542933464, 0.018101535737514496], [-0.21895988285541534, -0.30157339572906494, -0.034707654267549515, -0.285436749458313], [-0.2249913513660431, -0.10597408562898636, -0.04041638970375061, -0.5888610482215881], [-0.2271108329296112, 0.08968982100486755, -0.05219361186027527, -0.8939964175224304], [-0.22531704604625702, -0.1046869233250618, -0.07007353752851486, -0.6181662678718567], [-0.22741077840328217, 0.09134028106927872, -0.08243686705827713, -0.932070255279541], [-0.2255839705467224, 0.28747203946113586, -0.10107827186584473, -1.249477744102478], [-0.21983453631401062, 0.09378047287464142, -0.12606783211231232, -0.9900897741317749], [-0.21795892715454102, 0.290343701839447, -0.14586962759494781, -1.3195605278015137], [-0.21215204894542694, 0.09733562916517258, -0.1722608357667923, -1.0758568048477173], [-0.2102053314447403, -0.09514418989419937, -0.19377796351909637, -0.8418048620223999], [-0.21210822463035583, -0.2871682345867157, -0.21061407029628754, -0.6157745718955994], [0.026270000264048576, -0.18688899278640747, 0.0005288491956889629, 0.2975230813026428], [0.02253222092986107, 0.008225410245358944, 0.006479310803115368, 0.00500698434188962], [0.022696729749441147, -0.18698886036872864, 0.006579450331628323, 0.2997271418571472], [0.018956951797008514, -0.38220396637916565, 0.012573993764817715, 0.5944778323173523], [0.011312872171401978, -0.5774996280670166, 0.024463549256324768, 0.8910948038101196], [-0.0002371205628151074, -0.38271796703338623, 0.04228544607758522, 0.6062012910842896], [-0.007891479879617691, -0.18821200728416443, 0.05440947413444519, 0.32713139057159424], [-0.011655719950795174, 0.006094798911362886, 0.06095210090279579, 0.052090976387262344], [-0.011533823795616627, -0.18984577059745789, 0.06199391931295395, 0.3633648753166199], [-0.015330739319324493, 0.0043428149074316025, 0.06926121562719345, 0.09085608273744583], [-0.01524388324469328, 0.19840717315673828, 0.0710783377289772, -0.17919601500034332], [-0.011275739409029484, 0.002343872794881463, 0.06749441474676132, 0.13503579795360565], [-0.011228862218558788, 0.19643738865852356, 0.07019513100385666, -0.13561329245567322], [-0.007300114259123802, 0.3904873728752136, 0.06748286634683609, -0.4053509831428528], [0.0005096327513456345, 0.19447655975818634, 0.05937584862112999, -0.09217910468578339], [0.004399164114147425, 0.38869941234588623, 0.05753226578235626, -0.36555376648902893], [0.012173152528703213, 0.5829585790634155, 0.050221189856529236, -0.6395552754402161], [0.023832324892282486, 0.7773457169532776, 0.037430085241794586, -0.9160094857215881], [0.039379239082336426, 0.5817381143569946, 0.019109897315502167, -0.6118017435073853], [0.0510140024125576, 0.7765878438949585, 0.006873862352222204, -0.8984049558639526], [0.0665457546710968, 0.581373393535614, -0.011094237677752972, -0.6035693287849426], [0.07817322760820389, 0.38640835881233215, -0.02316562458872795, -0.31440141797065735], [0.08590139448642731, 0.19162394106388092, -0.02945365197956562, -0.029113247990608215], [0.08973387628793716, 0.3871556222438812, -0.030035916715860367, -0.33094167709350586], [0.09747698903083801, 0.19247381389141083, -0.0366547517478466, -0.047879911959171295], [0.10132645815610886, -0.002103887964040041, -0.037612348794937134, 0.2330165058374405], [0.10128438472747803, -0.19666878879070282, -0.032952018082141876, 0.5136020183563232], [0.09735100716352463, -0.0010986151173710823, -0.022679978981614113, 0.21071986854076385], [0.0973290354013443, -0.19588907063007355, -0.01846558041870594, 0.4961630702018738], [0.09341125190258026, -0.3907458186149597, -0.008542319759726524, 0.7829698324203491], [0.08559633791446686, -0.19550752639770508, 0.007117076311260462, 0.4876116216182709], [0.08168618381023407, -0.390729159116745, 0.016869308426976204, 0.7825290560722351], [0.07387160509824753, -0.19584308564662933, 0.03251989185810089, 0.49520087242126465], [0.06995474547147751, -0.0011944614816457033, 0.04242390766739845, 0.2129414826631546], [0.06993085145950317, 0.19329607486724854, 0.04668273776769638, -0.06606294214725494], [0.07379677146673203, 0.38771870732307434, 0.04536147788167, -0.3436594605445862], [0.08155114948749542, 0.19198179244995117, 0.03848829120397568, -0.0370243638753891], [0.08539078384637833, -0.003670350182801485, 0.03774780407547951, 0.2675492465496063], [0.08531738072633743, -0.19931012392044067, 0.04309878870844841, 0.5718950629234314], [0.08133117854595184, -0.004818175919353962, 0.054536689072847366, 0.293095201253891], [0.08123481273651123, -0.20067356526851654, 0.06039859354496002, 0.6024673581123352], [0.0772213414311409, -0.006446117535233498, 0.07244794070720673, 0.3294037878513336], [0.07709241658449173, -0.20252060890197754, 0.07903601974248886, 0.6440250873565674], [0.07304200530052185, -0.008583949878811836, 0.0919165164232254, 0.3772406280040741], [0.07287032902240753, 0.18512052297592163, 0.09946133196353912, 0.11489587277173996], [0.07657273858785629, 0.3786870837211609, 0.10175924748182297, -0.1448255330324173], [0.08414647728204727, 0.5722156763076782, 0.09886273741722107, -0.40375110507011414], [0.09559079259634018, 0.7658066749572754, 0.09078771620988846, -0.6637014150619507], [0.1109069287776947, 0.5695468783378601, 0.077513687312603, -0.3438691198825836], [0.12229786068201065, 0.3734126687049866, 0.07063630223274231, -0.027785036712884903], [0.12976612150669098, 0.17735257744789124, 0.07008060067892075, 0.2863215506076813], [0.1333131641149521, 0.37140873074531555, 0.07580703496932983, 0.016538653522729874], [0.14074134826660156, 0.565366268157959, 0.07613781094551086, -0.25129616260528564], [0.15204866230487823, 0.7593231201171875, 0.07111188769340515, -0.5190256237983704], [0.1672351360321045, 0.5632758140563965, 0.060731373727321625, -0.20480868220329285], [0.17850065231323242, 0.7574790716171265, 0.05663519725203514, -0.47773247957229614], [0.1936502307653427, 0.9517576098442078, 0.04708055034279823, -0.7520411610603333], [0.21268537640571594, 1.1461998224258423, 0.03203972801566124, -1.029544711112976], [0.23560938239097595, 1.340881109237671, 0.011448833160102367, -1.3119986057281494], [0.2624270021915436, 1.145616054534912, -0.014791140332818031, -1.0157544612884521], [0.2853393256664276, 1.340932011604309, -0.03510623052716255, -1.3130449056625366], [0.3121579587459564, 1.1462717056274414, -0.06136712431907654, -1.0315532684326172], [0.33508339524269104, 0.9520174264907837, -0.08199819177389145, -0.7587510347366333], [0.3541237413883209, 0.7581153512001038, -0.09717321395874023, -0.49295562505722046], [0.36928606033325195, 0.5644885897636414, -0.10703232884407043, -0.23240968585014343], [0.38057583570480347, 0.371045857667923, -0.1116805225610733, 0.024686511605978012], [0.38799673318862915, 0.5675775408744812, -0.11118678748607635, -0.30104029178619385], [0.39934828877449036, 0.3742014169692993, -0.1172075942158699, -0.045388881117105484], [0.4068323075771332, 0.570792019367218, -0.1181153729557991, -0.3726317584514618], [0.41824814677238464, 0.7673764824867249, -0.12556800246238708, -0.7000991106033325], [0.4335956871509552, 0.9639948606491089, -0.1395699828863144, -1.0295246839523315], [0.4528755843639374, 0.7709781527519226, -0.16016048192977905, -0.7837154865264893], [0.468295156955719, 0.9678959250450134, -0.1758347898721695, -1.1221979856491089], [0.48765307664871216, 0.7754600048065186, -0.1982787549495697, -0.8894243240356445], [0.5031622648239136, 0.5835006833076477, -0.21606723964214325, -0.6650396585464478], [-0.03558550775051117, 0.20733965933322906, 0.03291908651590347, -0.23389600217342377], [-0.031438715755939484, 0.011763193644583225, 0.028241164982318878, 0.0689862072467804], [-0.03120345063507557, 0.2064691185951233, 0.029620889574289322, -0.21465441584587097], [-0.027074068784713745, 0.01093648374080658, 0.02532779984176159, 0.08722313493490219], [-0.026855338364839554, 0.20568640530109406, 0.02707226388156414, -0.19736246764659882], [-0.022741610184311867, 0.010187894105911255, 0.02312501333653927, 0.10373611003160477], [-0.022537853568792343, 0.20497094094753265, 0.025199735537171364, -0.18156218528747559], [-0.01843843422830105, 0.009497631341218948, 0.02156849205493927, 0.1189626157283783], [-0.018248481675982475, -0.18592660129070282, 0.023947743698954582, 0.41837143898010254], [-0.02196701429784298, -0.3813795745372772, 0.032315172255039215, 0.7185068130493164], [-0.029594605788588524, -0.18671934306621552, 0.04668530821800232, 0.4361678957939148], [-0.03332899138331413, -0.3824700117111206, 0.05540866777300835, 0.7431944608688354], [-0.04097839072346687, -0.18815483152866364, 0.07027255743741989, 0.4684508144855499], [-0.04474148899316788, 0.005907649639993906, 0.07964157313108444, 0.19871868193149567], [-0.04462333768606186, -0.1902577430009842, 0.08361594378948212, 0.5154239535331726], [-0.0484284907579422, 0.0035933242179453373, 0.09392442554235458, 0.2502177357673645], [-0.04835662245750427, 0.19725725054740906, 0.0989287793636322, -0.011424563825130463], [-0.04441148042678833, 0.0008659533341415226, 0.09870028495788574, 0.31075966358184814], [-0.04439416155219078, 0.19445331394672394, 0.10491548478603363, 0.05076267570257187], [-0.04050509259104729, 0.3879266381263733, 0.10593073815107346, -0.2070629894733429], [-0.032746560871601105, 0.581386923789978, 0.10178947448730469, -0.46454131603240967], [-0.021118823438882828, 0.7749342918395996, 0.09249865263700485, -0.7234851717948914], [-0.005620136857032776, 0.5786629915237427, 0.07802894711494446, -0.4031810164451599], [0.005953123327344656, 0.38252609968185425, 0.06996532529592514, -0.08695361763238907], [0.013603645376861095, 0.5765790343284607, 0.06822625547647476, -0.356767863035202], [0.025135226547718048, 0.7706680297851562, 0.06109089404344559, -0.6271810531616211], [0.04054858535528183, 0.5747489929199219, 0.048547275364398956, -0.31590116024017334], [0.05204356834292412, 0.37897035479545593, 0.04222925007343292, -0.00831189751625061], [0.05962297320365906, 0.5734620094299316, 0.04206301271915436, -0.28737762570381165], [0.07109221816062927, 0.3777662515640259, 0.03631545975804329, 0.018269281834363937], [0.07864753901958466, 0.18214282393455505, 0.03668084740638733, 0.32218536734580994], [0.0822903960943222, 0.3767237663269043, 0.04312455281615257, 0.041292037814855576], [0.0898248702287674, 0.5712016224861145, 0.0439503937959671, -0.23747886717319489], [0.10124890506267548, 0.3754802346229553, 0.03920081630349159, 0.0687369778752327], [0.10875850915908813, 0.17981883883476257, 0.040575556457042694, 0.3735256791114807], [0.11235488951206207, 0.37434160709381104, 0.04804607108235359, 0.09390762448310852], [0.11984171718358994, 0.1785651296377182, 0.049924224615097046, 0.4013535678386688], [0.12341301888227463, 0.372944712638855, 0.057951293885707855, 0.12481912225484848], [0.13087192177772522, 0.5671905875205994, 0.060447677969932556, -0.14903247356414795], [0.14221572875976562, 0.7613972425460815, 0.0574670284986496, -0.42204952239990234], [0.15744367241859436, 0.5655101537704468, 0.049026038497686386, -0.11181801557540894], [0.16875387728214264, 0.7598965764045715, 0.04678967595100403, -0.3886393904685974], [0.18395181000232697, 0.5641428232192993, 0.03901688754558563, -0.08157894760370255], [0.19523465633392334, 0.36848390102386475, 0.03738531097769737, 0.22315409779548645], [0.20260433852672577, 0.5630521178245544, 0.04184839129447937, -0.05750557407736778], [0.21386538445949554, 0.36735591292381287, 0.04069828242063522, 0.24808159470558167], [0.2212125062942505, 0.561873733997345, 0.04565991088747978, -0.031491514295339584], [0.2324499785900116, 0.36612772941589355, 0.04503008350729942, 0.27524080872535706], [0.23977252840995789, 0.1703931987285614, 0.050534896552562714, 0.5817793607711792], [0.24318039417266846, 0.3647720217704773, 0.06217048689723015, 0.3054342567920685], [0.25047582387924194, 0.5589554905891418, 0.06827916949987411, 0.032988179475069046], [0.26165494322776794, 0.36292415857315063, 0.06893893331289291, 0.3464084267616272], [0.2689134180545807, 0.16689278185367584, 0.07586710155010223, 0.6600090265274048], [0.27225127816200256, 0.3608815371990204, 0.08906728029251099, 0.392146497964859], [0.27946892380714417, 0.1646159440279007, 0.09691021591424942, 0.7115290760993958], [0.28276124596595764, 0.35827186703681946, 0.11114079505205154, 0.45085519552230835], [0.289926677942276, 0.5516608953475952, 0.12015789747238159, 0.19516955316066742], [0.30095988512039185, 0.7448774576187134, 0.12406128644943237, -0.05732409656047821], [0.3158574402332306, 0.5482152700424194, 0.12291480600833893, 0.2717825472354889], [0.3268217444419861, 0.7413884997367859, 0.12835045158863068, 0.02025480754673481], [0.34164950251579285, 0.9344584345817566, 0.12875555455684662, -0.2293364554643631], [0.3603386878967285, 1.1275278329849243, 0.12416882812976837, -0.478793740272522], [0.3828892409801483, 0.9308918118476868, 0.11459295451641083, -0.14969861507415771], [0.40150707960128784, 1.1242022514343262, 0.11159897595643997, -0.40414586663246155], [0.4239911139011383, 1.3175792694091797, 0.10351606458425522, -0.6596648693084717], [0.45034271478652954, 1.121180534362793, 0.09032276272773743, -0.3362644910812378], [0.47276630997657776, 0.9248971343040466, 0.08359747380018234, -0.016520662233233452], [0.4912642538547516, 1.1187268495559692, 0.08326706290245056, -0.28170090913772583], [0.5136387944221497, 0.9225220084190369, 0.07763304561376572, 0.03603893518447876], [0.5320892333984375, 1.1164498329162598, 0.07835382223129272, -0.23117542266845703], [0.5544182062149048, 1.3103697299957275, 0.07373031228780746, -0.498150497674942], [0.5806256532669067, 1.1142899990081787, 0.06376730650663376, -0.18317273259162903], [0.6029114127159119, 0.9183163046836853, 0.060103848576545715, 0.12892520427703857], [0.6212777495384216, 1.1125279664993286, 0.06268235296010971, -0.14420649409294128], [0.6435283422470093, 0.9165670275688171, 0.0597982220351696, 0.16757431626319885], [0.6618596315383911, 0.7206423282623291, 0.06314971297979355, 0.4785062074661255], [0.6762725114822388, 0.5246883630752563, 0.07271983474493027, 0.7904050350189209], [0.6867662668228149, 0.3286471664905548, 0.08852793276309967, 1.1050504446029663], [0.6933392286300659, 0.5225005745887756, 0.11062894016504288, 0.8414022326469421], [0.703789234161377, 0.7159525752067566, 0.12745699286460876, 0.5854567289352417], [0.7181082963943481, 0.5192974209785461, 0.13916611671447754, 0.9154176115989685], [0.7284942269325256, 0.71229088306427, 0.15747447311878204, 0.6695091128349304], [0.7427400350570679, 0.9049135446548462, 0.17086465656757355, 0.4302566647529602], [0.7608383297920227, 1.0972563028335571, 0.17946979403495789, 0.19593402743339539], [0.7827834486961365, 1.2894178628921509, 0.18338847160339355, -0.035197507590055466], [0.8085718154907227, 1.4815012216567993, 0.182684525847435, -0.26487645506858826], [0.8382018208503723, 1.2843058109283447, 0.17738698422908783, 0.07940544188022614], [0.8638879060745239, 1.0871431827545166, 0.17897510528564453, 0.4223873019218445], [0.8856307864189148, 0.8899970650672913, 0.18742284178733826, 0.7657210230827332], [0.9034307599067688, 1.082112193107605, 0.20273727178573608, 0.537375271320343], [0.925072968006134, 0.8848037123680115, 0.2134847640991211, 0.8864735960960388]], "action_prob": [0.4831140637397766, 0.37746450304985046, 0.6516517996788025, 0.6204363107681274, 0.4986465573310852, 0.6180919408798218, 0.49714216589927673, 0.6207694411277771, 0.5107873678207397, 0.6114992499351501, 0.4844578206539154, 0.6266438364982605, 0.475750595331192, 0.3690272271633148, 0.6541916728019714, 0.6382954716682434, 0.5566278696060181, 0.42506054043769836, 0.6405121088027954, 0.5664094090461731, 0.42181316018104553, 0.6488502621650696, 0.40805214643478394, 0.6526894569396973, 0.3926132321357727, 0.34378287196159363, 0.6525338888168335, 0.659909188747406, 0.6422709226608276, 0.438944935798645, 0.653675377368927, 0.5942734479904175, 0.4740460515022278, 0.3853282928466797, 0.6447737216949463, 0.6036368608474731, 0.5263593196868896, 0.5905382037162781, 0.5477102398872375, 0.5765588879585266, 0.43375474214553833, 0.6547590494155884, 0.5869402885437012, 0.5396824479103088, 0.603703498840332, 0.48070865869522095, 0.3856007158756256, 0.6476362943649292, 0.6103057265281677, 0.49623796343803406, 0.6275830268859863, 0.5158237814903259, 0.5988963842391968, 0.4758412837982178, 0.36332952976226807, 0.3354473114013672, 0.6532625555992126, 0.3335592746734619, 0.34824827313423157, 0.6306302547454834, 0.3509894013404846, 0.6263396143913269, 0.6444087624549866, 0.6638405919075012, 0.505584180355072, 0.6152550578117371, 0.5025634169578552, 0.38249725103378296, 0.3486858606338501, 0.6472265720367432, 0.6538005471229553, 0.6354761719703674, 0.4506644606590271, 0.6433363556861877, 0.5724892020225525, 0.5566145181655884, 0.5915884971618652, 0.46510928869247437, 0.6251282095909119, 0.48341992497444153, 0.381584495306015, 0.35046467185020447, 0.6497114896774292, 0.3489014208316803, 0.6507982015609741, 0.6534093618392944, 0.626724362373352, 0.4734559655189514, 0.6325168609619141, 0.5411427617073059, 0.41126251220703125, 0.6448618173599243, 0.4156773090362549, 0.3552040755748749, 0.6496280431747437, 0.35287830233573914, 0.6503018736839294, 0.6506761908531189, 0.6062444448471069, 0.4834114909172058, 0.620596170425415, 0.5048676133155823, 0.37879645824432373, 0.6549662947654724, 0.3683663010597229, 0.6566122174263, 0.35739484429359436, 0.6575278639793396, 0.652747392654419, 0.5964385867118835, 0.4765106737613678, 0.3843725025653839, 0.647902250289917, 0.6053903698921204, 0.4767177402973175, 0.6388875842094421, 0.5474919676780701, 0.4249090850353241, 0.6378570795059204, 0.43760597705841064, 0.36531195044517517, 0.34556978940963745, 0.3462353050708771, 0.6465410590171814, 0.34503617882728577, 0.646252453327179, 0.6549944281578064, 0.661456286907196, 0.659179151058197, 0.6309515237808228, 0.4514853358268738, 0.6470419764518738, 0.4143373966217041, 0.3415989577770233, 0.33519071340560913, 0.6526923179626465, 0.33685868978500366, 0.6474295854568481, 0.6585854887962341, 0.5409071445465088, 0.589931845664978, 0.550007164478302, 0.5834970474243164, 0.5579493045806885, 0.5773042440414429, 0.5650012493133545, 0.5712703466415405, 0.4286031424999237, 0.3531875014305115, 0.6537330150604248, 0.34821075201034546, 0.6538121104240417, 0.6568766236305237, 0.377886563539505, 0.6599932312965393, 0.6391614675521851, 0.4487888813018799, 0.6512924432754517, 0.5841100811958313, 0.46165236830711365, 0.37931984663009644, 0.6472312808036804, 0.6123211979866028, 0.5071690678596497, 0.3973366618156433, 0.6451205015182495, 0.5964123010635376, 0.5340707898139954, 0.5897553563117981, 0.4563610851764679, 0.644859254360199, 0.5565038919448853, 0.5725938677787781, 0.4335569143295288, 0.6521941423416138, 0.4201970398426056, 0.656433641910553, 0.5949394106864929, 0.4693882167339325, 0.6211320161819458, 0.48125961422920227, 0.616777777671814, 0.5098077654838562, 0.6181442737579346, 0.4985472857952118, 0.6247530579566956, 0.48593127727508545, 0.36849501729011536, 0.6641499400138855, 0.6410602331161499, 0.44904935359954834, 0.3510410785675049, 0.66587233543396, 0.3419203460216522, 0.6661285161972046, 0.6661813855171204, 0.6255596876144409, 0.47038576006889343, 0.6437833905220032, 0.564194917678833, 0.4582917094230652, 0.6147869229316711, 0.48520123958587646, 0.3996855914592743, 0.6425869464874268, 0.5877131819725037, 0.5265395045280457, 0.5741183757781982, 0.5432370901107788, 0.4396804869174957, 0.626073956489563, 0.5499580502510071, 0.5664677619934082, 0.5385702252388, 0.4234970211982727, 0.34840819239616394, 0.32942745089530945, 0.6611632704734802, 0.6722466945648193, 0.33243799209594727, 0.6725718379020691, 0.6738916039466858, 0.6539572477340698, 0.6043853759765625, 0.5305467844009399, 0.5442366600036621, 0.43584370613098145, 0.3532716631889343, 0.6773198843002319, 0.3373884856700897], "advantages": [36.2447624206543, 35.997066497802734, 35.96256637573242, 34.90070724487305, 34.17264175415039, 33.832969665527344, 33.09205627441406, 32.69356155395508, 32.08399963378906, 31.714210510253906, 30.969186782836914, 30.576709747314453, 29.934858322143555, 29.565893173217773, 29.546489715576172, 28.72989845275879, 28.116792678833008, 27.74763298034668, 27.615116119384766, 26.56014060974121, 25.904239654541016, 25.66071319580078, 24.958332061767578, 24.783123016357422, 24.101177215576172, 24.013425827026367, 24.302846908569336, 23.59832000732422, 23.066497802734375, 22.760332107543945, 22.607999801635742, 22.32196044921875, 22.24661636352539, 22.298036575317383, 22.336402893066406, 21.153541564941406, 20.269746780395508, 20.081148147583008, 19.219987869262695, 18.953826904296875, 18.113557815551758, 17.668262481689453, 17.227487564086914, 16.890968322753906, 16.166297912597656, 15.779576301574707, 15.391071319580078, 14.897308349609375, 13.675190925598145, 12.596246719360352, 11.780536651611328, 11.142011642456055, 10.519749641418457, 9.444140434265137, 8.621695518493652, 8.07107925415039, 7.7076849937438965, 7.181106090545654, 6.880003929138184, 6.578182220458984, 6.516676425933838, 6.164999008178711, 6.364455223083496, 6.546551704406738, 42.51231002807617, 42.22963333129883, 41.487300872802734, 41.182071685791016, 41.11277389526367, 41.1988525390625, 39.7299919128418, 38.53096389770508, 37.63894271850586, 37.23960494995117, 36.316749572753906, 35.67002487182617, 35.0528564453125, 34.377498626708984, 33.93736267089844, 33.155555725097656, 32.69844055175781, 32.45730972290039, 32.425872802734375, 31.420331954956055, 31.459766387939453, 30.500436782836914, 29.672826766967773, 29.013341903686523, 28.680814743041992, 28.012418746948242, 27.542329788208008, 27.278705596923828, 26.313535690307617, 26.003738403320312, 25.87782859802246, 24.554035186767578, 24.368579864501953, 23.012845993041992, 21.93654441833496, 21.129980087280273, 20.570499420166016, 19.70549201965332, 19.046707153320312, 18.589357376098633, 17.44980239868164, 16.965078353881836, 15.801480293273926, 15.292823791503906, 14.111288070678711, 13.136889457702637, 12.329071998596191, 11.662016868591309, 11.128570556640625, 10.048476219177246, 9.10805892944336, 8.302454948425293, 7.425912857055664, 6.676381587982178, 6.048098564147949, 5.016467571258545, 4.371492385864258, 3.860898733139038, 3.5025861263275146, 3.3103976249694824, 2.0961360931396484, 2.0255212783813477, 0.8799968361854553, -0.21363385021686554, -1.2411999702453613, -2.1847684383392334, -3.022258996963501, -3.4837570190429688, -4.328895092010498, -4.677290916442871, -4.681040287017822, -4.40980339050293, -5.181405544281006, -4.754636287689209, -5.23646879196167, 48.614681243896484, 48.19743728637695, 47.71570587158203, 47.283138275146484, 46.81161880493164, 46.36342239379883, 45.8988037109375, 45.43461227416992, 44.97422409057617, 44.745811462402344, 44.72406768798828, 43.60731887817383, 43.54581832885742, 42.413108825683594, 41.54303741455078, 41.247100830078125, 40.36058044433594, 39.68783950805664, 39.214290618896484, 38.51984786987305, 37.98438262939453, 37.58343505859375, 37.311492919921875, 36.4926872253418, 35.812278747558594, 35.385555267333984, 35.090457916259766, 34.321346282958984, 33.67337417602539, 33.22504425048828, 32.58034896850586, 32.052032470703125, 31.431669235229492, 30.940771102905273, 30.291513442993164, 29.751907348632812, 29.094093322753906, 28.544477462768555, 27.864856719970703, 27.297517776489258, 26.836990356445312, 26.083309173583984, 25.609466552734375, 24.858366012573242, 24.199495315551758, 23.58293342590332, 22.916141510009766, 22.27823829650879, 21.603273391723633, 21.013938903808594, 20.227243423461914, 19.537715911865234, 18.843996047973633, 18.227678298950195, 17.401880264282227, 16.770118713378906, 15.926481246948242, 15.157439231872559, 14.444673538208008, 13.669590950012207, 12.93069076538086, 12.236034393310547, 11.587924003601074, 10.708131790161133, 10.037031173706055, 9.420587539672852, 8.490174293518066, 7.613265037536621, 6.905394554138184, 6.022566318511963, 5.293800354003906, 4.619964122772217, 3.678194046020508, 2.7786223888397217, 2.014737844467163, 1.102739930152893, 0.225285604596138, -0.6208505034446716, -1.436601996421814, -2.4381182193756104, -3.392970561981201, -4.278507232666016, -5.257473945617676, -6.207446098327637, -7.136166095733643, -8.04660701751709, -8.938042640686035, -9.97353458404541, -10.984552383422852, -11.977559089660645, -12.986820220947266], "value_targets": [47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 969587050, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334, 76431334], "obs": [[0.04396471753716469, 0.039110057055950165, 0.024596597999334335, 0.010587934404611588], [0.044746916741132736, 0.23387078940868378, 0.024808356538414955, -0.2742341160774231], [0.04942433536052704, 0.03840380907058716, 0.019323673099279404, 0.026169029995799065], [0.05019240826368332, 0.23324339091777802, 0.019847054034471512, -0.2603549659252167], [0.0548572763800621, 0.037843819707632065, 0.014639955013990402, 0.038521308451890945], [0.055614154785871506, 0.23275281488895416, 0.015410381369292736, -0.2495068460702896], [0.06026921048760414, 0.03741421550512314, 0.010420244187116623, 0.04799672216176987], [0.06101749464869499, 0.23238520324230194, 0.011380178853869438, -0.24138039350509644], [0.06566520035266876, 0.4273427724838257, 0.006552570965141058, -0.5304520726203918], [0.07421205192804337, 0.2321292608976364, -0.004056470934301615, -0.23571167886257172], [0.07885464280843735, 0.42730891704559326, -0.00877070426940918, -0.5296713709831238], [0.08740081638097763, 0.2323114573955536, -0.01936413161456585, -0.2397649586200714], [0.09204705059528351, 0.03747139871120453, -0.02415943145751953, 0.04674762487411499], [0.09279647469520569, -0.15729594230651855, -0.0232244785875082, 0.33171120285987854], [0.08965055644512177, 0.03814876079559326, -0.01659025438129902, 0.03179582580924034], [0.09041353315114975, -0.15673139691352844, -0.015954338014125824, 0.31919851899147034], [0.08727890253067017, -0.3516225218772888, -0.009570367634296417, 0.6068076491355896], [0.0802464559674263, -0.15636809170246124, 0.0025657855439931154, 0.3111257553100586], [0.07711908966302872, -0.35152649879455566, 0.008788300678133965, 0.6046167612075806], [0.07008855789899826, -0.1565285474061966, 0.02088063582777977, 0.31471481919288635], [0.066957987844944, 0.038289837539196014, 0.0271749310195446, 0.028689419850707054], [0.06772378832101822, 0.23301175236701965, 0.027748720720410347, -0.25529715418815613], [0.07238402217626572, 0.03750482574105263, 0.022642776370048523, 0.04600740224123001], [0.07313411682844162, -0.15793436765670776, 0.023562924936413765, 0.3457474410533905], [0.06997542828321457, 0.03684461861848831, 0.030477873980998993, 0.06058693677186966], [0.07071232050657272, -0.15870076417922974, 0.031689614057540894, 0.36272791028022766], [0.0675383061170578, 0.03595678508281708, 0.038944169878959656, 0.08020336180925369], [0.06825744360685349, 0.23049944639205933, 0.04054823890328407, -0.1999426782131195], [0.07286743074655533, 0.03482172638177872, 0.03654938563704491, 0.10525055974721909], [0.07356386631727219, 0.2294013500213623, 0.0386543944478035, -0.17568083107471466], [0.0781518965959549, 0.42394939064979553, 0.03514077886939049, -0.4559233486652374], [0.08663088083267212, 0.618557333946228, 0.02602231130003929, -0.7373257875442505], [0.09900202602148056, 0.4230858385562897, 0.011275796219706535, -0.43656811118125916], [0.10746374726295471, 0.22780610620975494, 0.0025444338098168373, -0.14035211503505707], [0.1120198667049408, 0.032647814601659775, -0.0002626085188239813, 0.15313245356082916], [0.1126728281378746, 0.227773517370224, 0.0028000404126942158, -0.13963331282138824], [0.11722829192876816, 0.4228552579879761, 7.374198503384832e-06, -0.4314315617084503], [0.12568539381027222, 0.22773320972919464, -0.008621256798505783, -0.13874630630016327], [0.1302400678396225, 0.03273578733205795, -0.01139618270099163, 0.15120433270931244], [0.13089478015899658, -0.16222114861011505, -0.008372096344828606, 0.440270334482193], [0.12765035033226013, 0.033018287271261215, 0.0004333099932409823, 0.14496007561683655], [0.12831072509288788, -0.1621098667383194, 0.0033325115218758583, 0.43777966499328613], [0.1250685304403305, 0.03296475484967232, 0.012088105082511902, 0.14614912867546082], [0.1257278174161911, -0.16232819855213165, 0.015011087991297245, 0.4426209628582001], [0.12248125672340393, 0.032578159123659134, 0.02386350743472576, 0.15470746159553528], [0.12313281744718552, 0.22735044360160828, 0.02695765718817711, -0.13035257160663605], [0.12767982482910156, 0.4220760762691498, 0.02435060404241085, -0.4144102931022644], [0.13612134754657745, 0.22661758959293365, 0.016062399372458458, -0.11415112018585205], [0.14065369963645935, 0.03126920759677887, 0.01377937663346529, 0.18355579674243927], [0.14127908647060394, 0.22619131207466125, 0.017450492829084396, -0.10474859923124313], [0.14580291509628296, 0.030823687091469765, 0.015355520881712437, 0.19338840246200562], [0.14641939103603363, 0.22572265565395355, 0.01922328770160675, -0.09441123157739639], [0.15093384683132172, 0.03033052757382393, 0.017335064709186554, 0.20427410304546356], [0.15154044330120087, 0.2252003401517868, 0.021420545876026154, -0.08289044350385666], [0.15604445338249207, 0.4200087785720825, 0.019762737676501274, -0.36873891949653625], [0.16444462537765503, 0.6148444414138794, 0.012387959286570549, -0.6551254391670227], [0.17674152553081512, 0.8097917437553406, -0.0007145503186620772, -0.9438819885253906], [0.19293735921382904, 1.0049233436584473, -0.01959219016134739, -1.236789345741272], [0.21303582191467285, 0.8100585341453552, -0.044327978044748306, -0.9503080248832703], [0.22923699021339417, 0.6155603528022766, -0.0633341372013092, -0.671875536441803], [0.24154819548130035, 0.4213733375072479, -0.07677164673805237, -0.3997867703437805], [0.24997566640377045, 0.617495596408844, -0.08476738631725311, -0.715652346611023], [0.26232558488845825, 0.8136821985244751, -0.09908042848110199, -1.0337674617767334], [0.27859923243522644, 0.6200074553489685, -0.11975578218698502, -0.7737621068954468], [0.2909993827342987, 0.8165555000305176, -0.13523101806640625, -1.101596713066101], [0.30733048915863037, 0.6234465837478638, -0.15726295113563538, -0.8542147278785706], [0.31979942321777344, 0.43077731132507324, -0.17434725165367126, -0.6148222088813782], [0.3284149467945099, 0.2384648472070694, -0.18664368987083435, -0.3817255198955536], [0.33318427205085754, 0.43567854166030884, -0.19427821040153503, -0.7269636392593384], [0.3418978154659271, 0.24369728565216064, -0.2088174819946289, -0.501168429851532], [-0.01654447242617607, -0.04988615959882736, -0.029269184917211533, 0.01102899294346571], [-0.017542196437716484, -0.24457639455795288, -0.029048604890704155, 0.29433533549308777], [-0.022433724254369736, -0.439272403717041, -0.02316189929842949, 0.5777170658111572], [-0.03121917136013508, -0.6340622305870056, -0.011607557535171509, 0.8630144000053406], [-0.04390041530132294, -0.4387841522693634, 0.005652730818837881, 0.566704511642456], [-0.05267610028386116, -0.2437419593334198, 0.016986820846796036, 0.27580779790878296], [-0.05755093693733215, -0.048866428434848785, 0.022502977401018143, -0.01146943960338831], [-0.058528266847133636, 0.14592568576335907, 0.022273588925600052, -0.29696834087371826], [-0.055609751492738724, -0.04950657859444618, 0.01633422262966633, 0.002655260032042861], [-0.05659988522529602, 0.14537735283374786, 0.016387326642870903, -0.28482958674430847], [-0.05369233712553978, 0.3402617871761322, 0.010690735653042793, -0.5722993612289429], [-0.0468871034681797, 0.5352322459220886, -0.000755251559894532, -0.8615952730178833], [-0.0361824557185173, 0.3401205539703369, -0.01798715628683567, -0.569149911403656], [-0.02938004583120346, 0.535490095615387, -0.029370155185461044, -0.8674447536468506], [-0.01867024414241314, 0.3407798707485199, -0.04671904817223549, -0.5841389298439026], [-0.011854646727442741, 0.1463424414396286, -0.05840182676911354, -0.3065314292907715], [-0.00892779789865017, -0.04790077731013298, -0.06453245878219604, -0.03282373026013374], [-0.009885813109576702, -0.24204079806804657, -0.065188929438591, 0.23882077634334564], [-0.014726629480719566, -0.04605107009410858, -0.060412514954805374, -0.07369136065244675], [-0.015647651627659798, -0.24025724828243256, -0.061886344105005264, 0.1993359923362732], [-0.020452795550227165, -0.4344419836997986, -0.05789962410926819, 0.4718725085258484], [-0.029141634702682495, -0.6287003755569458, -0.04846217483282089, 0.7457588315010071], [-0.04171564429998398, -0.8231213092803955, -0.033546995371580124, 1.0228055715560913], [-0.058178067207336426, -0.6275689005851746, -0.013090885244309902, 0.7197810411453247], [-0.07072944939136505, -0.43226832151412964, 0.0013047355460003018, 0.4230066239833832], [-0.07937481254339218, -0.23716488480567932, 0.009764867834746838, 0.13073530793190002], [-0.08411811292171478, -0.04218415915966034, 0.012379574589431286, -0.1588509976863861], [-0.08496179431676865, 0.15275838971138, 0.009202554821968079, -0.44760289788246155], [-0.08190662413835526, -0.04249252378940582, 0.0002504963194951415, -0.15203343331813812], [-0.08275647461414337, -0.23761805891990662, -0.002790172351524234, 0.14072851836681366], [-0.08750883489847183, -0.042456261813640594, 2.439801028231159e-05, -0.15283335745334625], [-0.08835796266794205, -0.23757855594158173, -0.00303226918913424, 0.13985726237297058], [-0.09310953319072723, -0.4326569437980652, -0.00023512383631896228, 0.4315820336341858], [-0.10176267474889755, -0.23753167688846588, 0.008396516554057598, 0.13882498443126678], [-0.10651330649852753, -0.042530983686447144, 0.011173016391694546, -0.15119719505310059], [-0.10736392438411713, -0.2378111183643341, 0.008149072527885437, 0.14498953521251678], [-0.11212015151977539, -0.04280681908130646, 0.011048862710595131, -0.14511141180992126], [-0.11297628283500671, 0.15215517580509186, 0.008146634325385094, -0.43428826332092285], [-0.10993318259716034, -0.04308116063475609, -0.0005391302402131259, -0.13904838263988495], [-0.1107948049902916, 0.1520485132932663, -0.0033200979232788086, -0.43190133571624756], [-0.10775383561849594, 0.347217321395874, -0.011958125047385693, -0.7256290316581726], [-0.1008094921708107, 0.15226274728775024, -0.02647070586681366, -0.4367336928844452], [-0.09776423126459122, -0.04247470200061798, -0.035205379128456116, -0.1525113433599472], [-0.09861373156309128, 0.15313319861888885, -0.03825560584664345, -0.45608964562416077], [-0.09555106610059738, -0.04142758622765541, -0.04737740010023117, -0.1757063865661621], [-0.09637961536645889, -0.23584061861038208, -0.05089152604341507, 0.10166217386722565], [-0.10109642893075943, -0.04002765193581581, -0.04885828495025635, -0.20663264393806458], [-0.1018969789147377, -0.234418123960495, -0.05299093574285507, 0.07024648785591125], [-0.10658534616231918, -0.038578081876039505, -0.051586005836725235, -0.23867326974868774], [-0.10735690593719482, -0.23292657732963562, -0.05635947361588478, 0.03730212152004242], [-0.11201544106006622, -0.4271969497203827, -0.055613428354263306, 0.3116840422153473], [-0.12055937945842743, -0.6214842796325684, -0.04937974736094475, 0.5863226056098938], [-0.1329890638589859, -0.42570677399635315, -0.03765329718589783, 0.27850255370140076], [-0.1415031999349594, -0.23006847500801086, -0.03208324685692787, -0.025814369320869446], [-0.1461045742034912, -0.03450145944952965, -0.03259953111410141, -0.32844477891921997], [-0.14679460227489471, -0.22914451360702515, -0.039168428629636765, -0.04621788114309311], [-0.15137748420238495, -0.033483441919088364, -0.04009278491139412, -0.3509969711303711], [-0.15204715728759766, -0.22801296412944794, -0.04711272567510605, -0.07122128456830978], [-0.15660741925239563, -0.4224289357662201, -0.04853715002536774, 0.20623306930065155], [-0.1650559902191162, -0.22664771974086761, -0.04441248998045921, -0.10135722905397415], [-0.16958895325660706, -0.030918341130018234, -0.04643963277339935, -0.40771475434303284], [-0.17020732164382935, -0.22535210847854614, -0.054593928158283234, -0.1300269067287445], [-0.1747143566608429, -0.41965121030807495, -0.05719446763396263, 0.1449449062347412], [-0.1831073760986328, -0.22375881671905518, -0.05429556965827942, -0.1652192324399948], [-0.18758255243301392, -0.4180631935596466, -0.057599954307079315, 0.10985276848077774], [-0.19594381749629974, -0.6123144626617432, -0.05540289729833603, 0.38382142782211304], [-0.20819011330604553, -0.41645148396492004, -0.04772647097706795, 0.07419763505458832], [-0.21651914715766907, -0.22067897021770477, -0.04624251648783684, -0.23315301537513733], [-0.2209327220916748, -0.4151107370853424, -0.05090557783842087, 0.04459240287542343], [-0.22923493385314941, -0.6094671487808228, -0.05001372843980789, 0.3207896053791046], [-0.24142427742481232, -0.41366997361183167, -0.04359793663024902, 0.012763150036334991], [-0.24969768524169922, -0.6081404089927673, -0.043342676013708115, 0.2913779318332672], [-0.2618604898452759, -0.8026184439659119, -0.03751511499285698, 0.5700821876525879], [-0.27791285514831543, -0.6069909930229187, -0.026113472878932953, 0.2658206522464752], [-0.2900526821613312, -0.8017306923866272, -0.020797058939933777, 0.5501541495323181], [-0.30608728528022766, -0.996554434299469, -0.009793976321816444, 0.836212694644928], [-0.326018363237381, -0.8013001084327698, 0.0069302767515182495, 0.5404658317565918], [-0.3420443832874298, -0.6062762141227722, 0.017739592120051384, 0.24997453391551971], [-0.35416990518569946, -0.8016469478607178, 0.02273908443748951, 0.5481997132301331], [-0.37020283937454224, -0.9970808625221252, 0.03370307758450508, 0.8479594588279724], [-0.3901444673538208, -0.8024344444274902, 0.050662267953157425, 0.5660624504089355], [-0.4061931371688843, -0.6080584526062012, 0.061983514577150345, 0.28976088762283325], [-0.418354332447052, -0.8040069937705994, 0.06777873635292053, 0.6013307571411133], [-0.4344344735145569, -0.6098953485488892, 0.07980534434318542, 0.33074355125427246], [-0.44663235545158386, -0.8060572743415833, 0.0864202156662941, 0.6474877595901489], [-0.4627535045146942, -0.612238883972168, 0.09936997294425964, 0.3832210898399353], [-0.4749982953071594, -0.4186578691005707, 0.10703439265489578, 0.12344873696565628], [-0.48337143659591675, -0.22521919012069702, 0.109503373503685, -0.13364072144031525], [-0.4878758192062378, -0.03182226046919823, 0.10683055967092514, -0.38986891508102417], [-0.4885122776031494, 0.16163408756256104, 0.0990331768989563, -0.6470506191253662], [-0.4852795898914337, -0.03471804037690163, 0.08609216660261154, -0.3248973488807678], [-0.48597395420074463, -0.23095357418060303, 0.0795942172408104, -0.006354403216391802], [-0.4905930161476135, -0.42712146043777466, 0.07946713268756866, 0.31034183502197266], [-0.49913546442985535, -0.23321634531021118, 0.08567396551370621, 0.04374082386493683], [-0.5037997961044312, -0.03942074626684189, 0.08654878288507462, -0.2207290232181549], [-0.5045881867408752, -0.23566633462905884, 0.0821342021226883, 0.09795112907886505], [-0.5093015432357788, -0.041811730712652206, 0.08409322798252106, -0.1677302122116089], [-0.5101377367973328, 0.15201212465763092, 0.0807386189699173, -0.4327443242073059], [-0.5070975422859192, -0.04415460675954819, 0.0720837339758873, -0.11574140191078186], [-0.5079805850982666, 0.14986443519592285, 0.06976890563964844, -0.3848399221897125], [-0.5049833059310913, 0.34393009543418884, 0.062072109431028366, -0.6547347903251648], [-0.4981047213077545, 0.14800134301185608, 0.04897741228342056, -0.343170166015625], [-0.49514469504356384, -0.04778192937374115, 0.04211400821805, -0.03545382246375084], [-0.4961003363132477, -0.24348171055316925, 0.041404932737350464, 0.27021342515945435], [-0.5009699463844299, -0.439169317483902, 0.04680920019745827, 0.5756627917289734], [-0.5097533464431763, -0.24473370611667633, 0.05832245573401451, 0.2980857789516449], [-0.5146480202674866, -0.050489529967308044, 0.06428417563438416, 0.02435198426246643], [-0.5156578421592712, 0.14365443587303162, 0.06477121263742447, -0.24737593531608582], [-0.5127847194671631, -0.052329882979393005, 0.059823691844940186, 0.06501353532075882], [-0.5138313174247742, 0.14188560843467712, 0.061123963445425034, -0.20821087062358856], [-0.5109935998916626, 0.33608269691467285, 0.05695974826812744, -0.4810032546520233], [-0.5042719841003418, 0.14020492136478424, 0.047339681535959244, -0.17092597484588623], [-0.5014678835868835, -0.05556151270866394, 0.04392116144299507, 0.13630735874176025], [-0.5025790929794312, 0.13890472054481506, 0.04664731025695801, -0.14220201969146729], [-0.49980098009109497, 0.33332863450050354, 0.04380326718091965, -0.41981130838394165], [-0.49313440918922424, 0.5278034210205078, 0.03540704399347305, -0.6983696818351746], [-0.4825783669948578, 0.33220890164375305, 0.021439649164676666, -0.39475423097610474], [-0.4759341776371002, 0.13678939640522003, 0.013544565066695213, -0.09538957476615906], [-0.47319838404655457, 0.3317146301269531, 0.011636773124337196, -0.38376861810684204], [-0.4665640890598297, 0.526669442653656, 0.003961400594562292, -0.6727598905563354], [-0.4560306966304779, 0.33149266242980957, -0.009493797086179256, -0.3788323700428009], [-0.4494008421897888, 0.5267481207847595, -0.01707044430077076, -0.6744935512542725], [-0.43886590003967285, 0.331867516040802, -0.030560316517949104, -0.3872336745262146], [-0.43222853541374207, 0.5274096727371216, -0.03830498829483986, -0.6893932819366455], [-0.42168036103248596, 0.7230416536331177, -0.05209285393357277, -0.9938849210739136], [-0.4072194993495941, 0.5286538600921631, -0.07197055220603943, -0.7180070877075195], [-0.3966464400291443, 0.33459773659706116, -0.08633069694042206, -0.44881758093833923], [-0.38995447754859924, 0.1407962441444397, -0.09530704468488693, -0.18454766273498535], [-0.3871385455131531, 0.33714351058006287, -0.09899800270795822, -0.5057098269462585], [-0.38039568066596985, 0.5335109233856201, -0.1091121956706047, -0.8278766870498657], [-0.36972546577453613, 0.7299420833587646, -0.12566973268985748, -1.1527864933013916], [-0.35512661933898926, 0.5366631746292114, -0.1487254649400711, -0.9020042419433594], [-0.34439337253570557, 0.3438350260257721, -0.16676554083824158, -0.6595192551612854], [-0.3375166654586792, 0.15137822926044464, -0.17995592951774597, -0.423641175031662], [-0.334489107131958, -0.040799111127853394, -0.18842875957489014, -0.19265216588974], [-0.3353050649166107, -0.2327960878610611, -0.1922817975282669, 0.0351749025285244], [-0.3399609923362732, -0.4247153103351593, -0.19157829880714417, 0.2615651786327362], [-0.3484553098678589, -0.22744859755039215, -0.18634699285030365, -0.08490147441625595], [-0.3530042767524719, -0.03021228313446045, -0.18804502487182617, -0.43010348081588745], [-0.35360851883888245, -0.22224323451519012, -0.19664709270000458, -0.20209486782550812], [-0.35805338621139526, -0.41408902406692505, -0.20068898797035217, 0.022685380652546883], [-0.3663351833820343, -0.6058520078659058, -0.2002352774143219, 0.24594934284687042], [-0.37845221161842346, -0.797635018825531, -0.19531629979610443, 0.46939948201179504], [-0.39440491795539856, -0.9895393252372742, -0.1859283149242401, 0.6947242021560669], [-0.4141956865787506, -0.7923919558525085, -0.17203381657600403, 0.3497513234615326], [-0.4300435483455658, -0.9847031235694885, -0.1650387942790985, 0.5836310982704163], [-0.4497376084327698, -0.7877007126808167, -0.15336617827415466, 0.24384133517742157], [-0.4654916226863861, -0.980337381362915, -0.1484893560409546, 0.48449164628982544], [-0.48509836196899414, -0.7834662199020386, -0.1387995183467865, 0.14893893897533417], [-0.500767707824707, -0.5866578221321106, -0.13582073152065277, -0.18411074578762054], [-0.5125008225440979, -0.7796013951301575, -0.13950295746326447, 0.06283064186573029], [-0.5280928611755371, -0.5827836394309998, -0.1382463425397873, -0.2704089283943176], [-0.5397485494613647, -0.7756898403167725, -0.14365451037883759, -0.02432538941502571], [-0.5552623271942139, -0.9684907793998718, -0.14414101839065552, 0.2198077291250229], [-0.5746321678161621, -1.1612896919250488, -0.13974487781524658, 0.46377620100975037], [-0.5978579521179199, -0.9644982218742371, -0.13046935200691223, 0.1305151730775833], [-0.6171479225158691, -0.7677721381187439, -0.12785904109477997, -0.20031526684761047], [-0.63250333070755, -0.9608556032180786, -0.13186535239219666, 0.04945755377411842], [-0.6517204642295837, -1.1538643836975098, -0.13087619841098785, 0.2978011667728424], [-0.674797773361206, -0.9571433067321777, -0.12492017447948456, -0.033124782145023346], [-0.6939406394958496, -1.150273084640503, -0.12558266520500183, 0.21768134832382202], [-0.7169460654258728, -0.9536004662513733, -0.12122904509305954, -0.11182858794927597], [-0.7360181212425232, -1.1467955112457275, -0.12346561253070831, 0.14028306305408478], [-0.7589539885520935, -1.339952826499939, -0.1206599548459053, 0.3916066288948059], [-0.785753071308136, -1.1433435678482056, -0.11282782256603241, 0.06344900280237198], [-0.8086199164390564, -1.3366822004318237, -0.11155883967876434, 0.318511962890625], [-0.8353535532951355, -1.1401628255844116, -0.10518860071897507, -0.007165013812482357], [-0.8581568598747253, -1.3336312770843506, -0.1053319051861763, 0.25056520104408264], [-0.8848294615745544, -1.5271037817001343, -0.10032059997320175, 0.5082550644874573], [-0.9153715372085571, -1.3307220935821533, -0.09015549719333649, 0.1857188194990158], [-0.9419859647750854, -1.134433627128601, -0.08644112199544907, -0.1339879333972931], [-0.9646746516227722, -0.9381866455078125, -0.08912087976932526, -0.4526413083076477], [-0.9834383726119995, -1.1319427490234375, -0.09817370772361755, -0.18932747840881348], [-1.0060772895812988, -1.3255330324172974, -0.10196025669574738, 0.07084308564662933], [-1.0325878858566284, -1.5190566778182983, -0.10054339468479156, 0.32969650626182556], [-1.0629689693450928, -1.3226579427719116, -0.09394945949316025, 0.007076171226799488], [-1.0894222259521484, -1.1263229846954346, -0.09380793571472168, -0.3137080669403076], [-1.1119486093521118, -1.3199920654296875, -0.10008209943771362, -0.05202072113752365], [-1.1383484601974487, -1.5135471820831299, -0.10112251341342926, 0.20748400688171387], [-1.1686193943023682, -1.707088589668274, -0.09697283059358597, 0.46663379669189453], [-1.202761173248291, -1.9007163047790527, -0.08764015883207321, 0.7272454500198364], [-1.2407755851745605, -1.7044990062713623, -0.07309524714946747, 0.40831589698791504], [-1.2748655080795288, -1.5084209442138672, -0.06492893397808075, 0.09351323544979095], [-1.3050339221954346, -1.7025550603866577, -0.06305866688489914, 0.3650251626968384], [-1.3390849828720093, -1.8967268466949463, -0.05575816333293915, 0.6371769309043884], [-1.3770195245742798, -1.7008734941482544, -0.04301462322473526, 0.3274690508842468], [-1.4110370874404907, -1.5051664113998413, -0.03646524250507355, 0.021537531167268753], [-1.4411404132843018, -1.3095409870147705, -0.03603449463844299, -0.2824239134788513], [-1.4673311710357666, -1.5041309595108032, -0.04168296977877617, -0.0013203497510403395], [-1.4974137544631958, -1.6986310482025146, -0.041709378361701965, 0.27792519330978394], [-1.531386375427246, -1.8931338787078857, -0.03615087643265724, 0.5571667551994324], [-1.569249153137207, -1.697523593902588, -0.025007540360093117, 0.2533169388771057], [-1.6031996011734009, -1.8922797441482544, -0.01994120143353939, 0.5380083322525024], [-1.6410452127456665, -1.696883201599121, -0.009181033819913864, 0.23910945653915405], [-1.6749827861785889, -1.891872763633728, -0.004398845136165619, 0.5288823246955872], [-1.712820291519165, -2.08693265914917, 0.006178801413625479, 0.8201759457588196], [-1.7545589208602905, -1.8918956518173218, 0.022582320496439934, 0.5294427871704102], [-1.792396903038025, -2.0873279571533203, 0.03317117691040039, 0.8291550278663635], [-1.8341434001922607, -1.8926748037338257, 0.04975427687168121, 0.5470864772796631], [-1.8719968795776367, -1.6982858180999756, 0.06069600582122803, 0.27048563957214355]], "actions": [1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[0.044746916741132736, 0.23387078940868378, 0.024808356538414955, -0.2742341160774231], [0.04942433536052704, 0.03840380907058716, 0.019323673099279404, 0.026169029995799065], [0.05019240826368332, 0.23324339091777802, 0.019847054034471512, -0.2603549659252167], [0.0548572763800621, 0.037843819707632065, 0.014639955013990402, 0.038521308451890945], [0.055614154785871506, 0.23275281488895416, 0.015410381369292736, -0.2495068460702896], [0.06026921048760414, 0.03741421550512314, 0.010420244187116623, 0.04799672216176987], [0.06101749464869499, 0.23238520324230194, 0.011380178853869438, -0.24138039350509644], [0.06566520035266876, 0.4273427724838257, 0.006552570965141058, -0.5304520726203918], [0.07421205192804337, 0.2321292608976364, -0.004056470934301615, -0.23571167886257172], [0.07885464280843735, 0.42730891704559326, -0.00877070426940918, -0.5296713709831238], [0.08740081638097763, 0.2323114573955536, -0.01936413161456585, -0.2397649586200714], [0.09204705059528351, 0.03747139871120453, -0.02415943145751953, 0.04674762487411499], [0.09279647469520569, -0.15729594230651855, -0.0232244785875082, 0.33171120285987854], [0.08965055644512177, 0.03814876079559326, -0.01659025438129902, 0.03179582580924034], [0.09041353315114975, -0.15673139691352844, -0.015954338014125824, 0.31919851899147034], [0.08727890253067017, -0.3516225218772888, -0.009570367634296417, 0.6068076491355896], [0.0802464559674263, -0.15636809170246124, 0.0025657855439931154, 0.3111257553100586], [0.07711908966302872, -0.35152649879455566, 0.008788300678133965, 0.6046167612075806], [0.07008855789899826, -0.1565285474061966, 0.02088063582777977, 0.31471481919288635], [0.066957987844944, 0.038289837539196014, 0.0271749310195446, 0.028689419850707054], [0.06772378832101822, 0.23301175236701965, 0.027748720720410347, -0.25529715418815613], [0.07238402217626572, 0.03750482574105263, 0.022642776370048523, 0.04600740224123001], [0.07313411682844162, -0.15793436765670776, 0.023562924936413765, 0.3457474410533905], [0.06997542828321457, 0.03684461861848831, 0.030477873980998993, 0.06058693677186966], [0.07071232050657272, -0.15870076417922974, 0.031689614057540894, 0.36272791028022766], [0.0675383061170578, 0.03595678508281708, 0.038944169878959656, 0.08020336180925369], [0.06825744360685349, 0.23049944639205933, 0.04054823890328407, -0.1999426782131195], [0.07286743074655533, 0.03482172638177872, 0.03654938563704491, 0.10525055974721909], [0.07356386631727219, 0.2294013500213623, 0.0386543944478035, -0.17568083107471466], [0.0781518965959549, 0.42394939064979553, 0.03514077886939049, -0.4559233486652374], [0.08663088083267212, 0.618557333946228, 0.02602231130003929, -0.7373257875442505], [0.09900202602148056, 0.4230858385562897, 0.011275796219706535, -0.43656811118125916], [0.10746374726295471, 0.22780610620975494, 0.0025444338098168373, -0.14035211503505707], [0.1120198667049408, 0.032647814601659775, -0.0002626085188239813, 0.15313245356082916], [0.1126728281378746, 0.227773517370224, 0.0028000404126942158, -0.13963331282138824], [0.11722829192876816, 0.4228552579879761, 7.374198503384832e-06, -0.4314315617084503], [0.12568539381027222, 0.22773320972919464, -0.008621256798505783, -0.13874630630016327], [0.1302400678396225, 0.03273578733205795, -0.01139618270099163, 0.15120433270931244], [0.13089478015899658, -0.16222114861011505, -0.008372096344828606, 0.440270334482193], [0.12765035033226013, 0.033018287271261215, 0.0004333099932409823, 0.14496007561683655], [0.12831072509288788, -0.1621098667383194, 0.0033325115218758583, 0.43777966499328613], [0.1250685304403305, 0.03296475484967232, 0.012088105082511902, 0.14614912867546082], [0.1257278174161911, -0.16232819855213165, 0.015011087991297245, 0.4426209628582001], [0.12248125672340393, 0.032578159123659134, 0.02386350743472576, 0.15470746159553528], [0.12313281744718552, 0.22735044360160828, 0.02695765718817711, -0.13035257160663605], [0.12767982482910156, 0.4220760762691498, 0.02435060404241085, -0.4144102931022644], [0.13612134754657745, 0.22661758959293365, 0.016062399372458458, -0.11415112018585205], [0.14065369963645935, 0.03126920759677887, 0.01377937663346529, 0.18355579674243927], [0.14127908647060394, 0.22619131207466125, 0.017450492829084396, -0.10474859923124313], [0.14580291509628296, 0.030823687091469765, 0.015355520881712437, 0.19338840246200562], [0.14641939103603363, 0.22572265565395355, 0.01922328770160675, -0.09441123157739639], [0.15093384683132172, 0.03033052757382393, 0.017335064709186554, 0.20427410304546356], [0.15154044330120087, 0.2252003401517868, 0.021420545876026154, -0.08289044350385666], [0.15604445338249207, 0.4200087785720825, 0.019762737676501274, -0.36873891949653625], [0.16444462537765503, 0.6148444414138794, 0.012387959286570549, -0.6551254391670227], [0.17674152553081512, 0.8097917437553406, -0.0007145503186620772, -0.9438819885253906], [0.19293735921382904, 1.0049233436584473, -0.01959219016134739, -1.236789345741272], [0.21303582191467285, 0.8100585341453552, -0.044327978044748306, -0.9503080248832703], [0.22923699021339417, 0.6155603528022766, -0.0633341372013092, -0.671875536441803], [0.24154819548130035, 0.4213733375072479, -0.07677164673805237, -0.3997867703437805], [0.24997566640377045, 0.617495596408844, -0.08476738631725311, -0.715652346611023], [0.26232558488845825, 0.8136821985244751, -0.09908042848110199, -1.0337674617767334], [0.27859923243522644, 0.6200074553489685, -0.11975578218698502, -0.7737621068954468], [0.2909993827342987, 0.8165555000305176, -0.13523101806640625, -1.101596713066101], [0.30733048915863037, 0.6234465837478638, -0.15726295113563538, -0.8542147278785706], [0.31979942321777344, 0.43077731132507324, -0.17434725165367126, -0.6148222088813782], [0.3284149467945099, 0.2384648472070694, -0.18664368987083435, -0.3817255198955536], [0.33318427205085754, 0.43567854166030884, -0.19427821040153503, -0.7269636392593384], [0.3418978154659271, 0.24369728565216064, -0.2088174819946289, -0.501168429851532], [0.346771776676178, 0.052035655826330185, -0.2188408374786377, -0.28086838126182556], [-0.017542196437716484, -0.24457639455795288, -0.029048604890704155, 0.29433533549308777], [-0.022433724254369736, -0.439272403717041, -0.02316189929842949, 0.5777170658111572], [-0.03121917136013508, -0.6340622305870056, -0.011607557535171509, 0.8630144000053406], [-0.04390041530132294, -0.4387841522693634, 0.005652730818837881, 0.566704511642456], [-0.05267610028386116, -0.2437419593334198, 0.016986820846796036, 0.27580779790878296], [-0.05755093693733215, -0.048866428434848785, 0.022502977401018143, -0.01146943960338831], [-0.058528266847133636, 0.14592568576335907, 0.022273588925600052, -0.29696834087371826], [-0.055609751492738724, -0.04950657859444618, 0.01633422262966633, 0.002655260032042861], [-0.05659988522529602, 0.14537735283374786, 0.016387326642870903, -0.28482958674430847], [-0.05369233712553978, 0.3402617871761322, 0.010690735653042793, -0.5722993612289429], [-0.0468871034681797, 0.5352322459220886, -0.000755251559894532, -0.8615952730178833], [-0.0361824557185173, 0.3401205539703369, -0.01798715628683567, -0.569149911403656], [-0.02938004583120346, 0.535490095615387, -0.029370155185461044, -0.8674447536468506], [-0.01867024414241314, 0.3407798707485199, -0.04671904817223549, -0.5841389298439026], [-0.011854646727442741, 0.1463424414396286, -0.05840182676911354, -0.3065314292907715], [-0.00892779789865017, -0.04790077731013298, -0.06453245878219604, -0.03282373026013374], [-0.009885813109576702, -0.24204079806804657, -0.065188929438591, 0.23882077634334564], [-0.014726629480719566, -0.04605107009410858, -0.060412514954805374, -0.07369136065244675], [-0.015647651627659798, -0.24025724828243256, -0.061886344105005264, 0.1993359923362732], [-0.020452795550227165, -0.4344419836997986, -0.05789962410926819, 0.4718725085258484], [-0.029141634702682495, -0.6287003755569458, -0.04846217483282089, 0.7457588315010071], [-0.04171564429998398, -0.8231213092803955, -0.033546995371580124, 1.0228055715560913], [-0.058178067207336426, -0.6275689005851746, -0.013090885244309902, 0.7197810411453247], [-0.07072944939136505, -0.43226832151412964, 0.0013047355460003018, 0.4230066239833832], [-0.07937481254339218, -0.23716488480567932, 0.009764867834746838, 0.13073530793190002], [-0.08411811292171478, -0.04218415915966034, 0.012379574589431286, -0.1588509976863861], [-0.08496179431676865, 0.15275838971138, 0.009202554821968079, -0.44760289788246155], [-0.08190662413835526, -0.04249252378940582, 0.0002504963194951415, -0.15203343331813812], [-0.08275647461414337, -0.23761805891990662, -0.002790172351524234, 0.14072851836681366], [-0.08750883489847183, -0.042456261813640594, 2.439801028231159e-05, -0.15283335745334625], [-0.08835796266794205, -0.23757855594158173, -0.00303226918913424, 0.13985726237297058], [-0.09310953319072723, -0.4326569437980652, -0.00023512383631896228, 0.4315820336341858], [-0.10176267474889755, -0.23753167688846588, 0.008396516554057598, 0.13882498443126678], [-0.10651330649852753, -0.042530983686447144, 0.011173016391694546, -0.15119719505310059], [-0.10736392438411713, -0.2378111183643341, 0.008149072527885437, 0.14498953521251678], [-0.11212015151977539, -0.04280681908130646, 0.011048862710595131, -0.14511141180992126], [-0.11297628283500671, 0.15215517580509186, 0.008146634325385094, -0.43428826332092285], [-0.10993318259716034, -0.04308116063475609, -0.0005391302402131259, -0.13904838263988495], [-0.1107948049902916, 0.1520485132932663, -0.0033200979232788086, -0.43190133571624756], [-0.10775383561849594, 0.347217321395874, -0.011958125047385693, -0.7256290316581726], [-0.1008094921708107, 0.15226274728775024, -0.02647070586681366, -0.4367336928844452], [-0.09776423126459122, -0.04247470200061798, -0.035205379128456116, -0.1525113433599472], [-0.09861373156309128, 0.15313319861888885, -0.03825560584664345, -0.45608964562416077], [-0.09555106610059738, -0.04142758622765541, -0.04737740010023117, -0.1757063865661621], [-0.09637961536645889, -0.23584061861038208, -0.05089152604341507, 0.10166217386722565], [-0.10109642893075943, -0.04002765193581581, -0.04885828495025635, -0.20663264393806458], [-0.1018969789147377, -0.234418123960495, -0.05299093574285507, 0.07024648785591125], [-0.10658534616231918, -0.038578081876039505, -0.051586005836725235, -0.23867326974868774], [-0.10735690593719482, -0.23292657732963562, -0.05635947361588478, 0.03730212152004242], [-0.11201544106006622, -0.4271969497203827, -0.055613428354263306, 0.3116840422153473], [-0.12055937945842743, -0.6214842796325684, -0.04937974736094475, 0.5863226056098938], [-0.1329890638589859, -0.42570677399635315, -0.03765329718589783, 0.27850255370140076], [-0.1415031999349594, -0.23006847500801086, -0.03208324685692787, -0.025814369320869446], [-0.1461045742034912, -0.03450145944952965, -0.03259953111410141, -0.32844477891921997], [-0.14679460227489471, -0.22914451360702515, -0.039168428629636765, -0.04621788114309311], [-0.15137748420238495, -0.033483441919088364, -0.04009278491139412, -0.3509969711303711], [-0.15204715728759766, -0.22801296412944794, -0.04711272567510605, -0.07122128456830978], [-0.15660741925239563, -0.4224289357662201, -0.04853715002536774, 0.20623306930065155], [-0.1650559902191162, -0.22664771974086761, -0.04441248998045921, -0.10135722905397415], [-0.16958895325660706, -0.030918341130018234, -0.04643963277339935, -0.40771475434303284], [-0.17020732164382935, -0.22535210847854614, -0.054593928158283234, -0.1300269067287445], [-0.1747143566608429, -0.41965121030807495, -0.05719446763396263, 0.1449449062347412], [-0.1831073760986328, -0.22375881671905518, -0.05429556965827942, -0.1652192324399948], [-0.18758255243301392, -0.4180631935596466, -0.057599954307079315, 0.10985276848077774], [-0.19594381749629974, -0.6123144626617432, -0.05540289729833603, 0.38382142782211304], [-0.20819011330604553, -0.41645148396492004, -0.04772647097706795, 0.07419763505458832], [-0.21651914715766907, -0.22067897021770477, -0.04624251648783684, -0.23315301537513733], [-0.2209327220916748, -0.4151107370853424, -0.05090557783842087, 0.04459240287542343], [-0.22923493385314941, -0.6094671487808228, -0.05001372843980789, 0.3207896053791046], [-0.24142427742481232, -0.41366997361183167, -0.04359793663024902, 0.012763150036334991], [-0.24969768524169922, -0.6081404089927673, -0.043342676013708115, 0.2913779318332672], [-0.2618604898452759, -0.8026184439659119, -0.03751511499285698, 0.5700821876525879], [-0.27791285514831543, -0.6069909930229187, -0.026113472878932953, 0.2658206522464752], [-0.2900526821613312, -0.8017306923866272, -0.020797058939933777, 0.5501541495323181], [-0.30608728528022766, -0.996554434299469, -0.009793976321816444, 0.836212694644928], [-0.326018363237381, -0.8013001084327698, 0.0069302767515182495, 0.5404658317565918], [-0.3420443832874298, -0.6062762141227722, 0.017739592120051384, 0.24997453391551971], [-0.35416990518569946, -0.8016469478607178, 0.02273908443748951, 0.5481997132301331], [-0.37020283937454224, -0.9970808625221252, 0.03370307758450508, 0.8479594588279724], [-0.3901444673538208, -0.8024344444274902, 0.050662267953157425, 0.5660624504089355], [-0.4061931371688843, -0.6080584526062012, 0.061983514577150345, 0.28976088762283325], [-0.418354332447052, -0.8040069937705994, 0.06777873635292053, 0.6013307571411133], [-0.4344344735145569, -0.6098953485488892, 0.07980534434318542, 0.33074355125427246], [-0.44663235545158386, -0.8060572743415833, 0.0864202156662941, 0.6474877595901489], [-0.4627535045146942, -0.612238883972168, 0.09936997294425964, 0.3832210898399353], [-0.4749982953071594, -0.4186578691005707, 0.10703439265489578, 0.12344873696565628], [-0.48337143659591675, -0.22521919012069702, 0.109503373503685, -0.13364072144031525], [-0.4878758192062378, -0.03182226046919823, 0.10683055967092514, -0.38986891508102417], [-0.4885122776031494, 0.16163408756256104, 0.0990331768989563, -0.6470506191253662], [-0.4852795898914337, -0.03471804037690163, 0.08609216660261154, -0.3248973488807678], [-0.48597395420074463, -0.23095357418060303, 0.0795942172408104, -0.006354403216391802], [-0.4905930161476135, -0.42712146043777466, 0.07946713268756866, 0.31034183502197266], [-0.49913546442985535, -0.23321634531021118, 0.08567396551370621, 0.04374082386493683], [-0.5037997961044312, -0.03942074626684189, 0.08654878288507462, -0.2207290232181549], [-0.5045881867408752, -0.23566633462905884, 0.0821342021226883, 0.09795112907886505], [-0.5093015432357788, -0.041811730712652206, 0.08409322798252106, -0.1677302122116089], [-0.5101377367973328, 0.15201212465763092, 0.0807386189699173, -0.4327443242073059], [-0.5070975422859192, -0.04415460675954819, 0.0720837339758873, -0.11574140191078186], [-0.5079805850982666, 0.14986443519592285, 0.06976890563964844, -0.3848399221897125], [-0.5049833059310913, 0.34393009543418884, 0.062072109431028366, -0.6547347903251648], [-0.4981047213077545, 0.14800134301185608, 0.04897741228342056, -0.343170166015625], [-0.49514469504356384, -0.04778192937374115, 0.04211400821805, -0.03545382246375084], [-0.4961003363132477, -0.24348171055316925, 0.041404932737350464, 0.27021342515945435], [-0.5009699463844299, -0.439169317483902, 0.04680920019745827, 0.5756627917289734], [-0.5097533464431763, -0.24473370611667633, 0.05832245573401451, 0.2980857789516449], [-0.5146480202674866, -0.050489529967308044, 0.06428417563438416, 0.02435198426246643], [-0.5156578421592712, 0.14365443587303162, 0.06477121263742447, -0.24737593531608582], [-0.5127847194671631, -0.052329882979393005, 0.059823691844940186, 0.06501353532075882], [-0.5138313174247742, 0.14188560843467712, 0.061123963445425034, -0.20821087062358856], [-0.5109935998916626, 0.33608269691467285, 0.05695974826812744, -0.4810032546520233], [-0.5042719841003418, 0.14020492136478424, 0.047339681535959244, -0.17092597484588623], [-0.5014678835868835, -0.05556151270866394, 0.04392116144299507, 0.13630735874176025], [-0.5025790929794312, 0.13890472054481506, 0.04664731025695801, -0.14220201969146729], [-0.49980098009109497, 0.33332863450050354, 0.04380326718091965, -0.41981130838394165], [-0.49313440918922424, 0.5278034210205078, 0.03540704399347305, -0.6983696818351746], [-0.4825783669948578, 0.33220890164375305, 0.021439649164676666, -0.39475423097610474], [-0.4759341776371002, 0.13678939640522003, 0.013544565066695213, -0.09538957476615906], [-0.47319838404655457, 0.3317146301269531, 0.011636773124337196, -0.38376861810684204], [-0.4665640890598297, 0.526669442653656, 0.003961400594562292, -0.6727598905563354], [-0.4560306966304779, 0.33149266242980957, -0.009493797086179256, -0.3788323700428009], [-0.4494008421897888, 0.5267481207847595, -0.01707044430077076, -0.6744935512542725], [-0.43886590003967285, 0.331867516040802, -0.030560316517949104, -0.3872336745262146], [-0.43222853541374207, 0.5274096727371216, -0.03830498829483986, -0.6893932819366455], [-0.42168036103248596, 0.7230416536331177, -0.05209285393357277, -0.9938849210739136], [-0.4072194993495941, 0.5286538600921631, -0.07197055220603943, -0.7180070877075195], [-0.3966464400291443, 0.33459773659706116, -0.08633069694042206, -0.44881758093833923], [-0.38995447754859924, 0.1407962441444397, -0.09530704468488693, -0.18454766273498535], [-0.3871385455131531, 0.33714351058006287, -0.09899800270795822, -0.5057098269462585], [-0.38039568066596985, 0.5335109233856201, -0.1091121956706047, -0.8278766870498657], [-0.36972546577453613, 0.7299420833587646, -0.12566973268985748, -1.1527864933013916], [-0.35512661933898926, 0.5366631746292114, -0.1487254649400711, -0.9020042419433594], [-0.34439337253570557, 0.3438350260257721, -0.16676554083824158, -0.6595192551612854], [-0.3375166654586792, 0.15137822926044464, -0.17995592951774597, -0.423641175031662], [-0.334489107131958, -0.040799111127853394, -0.18842875957489014, -0.19265216588974], [-0.3353050649166107, -0.2327960878610611, -0.1922817975282669, 0.0351749025285244], [-0.3399609923362732, -0.4247153103351593, -0.19157829880714417, 0.2615651786327362], [-0.3484553098678589, -0.22744859755039215, -0.18634699285030365, -0.08490147441625595], [-0.3530042767524719, -0.03021228313446045, -0.18804502487182617, -0.43010348081588745], [-0.35360851883888245, -0.22224323451519012, -0.19664709270000458, -0.20209486782550812], [-0.35805338621139526, -0.41408902406692505, -0.20068898797035217, 0.022685380652546883], [-0.3663351833820343, -0.6058520078659058, -0.2002352774143219, 0.24594934284687042], [-0.37845221161842346, -0.797635018825531, -0.19531629979610443, 0.46939948201179504], [-0.39440491795539856, -0.9895393252372742, -0.1859283149242401, 0.6947242021560669], [-0.4141956865787506, -0.7923919558525085, -0.17203381657600403, 0.3497513234615326], [-0.4300435483455658, -0.9847031235694885, -0.1650387942790985, 0.5836310982704163], [-0.4497376084327698, -0.7877007126808167, -0.15336617827415466, 0.24384133517742157], [-0.4654916226863861, -0.980337381362915, -0.1484893560409546, 0.48449164628982544], [-0.48509836196899414, -0.7834662199020386, -0.1387995183467865, 0.14893893897533417], [-0.500767707824707, -0.5866578221321106, -0.13582073152065277, -0.18411074578762054], [-0.5125008225440979, -0.7796013951301575, -0.13950295746326447, 0.06283064186573029], [-0.5280928611755371, -0.5827836394309998, -0.1382463425397873, -0.2704089283943176], [-0.5397485494613647, -0.7756898403167725, -0.14365451037883759, -0.02432538941502571], [-0.5552623271942139, -0.9684907793998718, -0.14414101839065552, 0.2198077291250229], [-0.5746321678161621, -1.1612896919250488, -0.13974487781524658, 0.46377620100975037], [-0.5978579521179199, -0.9644982218742371, -0.13046935200691223, 0.1305151730775833], [-0.6171479225158691, -0.7677721381187439, -0.12785904109477997, -0.20031526684761047], [-0.63250333070755, -0.9608556032180786, -0.13186535239219666, 0.04945755377411842], [-0.6517204642295837, -1.1538643836975098, -0.13087619841098785, 0.2978011667728424], [-0.674797773361206, -0.9571433067321777, -0.12492017447948456, -0.033124782145023346], [-0.6939406394958496, -1.150273084640503, -0.12558266520500183, 0.21768134832382202], [-0.7169460654258728, -0.9536004662513733, -0.12122904509305954, -0.11182858794927597], [-0.7360181212425232, -1.1467955112457275, -0.12346561253070831, 0.14028306305408478], [-0.7589539885520935, -1.339952826499939, -0.1206599548459053, 0.3916066288948059], [-0.785753071308136, -1.1433435678482056, -0.11282782256603241, 0.06344900280237198], [-0.8086199164390564, -1.3366822004318237, -0.11155883967876434, 0.318511962890625], [-0.8353535532951355, -1.1401628255844116, -0.10518860071897507, -0.007165013812482357], [-0.8581568598747253, -1.3336312770843506, -0.1053319051861763, 0.25056520104408264], [-0.8848294615745544, -1.5271037817001343, -0.10032059997320175, 0.5082550644874573], [-0.9153715372085571, -1.3307220935821533, -0.09015549719333649, 0.1857188194990158], [-0.9419859647750854, -1.134433627128601, -0.08644112199544907, -0.1339879333972931], [-0.9646746516227722, -0.9381866455078125, -0.08912087976932526, -0.4526413083076477], [-0.9834383726119995, -1.1319427490234375, -0.09817370772361755, -0.18932747840881348], [-1.0060772895812988, -1.3255330324172974, -0.10196025669574738, 0.07084308564662933], [-1.0325878858566284, -1.5190566778182983, -0.10054339468479156, 0.32969650626182556], [-1.0629689693450928, -1.3226579427719116, -0.09394945949316025, 0.007076171226799488], [-1.0894222259521484, -1.1263229846954346, -0.09380793571472168, -0.3137080669403076], [-1.1119486093521118, -1.3199920654296875, -0.10008209943771362, -0.05202072113752365], [-1.1383484601974487, -1.5135471820831299, -0.10112251341342926, 0.20748400688171387], [-1.1686193943023682, -1.707088589668274, -0.09697283059358597, 0.46663379669189453], [-1.202761173248291, -1.9007163047790527, -0.08764015883207321, 0.7272454500198364], [-1.2407755851745605, -1.7044990062713623, -0.07309524714946747, 0.40831589698791504], [-1.2748655080795288, -1.5084209442138672, -0.06492893397808075, 0.09351323544979095], [-1.3050339221954346, -1.7025550603866577, -0.06305866688489914, 0.3650251626968384], [-1.3390849828720093, -1.8967268466949463, -0.05575816333293915, 0.6371769309043884], [-1.3770195245742798, -1.7008734941482544, -0.04301462322473526, 0.3274690508842468], [-1.4110370874404907, -1.5051664113998413, -0.03646524250507355, 0.021537531167268753], [-1.4411404132843018, -1.3095409870147705, -0.03603449463844299, -0.2824239134788513], [-1.4673311710357666, -1.5041309595108032, -0.04168296977877617, -0.0013203497510403395], [-1.4974137544631958, -1.6986310482025146, -0.041709378361701965, 0.27792519330978394], [-1.531386375427246, -1.8931338787078857, -0.03615087643265724, 0.5571667551994324], [-1.569249153137207, -1.697523593902588, -0.025007540360093117, 0.2533169388771057], [-1.6031996011734009, -1.8922797441482544, -0.01994120143353939, 0.5380083322525024], [-1.6410452127456665, -1.696883201599121, -0.009181033819913864, 0.23910945653915405], [-1.6749827861785889, -1.891872763633728, -0.004398845136165619, 0.5288823246955872], [-1.712820291519165, -2.08693265914917, 0.006178801413625479, 0.8201759457588196], [-1.7545589208602905, -1.8918956518173218, 0.022582320496439934, 0.5294427871704102], [-1.792396903038025, -2.0873279571533203, 0.03317117691040039, 0.8291550278663635], [-1.8341434001922607, -1.8926748037338257, 0.04975427687168121, 0.5470864772796631], [-1.8719968795776367, -1.6982858180999756, 0.06069600582122803, 0.27048563957214355], [-1.905962586402893, -1.5040801763534546, 0.06610572338104248, -0.002452741377055645]], "action_prob": [0.5249334573745728, 0.6855826377868652, 0.5337754487991333, 0.6818234920501709, 0.5396736264228821, 0.6794508695602417, 0.5429192185401917, 0.3215319514274597, 0.7543482780456543, 0.31118038296699524, 0.7576514482498169, 0.7035927176475525, 0.5121743679046631, 0.6914016604423523, 0.5190887451171875, 0.31039541959762573, 0.7535455226898193, 0.30114781856536865, 0.756508469581604, 0.7126927971839905, 0.5378842949867249, 0.6773438453674316, 0.4506838023662567, 0.7256978750228882, 0.4255852699279785, 0.7347291111946106, 0.6037964224815369, 0.6251339316368103, 0.6226971745491028, 0.39305004477500916, 0.2661568820476532, 0.7576315402984619, 0.7392891645431519, 0.6217226982116699, 0.6166462898254395, 0.3773752450942993, 0.7434046864509583, 0.6367747187614441, 0.4028984606266022, 0.7345330119132996, 0.39603549242019653, 0.7381044030189514, 0.38268938660621643, 0.743035078048706, 0.6364037394523621, 0.4062120020389557, 0.73150235414505, 0.5940804481506348, 0.6449945569038391, 0.5853321552276611, 0.652233362197876, 0.5750429630279541, 0.6602439284324646, 0.4371468126773834, 0.278204083442688, 0.24133941531181335, 0.24871045351028442, 0.7313666343688965, 0.7493873834609985, 0.7642034888267517, 0.23539400100708008, 0.23829904198646545, 0.7372084856033325, 0.2441985011100769, 0.726478099822998, 0.7451782822608948, 0.7638283967971802, 0.22192524373531342, 0.7506722807884216, 0.7694736123085022, 0.5419188141822815, 0.32614150643348694, 0.2506018579006195, 0.7530834674835205, 0.7546654939651489, 0.7012525200843811, 0.5107324719429016, 0.6939697861671448, 0.5185555219650269, 0.30863767862319946, 0.2439587563276291, 0.754277229309082, 0.2394062578678131, 0.753373384475708, 0.7642735242843628, 0.7436412572860718, 0.626557469367981, 0.5958317518234253, 0.6554049253463745, 0.437573105096817, 0.28679829835891724, 0.24790921807289124, 0.7482134699821472, 0.7559290528297424, 0.7289999127388, 0.5942228436470032, 0.3607463240623474, 0.7471376657485962, 0.6449437737464905, 0.5923356413841248, 0.6439616680145264, 0.4066449999809265, 0.7335146069526672, 0.608854353427887, 0.6262202858924866, 0.6162819266319275, 0.38104769587516785, 0.742422342300415, 0.37477439641952515, 0.2544984817504883, 0.7596405148506165, 0.7531296610832214, 0.3309638500213623, 0.7582103610038757, 0.6929821372032166, 0.5039167404174805, 0.7090999484062195, 0.46973976492881775, 0.7235254645347595, 0.5664335489273071, 0.3549184501171112, 0.7381333112716675, 0.6409559845924377, 0.40944549441337585, 0.7395967841148376, 0.385585218667984, 0.7467449903488159, 0.6408250331878662, 0.5754081010818481, 0.3425247371196747, 0.7563883066177368, 0.6824270486831665, 0.5115711092948914, 0.6989431381225586, 0.5197964310646057, 0.6673286557197571, 0.4627877175807953, 0.7189926505088806, 0.5645941495895386, 0.6370131969451904, 0.5795673131942749, 0.37395164370536804, 0.7307405471801758, 0.3709659278392792, 0.2660011351108551, 0.756443440914154, 0.7432882189750671, 0.33123862743377686, 0.24955163896083832, 0.7594034075737, 0.7596661448478699, 0.27446916699409485, 0.7645930647850037, 0.2525082528591156, 0.7665781378746033, 0.7632454633712769, 0.7198153138160706, 0.5887991786003113, 0.39514392614364624, 0.721227765083313, 0.5672152638435364, 0.33132967352867126, 0.7617752552032471, 0.7056730389595032, 0.45477789640426636, 0.7289953827857971, 0.5960770845413208, 0.6074178218841553, 0.6299042105674744, 0.42361292243003845, 0.715503454208374, 0.5617163777351379, 0.33643630146980286, 0.24200516939163208, 0.763178825378418, 0.7650330662727356, 0.7154549956321716, 0.44355809688568115, 0.7296445369720459, 0.5891382098197937, 0.6181694865226746, 0.39359399676322937, 0.7444160580635071, 0.6293569207191467, 0.41742056608200073, 0.7203940153121948, 0.5878520607948303, 0.6311252117156982, 0.4091487526893616, 0.7288467884063721, 0.3876981735229492, 0.7391130328178406, 0.35705286264419556, 0.24967285990715027, 0.7649690508842468, 0.7628418803215027, 0.7243128418922424, 0.40236085653305054, 0.2516372799873352, 0.2307329773902893, 0.7519567608833313, 0.765548586845398, 0.7744167447090149, 0.7689948678016663, 0.7266203761100769, 0.6134429574012756, 0.5500930547714233, 0.30678850412368774, 0.7736966013908386, 0.7464093565940857, 0.6637901663780212, 0.5234458446502686, 0.3870565593242645, 0.6957464218139648, 0.4487769305706024, 0.6645009517669678, 0.5090748071670532, 0.6265041828155518, 0.4377160370349884, 0.719836950302124, 0.38269656896591187, 0.7409718632698059, 0.6647569537162781, 0.538469135761261, 0.5928112268447876, 0.4212331473827362, 0.715129554271698, 0.621394693851471, 0.5065651535987854, 0.6514923572540283, 0.46769091486930847, 0.676395058631897, 0.5690028667449951, 0.5530756711959839, 0.594490110874176, 0.5261494517326355, 0.6158372759819031, 0.49897050857543945, 0.6105416417121887, 0.4867023229598999, 0.3579026162624359, 0.7283511161804199, 0.6620290279388428, 0.563136875629425, 0.5456432104110718, 0.4220716059207916, 0.684677004814148, 0.5987496972084045, 0.4964238703250885, 0.4007440209388733, 0.6717325448989868, 0.5981279611587524, 0.5027512311935425, 0.40472984313964844, 0.6703445911407471, 0.601672887802124, 0.5083504915237427, 0.5955575108528137, 0.4931023418903351, 0.39837148785591125, 0.6736496090888977, 0.3884948492050171, 0.6812992095947266, 0.37547120451927185, 0.3090895712375641, 0.7317245006561279, 0.29378896951675415, 0.7418193817138672, 0.722939133644104, 0.6909089684486389], "advantages": [28.775314331054688, 28.500743865966797, 27.76310157775879, 27.451231002807617, 26.73845863342285, 26.397232055664062, 25.69953155517578, 25.336219787597656, 25.89904022216797, 24.357168197631836, 25.017295837402344, 23.423799514770508, 22.664331436157227, 22.928022384643555, 21.53953742980957, 21.752182006835938, 23.296245574951172, 20.493738174438477, 22.021028518676758, 19.219423294067383, 17.776899337768555, 17.343414306640625, 16.536623001098633, 16.781206130981445, 15.220087051391602, 15.5027437210083, 13.873823165893555, 13.213380813598633, 12.549322128295898, 11.818106651306152, 11.833479881286621, 12.761516571044922, 10.573561668395996, 9.204902648925781, 8.611741065979004, 7.819441795349121, 7.900196075439453, 6.481253623962402, 5.846309661865234, 6.275506973266602, 4.342168807983398, 4.749301433563232, 2.798809766769409, 3.204662799835205, 1.2174032926559448, 0.29134276509284973, 0.15650728344917297, -1.2667933702468872, -1.8946950435638428, -2.900601387023926, -3.5201668739318848, -4.57071590423584, -5.179555892944336, -6.278278350830078, -6.582672595977783, -5.975947380065918, -4.155144691467285, -1.164343237876892, -4.69895601272583, -7.850595951080322, -10.348257064819336, -8.34423828125, -4.748455047607422, -7.971456050872803, -3.7424468994140625, -6.6598734855651855, -9.50732421875, -12.025967597961426, -7.816045761108398, -10.303750991821289, 65.40158081054688, 66.12979888916016, 68.20989227294922, 70.82599639892578, 67.73377990722656, 65.30785369873047, 64.2911148071289, 64.38880157470703, 63.986244201660156, 64.05634307861328, 65.13502502441406, 67.4488525390625, 65.1964340209961, 67.87899780273438, 65.55514526367188, 64.06501770019531, 63.48067855834961, 63.99338912963867, 63.348628997802734, 63.7070198059082, 65.43860626220703, 67.966796875, 70.05757904052734, 67.315185546875, 64.25159454345703, 62.2568473815918, 61.758121490478516, 62.50672912597656, 61.44184494018555, 61.56266403198242, 61.06117248535156, 61.17832565307617, 62.73672103881836, 60.71157455444336, 60.15896987915039, 60.2997932434082, 59.71723556518555, 60.3288688659668, 59.362430572509766, 60.02021789550781, 61.98801803588867, 59.95108413696289, 58.9052848815918, 59.919105529785156, 58.760597229003906, 58.71030044555664, 58.58000564575195, 58.39412307739258, 58.4435920715332, 58.10993194580078, 59.165382385253906, 61.40935516357422, 58.55781936645508, 57.23220443725586, 57.64683151245117, 56.922386169433594, 57.51000213623047, 56.66313171386719, 57.23371887207031, 56.326080322265625, 57.29660415649414, 56.1551399230957, 56.424556732177734, 55.92579650878906, 56.01480484008789, 57.58919906616211, 55.4969367980957, 55.36195755004883, 55.10441207885742, 56.39924621582031, 54.59954071044922, 55.75395584106445, 57.81839370727539, 54.983428955078125, 57.01777267456055, 58.79478454589844, 56.119754791259766, 53.27256774902344, 55.328460693359375, 57.16854476928711, 54.47600555419922, 51.57041931152344, 53.742889404296875, 50.81046676635742, 53.0479736328125, 50.1070442199707, 47.79439163208008, 46.57786560058594, 46.22908020019531, 46.55045700073242, 45.316959381103516, 45.02934265136719, 45.928382873535156, 44.25673294067383, 43.523651123046875, 43.53037643432617, 42.684356689453125, 42.450618743896484, 41.892452239990234, 41.57783508300781, 41.765445709228516, 40.77094268798828, 40.3674430847168, 40.74558639526367, 42.28764724731445, 39.97999954223633, 38.734432220458984, 38.16459274291992, 37.933502197265625, 37.30216598510742, 37.09154510498047, 36.457977294921875, 36.32219696044922, 35.5899772644043, 35.291839599609375, 35.39357376098633, 34.43803405761719, 33.88627624511719, 33.56853485107422, 33.70106887817383, 32.73622512817383, 32.94407653808594, 31.93475914001465, 32.270843505859375, 33.50680160522461, 31.83692741394043, 30.617788314819336, 29.820011138916016, 30.100065231323242, 31.54195213317871, 34.53074264526367, 32.411312103271484, 30.57912826538086, 29.141454696655273, 28.189788818359375, 27.8825740814209, 28.492671966552734, 27.552459716796875, 28.962934494018555, 27.86185646057129, 27.63450050354004, 28.473424911499023, 30.052621841430664, 31.531286239624023, 28.97909164428711, 30.37989616394043, 28.055147171020508, 29.283918380737305, 27.26639175415039, 26.974571228027344, 26.841842651367188, 27.253307342529297, 26.706052780151367, 27.054536819458008, 27.578197479248047, 26.30919647216797, 26.304542541503906, 25.897233963012695, 25.953523635864258, 25.390186309814453, 25.179479598999023, 24.953792572021484, 24.49081039428711, 24.116296768188477, 23.611663818359375, 23.057382583618164, 22.70726203918457, 21.988080978393555, 21.203811645507812, 20.651731491088867, 20.49064826965332, 21.09674644470215, 19.77835464477539, 18.70823097229004, 17.653162002563477, 17.463159561157227, 17.718461990356445, 16.475727081298828, 15.257204055786133, 13.980966567993164, 12.683966636657715, 12.137557983398438, 11.758386611938477, 10.338123321533203, 8.95661449432373, 8.241552352905273, 7.687946796417236, 7.387645721435547, 5.861902713775635, 4.404642105102539, 3.0176680088043213, 2.147969961166382, 0.766270101070404, -0.2167152613401413, -1.5743435621261597, -2.8196799755096436, -4.147350311279297, -5.3384690284729, -6.810678482055664, -8.258934020996094], "value_targets": [50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0, 86.60203552246094, 86.4666976928711, 86.33000183105469, 86.1919174194336, 86.05244445800781, 85.91156005859375, 85.76924896240234, 85.62550354003906, 85.48030853271484, 85.33364868164062, 85.18550109863281, 85.03585815429688, 84.88470458984375, 84.73202514648438, 84.57780456542969, 84.42202758789062, 84.2646713256836, 84.10572814941406, 83.94518280029297, 83.78301239013672, 83.61920166015625, 83.45374298095703, 83.28660583496094, 83.11778259277344, 82.94725799560547, 82.77500915527344, 82.60102081298828, 82.4252700805664, 82.24774932861328, 82.06842803955078, 81.8873062133789, 81.704345703125, 81.51954650878906, 81.33287048339844, 81.14431762695312, 80.953857421875, 80.76146697998047, 80.567138671875, 80.370849609375, 80.17257690429688, 79.97229766845703, 79.7699966430664, 79.5656509399414, 79.35924530029297, 79.1507568359375, 78.94015502929688, 78.72743225097656, 78.51255798339844, 78.2955093383789, 78.0762710571289, 77.85482025146484, 77.63113403320312, 77.40518188476562, 77.17695617675781, 76.94641876220703, 76.71355438232422, 76.47834014892578, 76.2407455444336, 76.0007553100586, 75.75833892822266, 75.51347351074219, 75.26612854003906, 75.01629638671875, 74.76393127441406, 74.50902557373047, 74.25154113769531, 73.991455078125, 73.72874450683594, 73.46337127685547, 73.19532775878906, 72.92457580566406, 72.65108489990234, 72.37483215332031, 72.09579467773438, 71.81392669677734, 71.52922058105469, 71.24163818359375, 70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}
{"type": "SampleBatch", "eps_id": [1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783, 1337984783], "obs": [[0.010039509274065495, 0.007557542063295841, -0.030501922592520714, 0.026214968413114548], [0.010190660133957863, -0.18711401522159576, -0.029977623373270035, 0.3091202974319458], [0.006448379717767239, 0.008421958424150944, -0.023795217275619507, 0.007136020343750715], [0.006616818718612194, -0.18635079264640808, -0.023652497678995132, 0.29221731424331665], [0.002889802912250161, 0.00910026952624321, -0.017808152362704277, -0.007830471731722355], [0.0030718082562088966, 0.20447303354740143, -0.017964761704206467, -0.3060784637928009], [0.007161268964409828, 0.39984631538391113, -0.024086330085992813, -0.6043724417686462], [0.015158195048570633, 0.20506934821605682, -0.036173779517412186, -0.3193724453449249], [0.019259581342339516, 0.010480747558176517, -0.042561229318380356, -0.03831326961517334], [0.01946919597685337, -0.18400584161281586, -0.043327491730451584, 0.2406432181596756], [0.015789080411195755, -0.3784829378128052, -0.0385146290063858, 0.5193507671356201], [0.008219420909881592, -0.573042094707489, -0.02812761254608631, 0.799652636051178], [-0.0032414214219897985, -0.3775458335876465, -0.012134561315178871, 0.49825575947761536], [-0.010792338289320469, -0.18225492537021637, -0.0021694456227123737, 0.2017734944820404], [-0.014437437057495117, 0.012897985987365246, 0.0018660241039469838, -0.09159300476312637], [-0.014179476536810398, -0.18225066363811493, 3.4163986128987744e-05, 0.201678067445755], [-0.017824489623308182, 0.01287080068141222, 0.0040677255019545555, -0.09099408239126205], [-0.017567073926329613, -0.18230922520160675, 0.0022478436585515738, 0.20296943187713623], [-0.021213257685303688, 0.012780514545738697, 0.006307232193648815, -0.0890035629272461], [-0.020957648754119873, 0.20781148970127106, 0.00452716089785099, -0.37968990206718445], [-0.016801418736577034, 0.4028688669204712, -0.0030666368547827005, -0.670941948890686], [-0.008744041435420513, 0.5980333089828491, -0.01648547686636448, -0.9645888805389404], [0.003216625191271305, 0.403136670589447, -0.0357772521674633, -0.6771301031112671], [0.01127935852855444, 0.20852959156036377, -0.049319855868816376, -0.39592257142066956], [0.01544994954019785, 0.014140836894512177, -0.05723830685019493, -0.11918817460536957], [0.015732767060399055, -0.18011629581451416, -0.05962207168340683, 0.15490145981311798], [0.012130441144108772, 0.015806397423148155, -0.056524042040109634, -0.15597890317440033], [0.012446568347513676, -0.17846260964870453, -0.059643618762493134, 0.11835001409053802], [0.008877316489815712, -0.37268152832984924, -0.05727661773562431, 0.391635537147522], [0.0014236855786293745, -0.17679548263549805, -0.04944390803575516, 0.081458181142807], [-0.0021122239995747805, -0.371175080537796, -0.0478147454559803, 0.35814064741134644], [-0.009535725228488445, -0.17540714144706726, -0.04065193235874176, 0.050772182643413544], [-0.013043868355453014, 0.020273428410291672, -0.03963648900389671, -0.2544545531272888], [-0.012638399377465248, -0.17426082491874695, -0.044725578278303146, 0.02546757273375988], [-0.016123617067933083, 0.02147304266691208, -0.044216226786375046, -0.2809845507144928], [-0.015694156289100647, -0.17299121618270874, -0.049835920333862305, -0.0025686072185635567], [-0.019153980538249016, -0.3673643469810486, -0.049887292087078094, 0.2739833891391754], [-0.026501266285777092, -0.1715673953294754, -0.04440762475132942, -0.03400741517543793], [-0.029932614415884018, -0.36602532863616943, -0.045087773352861404, 0.24434036016464233], [-0.03725311905145645, -0.56047523021698, -0.040200963616371155, 0.5224674940109253], [-0.048462625592947006, -0.3648112118244171, -0.02975161373615265, 0.2173926830291748], [-0.055758848786354065, -0.5594955086708069, -0.025403760373592377, 0.5005441904067993], [-0.06694875657558441, -0.7542502880096436, -0.015392877161502838, 0.7851142287254333], [-0.08203376084566116, -0.5589202642440796, 0.0003094076528213918, 0.4876285493373871], [-0.09321217238903046, -0.7540465593338013, 0.010061979293823242, 0.7804089784622192], [-0.10829310119152069, -0.5590643882751465, 0.025670157745480537, 0.490908682346344], [-0.1194743886590004, -0.7545388340950012, 0.03548833355307579, 0.7915700078010559], [-0.13456515967845917, -0.5599216818809509, 0.05131973326206207, 0.5102593898773193], [-0.1457636058330536, -0.36555880308151245, 0.06152492016553879, 0.23418034613132477], [-0.15307477116584778, -0.17136742174625397, 0.06620852649211884, -0.03847869485616684], [-0.1565021276473999, -0.3673732578754425, 0.06543895602226257, 0.27433696389198303], [-0.1638495922088623, -0.17324306070804596, 0.07092569023370743, 0.0029902656096965075], [-0.16731445491313934, 0.020793817937374115, 0.07098549604415894, -0.2664986252784729], [-0.16689857840538025, -0.17526566982269287, 0.06565552204847336, 0.04770219698548317], [-0.1704038828611374, -0.37126463651657104, 0.06660956889390945, 0.36035606265068054], [-0.17782917618751526, -0.17714963853359222, 0.0738166868686676, 0.08939800411462784], [-0.18137216567993164, 0.016840888187289238, 0.075604647397995, -0.17911295592784882], [-0.1810353547334671, -0.1792769879102707, 0.07202239334583282, 0.1364300698041916], [-0.18462088704109192, -0.375352680683136, 0.07475098967552185, 0.450937420129776], [-0.19212794303894043, -0.18136312067508698, 0.08376973867416382, 0.18272200226783752], [-0.1957552134990692, 0.012466493993997574, 0.08742418140172958, -0.08240337669849396], [-0.19550588726997375, 0.20623353123664856, 0.08577611297369003, -0.34627392888069153], [-0.19138121604919434, 0.4000372886657715, 0.0788506343960762, -0.6107235550880432], [-0.18338046967983246, 0.20390689373016357, 0.06663616746664047, -0.2942839562892914], [-0.17930231988430023, 0.39801865816116333, 0.060750484466552734, -0.5652288794517517], [-0.17134195566177368, 0.20209936797618866, 0.04944590851664543, -0.254042387008667], [-0.16729997098445892, 0.006307550705969334, 0.044365059584379196, 0.05381755530834198], [-0.1671738177537918, 0.20076622068881989, 0.045441411435604095, -0.22454437613487244], [-0.16315849125385284, 0.39521023631095886, 0.04095052182674408, -0.502554178237915], [-0.1552542895078659, 0.5897318124771118, 0.030899440869688988, -0.7820557951927185], [-0.14345964789390564, 0.39419907331466675, 0.015258324332535267, -0.47981372475624084], [-0.13557566702365875, 0.19886508584022522, 0.005662050098180771, -0.18236106634140015], [-0.1315983682870865, 0.0036625699140131474, 0.0020148290786892176, 0.11210264265537262], [-0.13152511417865753, -0.19148819148540497, 0.004256881773471832, 0.40542054176330566], [-0.1353548765182495, 0.0035731319803744555, 0.012365292757749557, 0.11408273875713348], [-0.13528341054916382, 0.19851574301719666, 0.014646947383880615, -0.17467351257801056], [-0.13131310045719147, 0.0031872631516307592, 0.011153477244079113, 0.12259382009506226], [-0.1312493532896042, 0.19814765453338623, 0.01360535342246294, -0.16654953360557556], [-0.1272864043712616, 0.002833625068888068, 0.010274362750351429, 0.13039425015449524], [-0.1272297352552414, 0.19780689477920532, 0.012882248498499393, -0.15902961790561676], [-0.12327359616756439, 0.3927420675754547, 0.009701656177639961, -0.44762083888053894], [-0.11541875451803207, 0.19748423993587494, 0.0007492390577681363, -0.15189562737941742], [-0.11146906763315201, 0.39259544014930725, -0.0022886733058840036, -0.44434207677841187], [-0.10361715406179428, 0.19750595092773438, -0.011175515130162239, -0.15238147974014282], [-0.0996670350432396, 0.0025457940064370632, -0.014223144389688969, 0.13675497472286224], [-0.09961612522602081, 0.19786854088306427, -0.011488045565783978, -0.1603809893131256], [-0.09565874934196472, 0.0029129318427294493, -0.014695664867758751, 0.12865573167800903], [-0.09560049325227737, -0.19199545681476593, -0.012122550047934055, 0.4166663587093353], [-0.09944040328264236, -0.386943519115448, -0.0037892230320721865, 0.7055030465126038], [-0.10717926919460297, -0.19176927208900452, 0.01032083760946989, 0.41162973642349243], [-0.11101465672254562, 0.003204860957339406, 0.01855343207716942, 0.12221838533878326], [-0.11095055937767029, -0.1921779215335846, 0.020997799932956696, 0.42069652676582336], [-0.11479412019252777, 0.002640319988131523, 0.02941173128783703, 0.13470648229122162], [-0.11474131047725677, 0.19732891023159027, 0.032105859369039536, -0.14855431020259857], [-0.11079473793506622, 0.0017622647574171424, 0.029134774580597878, 0.15408198535442352], [-0.11075948923826218, -0.19376446306705475, 0.03221641480922699, 0.4558120369911194], [-0.11463478207588196, 0.0008875220082700253, 0.041332654654979706, 0.17345553636550903], [-0.11461702734231949, -0.19480086863040924, 0.04480176419019699, 0.4788857698440552], [-0.11851304769515991, -0.3905257284641266, 0.054379481822252274, 0.7853457927703857], [-0.12632356584072113, -0.1961914300918579, 0.07008639723062515, 0.5102549195289612], [-0.13024738430976868, -0.0021231798455119133, 0.0802914947271347, 0.2404557466506958], [-0.13028985261917114, 0.19176547229290009, 0.08510060608386993, -0.02585994079709053], [-0.12645454704761505, -0.004467266611754894, 0.08458340913057327, 0.2924133539199829], [-0.12654389441013336, 0.18935324251651764, 0.09043167531490326, 0.027559852227568626], [-0.12275682389736176, 0.383069783449173, 0.09098287671804428, -0.2352769523859024], [-0.11509542912244797, 0.18677367269992828, 0.08627733588218689, 0.08466144651174545], [-0.11135995388031006, 0.3805597424507141, 0.0879705622792244, -0.17960235476493835], [-0.10374876111745834, 0.5743198990821838, 0.08437851816415787, -0.4432886838912964], [-0.09226236492395401, 0.7681528925895691, 0.07551274448633194, -0.7082259058952332], [-0.07689930498600006, 0.5720706582069397, 0.06134822592139244, -0.39276108145713806], [-0.06545788794755936, 0.3761341869831085, 0.05349300429224968, -0.08138424158096313], [-0.0579352080821991, 0.5704501271247864, 0.051865316927433014, -0.35672178864479065], [-0.04652620479464531, 0.7647978067398071, 0.044730883091688156, -0.6326097249984741], [-0.031230248510837555, 0.5690813064575195, 0.032078687101602554, -0.32618212699890137], [-0.019848620519042015, 0.3735176622867584, 0.025555046275258064, -0.023558061569929123], [-0.0123782679438591, 0.5682640075683594, 0.025083884596824646, -0.30806979537010193], [-0.001012988155707717, 0.7630197405815125, 0.018922489136457443, -0.59273761510849], [0.014247406274080276, 0.5676380395889282, 0.007067736238241196, -0.29415470361709595], [0.025600166991353035, 0.7626585364341736, 0.0011846426641568542, -0.5846002101898193], [0.040853336453437805, 0.9577638506889343, -0.01050736103206873, -0.8769097328186035], [0.060008615255355835, 0.7627862691879272, -0.02804555557668209, -0.5875486135482788], [0.0752643421292305, 0.9582895636558533, -0.03979652747511864, -0.888932466506958], [0.09443013370037079, 0.7637295722961426, -0.057575177401304245, -0.6090207099914551], [0.10970472544431686, 0.5694577693939209, -0.06975559145212173, -0.33501359820365906], [0.12109387665987015, 0.7654995918273926, -0.07645586133003235, -0.6488526463508606], [0.1364038735628128, 0.5715212821960449, -0.08943291753530502, -0.3811913728713989], [0.14783430099487305, 0.37777552008628845, -0.09705674648284912, -0.11799241602420807], [0.15538980066776276, 0.1841684877872467, -0.0994165912270546, 0.14256145060062408], [0.15907317399978638, 0.38056331872940063, -0.0965653657913208, -0.1797565072774887], [0.16668444871902466, 0.1869463175535202, -0.10016049444675446, 0.08096984028816223], [0.17042337357997894, -0.006607807707041502, -0.09854109585285187, 0.34044796228408813], [0.1702912151813507, -0.200199693441391, -0.09173213690519333, 0.6005027890205383], [0.16628721356391907, -0.003922268748283386, -0.0797220841050148, 0.2803930938243866], [0.16620877385139465, -0.19782185554504395, -0.07411421835422516, 0.5469052195549011], [0.16225233674049377, -0.3918285667896271, -0.06317611783742905, 0.8153467774391174], [0.1544157713651657, -0.5860311985015869, -0.0468691810965538, 1.087508201599121], [0.14269514381885529, -0.39032354950904846, -0.02511901780962944, 0.7804945707321167], [0.1348886787891388, -0.19486545026302338, -0.009509125724434853, 0.48001569509506226], [0.1309913694858551, -0.3898518979549408, 9.118805610341951e-05, 0.7696864604949951], [0.12319432199001312, -0.5849750638008118, 0.015484917908906937, 1.062398076057434], [0.11149482429027557, -0.39006155729293823, 0.03673287853598595, 0.7746152281761169], [0.10369358956813812, -0.195463627576828, 0.05222518369555473, 0.49371230602264404], [0.09978432208299637, -0.0011156421387568116, 0.062099430710077286, 0.2179350107908249], [0.09976200759410858, -0.19706781208515167, 0.06645812839269638, 0.5295422077178955], [0.09582065045833588, -0.0029406333342194557, 0.07704897224903107, 0.2585185468196869], [0.09576183557510376, -0.1990731656551361, 0.08221934735774994, 0.5744745135307312], [0.09178037196397781, -0.005194293800741434, 0.093708835542202, 0.3087838888168335], [0.0916764885187149, -0.20151783525943756, 0.0998845100402832, 0.6294872164726257], [0.08764613419771194, -0.007921172305941582, 0.11247425526380539, 0.36985692381858826], [0.08748770505189896, 0.18543805181980133, 0.11987139284610748, 0.11464846134185791], [0.0911964699625969, 0.37865665555000305, 0.12216436862945557, -0.13794177770614624], [0.09876960515975952, 0.5718362927436829, 0.11940553039312363, -0.38972464203834534], [0.11020632833242416, 0.37523993849754333, 0.11161103844642639, -0.06190795078873634], [0.1177111268043518, 0.5685994029045105, 0.1103728786110878, -0.3173969089984894], [0.12908311188220978, 0.7619903683662415, 0.10402493923902512, -0.5733345150947571], [0.14432291686534882, 0.5655755400657654, 0.09255824983119965, -0.2497767060995102], [0.15563443303108215, 0.36926209926605225, 0.08756271749734879, 0.07060631364583969], [0.16301967203617096, 0.5630266666412354, 0.08897484093904495, -0.1932164877653122], [0.17428021132946014, 0.3667520582675934, 0.08511051535606384, 0.12615495920181274], [0.18161524832248688, 0.17052045464515686, 0.08763360977172852, 0.4444291889667511], [0.1850256621837616, 0.36430028080940247, 0.09652219712734222, 0.1806061714887619], [0.19231165945529938, 0.5579180121421814, 0.10013432055711746, -0.08013513684272766], [0.20347002148628235, 0.7514725923538208, 0.09853161871433258, -0.3396223187446594], [0.21849948167800903, 0.5550968050956726, 0.09173917025327682, -0.017565902322530746], [0.2296014130115509, 0.3587871193885803, 0.09138785302639008, 0.302593857049942], [0.2367771565914154, 0.5524958372116089, 0.0974397286772728, 0.04007395729422569], [0.24782706797122955, 0.7460952401161194, 0.09824120998382568, -0.22034570574760437], [0.26274898648262024, 0.5497162938117981, 0.0938342958688736, 0.10163883864879608], [0.27374330163002014, 0.7433769702911377, 0.09586706757545471, -0.1600273996591568], [0.2886108458042145, 0.5470225811004639, 0.09266652166843414, 0.16129353642463684], [0.2995513081550598, 0.3507046103477478, 0.09589239209890366, 0.4817120432853699], [0.30656537413597107, 0.15436920523643494, 0.1055266335606575, 0.8030113577842712], [0.30965277552604675, 0.34789812564849854, 0.1215868592262268, 0.5453000664710999], [0.316610723733902, 0.15129636228084564, 0.13249285519123077, 0.8736841082572937], [0.31963667273521423, 0.34439215064048767, 0.1499665379524231, 0.6254180073738098], [0.3265244960784912, 0.5371376276016235, 0.16247490048408508, 0.3834698498249054], [0.3372672498226166, 0.34012678265571594, 0.17014430463314056, 0.7226519584655762], [0.34406977891921997, 0.5325380563735962, 0.18459734320640564, 0.4879840016365051], [0.3547205626964569, 0.7246413826942444, 0.1943570226430893, 0.2586885392665863], [0.36921337246894836, 0.9165345430374146, 0.19953079521656036, 0.03305020183324814], [0.38754406571388245, 1.1083191633224487, 0.20019179582595825, -0.19064557552337646], [0.40971046686172485, 0.9109802842140198, 0.1963788866996765, 0.15791501104831696], [0.4279300570487976, 1.102828025817871, 0.19953718781471252, -0.06696050614118576], [0.44998663663864136, 1.294613242149353, 0.19819797575473785, -0.29065486788749695], [0.47587889432907104, 1.0972986221313477, 0.19238486886024475, 0.05741218850016594], [0.49782484769821167, 1.28921639919281, 0.19353312253952026, -0.1689404398202896], [0.5236091613769531, 1.4811174869537354, 0.1901543140411377, -0.3948740065097809], [0.5532315373420715, 1.6731045246124268, 0.18225683271884918, -0.6220946311950684], [0.5866936445236206, 1.8652766942977905, 0.16981494426727295, -0.8522911071777344], [0.6239991784095764, 1.668297290802002, 0.15276911854743958, -0.5113860368728638], [0.657365083694458, 1.8609745502471924, 0.14254139363765717, -0.7522963285446167], [0.6945846080780029, 2.0538735389709473, 0.12749546766281128, -0.9969447255134583], [0.735662043094635, 2.2470815181732178, 0.10755657404661179, -1.2470221519470215], [0.7806037068367004, 2.0507571697235107, 0.08261612802743912, -0.9226769208908081], [0.8216188549995422, 1.8546221256256104, 0.06416258960962296, -0.6052162051200867], [0.858711302280426, 1.658664345741272, 0.05205826833844185, -0.29303354024887085], [0.8918845653533936, 1.8530068397521973, 0.046197596937417984, -0.5688542127609253], [0.9289447069168091, 1.6572685241699219, 0.03482051193714142, -0.26198258996009827], [0.9620900750160217, 1.4616671800613403, 0.0295808594673872, 0.04147659242153168], [0.9913234114646912, 1.2661339044570923, 0.030410392209887505, 0.3433438539505005]], "actions": [0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1], "rewards": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "prev_actions": [0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0], "prev_rewards": [0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "dones": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "new_obs": [[0.010190660133957863, -0.18711401522159576, -0.029977623373270035, 0.3091202974319458], [0.006448379717767239, 0.008421958424150944, -0.023795217275619507, 0.007136020343750715], [0.006616818718612194, -0.18635079264640808, -0.023652497678995132, 0.29221731424331665], [0.002889802912250161, 0.00910026952624321, -0.017808152362704277, -0.007830471731722355], [0.0030718082562088966, 0.20447303354740143, -0.017964761704206467, -0.3060784637928009], [0.007161268964409828, 0.39984631538391113, -0.024086330085992813, -0.6043724417686462], [0.015158195048570633, 0.20506934821605682, -0.036173779517412186, -0.3193724453449249], [0.019259581342339516, 0.010480747558176517, -0.042561229318380356, -0.03831326961517334], [0.01946919597685337, -0.18400584161281586, -0.043327491730451584, 0.2406432181596756], [0.015789080411195755, -0.3784829378128052, -0.0385146290063858, 0.5193507671356201], [0.008219420909881592, -0.573042094707489, -0.02812761254608631, 0.799652636051178], [-0.0032414214219897985, -0.3775458335876465, -0.012134561315178871, 0.49825575947761536], [-0.010792338289320469, -0.18225492537021637, -0.0021694456227123737, 0.2017734944820404], [-0.014437437057495117, 0.012897985987365246, 0.0018660241039469838, -0.09159300476312637], [-0.014179476536810398, -0.18225066363811493, 3.4163986128987744e-05, 0.201678067445755], [-0.017824489623308182, 0.01287080068141222, 0.0040677255019545555, -0.09099408239126205], [-0.017567073926329613, -0.18230922520160675, 0.0022478436585515738, 0.20296943187713623], [-0.021213257685303688, 0.012780514545738697, 0.006307232193648815, -0.0890035629272461], [-0.020957648754119873, 0.20781148970127106, 0.00452716089785099, -0.37968990206718445], [-0.016801418736577034, 0.4028688669204712, -0.0030666368547827005, -0.670941948890686], [-0.008744041435420513, 0.5980333089828491, -0.01648547686636448, -0.9645888805389404], [0.003216625191271305, 0.403136670589447, -0.0357772521674633, -0.6771301031112671], [0.01127935852855444, 0.20852959156036377, -0.049319855868816376, -0.39592257142066956], [0.01544994954019785, 0.014140836894512177, -0.05723830685019493, -0.11918817460536957], [0.015732767060399055, -0.18011629581451416, -0.05962207168340683, 0.15490145981311798], [0.012130441144108772, 0.015806397423148155, -0.056524042040109634, -0.15597890317440033], [0.012446568347513676, -0.17846260964870453, -0.059643618762493134, 0.11835001409053802], [0.008877316489815712, -0.37268152832984924, -0.05727661773562431, 0.391635537147522], [0.0014236855786293745, -0.17679548263549805, -0.04944390803575516, 0.081458181142807], [-0.0021122239995747805, -0.371175080537796, -0.0478147454559803, 0.35814064741134644], [-0.009535725228488445, -0.17540714144706726, -0.04065193235874176, 0.050772182643413544], [-0.013043868355453014, 0.020273428410291672, -0.03963648900389671, -0.2544545531272888], [-0.012638399377465248, -0.17426082491874695, -0.044725578278303146, 0.02546757273375988], [-0.016123617067933083, 0.02147304266691208, -0.044216226786375046, -0.2809845507144928], [-0.015694156289100647, -0.17299121618270874, -0.049835920333862305, -0.0025686072185635567], [-0.019153980538249016, -0.3673643469810486, -0.049887292087078094, 0.2739833891391754], [-0.026501266285777092, -0.1715673953294754, -0.04440762475132942, -0.03400741517543793], [-0.029932614415884018, -0.36602532863616943, -0.045087773352861404, 0.24434036016464233], [-0.03725311905145645, -0.56047523021698, -0.040200963616371155, 0.5224674940109253], [-0.048462625592947006, -0.3648112118244171, -0.02975161373615265, 0.2173926830291748], [-0.055758848786354065, -0.5594955086708069, -0.025403760373592377, 0.5005441904067993], [-0.06694875657558441, -0.7542502880096436, -0.015392877161502838, 0.7851142287254333], [-0.08203376084566116, -0.5589202642440796, 0.0003094076528213918, 0.4876285493373871], [-0.09321217238903046, -0.7540465593338013, 0.010061979293823242, 0.7804089784622192], [-0.10829310119152069, -0.5590643882751465, 0.025670157745480537, 0.490908682346344], [-0.1194743886590004, -0.7545388340950012, 0.03548833355307579, 0.7915700078010559], [-0.13456515967845917, -0.5599216818809509, 0.05131973326206207, 0.5102593898773193], [-0.1457636058330536, -0.36555880308151245, 0.06152492016553879, 0.23418034613132477], [-0.15307477116584778, -0.17136742174625397, 0.06620852649211884, -0.03847869485616684], [-0.1565021276473999, -0.3673732578754425, 0.06543895602226257, 0.27433696389198303], [-0.1638495922088623, -0.17324306070804596, 0.07092569023370743, 0.0029902656096965075], [-0.16731445491313934, 0.020793817937374115, 0.07098549604415894, -0.2664986252784729], [-0.16689857840538025, -0.17526566982269287, 0.06565552204847336, 0.04770219698548317], [-0.1704038828611374, -0.37126463651657104, 0.06660956889390945, 0.36035606265068054], [-0.17782917618751526, -0.17714963853359222, 0.0738166868686676, 0.08939800411462784], [-0.18137216567993164, 0.016840888187289238, 0.075604647397995, -0.17911295592784882], [-0.1810353547334671, -0.1792769879102707, 0.07202239334583282, 0.1364300698041916], [-0.18462088704109192, -0.375352680683136, 0.07475098967552185, 0.450937420129776], [-0.19212794303894043, -0.18136312067508698, 0.08376973867416382, 0.18272200226783752], [-0.1957552134990692, 0.012466493993997574, 0.08742418140172958, -0.08240337669849396], [-0.19550588726997375, 0.20623353123664856, 0.08577611297369003, -0.34627392888069153], [-0.19138121604919434, 0.4000372886657715, 0.0788506343960762, -0.6107235550880432], [-0.18338046967983246, 0.20390689373016357, 0.06663616746664047, -0.2942839562892914], [-0.17930231988430023, 0.39801865816116333, 0.060750484466552734, -0.5652288794517517], [-0.17134195566177368, 0.20209936797618866, 0.04944590851664543, -0.254042387008667], [-0.16729997098445892, 0.006307550705969334, 0.044365059584379196, 0.05381755530834198], [-0.1671738177537918, 0.20076622068881989, 0.045441411435604095, -0.22454437613487244], [-0.16315849125385284, 0.39521023631095886, 0.04095052182674408, -0.502554178237915], [-0.1552542895078659, 0.5897318124771118, 0.030899440869688988, -0.7820557951927185], [-0.14345964789390564, 0.39419907331466675, 0.015258324332535267, -0.47981372475624084], [-0.13557566702365875, 0.19886508584022522, 0.005662050098180771, -0.18236106634140015], [-0.1315983682870865, 0.0036625699140131474, 0.0020148290786892176, 0.11210264265537262], [-0.13152511417865753, -0.19148819148540497, 0.004256881773471832, 0.40542054176330566], [-0.1353548765182495, 0.0035731319803744555, 0.012365292757749557, 0.11408273875713348], [-0.13528341054916382, 0.19851574301719666, 0.014646947383880615, -0.17467351257801056], [-0.13131310045719147, 0.0031872631516307592, 0.011153477244079113, 0.12259382009506226], [-0.1312493532896042, 0.19814765453338623, 0.01360535342246294, -0.16654953360557556], [-0.1272864043712616, 0.002833625068888068, 0.010274362750351429, 0.13039425015449524], [-0.1272297352552414, 0.19780689477920532, 0.012882248498499393, -0.15902961790561676], [-0.12327359616756439, 0.3927420675754547, 0.009701656177639961, -0.44762083888053894], [-0.11541875451803207, 0.19748423993587494, 0.0007492390577681363, -0.15189562737941742], [-0.11146906763315201, 0.39259544014930725, -0.0022886733058840036, -0.44434207677841187], [-0.10361715406179428, 0.19750595092773438, -0.011175515130162239, -0.15238147974014282], [-0.0996670350432396, 0.0025457940064370632, -0.014223144389688969, 0.13675497472286224], [-0.09961612522602081, 0.19786854088306427, -0.011488045565783978, -0.1603809893131256], [-0.09565874934196472, 0.0029129318427294493, -0.014695664867758751, 0.12865573167800903], [-0.09560049325227737, -0.19199545681476593, -0.012122550047934055, 0.4166663587093353], [-0.09944040328264236, -0.386943519115448, -0.0037892230320721865, 0.7055030465126038], [-0.10717926919460297, -0.19176927208900452, 0.01032083760946989, 0.41162973642349243], [-0.11101465672254562, 0.003204860957339406, 0.01855343207716942, 0.12221838533878326], [-0.11095055937767029, -0.1921779215335846, 0.020997799932956696, 0.42069652676582336], [-0.11479412019252777, 0.002640319988131523, 0.02941173128783703, 0.13470648229122162], [-0.11474131047725677, 0.19732891023159027, 0.032105859369039536, -0.14855431020259857], [-0.11079473793506622, 0.0017622647574171424, 0.029134774580597878, 0.15408198535442352], [-0.11075948923826218, -0.19376446306705475, 0.03221641480922699, 0.4558120369911194], [-0.11463478207588196, 0.0008875220082700253, 0.041332654654979706, 0.17345553636550903], [-0.11461702734231949, -0.19480086863040924, 0.04480176419019699, 0.4788857698440552], [-0.11851304769515991, -0.3905257284641266, 0.054379481822252274, 0.7853457927703857], [-0.12632356584072113, -0.1961914300918579, 0.07008639723062515, 0.5102549195289612], [-0.13024738430976868, -0.0021231798455119133, 0.0802914947271347, 0.2404557466506958], [-0.13028985261917114, 0.19176547229290009, 0.08510060608386993, -0.02585994079709053], [-0.12645454704761505, -0.004467266611754894, 0.08458340913057327, 0.2924133539199829], [-0.12654389441013336, 0.18935324251651764, 0.09043167531490326, 0.027559852227568626], [-0.12275682389736176, 0.383069783449173, 0.09098287671804428, -0.2352769523859024], [-0.11509542912244797, 0.18677367269992828, 0.08627733588218689, 0.08466144651174545], [-0.11135995388031006, 0.3805597424507141, 0.0879705622792244, -0.17960235476493835], [-0.10374876111745834, 0.5743198990821838, 0.08437851816415787, -0.4432886838912964], [-0.09226236492395401, 0.7681528925895691, 0.07551274448633194, -0.7082259058952332], [-0.07689930498600006, 0.5720706582069397, 0.06134822592139244, -0.39276108145713806], [-0.06545788794755936, 0.3761341869831085, 0.05349300429224968, -0.08138424158096313], [-0.0579352080821991, 0.5704501271247864, 0.051865316927433014, -0.35672178864479065], [-0.04652620479464531, 0.7647978067398071, 0.044730883091688156, -0.6326097249984741], [-0.031230248510837555, 0.5690813064575195, 0.032078687101602554, -0.32618212699890137], [-0.019848620519042015, 0.3735176622867584, 0.025555046275258064, -0.023558061569929123], [-0.0123782679438591, 0.5682640075683594, 0.025083884596824646, -0.30806979537010193], [-0.001012988155707717, 0.7630197405815125, 0.018922489136457443, -0.59273761510849], [0.014247406274080276, 0.5676380395889282, 0.007067736238241196, -0.29415470361709595], [0.025600166991353035, 0.7626585364341736, 0.0011846426641568542, -0.5846002101898193], [0.040853336453437805, 0.9577638506889343, -0.01050736103206873, -0.8769097328186035], [0.060008615255355835, 0.7627862691879272, -0.02804555557668209, -0.5875486135482788], [0.0752643421292305, 0.9582895636558533, -0.03979652747511864, -0.888932466506958], [0.09443013370037079, 0.7637295722961426, -0.057575177401304245, -0.6090207099914551], [0.10970472544431686, 0.5694577693939209, -0.06975559145212173, -0.33501359820365906], [0.12109387665987015, 0.7654995918273926, -0.07645586133003235, -0.6488526463508606], [0.1364038735628128, 0.5715212821960449, -0.08943291753530502, -0.3811913728713989], [0.14783430099487305, 0.37777552008628845, -0.09705674648284912, -0.11799241602420807], [0.15538980066776276, 0.1841684877872467, -0.0994165912270546, 0.14256145060062408], [0.15907317399978638, 0.38056331872940063, -0.0965653657913208, -0.1797565072774887], [0.16668444871902466, 0.1869463175535202, -0.10016049444675446, 0.08096984028816223], [0.17042337357997894, -0.006607807707041502, -0.09854109585285187, 0.34044796228408813], [0.1702912151813507, -0.200199693441391, -0.09173213690519333, 0.6005027890205383], [0.16628721356391907, -0.003922268748283386, -0.0797220841050148, 0.2803930938243866], [0.16620877385139465, -0.19782185554504395, -0.07411421835422516, 0.5469052195549011], [0.16225233674049377, -0.3918285667896271, -0.06317611783742905, 0.8153467774391174], [0.1544157713651657, -0.5860311985015869, -0.0468691810965538, 1.087508201599121], [0.14269514381885529, -0.39032354950904846, -0.02511901780962944, 0.7804945707321167], [0.1348886787891388, -0.19486545026302338, -0.009509125724434853, 0.48001569509506226], [0.1309913694858551, -0.3898518979549408, 9.118805610341951e-05, 0.7696864604949951], [0.12319432199001312, -0.5849750638008118, 0.015484917908906937, 1.062398076057434], [0.11149482429027557, -0.39006155729293823, 0.03673287853598595, 0.7746152281761169], [0.10369358956813812, -0.195463627576828, 0.05222518369555473, 0.49371230602264404], [0.09978432208299637, -0.0011156421387568116, 0.062099430710077286, 0.2179350107908249], [0.09976200759410858, -0.19706781208515167, 0.06645812839269638, 0.5295422077178955], [0.09582065045833588, -0.0029406333342194557, 0.07704897224903107, 0.2585185468196869], [0.09576183557510376, -0.1990731656551361, 0.08221934735774994, 0.5744745135307312], [0.09178037196397781, -0.005194293800741434, 0.093708835542202, 0.3087838888168335], [0.0916764885187149, -0.20151783525943756, 0.0998845100402832, 0.6294872164726257], [0.08764613419771194, -0.007921172305941582, 0.11247425526380539, 0.36985692381858826], [0.08748770505189896, 0.18543805181980133, 0.11987139284610748, 0.11464846134185791], [0.0911964699625969, 0.37865665555000305, 0.12216436862945557, -0.13794177770614624], [0.09876960515975952, 0.5718362927436829, 0.11940553039312363, -0.38972464203834534], [0.11020632833242416, 0.37523993849754333, 0.11161103844642639, -0.06190795078873634], [0.1177111268043518, 0.5685994029045105, 0.1103728786110878, -0.3173969089984894], [0.12908311188220978, 0.7619903683662415, 0.10402493923902512, -0.5733345150947571], [0.14432291686534882, 0.5655755400657654, 0.09255824983119965, -0.2497767060995102], [0.15563443303108215, 0.36926209926605225, 0.08756271749734879, 0.07060631364583969], [0.16301967203617096, 0.5630266666412354, 0.08897484093904495, -0.1932164877653122], [0.17428021132946014, 0.3667520582675934, 0.08511051535606384, 0.12615495920181274], [0.18161524832248688, 0.17052045464515686, 0.08763360977172852, 0.4444291889667511], [0.1850256621837616, 0.36430028080940247, 0.09652219712734222, 0.1806061714887619], [0.19231165945529938, 0.5579180121421814, 0.10013432055711746, -0.08013513684272766], [0.20347002148628235, 0.7514725923538208, 0.09853161871433258, -0.3396223187446594], [0.21849948167800903, 0.5550968050956726, 0.09173917025327682, -0.017565902322530746], [0.2296014130115509, 0.3587871193885803, 0.09138785302639008, 0.302593857049942], [0.2367771565914154, 0.5524958372116089, 0.0974397286772728, 0.04007395729422569], [0.24782706797122955, 0.7460952401161194, 0.09824120998382568, -0.22034570574760437], [0.26274898648262024, 0.5497162938117981, 0.0938342958688736, 0.10163883864879608], [0.27374330163002014, 0.7433769702911377, 0.09586706757545471, -0.1600273996591568], [0.2886108458042145, 0.5470225811004639, 0.09266652166843414, 0.16129353642463684], [0.2995513081550598, 0.3507046103477478, 0.09589239209890366, 0.4817120432853699], [0.30656537413597107, 0.15436920523643494, 0.1055266335606575, 0.8030113577842712], [0.30965277552604675, 0.34789812564849854, 0.1215868592262268, 0.5453000664710999], [0.316610723733902, 0.15129636228084564, 0.13249285519123077, 0.8736841082572937], [0.31963667273521423, 0.34439215064048767, 0.1499665379524231, 0.6254180073738098], [0.3265244960784912, 0.5371376276016235, 0.16247490048408508, 0.3834698498249054], [0.3372672498226166, 0.34012678265571594, 0.17014430463314056, 0.7226519584655762], [0.34406977891921997, 0.5325380563735962, 0.18459734320640564, 0.4879840016365051], [0.3547205626964569, 0.7246413826942444, 0.1943570226430893, 0.2586885392665863], [0.36921337246894836, 0.9165345430374146, 0.19953079521656036, 0.03305020183324814], [0.38754406571388245, 1.1083191633224487, 0.20019179582595825, -0.19064557552337646], [0.40971046686172485, 0.9109802842140198, 0.1963788866996765, 0.15791501104831696], [0.4279300570487976, 1.102828025817871, 0.19953718781471252, -0.06696050614118576], [0.44998663663864136, 1.294613242149353, 0.19819797575473785, -0.29065486788749695], [0.47587889432907104, 1.0972986221313477, 0.19238486886024475, 0.05741218850016594], [0.49782484769821167, 1.28921639919281, 0.19353312253952026, -0.1689404398202896], [0.5236091613769531, 1.4811174869537354, 0.1901543140411377, -0.3948740065097809], [0.5532315373420715, 1.6731045246124268, 0.18225683271884918, -0.6220946311950684], [0.5866936445236206, 1.8652766942977905, 0.16981494426727295, -0.8522911071777344], [0.6239991784095764, 1.668297290802002, 0.15276911854743958, -0.5113860368728638], [0.657365083694458, 1.8609745502471924, 0.14254139363765717, -0.7522963285446167], [0.6945846080780029, 2.0538735389709473, 0.12749546766281128, -0.9969447255134583], [0.735662043094635, 2.2470815181732178, 0.10755657404661179, -1.2470221519470215], [0.7806037068367004, 2.0507571697235107, 0.08261612802743912, -0.9226769208908081], [0.8216188549995422, 1.8546221256256104, 0.06416258960962296, -0.6052162051200867], [0.858711302280426, 1.658664345741272, 0.05205826833844185, -0.29303354024887085], [0.8918845653533936, 1.8530068397521973, 0.046197596937417984, -0.5688542127609253], [0.9289447069168091, 1.6572685241699219, 0.03482051193714142, -0.26198258996009827], [0.9620900750160217, 1.4616671800613403, 0.0295808594673872, 0.04147659242153168], [0.9913234114646912, 1.2661339044570923, 0.030410392209887505, 0.3433438539505005], [1.016646146774292, 1.4608103036880493, 0.03727727010846138, 0.06040350720286369]], "action_prob": [0.5175093412399292, 0.6875422596931458, 0.5295204520225525, 0.682706356048584, 0.46228447556495667, 0.27726247906684875, 0.7621508836746216, 0.7368318438529968, 0.6035043597221375, 0.3741706907749176, 0.2628467381000519, 0.7544750571250916, 0.7422745227813721, 0.6403242945671082, 0.5972186326980591, 0.6432556509971619, 0.5930286645889282, 0.6472556591033936, 0.41264864802360535, 0.26517918705940247, 0.23988671600818634, 0.7461951971054077, 0.7617210149765015, 0.7568281888961792, 0.6816123723983765, 0.5249503254890442, 0.7024214267730713, 0.513938844203949, 0.6802708506584167, 0.5381057262420654, 0.6689469814300537, 0.44329899549484253, 0.7321743965148926, 0.4140508472919464, 0.7414822578430176, 0.6167399287223816, 0.6071280837059021, 0.6355425715446472, 0.41169294714927673, 0.7234145402908325, 0.41501834988594055, 0.2751935124397278, 0.7558556199073792, 0.2660660147666931, 0.758280873298645, 0.25464966893196106, 0.7596147060394287, 0.756356954574585, 0.7015859484672546, 0.4715173840522766, 0.7242290377616882, 0.5824083685874939, 0.6334033608436584, 0.3783823251724243, 0.7509492039680481, 0.6665957570075989, 0.5393946766853333, 0.30313563346862793, 0.7638047933578491, 0.7275634407997131, 0.5847131609916687, 0.3724174499511719, 0.7331855893135071, 0.39555028080940247, 0.7289407253265381, 0.5882362127304077, 0.6567630171775818, 0.4353964626789093, 0.2810675799846649, 0.757016658782959, 0.7251664996147156, 0.5769761800765991, 0.34388110041618347, 0.7507181763648987, 0.6666961312294006, 0.5594523549079895, 0.6705901622772217, 0.5537251830101013, 0.6741415858268738, 0.4517737329006195, 0.7190046906471252, 0.4409599006175995, 0.7251191139221191, 0.5773656368255615, 0.6522626876831055, 0.5874138474464417, 0.35559165477752686, 0.25375911593437195, 0.7549622058868408, 0.7515518069267273, 0.32943210005760193, 0.7550182342529297, 0.6871606707572937, 0.5206036567687988, 0.3028276264667511, 0.7595278024673462, 0.2857041656970978, 0.23806531727313995, 0.749110996723175, 0.7640381455421448, 0.7518104910850525, 0.34099113941192627, 0.7603772282600403, 0.6963557004928589, 0.4818814694881439, 0.7196506261825562, 0.56695955991745, 0.3685418367385864, 0.7305391430854797, 0.6198252439498901, 0.6084669828414917, 0.39555978775024414, 0.725974977016449, 0.6054643988609314, 0.6177165508270264, 0.3974079191684723, 0.7294291853904724, 0.38377949595451355, 0.263470321893692, 0.7608022689819336, 0.25089961290359497, 0.7624770998954773, 0.760564923286438, 0.2796003520488739, 0.7664551138877869, 0.7475021481513977, 0.6604338884353638, 0.5325992703437805, 0.7037039995193481, 0.539890706539154, 0.34521663188934326, 0.7378695011138916, 0.37395891547203064, 0.26737746596336365, 0.2480143904685974, 0.7411465644836426, 0.754821240901947, 0.2593299448490143, 0.2436329871416092, 0.740443766117096, 0.7571555376052856, 0.7585773468017578, 0.2941673696041107, 0.7626469135284424, 0.26918378472328186, 0.7644055485725403, 0.24945764243602753, 0.7633261680603027, 0.7635097503662109, 0.7141349911689758, 0.5658862590789795, 0.6205641627311707, 0.6187753081321716, 0.42680832743644714, 0.701795756816864, 0.5369036197662354, 0.6818332672119141, 0.4924739897251129, 0.29495367407798767, 0.7636314630508423, 0.7292724847793579, 0.6100348234176636, 0.5719967484474182, 0.3579511344432831, 0.7514099478721619, 0.6768248081207275, 0.4814109206199646, 0.6997572183609009, 0.4403539299964905, 0.2819165289402008, 0.23589755594730377, 0.753979504108429, 0.23361413180828094, 0.7488815188407898, 0.7653635740280151, 0.2325817495584488, 0.7609432339668274, 0.7705773115158081, 0.7621049284934998, 0.7252062559127808, 0.34751665592193604, 0.7471452355384827, 0.6961379051208496, 0.38638681173324585, 0.7236313223838806, 0.6589236259460449, 0.5689250826835632, 0.46877244114875793, 0.6205497980117798, 0.4980238676071167, 0.40076175332069397, 0.3268614113330841, 0.7189487814903259, 0.6755150556564331, 0.5994820594787598, 0.5049768090248108, 0.6040036082267761, 0.5042694807052612, 0.3976629376411438, 0.6897073984146118], "advantages": [65.07020568847656, 65.74015808105469, 64.82101440429688, 65.43494415283203, 64.558349609375, 64.86185455322266, 66.34040069580078, 64.87236022949219, 64.28449249267578, 64.72274780273438, 66.49376678466797, 69.09212493896484, 65.98890686035156, 63.904396057128906, 63.2788200378418, 63.574588775634766, 62.939002990722656, 63.237152099609375, 62.58668899536133, 63.06370162963867, 64.71572875976562, 67.7505874633789, 65.08605194091797, 63.22376251220703, 62.28325271606445, 62.389522552490234, 62.1884880065918, 62.14595413208008, 63.45584487915039, 61.82421875, 62.99941635131836, 61.492042541503906, 61.71745681762695, 61.261444091796875, 61.65990447998047, 61.069095611572266, 61.87977600097656, 60.79090118408203, 61.46296691894531, 63.53250503540039, 60.937782287597656, 62.93840026855469, 65.3224105834961, 62.258934020996094, 64.67164611816406, 61.6085090637207, 64.04985809326172, 61.00095748901367, 58.38166427612305, 57.07927703857422, 57.88327407836914, 56.440887451171875, 56.12803649902344, 55.88209915161133, 56.99592590332031, 55.29522705078125, 54.70582580566406, 54.7697868347168, 56.164920806884766, 54.22292709350586, 53.38187026977539, 53.240509033203125, 53.67807388305664, 52.614749908447266, 52.984107971191406, 52.033538818359375, 51.77152633666992, 51.433265686035156, 51.68737030029297, 52.67179870605469, 51.197059631347656, 50.401309967041016, 50.23717498779297, 50.988525390625, 49.64826202392578, 49.23119354248047, 49.07849884033203, 48.640567779541016, 48.49745559692383, 48.03948974609375, 48.2364387512207, 47.47464370727539, 47.70448684692383, 46.922035217285156, 46.76630401611328, 46.33074188232422, 46.14948272705078, 46.899810791015625, 48.88417434692383, 46.17500305175781, 44.75533676147461, 45.50044631958008, 44.049034118652344, 43.50853729248047, 43.360572814941406, 44.181175231933594, 42.63010787963867, 43.50058364868164, 45.60898971557617, 42.803504943847656, 41.12834167480469, 40.32524490356445, 40.41713333129883, 39.528053283691406, 39.11021423339844, 38.74814987182617, 38.26304626464844, 38.09172439575195, 38.29186248779297, 37.248130798339844, 36.635520935058594, 36.392173767089844, 36.5296516418457, 35.56935119628906, 34.998050689697266, 34.723175048828125, 34.866432189941406, 33.907413482666016, 34.10166931152344, 35.05186462402344, 33.47590255737305, 34.73307418823242, 33.020931243896484, 31.814279556274414, 32.70759201049805, 31.31878089904785, 30.40036964416504, 29.96086311340332, 29.735740661621094, 29.150693893432617, 29.266725540161133, 30.452625274658203, 28.21649169921875, 29.25935935974121, 31.32685661315918, 33.36408996582031, 29.98841667175293, 26.752355575561523, 28.77556037902832, 30.896312713623047, 27.54107666015625, 24.36266326904297, 22.359771728515625, 23.285749435424805, 21.188451766967773, 22.222251892089844, 20.019702911376953, 21.180620193481445, 18.864139556884766, 17.547574996948242, 16.79896354675293, 16.400348663330078, 15.5011568069458, 15.007741928100586, 14.856807708740234, 13.663432121276855, 12.933156967163086, 12.296913146972656, 11.625007629394531, 11.4944429397583, 10.281388282775879, 9.500345230102539, 8.986893653869629, 8.108373641967773, 7.601161479949951, 6.6818437576293945, 6.032909393310547, 5.252676963806152, 4.543684005737305, 3.803632974624634, 3.461355447769165, 3.884486675262451, 2.021986722946167, 2.554100513458252, 0.5886266827583313, -0.7249689102172852, -0.8124238848686218, -2.2397050857543945, -3.2996022701263428, -4.188738822937012, -4.9835076332092285, -5.8296308517456055, -6.68121337890625, -7.456789016723633, -8.383384704589844, -9.213141441345215, -9.965304374694824, -10.604227066040039, -11.059999465942383, -12.438786506652832, -12.94234848022461, -13.156770706176758, -12.94666862487793, -14.922598838806152, -16.532800674438477, -17.862979888916016, -18.336570739746094, -19.693920135498047, -20.849578857421875, -21.8323974609375], "value_targets": [86.60203552246094, 86.4666976928711, 86.33000183105469, 86.1919174194336, 86.05244445800781, 85.91156005859375, 85.76924896240234, 85.62550354003906, 85.48030853271484, 85.33364868164062, 85.18550109863281, 85.03585815429688, 84.88470458984375, 84.73202514648438, 84.57780456542969, 84.42202758789062, 84.2646713256836, 84.10572814941406, 83.94518280029297, 83.78301239013672, 83.61920166015625, 83.45374298095703, 83.28660583496094, 83.11778259277344, 82.94725799560547, 82.77500915527344, 82.60102081298828, 82.4252700805664, 82.24774932861328, 82.06842803955078, 81.8873062133789, 81.704345703125, 81.51954650878906, 81.33287048339844, 81.14431762695312, 80.953857421875, 80.76146697998047, 80.567138671875, 80.370849609375, 80.17257690429688, 79.97229766845703, 79.7699966430664, 79.5656509399414, 79.35924530029297, 79.1507568359375, 78.94015502929688, 78.72743225097656, 78.51255798339844, 78.2955093383789, 78.0762710571289, 77.85482025146484, 77.63113403320312, 77.40518188476562, 77.17695617675781, 76.94641876220703, 76.71355438232422, 76.47834014892578, 76.2407455444336, 76.0007553100586, 75.75833892822266, 75.51347351074219, 75.26612854003906, 75.01629638671875, 74.76393127441406, 74.50902557373047, 74.25154113769531, 73.991455078125, 73.72874450683594, 73.46337127685547, 73.19532775878906, 72.92457580566406, 72.65108489990234, 72.37483215332031, 72.09579467773438, 71.81392669677734, 71.52922058105469, 71.24163818359375, 70.9511489868164, 70.65773010253906, 70.36134338378906, 70.06195831298828, 69.75955963134766, 69.45409393310547, 69.14555358886719, 68.83389282226562, 68.51908111572266, 68.20109558105469, 67.87989044189453, 67.55545043945312, 67.22772216796875, 66.89669036865234, 66.56231689453125, 66.22456359863281, 65.88339233398438, 65.53878021240234, 65.19068908691406, 64.83908081054688, 64.48391723632812, 64.12516784667969, 63.76279830932617, 63.396766662597656, 63.027034759521484, 62.65357208251953, 62.276336669921875, 61.895286560058594, 61.51039123535156, 61.12160873413086, 60.72889709472656, 60.332218170166016, 59.93153381347656, 59.52680206298828, 59.11798095703125, 58.70503234863281, 58.28791046142578, 57.8665771484375, 57.44098663330078, 57.0110969543457, 56.576866149902344, 56.138248443603516, 55.6952018737793, 55.247676849365234, 54.79563522338867, 54.33902359008789, 53.877803802490234, 53.411922454833984, 52.94133758544922, 52.46599578857422, 51.98585510253906, 51.50086212158203, 51.01097106933594, 50.51613235473633, 50.01629638671875, 49.511409759521484, 49.001426696777344, 48.486289978027344, 47.965946197509766, 47.44034957885742, 46.909446716308594, 46.37317657470703, 45.83149337768555, 45.28433609008789, 44.731651306152344, 44.17338562011719, 43.60948181152344, 43.039878845214844, 42.46452331542969, 41.883358001708984, 41.296321868896484, 40.70335388183594, 40.104400634765625, 39.499393463134766, 38.888275146484375, 38.2709846496582, 37.6474609375, 37.017635345458984, 36.38145065307617, 35.73883819580078, 35.08973693847656, 34.434078216552734, 33.77179718017578, 33.10282516479492, 32.427093505859375, 31.74454116821289, 31.055091857910156, 30.358678817749023, 29.655229568481445, 28.944677352905273, 28.226945877075195, 27.50196647644043, 26.769662857055664, 26.02996253967285, 25.282791137695312, 24.5280704498291, 23.765727996826172, 22.995685577392578, 22.217864990234375, 21.432186126708984, 20.63857078552246, 19.83694076538086, 19.02721405029297, 18.209306716918945, 17.383136749267578, 16.54862403869629, 15.705680847167969, 14.854223251342773, 13.99416446685791, 13.125418663024902, 12.24789810180664, 11.361513137817383, 10.466174125671387, 9.561792373657227, 8.648275375366211, 7.725530624389648, 6.7934651374816895, 5.851984977722168, 4.900994777679443, 3.940398931503296, 2.970099925994873, 1.9900000095367432, 1.0]}