{"global_step": 84167, "epoch": 500, "test/sim_max_reward_100650": 1.0, "test/sim_max_reward_100651": 0.9836272611798609, "test/sim_max_reward_100652": 1.0, "test/sim_max_reward_100653": 0.9984529698054456, "test/sim_max_reward_100654": 0.6993084780416883, "test/sim_max_reward_100655": 1.0, "test/sim_max_reward_100656": 1.0, "test/sim_max_reward_100657": 0.6949983604832853, "test/sim_max_reward_100658": 0.9987650781039431, "test/sim_max_reward_100659": 1.0, "test/sim_max_reward_100660": 1.0, "test/sim_max_reward_100661": 1.0, "test/sim_max_reward_100662": 1.0, "test/sim_max_reward_100663": 0.4838603510489545, "test/sim_max_reward_100664": 1.0, "test/sim_max_reward_100665": 0.725068245106743, "test/sim_max_reward_100666": 1.0, "test/sim_max_reward_100667": 0.22106641532914753, "test/sim_max_reward_100668": 1.0, "test/sim_max_reward_100669": 1.0, "test/sim_max_reward_100670": 1.0, "test/sim_max_reward_100671": 1.0, "test/sim_max_reward_100672": 0.9803708933775173, "test/sim_max_reward_100673": 1.0, "test/sim_max_reward_100674": 0.9931098608520859, "test/sim_max_reward_100450": 0.9919029459733606, "test/sim_max_reward_100451": 0.0, "test/sim_max_reward_100452": 0.24206373370792003, "test/sim_max_reward_100453": 1.0, "test/sim_max_reward_100454": 1.0, "test/sim_max_reward_100455": 1.0, "test/sim_max_reward_100456": 0.0, "test/sim_max_reward_100457": 0.9844193517054219, "test/sim_max_reward_100458": 0.4843978861954368, "test/sim_max_reward_100459": 0.6319069163829951, "test/sim_max_reward_100460": 0.9846004487985124, "test/sim_max_reward_100461": 1.0, "test/sim_max_reward_100462": 0.962269107478234, "test/sim_max_reward_100463": 1.0, "test/sim_max_reward_100464": 1.0, "test/sim_max_reward_100465": 0.0, "test/sim_max_reward_100466": 0.4755535971647512, "test/sim_max_reward_100467": 0.6401438416501674, "test/sim_max_reward_100468": 1.0, "test/sim_max_reward_100469": 0.9998291223721207, "test/sim_max_reward_100470": 0.6485025649276396, "test/sim_max_reward_100471": 0.0, "test/sim_max_reward_100472": 0.988054356224632, "test/sim_max_reward_100473": 0.9647860346838609, "test/sim_max_reward_100474": 1.0, "test/sim_max_reward_100200": 1.0, "test/sim_max_reward_100201": 0.9999635054844798, "test/sim_max_reward_100202": 0.9955696374708086, "test/sim_max_reward_100203": 1.0, "test/sim_max_reward_100204": 0.9551376183790002, "test/sim_max_reward_100205": 1.0, "test/sim_max_reward_100206": 0.9957963523729236, "test/sim_max_reward_100207": 1.0, "test/sim_max_reward_100208": 1.0, "test/sim_max_reward_100209": 1.0, "test/sim_max_reward_100210": 0.15586047142432483, "test/sim_max_reward_100211": 1.0, "test/sim_max_reward_100212": 1.0, "test/sim_max_reward_100213": 0.9661915862186127, "test/sim_max_reward_100214": 0.0, "test/sim_max_reward_100215": 1.0, "test/sim_max_reward_100216": 0.94861301560252, "test/sim_max_reward_100217": 1.0, "test/sim_max_reward_100218": 1.0, "test/sim_max_reward_100219": 0.9869500671313967, "test/sim_max_reward_100220": 0.6815226246018647, "test/sim_max_reward_100221": 0.2507500883938842, "test/sim_max_reward_100222": 0.9808780456254489, "test/sim_max_reward_100223": 0.5546086514456113, "test/sim_max_reward_100224": 0.9912603867334581, "test/sim_max_reward_100075": 1.0, "test/sim_max_reward_100076": 1.0, "test/sim_max_reward_100077": 1.0, "test/sim_max_reward_100078": 0.9850151661656724, "test/sim_max_reward_100079": 1.0, "test/sim_max_reward_100080": 0.9852808457132028, "test/sim_max_reward_100081": 1.0, "test/sim_max_reward_100082": 1.0, "test/sim_max_reward_100083": 1.0, "test/sim_max_reward_100084": 0.5308496628928177, "test/sim_max_reward_100085": 1.0, "test/sim_max_reward_100086": 1.0, "test/sim_max_reward_100087": 0.8254560956431363, "test/sim_max_reward_100088": 1.0, "test/sim_max_reward_100089": 1.0, "test/sim_max_reward_100090": 1.0, "test/sim_max_reward_100091": 0.38763476587975193, "test/sim_max_reward_100092": 0.1259478749515575, "test/sim_max_reward_100093": 0.0, "test/sim_max_reward_100094": 0.7230364055041981, "test/sim_max_reward_100095": 0.9943380431943764, "test/sim_max_reward_100096": 1.0, "test/sim_max_reward_100097": 1.0, "test/sim_max_reward_100098": 0.721867636301957, "test/sim_max_reward_100099": 1.0, "test/sim_max_reward_100325": 0.9663586115018615, "test/sim_max_reward_100326": 1.0, "test/sim_max_reward_100327": 0.5231106001822893, "test/sim_max_reward_100328": 0.6642666586999407, "test/sim_max_reward_100329": 1.0, "test/sim_max_reward_100330": 0.4919848487094767, "test/sim_max_reward_100331": 0.5255893780414201, "test/sim_max_reward_100332": 1.0, "test/sim_max_reward_100333": 0.0, "test/sim_max_reward_100334": 0.9912726088094925, "test/sim_max_reward_100335": 1.0, "test/sim_max_reward_100336": 1.0, "test/sim_max_reward_100337": 0.0, "test/sim_max_reward_100338": 1.0, "test/sim_max_reward_100339": 0.5690801944522402, "test/sim_max_reward_100340": 1.0, "test/sim_max_reward_100341": 0.26495715530866043, "test/sim_max_reward_100342": 1.0, "test/sim_max_reward_100343": 0.9393132256678725, "test/sim_max_reward_100344": 0.7170947251322198, "test/sim_max_reward_100345": 0.7282626086858525, "test/sim_max_reward_100346": 0.9525979226194662, "test/sim_max_reward_100347": 0.9890070728630901, "test/sim_max_reward_100348": 0.5883447879148069, "test/sim_max_reward_100349": 0.9807851347959082, "test/sim_max_reward_100375": 0.6900363004830679, "test/sim_max_reward_100376": 1.0, "test/sim_max_reward_100377": 0.7178844957976743, "test/sim_max_reward_100378": 1.0, "test/sim_max_reward_100379": 1.0, "test/sim_max_reward_100380": 1.0, "test/sim_max_reward_100381": 1.0, "test/sim_max_reward_100382": 0.4534510914004395, "test/sim_max_reward_100383": 0.6652344152780414, "test/sim_max_reward_100384": 1.0, "test/sim_max_reward_100385": 1.0, "test/sim_max_reward_100386": 0.9710927109156954, "test/sim_max_reward_100387": 1.0, "test/sim_max_reward_100388": 1.0, "test/sim_max_reward_100389": 0.9055468169948054, "test/sim_max_reward_100390": 0.9898770511095365, "test/sim_max_reward_100391": 0.6852364263097003, "test/sim_max_reward_100392": 0.5075570998799126, "test/sim_max_reward_100393": 1.0, "test/sim_max_reward_100394": 0.6986157355784163, "test/sim_max_reward_100395": 0.9931576227834222, "test/sim_max_reward_100396": 1.0, "test/sim_max_reward_100397": 1.0, "test/sim_max_reward_100398": 1.0, "test/sim_max_reward_100399": 0.9926451869641156, "test/sim_max_reward_100150": 0.8170756447884853, "test/sim_max_reward_100151": 0.9851348295086126, "test/sim_max_reward_100152": 0.33403999756212255, "test/sim_max_reward_100153": 0.9699455968774913, "test/sim_max_reward_100154": 0.9798202558887613, "test/sim_max_reward_100155": 0.29490923858404006, "test/sim_max_reward_100156": 1.0, "test/sim_max_reward_100157": 0.9932971389741195, "test/sim_max_reward_100158": 1.0, "test/sim_max_reward_100159": 1.0, "test/sim_max_reward_100160": 0.9907023226763706, "test/sim_max_reward_100161": 0.0, "test/sim_max_reward_100162": 1.0, "test/sim_max_reward_100163": 0.9977527168139654, "test/sim_max_reward_100164": 1.0, "test/sim_max_reward_100165": 0.7210482108197053, "test/sim_max_reward_100166": 1.0, "test/sim_max_reward_100167": 0.19597639164956804, "test/sim_max_reward_100168": 1.0, "test/sim_max_reward_100169": 0.2842539051081466, "test/sim_max_reward_100170": 0.8963467096705136, "test/sim_max_reward_100171": 0.22002151719504137, "test/sim_max_reward_100172": 0.9994724096551441, "test/sim_max_reward_100173": 0.48222889169147914, "test/sim_max_reward_100174": 1.0, "test/sim_max_reward_100925": 0.607315393713649, "test/sim_max_reward_100926": 0.32290818433231466, "test/sim_max_reward_100927": 1.0, "test/sim_max_reward_100928": 0.7067975466009282, "test/sim_max_reward_100929": 1.0, "test/sim_max_reward_100930": 1.0, "test/sim_max_reward_100931": 1.0, "test/sim_max_reward_100932": 0.0, "test/sim_max_reward_100933": 0.9949582223156729, "test/sim_max_reward_100934": 0.6671520454676798, "test/sim_max_reward_100935": 1.0, "test/sim_max_reward_100936": 0.9706447481412397, "test/sim_max_reward_100937": 1.0, "test/sim_max_reward_100938": 0.9756196220394154, "test/sim_max_reward_100939": 0.37325173551174207, "test/sim_max_reward_100940": 1.0, "test/sim_max_reward_100941": 0.9707904826981838, "test/sim_max_reward_100942": 1.0, "test/sim_max_reward_100943": 1.0, "test/sim_max_reward_100944": 0.990454227587822, "test/sim_max_reward_100945": 0.9380555971708141, "test/sim_max_reward_100946": 1.0, "test/sim_max_reward_100947": 1.0, "test/sim_max_reward_100948": 0.9962495400868426, "test/sim_max_reward_100949": 0.0, "test/sim_max_reward_100775": 0.9686175263958058, "test/sim_max_reward_100776": 0.0, "test/sim_max_reward_100777": 0.9948741217923174, "test/sim_max_reward_100778": 1.0, "test/sim_max_reward_100779": 1.0, "test/sim_max_reward_100780": 1.0, "test/sim_max_reward_100781": 0.23483742454056888, "test/sim_max_reward_100782": 0.7879789559562442, "test/sim_max_reward_100783": 1.0, "test/sim_max_reward_100784": 1.0, "test/sim_max_reward_100785": 0.9625470132473175, "test/sim_max_reward_100786": 0.9943324373985125, "test/sim_max_reward_100787": 0.9908434972407175, "test/sim_max_reward_100788": 0.0, "test/sim_max_reward_100789": 1.0, "test/sim_max_reward_100790": 0.20598215072925669, "test/sim_max_reward_100791": 1.0, "test/sim_max_reward_100792": 0.9977468126148364, "test/sim_max_reward_100793": 0.9851245429444448, "test/sim_max_reward_100794": 0.9733353057002673, "test/sim_max_reward_100795": 1.0, "test/sim_max_reward_100796": 1.0, "test/sim_max_reward_100797": 1.0, "test/sim_max_reward_100798": 0.07613417224278962, "test/sim_max_reward_100799": 1.0, "test/sim_max_reward_100175": 1.0, "test/sim_max_reward_100176": 1.0, "test/sim_max_reward_100177": 0.02933957042270729, "test/sim_max_reward_100178": 1.0, "test/sim_max_reward_100179": 0.9642307952520492, "test/sim_max_reward_100180": 0.9864185845678496, "test/sim_max_reward_100181": 0.6273631682076903, "test/sim_max_reward_100182": 0.9666529156551665, "test/sim_max_reward_100183": 0.9878789245169014, "test/sim_max_reward_100184": 1.0, "test/sim_max_reward_100185": 0.5230551994938692, "test/sim_max_reward_100186": 1.0, "test/sim_max_reward_100187": 1.0, "test/sim_max_reward_100188": 1.0, "test/sim_max_reward_100189": 0.724948399177713, "test/sim_max_reward_100190": 1.0, "test/sim_max_reward_100191": 0.9940267724255434, "test/sim_max_reward_100192": 0.5981655173646161, "test/sim_max_reward_100193": 0.6863798030405555, "test/sim_max_reward_100194": 0.5398036712193292, "test/sim_max_reward_100195": 0.24767593264507204, "test/sim_max_reward_100196": 0.9793470216493734, "test/sim_max_reward_100197": 0.5692890443079605, "test/sim_max_reward_100198": 1.0, "test/sim_max_reward_100199": 0.9959798332276449, "test/sim_max_reward_100100": 1.0, "test/sim_max_reward_100101": 1.0, "test/sim_max_reward_100102": 0.7225887585347117, "test/sim_max_reward_100103": 1.0, "test/sim_max_reward_100104": 1.0, "test/sim_max_reward_100105": 1.0, "test/sim_max_reward_100106": 0.7151688513080411, "test/sim_max_reward_100107": 1.0, "test/sim_max_reward_100108": 0.9822213146676875, "test/sim_max_reward_100109": 0.702200691008055, "test/sim_max_reward_100110": 0.5085301246178349, "test/sim_max_reward_100111": 0.9991068700869299, "test/sim_max_reward_100112": 1.0, "test/sim_max_reward_100113": 0.9957423133214728, "test/sim_max_reward_100114": 1.0, "test/sim_max_reward_100115": 0.7182089886783773, "test/sim_max_reward_100116": 0.9759904149969384, "test/sim_max_reward_100117": 1.0, "test/sim_max_reward_100118": 1.0, "test/sim_max_reward_100119": 1.0, "test/sim_max_reward_100120": 1.0, "test/sim_max_reward_100121": 1.0, "test/sim_max_reward_100122": 1.0, "test/sim_max_reward_100123": 0.4877472590343483, "test/sim_max_reward_100124": 0.9336901393370906, "test/sim_max_reward_100350": 0.9175454139117166, "test/sim_max_reward_100351": 1.0, "test/sim_max_reward_100352": 1.0, "test/sim_max_reward_100353": 0.9994557441625372, "test/sim_max_reward_100354": 1.0, "test/sim_max_reward_100355": 0.9667042577154455, "test/sim_max_reward_100356": 0.6899999176866632, "test/sim_max_reward_100357": 0.7160142183354826, "test/sim_max_reward_100358": 1.0, "test/sim_max_reward_100359": 0.9742213912476448, "test/sim_max_reward_100360": 1.0, "test/sim_max_reward_100361": 1.0, "test/sim_max_reward_100362": 0.6127663176929823, "test/sim_max_reward_100363": 1.0, "test/sim_max_reward_100364": 0.7288853390008053, "test/sim_max_reward_100365": 0.9554747701106797, "test/sim_max_reward_100366": 1.0, "test/sim_max_reward_100367": 0.0, "test/sim_max_reward_100368": 0.9908701837135674, "test/sim_max_reward_100369": 0.8674035040401985, "test/sim_max_reward_100370": 0.17920370349676124, "test/sim_max_reward_100371": 0.0, "test/sim_max_reward_100372": 0.9251226691001598, "test/sim_max_reward_100373": 0.8756782896040832, "test/sim_max_reward_100374": 1.0, "test/sim_max_reward_100975": 1.0, "test/sim_max_reward_100976": 0.7370302403644253, "test/sim_max_reward_100977": 1.0, "test/sim_max_reward_100978": 0.7017969054659985, "test/sim_max_reward_100979": 1.0, "test/sim_max_reward_100980": 0.9560984786656771, "test/sim_max_reward_100981": 0.9961098029004755, "test/sim_max_reward_100982": 0.9607153483591752, "test/sim_max_reward_100983": 0.97410729771006, "test/sim_max_reward_100984": 1.0, "test/sim_max_reward_100985": 1.0, "test/sim_max_reward_100986": 1.0, "test/sim_max_reward_100987": 1.0, "test/sim_max_reward_100988": 0.9981427691430418, "test/sim_max_reward_100989": 1.0, "test/sim_max_reward_100990": 1.0, "test/sim_max_reward_100991": 1.0, "test/sim_max_reward_100992": 1.0, "test/sim_max_reward_100993": 1.0, "test/sim_max_reward_100994": 1.0, "test/sim_max_reward_100995": 0.9956082866786868, "test/sim_max_reward_100996": 1.0, "test/sim_max_reward_100997": 0.7258287718179045, "test/sim_max_reward_100998": 0.9840981569000606, "test/sim_max_reward_100999": 0.9922583665706955, "test/sim_max_reward_100800": 1.0, "test/sim_max_reward_100801": 0.99313437070546, "test/sim_max_reward_100802": 0.9944295856148649, "test/sim_max_reward_100803": 0.9653217929836162, "test/sim_max_reward_100804": 0.9800207485622735, "test/sim_max_reward_100805": 0.6485630173905996, "test/sim_max_reward_100806": 0.0, "test/sim_max_reward_100807": 1.0, "test/sim_max_reward_100808": 1.0, "test/sim_max_reward_100809": 0.9784125083639388, "test/sim_max_reward_100810": 0.986186457272048, "test/sim_max_reward_100811": 1.0, "test/sim_max_reward_100812": 0.9688207192084661, "test/sim_max_reward_100813": 0.9744930606778395, "test/sim_max_reward_100814": 1.0, "test/sim_max_reward_100815": 1.0, "test/sim_max_reward_100816": 1.0, "test/sim_max_reward_100817": 0.0, "test/sim_max_reward_100818": 1.0, "test/sim_max_reward_100819": 1.0, "test/sim_max_reward_100820": 0.9605891644181005, "test/sim_max_reward_100821": 0.5457920538174492, "test/sim_max_reward_100822": 1.0, "test/sim_max_reward_100823": 0.6041486377310438, "test/sim_max_reward_100824": 1.0, "test/sim_max_reward_100625": 0.7067799409940081, "test/sim_max_reward_100626": 0.989393417089876, "test/sim_max_reward_100627": 1.0, "test/sim_max_reward_100628": 1.0, "test/sim_max_reward_100629": 0.0, "test/sim_max_reward_100630": 1.0, "test/sim_max_reward_100631": 1.0, "test/sim_max_reward_100632": 0.9768833369508468, "test/sim_max_reward_100633": 1.0, "test/sim_max_reward_100634": 0.0, "test/sim_max_reward_100635": 0.9856709052551006, "test/sim_max_reward_100636": 0.6800291852310281, "test/sim_max_reward_100637": 0.8872890291465975, "test/sim_max_reward_100638": 0.9933455180159476, "test/sim_max_reward_100639": 0.989927903085088, "test/sim_max_reward_100640": 0.998790859335771, "test/sim_max_reward_100641": 1.0, "test/sim_max_reward_100642": 0.9968556346199109, "test/sim_max_reward_100643": 0.9956959985014171, "test/sim_max_reward_100644": 1.0, "test/sim_max_reward_100645": 1.0, "test/sim_max_reward_100646": 1.0, "test/sim_max_reward_100647": 1.0, "test/sim_max_reward_100648": 1.0, "test/sim_max_reward_100649": 0.996209530816789, "test/sim_max_reward_100050": 0.996596287641588, "test/sim_max_reward_100051": 0.8831943378435408, "test/sim_max_reward_100052": 0.9768397070642932, "test/sim_max_reward_100053": 0.721380176295159, "test/sim_max_reward_100054": 1.0, "test/sim_max_reward_100055": 0.15218962419549573, "test/sim_max_reward_100056": 1.0, "test/sim_max_reward_100057": 0.6180667650678929, "test/sim_max_reward_100058": 1.0, "test/sim_max_reward_100059": 0.9807479100114068, "test/sim_max_reward_100060": 0.9569820490577864, "test/sim_max_reward_100061": 0.8965684155448576, "test/sim_max_reward_100062": 0.9404039355201222, "test/sim_max_reward_100063": 0.9970707519835172, "test/sim_max_reward_100064": 1.0, "test/sim_max_reward_100065": 0.46293813238193915, "test/sim_max_reward_100066": 1.0, "test/sim_max_reward_100067": 0.7183367551361161, "test/sim_max_reward_100068": 0.7216792860581339, "test/sim_max_reward_100069": 0.5836906972350795, "test/sim_max_reward_100070": 0.6595936214474484, "test/sim_max_reward_100071": 0.5482069572811578, "test/sim_max_reward_100072": 0.45294098350142387, "test/sim_max_reward_100073": 0.9045584183523702, "test/sim_max_reward_100074": 1.0, "test/sim_max_reward_100225": 0.9735841292205049, "test/sim_max_reward_100226": 0.4581848554010335, "test/sim_max_reward_100227": 0.9867667678658524, "test/sim_max_reward_100228": 1.0, "test/sim_max_reward_100229": 1.0, "test/sim_max_reward_100230": 0.9908223234170833, "test/sim_max_reward_100231": 0.9824160874287698, "test/sim_max_reward_100232": 0.5658074553002722, "test/sim_max_reward_100233": 0.9969712347061116, "test/sim_max_reward_100234": 0.9926613953927571, "test/sim_max_reward_100235": 0.993621856432211, "test/sim_max_reward_100236": 0.979981195067095, "test/sim_max_reward_100237": 0.986103913655203, "test/sim_max_reward_100238": 0.9987542571128213, "test/sim_max_reward_100239": 0.9926102848140504, "test/sim_max_reward_100240": 1.0, "test/sim_max_reward_100241": 1.0, "test/sim_max_reward_100242": 1.0, "test/sim_max_reward_100243": 0.48307203740342824, "test/sim_max_reward_100244": 0.9911241127095717, "test/sim_max_reward_100245": 0.9932059293124329, "test/sim_max_reward_100246": 0.9929441067530157, "test/sim_max_reward_100247": 0.9975586179659158, "test/sim_max_reward_100248": 1.0, "test/sim_max_reward_100249": 0.6259976628543575, "test/sim_max_reward_100825": 0.9819167470530762, "test/sim_max_reward_100826": 0.6168800850298304, "test/sim_max_reward_100827": 0.24779714215256005, "test/sim_max_reward_100828": 0.4735838840822256, "test/sim_max_reward_100829": 0.9709178400753111, "test/sim_max_reward_100830": 1.0, "test/sim_max_reward_100831": 1.0, "test/sim_max_reward_100832": 0.9948252956691693, "test/sim_max_reward_100833": 0.9356852005510657, "test/sim_max_reward_100834": 0.7026484804617786, "test/sim_max_reward_100835": 1.0, "test/sim_max_reward_100836": 1.0, "test/sim_max_reward_100837": 0.9094100648989248, "test/sim_max_reward_100838": 1.0, "test/sim_max_reward_100839": 0.9857901492565336, "test/sim_max_reward_100840": 0.5376880845843511, "test/sim_max_reward_100841": 0.5180206397745696, "test/sim_max_reward_100842": 1.0, "test/sim_max_reward_100843": 1.0, "test/sim_max_reward_100844": 1.0, "test/sim_max_reward_100845": 0.7142064049368292, "test/sim_max_reward_100846": 0.9241872880400138, "test/sim_max_reward_100847": 1.0, "test/sim_max_reward_100848": 0.9809596982395168, "test/sim_max_reward_100849": 0.8992525470455712, "test/sim_max_reward_100900": 1.0, "test/sim_max_reward_100901": 0.7272555629272026, "test/sim_max_reward_100902": 0.2843544199877123, "test/sim_max_reward_100903": 1.0, "test/sim_max_reward_100904": 0.9549349848873877, "test/sim_max_reward_100905": 0.9946362258987173, "test/sim_max_reward_100906": 0.6867065853678895, "test/sim_max_reward_100907": 0.9991350510951928, "test/sim_max_reward_100908": 1.0, "test/sim_max_reward_100909": 0.7175105200591363, "test/sim_max_reward_100910": 1.0, "test/sim_max_reward_100911": 1.0, "test/sim_max_reward_100912": 0.9931737960676275, "test/sim_max_reward_100913": 1.0, "test/sim_max_reward_100914": 0.7992824208575305, "test/sim_max_reward_100915": 0.6288126199419043, "test/sim_max_reward_100916": 0.6651214949266425, "test/sim_max_reward_100917": 0.6696079465579261, "test/sim_max_reward_100918": 1.0, "test/sim_max_reward_100919": 0.9825178876480642, "test/sim_max_reward_100920": 1.0, "test/sim_max_reward_100921": 0.9933799702947378, "test/sim_max_reward_100922": 0.6725133534895913, "test/sim_max_reward_100923": 0.9753188649478107, "test/sim_max_reward_100924": 0.8789541513359993, "test/sim_max_reward_100700": 0.9649224001630957, "test/sim_max_reward_100701": 0.9743352250710658, "test/sim_max_reward_100702": 1.0, "test/sim_max_reward_100703": 0.1649292845300129, "test/sim_max_reward_100704": 0.034243579862043926, "test/sim_max_reward_100705": 1.0, "test/sim_max_reward_100706": 0.6246086613803663, "test/sim_max_reward_100707": 0.9448243647248709, "test/sim_max_reward_100708": 0.9806612013828793, "test/sim_max_reward_100709": 1.0, "test/sim_max_reward_100710": 0.8869806806206006, "test/sim_max_reward_100711": 0.9971005368424358, "test/sim_max_reward_100712": 1.0, "test/sim_max_reward_100713": 1.0, "test/sim_max_reward_100714": 1.0, "test/sim_max_reward_100715": 0.9757978777551659, "test/sim_max_reward_100716": 0.9944772202407532, "test/sim_max_reward_100717": 1.0, "test/sim_max_reward_100718": 0.8578806017696724, "test/sim_max_reward_100719": 1.0, "test/sim_max_reward_100720": 1.0, "test/sim_max_reward_100721": 0.994459339476519, "test/sim_max_reward_100722": 1.0, "test/sim_max_reward_100723": 1.0, "test/sim_max_reward_100724": 0.9489108928038109, "test/sim_max_reward_100000": 1.0, "test/sim_max_reward_100001": 0.8860776071445418, "test/sim_max_reward_100002": 0.9848742970545953, "test/sim_max_reward_100003": 0.6725808419032093, "test/sim_max_reward_100004": 1.0, "test/sim_max_reward_100005": 1.0, "test/sim_max_reward_100006": 0.6876645853929398, "test/sim_max_reward_100007": 1.0, "test/sim_max_reward_100008": 1.0, "test/sim_max_reward_100009": 0.6630266533115264, "test/sim_max_reward_100010": 1.0, "test/sim_max_reward_100011": 0.8729820954535515, "test/sim_max_reward_100012": 1.0, "test/sim_max_reward_100013": 0.9952408449014896, "test/sim_max_reward_100014": 0.9918995372348649, "test/sim_max_reward_100015": 0.675532594643955, "test/sim_max_reward_100016": 0.9725464131181504, "test/sim_max_reward_100017": 0.9428342549143132, "test/sim_max_reward_100018": 1.0, "test/sim_max_reward_100019": 1.0, "test/sim_max_reward_100020": 1.0, "test/sim_max_reward_100021": 1.0, "test/sim_max_reward_100022": 1.0, "test/sim_max_reward_100023": 1.0, "test/sim_max_reward_100024": 0.571683286543568, "test/sim_max_reward_100425": 1.0, "test/sim_max_reward_100426": 0.4098702062022917, "test/sim_max_reward_100427": 0.5990542198859902, "test/sim_max_reward_100428": 0.7233999919962742, "test/sim_max_reward_100429": 1.0, "test/sim_max_reward_100430": 1.0, "test/sim_max_reward_100431": 0.7281277954845945, "test/sim_max_reward_100432": 0.024883496163835003, "test/sim_max_reward_100433": 0.05570529935541475, "test/sim_max_reward_100434": 1.0, "test/sim_max_reward_100435": 0.9756315535177488, "test/sim_max_reward_100436": 0.49841891549094003, "test/sim_max_reward_100437": 0.5964303737009878, "test/sim_max_reward_100438": 0.9814958140477064, "test/sim_max_reward_100439": 0.5727575674288298, "test/sim_max_reward_100440": 1.0, "test/sim_max_reward_100441": 0.6632372397263134, "test/sim_max_reward_100442": 0.992517780390376, "test/sim_max_reward_100443": 0.45485664380812696, "test/sim_max_reward_100444": 1.0, "test/sim_max_reward_100445": 0.7039559406120864, "test/sim_max_reward_100446": 1.0, "test/sim_max_reward_100447": 0.9930891846765251, "test/sim_max_reward_100448": 0.0, "test/sim_max_reward_100449": 0.981034421556519, "test/sim_max_reward_100550": 1.0, "test/sim_max_reward_100551": 1.0, "test/sim_max_reward_100552": 1.0, "test/sim_max_reward_100553": 0.6115847791306067, "test/sim_max_reward_100554": 1.0, "test/sim_max_reward_100555": 1.0, "test/sim_max_reward_100556": 0.6489463977005546, "test/sim_max_reward_100557": 0.41514125930298973, "test/sim_max_reward_100558": 1.0, "test/sim_max_reward_100559": 1.0, "test/sim_max_reward_100560": 1.0, "test/sim_max_reward_100561": 0.9729589956409751, "test/sim_max_reward_100562": 0.8205531049489102, "test/sim_max_reward_100563": 0.9905518317156957, "test/sim_max_reward_100564": 1.0, "test/sim_max_reward_100565": 0.9808739916903888, "test/sim_max_reward_100566": 0.7061748403387857, "test/sim_max_reward_100567": 0.5107104143674389, "test/sim_max_reward_100568": 0.9868090294583195, "test/sim_max_reward_100569": 1.0, "test/sim_max_reward_100570": 0.6496075769360148, "test/sim_max_reward_100571": 0.9958316482481921, "test/sim_max_reward_100572": 1.0, "test/sim_max_reward_100573": 0.946419240120128, "test/sim_max_reward_100574": 1.0, "test/sim_max_reward_100500": 0.08544741300407577, "test/sim_max_reward_100501": 0.9055291192877889, "test/sim_max_reward_100502": 0.43003962157225695, "test/sim_max_reward_100503": 0.009772987843080816, "test/sim_max_reward_100504": 0.7146203790063141, "test/sim_max_reward_100505": 0.9454455321223607, "test/sim_max_reward_100506": 1.0, "test/sim_max_reward_100507": 1.0, "test/sim_max_reward_100508": 0.9925632940724258, "test/sim_max_reward_100509": 0.9928275367535978, "test/sim_max_reward_100510": 0.9847545805207982, "test/sim_max_reward_100511": 1.0, "test/sim_max_reward_100512": 0.9782321139799751, "test/sim_max_reward_100513": 1.0, "test/sim_max_reward_100514": 1.0, "test/sim_max_reward_100515": 1.0, "test/sim_max_reward_100516": 0.6461472240847297, "test/sim_max_reward_100517": 0.7037925424222886, "test/sim_max_reward_100518": 0.9308706227705165, "test/sim_max_reward_100519": 1.0, "test/sim_max_reward_100520": 1.0, "test/sim_max_reward_100521": 0.9590992807997574, "test/sim_max_reward_100522": 0.0, "test/sim_max_reward_100523": 0.62005086938911, "test/sim_max_reward_100524": 1.0, "test/sim_max_reward_100850": 1.0, "test/sim_max_reward_100851": 1.0, "test/sim_max_reward_100852": 0.0, "test/sim_max_reward_100853": 0.16157351865827485, "test/sim_max_reward_100854": 1.0, "test/sim_max_reward_100855": 0.4688304165732199, "test/sim_max_reward_100856": 1.0, "test/sim_max_reward_100857": 1.0, "test/sim_max_reward_100858": 1.0, "test/sim_max_reward_100859": 1.0, "test/sim_max_reward_100860": 0.7733525372208864, "test/sim_max_reward_100861": 1.0, "test/sim_max_reward_100862": 0.6884609094797888, "test/sim_max_reward_100863": 0.7175917975454768, "test/sim_max_reward_100864": 1.0, "test/sim_max_reward_100865": 0.6492622155788053, "test/sim_max_reward_100866": 1.0, "test/sim_max_reward_100867": 1.0, "test/sim_max_reward_100868": 1.0, "test/sim_max_reward_100869": 0.03576611749983982, "test/sim_max_reward_100870": 0.9832945069523817, "test/sim_max_reward_100871": 0.9366937689491834, "test/sim_max_reward_100872": 1.0, "test/sim_max_reward_100873": 0.9939452397889982, "test/sim_max_reward_100874": 1.0, "test/sim_max_reward_100475": 1.0, "test/sim_max_reward_100476": 1.0, "test/sim_max_reward_100477": 0.6389050021462187, "test/sim_max_reward_100478": 1.0, "test/sim_max_reward_100479": 0.9964509542523309, "test/sim_max_reward_100480": 1.0, "test/sim_max_reward_100481": 1.0, "test/sim_max_reward_100482": 1.0, "test/sim_max_reward_100483": 1.0, "test/sim_max_reward_100484": 0.1492957047209275, "test/sim_max_reward_100485": 0.6885693371935075, "test/sim_max_reward_100486": 1.0, "test/sim_max_reward_100487": 0.5321563090794329, "test/sim_max_reward_100488": 0.9831893211442309, "test/sim_max_reward_100489": 0.43935136088569304, "test/sim_max_reward_100490": 1.0, "test/sim_max_reward_100491": 0.9907383555718159, "test/sim_max_reward_100492": 0.9941770808442402, "test/sim_max_reward_100493": 0.7246686681461574, "test/sim_max_reward_100494": 0.9990617149963087, "test/sim_max_reward_100495": 1.0, "test/sim_max_reward_100496": 1.0, "test/sim_max_reward_100497": 0.9944254417993066, "test/sim_max_reward_100498": 1.0, "test/sim_max_reward_100499": 0.5750623214535996, "test/sim_max_reward_100575": 0.9799516223258569, "test/sim_max_reward_100576": 0.9450257038729568, "test/sim_max_reward_100577": 0.694862314739952, "test/sim_max_reward_100578": 0.9979960810204123, "test/sim_max_reward_100579": 1.0, "test/sim_max_reward_100580": 0.0, "test/sim_max_reward_100581": 0.9957659271659377, "test/sim_max_reward_100582": 1.0, "test/sim_max_reward_100583": 1.0, "test/sim_max_reward_100584": 0.9897407652132596, "test/sim_max_reward_100585": 0.8289753594688748, "test/sim_max_reward_100586": 0.974904828833674, "test/sim_max_reward_100587": 1.0, "test/sim_max_reward_100588": 1.0, "test/sim_max_reward_100589": 0.7229199952204445, "test/sim_max_reward_100590": 1.0, "test/sim_max_reward_100591": 0.4284006111351296, "test/sim_max_reward_100592": 0.6972269963584091, "test/sim_max_reward_100593": 1.0, "test/sim_max_reward_100594": 0.9901406868805991, "test/sim_max_reward_100595": 0.5952834401225311, "test/sim_max_reward_100596": 0.9963163028590512, "test/sim_max_reward_100597": 1.0, "test/sim_max_reward_100598": 0.9809302624433472, "test/sim_max_reward_100599": 1.0, "test/sim_max_reward_100725": 0.9683260816839514, "test/sim_max_reward_100726": 0.7251682557873365, "test/sim_max_reward_100727": 1.0, "test/sim_max_reward_100728": 1.0, "test/sim_max_reward_100729": 0.6132905052230548, "test/sim_max_reward_100730": 0.6415788254409367, "test/sim_max_reward_100731": 1.0, "test/sim_max_reward_100732": 1.0, "test/sim_max_reward_100733": 0.5455946064935092, "test/sim_max_reward_100734": 1.0, "test/sim_max_reward_100735": 1.0, "test/sim_max_reward_100736": 0.9876406514053349, "test/sim_max_reward_100737": 1.0, "test/sim_max_reward_100738": 1.0, "test/sim_max_reward_100739": 0.9382600751757871, "test/sim_max_reward_100740": 0.6560497349401438, "test/sim_max_reward_100741": 1.0, "test/sim_max_reward_100742": 0.9740177834044896, "test/sim_max_reward_100743": 1.0, "test/sim_max_reward_100744": 1.0, "test/sim_max_reward_100745": 0.9919648100718815, "test/sim_max_reward_100746": 1.0, "test/sim_max_reward_100747": 1.0, "test/sim_max_reward_100748": 1.0, "test/sim_max_reward_100749": 0.698801005109317, "test/sim_max_reward_100125": 0.7197871100828904, "test/sim_max_reward_100126": 1.0, "test/sim_max_reward_100127": 0.9946074585885923, "test/sim_max_reward_100128": 0.9835081615019168, "test/sim_max_reward_100129": 1.0, "test/sim_max_reward_100130": 0.0, "test/sim_max_reward_100131": 0.982070979507591, "test/sim_max_reward_100132": 0.0, "test/sim_max_reward_100133": 1.0, "test/sim_max_reward_100134": 1.0, "test/sim_max_reward_100135": 0.9954142283075605, "test/sim_max_reward_100136": 1.0, "test/sim_max_reward_100137": 1.0, "test/sim_max_reward_100138": 0.9868229692277871, "test/sim_max_reward_100139": 1.0, "test/sim_max_reward_100140": 0.9574676472694543, "test/sim_max_reward_100141": 0.9669801269778776, "test/sim_max_reward_100142": 0.992959453315668, "test/sim_max_reward_100143": 1.0, "test/sim_max_reward_100144": 1.0, "test/sim_max_reward_100145": 0.9876479436963355, "test/sim_max_reward_100146": 0.9936810110703287, "test/sim_max_reward_100147": 1.0, "test/sim_max_reward_100148": 0.0, "test/sim_max_reward_100149": 1.0, "test/sim_max_reward_100950": 1.0, "test/sim_max_reward_100951": 1.0, "test/sim_max_reward_100952": 0.9471564014597394, "test/sim_max_reward_100953": 0.9422547039131632, "test/sim_max_reward_100954": 1.0, "test/sim_max_reward_100955": 0.5742941967718058, "test/sim_max_reward_100956": 1.0, "test/sim_max_reward_100957": 0.7117246772784865, "test/sim_max_reward_100958": 1.0, "test/sim_max_reward_100959": 1.0, "test/sim_max_reward_100960": 1.0, "test/sim_max_reward_100961": 0.6818049055131494, "test/sim_max_reward_100962": 0.9930190595073668, "test/sim_max_reward_100963": 0.9872562699700824, "test/sim_max_reward_100964": 0.7277686287576384, "test/sim_max_reward_100965": 1.0, "test/sim_max_reward_100966": 0.7267589933422299, "test/sim_max_reward_100967": 1.0, "test/sim_max_reward_100968": 1.0, "test/sim_max_reward_100969": 0.9874108188082423, "test/sim_max_reward_100970": 1.0, "test/sim_max_reward_100971": 1.0, "test/sim_max_reward_100972": 0.6664409163253112, "test/sim_max_reward_100973": 0.6226827194580673, "test/sim_max_reward_100974": 1.0, "test/sim_max_reward_100875": 1.0, "test/sim_max_reward_100876": 0.983272331316513, "test/sim_max_reward_100877": 0.9672945415971566, "test/sim_max_reward_100878": 1.0, "test/sim_max_reward_100879": 1.0, "test/sim_max_reward_100880": 0.9481015926754199, "test/sim_max_reward_100881": 0.6745267549333412, "test/sim_max_reward_100882": 1.0, "test/sim_max_reward_100883": 0.6428606560537554, "test/sim_max_reward_100884": 1.0, "test/sim_max_reward_100885": 0.9892825063396486, "test/sim_max_reward_100886": 0.6153623610105787, "test/sim_max_reward_100887": 0.672904852475914, "test/sim_max_reward_100888": 1.0, "test/sim_max_reward_100889": 1.0, "test/sim_max_reward_100890": 1.0, "test/sim_max_reward_100891": 1.0, "test/sim_max_reward_100892": 0.9850704071553169, "test/sim_max_reward_100893": 0.6804018575427364, "test/sim_max_reward_100894": 0.9945692407772937, "test/sim_max_reward_100895": 0.9930878902316634, "test/sim_max_reward_100896": 1.0, "test/sim_max_reward_100897": 0.3175525766764698, "test/sim_max_reward_100898": 0.8459231532028472, "test/sim_max_reward_100899": 1.0, "test/sim_max_reward_100275": 0.984060938266468, "test/sim_max_reward_100276": 0.996831531225126, "test/sim_max_reward_100277": 0.24369421906050426, "test/sim_max_reward_100278": 0.9825462784696241, "test/sim_max_reward_100279": 0.6275017193203499, "test/sim_max_reward_100280": 1.0, "test/sim_max_reward_100281": 0.9547678015341857, "test/sim_max_reward_100282": 0.9517525368454548, "test/sim_max_reward_100283": 0.9363150147403605, "test/sim_max_reward_100284": 0.9662034614768209, "test/sim_max_reward_100285": 1.0, "test/sim_max_reward_100286": 1.0, "test/sim_max_reward_100287": 0.8639364606347201, "test/sim_max_reward_100288": 1.0, "test/sim_max_reward_100289": 1.0, "test/sim_max_reward_100290": 0.5466797645613323, "test/sim_max_reward_100291": 1.0, "test/sim_max_reward_100292": 0.9224426944357462, "test/sim_max_reward_100293": 1.0, "test/sim_max_reward_100294": 1.0, "test/sim_max_reward_100295": 1.0, "test/sim_max_reward_100296": 0.6284263187406789, "test/sim_max_reward_100297": 0.421658310767922, "test/sim_max_reward_100298": 1.0, "test/sim_max_reward_100299": 1.0, "test/sim_max_reward_100025": 0.9885411496596627, "test/sim_max_reward_100026": 0.9671881283223862, "test/sim_max_reward_100027": 0.9780545836988936, "test/sim_max_reward_100028": 1.0, "test/sim_max_reward_100029": 1.0, "test/sim_max_reward_100030": 0.9961329225847846, "test/sim_max_reward_100031": 1.0, "test/sim_max_reward_100032": 1.0, "test/sim_max_reward_100033": 1.0, "test/sim_max_reward_100034": 0.6071949727828858, "test/sim_max_reward_100035": 0.6428527107500349, "test/sim_max_reward_100036": 0.5137520263722845, "test/sim_max_reward_100037": 1.0, "test/sim_max_reward_100038": 0.9628955569476347, "test/sim_max_reward_100039": 1.0, "test/sim_max_reward_100040": 1.0, "test/sim_max_reward_100041": 1.0, "test/sim_max_reward_100042": 1.0, "test/sim_max_reward_100043": 0.525629399378483, "test/sim_max_reward_100044": 1.0, "test/sim_max_reward_100045": 1.0, "test/sim_max_reward_100046": 0.7059281787960106, "test/sim_max_reward_100047": 1.0, "test/sim_max_reward_100048": 1.0, "test/sim_max_reward_100049": 0.0, "test/sim_max_reward_100250": 0.8303991197001669, "test/sim_max_reward_100251": 1.0, "test/sim_max_reward_100252": 1.0, "test/sim_max_reward_100253": 1.0, "test/sim_max_reward_100254": 1.0, "test/sim_max_reward_100255": 1.0, "test/sim_max_reward_100256": 1.0, "test/sim_max_reward_100257": 0.9661398952349883, "test/sim_max_reward_100258": 0.0, "test/sim_max_reward_100259": 1.0, "test/sim_max_reward_100260": 0.9584945515187037, "test/sim_max_reward_100261": 0.9558023943720491, "test/sim_max_reward_100262": 0.974425434015766, "test/sim_max_reward_100263": 0.9679686482546094, "test/sim_max_reward_100264": 0.9050245693376728, "test/sim_max_reward_100265": 1.0, "test/sim_max_reward_100266": 0.7204140063544631, "test/sim_max_reward_100267": 0.9826899692858179, "test/sim_max_reward_100268": 1.0, "test/sim_max_reward_100269": 1.0, "test/sim_max_reward_100270": 0.0, "test/sim_max_reward_100271": 1.0, "test/sim_max_reward_100272": 1.0, "test/sim_max_reward_100273": 0.9765270539203529, "test/sim_max_reward_100274": 1.0, "test/sim_max_reward_100300": 0.47158306666193206, "test/sim_max_reward_100301": 0.11575626880589691, "test/sim_max_reward_100302": 0.7062328400591971, "test/sim_max_reward_100303": 0.7141039862274707, "test/sim_max_reward_100304": 0.9069076840878941, "test/sim_max_reward_100305": 0.9918065142596556, "test/sim_max_reward_100306": 0.97188702201679, "test/sim_max_reward_100307": 0.7156215254149833, "test/sim_max_reward_100308": 0.7265361921402822, "test/sim_max_reward_100309": 0.983223557759286, "test/sim_max_reward_100310": 0.997121522995627, "test/sim_max_reward_100311": 0.72512594263006, "test/sim_max_reward_100312": 1.0, "test/sim_max_reward_100313": 1.0, "test/sim_max_reward_100314": 0.9725047563153849, "test/sim_max_reward_100315": 0.36935624628866254, "test/sim_max_reward_100316": 0.9931596670104414, "test/sim_max_reward_100317": 0.6946987520251854, "test/sim_max_reward_100318": 1.0, "test/sim_max_reward_100319": 1.0, "test/sim_max_reward_100320": 1.0, "test/sim_max_reward_100321": 1.0, "test/sim_max_reward_100322": 0.6215415663002578, "test/sim_max_reward_100323": 0.6276007699951771, "test/sim_max_reward_100324": 0.5641888167440811, "test/sim_max_reward_100675": 1.0, "test/sim_max_reward_100676": 0.5286073651920475, "test/sim_max_reward_100677": 0.9918485187817249, "test/sim_max_reward_100678": 0.7042939145983119, "test/sim_max_reward_100679": 0.6486225695163466, "test/sim_max_reward_100680": 0.9840627151387897, "test/sim_max_reward_100681": 0.992024185751194, "test/sim_max_reward_100682": 0.8923127616724483, "test/sim_max_reward_100683": 0.8137962633014622, "test/sim_max_reward_100684": 0.46652136868363986, "test/sim_max_reward_100685": 0.9775160852481605, "test/sim_max_reward_100686": 1.0, "test/sim_max_reward_100687": 0.9992486095303165, "test/sim_max_reward_100688": 1.0, "test/sim_max_reward_100689": 0.980520542115558, "test/sim_max_reward_100690": 0.9930701172205038, "test/sim_max_reward_100691": 0.6552902321582635, "test/sim_max_reward_100692": 1.0, "test/sim_max_reward_100693": 0.975300385336388, "test/sim_max_reward_100694": 1.0, "test/sim_max_reward_100695": 0.5876039497182919, "test/sim_max_reward_100696": 1.0, "test/sim_max_reward_100697": 1.0, "test/sim_max_reward_100698": 1.0, "test/sim_max_reward_100699": 1.0, "test/sim_max_reward_100750": 1.0, "test/sim_max_reward_100751": 0.9243989864975627, "test/sim_max_reward_100752": 0.990729873130719, "test/sim_max_reward_100753": 1.0, "test/sim_max_reward_100754": 0.9692100116269463, "test/sim_max_reward_100755": 0.673662195994639, "test/sim_max_reward_100756": 1.0, "test/sim_max_reward_100757": 1.0, "test/sim_max_reward_100758": 1.0, "test/sim_max_reward_100759": 1.0, "test/sim_max_reward_100760": 0.9807386580157113, "test/sim_max_reward_100761": 1.0, "test/sim_max_reward_100762": 0.4439960694061506, "test/sim_max_reward_100763": 0.9872020343630136, "test/sim_max_reward_100764": 0.47214411587723143, "test/sim_max_reward_100765": 1.0, "test/sim_max_reward_100766": 0.9539832263292758, "test/sim_max_reward_100767": 1.0, "test/sim_max_reward_100768": 1.0, "test/sim_max_reward_100769": 0.47777009793018876, "test/sim_max_reward_100770": 0.9715891543755096, "test/sim_max_reward_100771": 0.9999367734493768, "test/sim_max_reward_100772": 1.0, "test/sim_max_reward_100773": 0.9735124688910173, "test/sim_max_reward_100774": 1.0, "test/sim_max_reward_100600": 1.0, "test/sim_max_reward_100601": 0.9922025561530784, "test/sim_max_reward_100602": 1.0, "test/sim_max_reward_100603": 0.999378997079747, "test/sim_max_reward_100604": 1.0, "test/sim_max_reward_100605": 0.9817313411636185, "test/sim_max_reward_100606": 0.15406562526207762, "test/sim_max_reward_100607": 1.0, "test/sim_max_reward_100608": 0.39190217939530525, "test/sim_max_reward_100609": 0.7291573465823317, "test/sim_max_reward_100610": 0.33395954015283574, "test/sim_max_reward_100611": 1.0, "test/sim_max_reward_100612": 0.6514028091479889, "test/sim_max_reward_100613": 0.725679723670453, "test/sim_max_reward_100614": 0.9865594760100893, "test/sim_max_reward_100615": 1.0, "test/sim_max_reward_100616": 1.0, "test/sim_max_reward_100617": 1.0, "test/sim_max_reward_100618": 1.0, "test/sim_max_reward_100619": 1.0, "test/sim_max_reward_100620": 0.0, "test/sim_max_reward_100621": 0.5797156997512823, "test/sim_max_reward_100622": 1.0, "test/sim_max_reward_100623": 1.0, "test/sim_max_reward_100624": 0.9799430749151392, "test/sim_max_reward_100525": 0.47016886297180754, "test/sim_max_reward_100526": 0.9928958213204557, "test/sim_max_reward_100527": 0.5325054622431848, "test/sim_max_reward_100528": 0.9854106935989169, "test/sim_max_reward_100529": 0.41036078970565326, "test/sim_max_reward_100530": 1.0, "test/sim_max_reward_100531": 0.0, "test/sim_max_reward_100532": 0.33555391995146544, "test/sim_max_reward_100533": 0.9835632223809714, "test/sim_max_reward_100534": 1.0, "test/sim_max_reward_100535": 0.9848416091362154, "test/sim_max_reward_100536": 1.0, "test/sim_max_reward_100537": 0.9843535561660863, "test/sim_max_reward_100538": 0.9676889512870822, "test/sim_max_reward_100539": 1.0, "test/sim_max_reward_100540": 0.5895829419434802, "test/sim_max_reward_100541": 0.9998685308178469, "test/sim_max_reward_100542": 0.9915279228071661, "test/sim_max_reward_100543": 0.674430182630744, "test/sim_max_reward_100544": 0.9889165385522729, "test/sim_max_reward_100545": 0.9878509135277169, "test/sim_max_reward_100546": 0.7210470977740637, "test/sim_max_reward_100547": 1.0, "test/sim_max_reward_100548": 0.4654094373836408, "test/sim_max_reward_100549": 1.0, "test/sim_max_reward_100400": 1.0, "test/sim_max_reward_100401": 1.0, "test/sim_max_reward_100402": 1.0, "test/sim_max_reward_100403": 1.0, "test/sim_max_reward_100404": 0.9953227305673954, "test/sim_max_reward_100405": 1.0, "test/sim_max_reward_100406": 0.2513665496763762, "test/sim_max_reward_100407": 1.0, "test/sim_max_reward_100408": 1.0, "test/sim_max_reward_100409": 1.0, "test/sim_max_reward_100410": 1.0, "test/sim_max_reward_100411": 0.13511493985298093, "test/sim_max_reward_100412": 0.6897496898687686, "test/sim_max_reward_100413": 0.5106062486816247, "test/sim_max_reward_100414": 1.0, "test/sim_max_reward_100415": 1.0, "test/sim_max_reward_100416": 1.0, "test/sim_max_reward_100417": 1.0, "test/sim_max_reward_100418": 1.0, "test/sim_max_reward_100419": 1.0, "test/sim_max_reward_100420": 1.0, "test/sim_max_reward_100421": 0.5817763288443969, "test/sim_max_reward_100422": 0.5200873772154714, "test/sim_max_reward_100423": 1.0, "test/sim_max_reward_100424": 0.5250796433045463, "test/mean_score": 0.8533580608655396} |