{"entities":{"Q2810778":{"pageid":2821516,"ns":120,"title":"Item:Q2810778","lastrevid":52547549,"modified":"2026-01-22T22:41:32Z","type":"item","id":"Q2810778","labels":{"en":{"language":"en","value":"Learning the variance of the reward-to-go"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 6589427"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810778$6F1AD361-A767-401B-B38D-A7365A9A126A","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"7f7f5ac32fc41b60a5acc00d347ed0097e6c4265","datavalue":{"value":"1360.68713","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810778$2EC45B21-4A84-4E71-B309-FDDA8382B2B4","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"f11c5697a9ccf1965dc19e39f2d7ba27d39071ff","datavalue":{"value":{"entity-type":"item","numeric-id":2809804,"id":"Q2809804"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810778$5F0FEAB7-F929-4A1F-9186-FF8C04626020","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"ef5dc96dd0e09fffb51f89eabdb0e9cf1004c393","datavalue":{"value":{"entity-type":"item","numeric-id":2810777,"id":"Q2810777"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810778$E7408629-6B3B-46D0-8DA6-24F5B2F33EFE","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"e6cce64b73fbb0ca1868d7800b99b549c19bea0a","datavalue":{"value":{"entity-type":"item","numeric-id":239358,"id":"Q239358"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810778$629D0182-24D9-42F4-907B-352901BE1930","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"d066e43a0d378deda532184f86b234184fe2275a","datavalue":{"value":{"time":"+2016-06-06T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q2810778$28D5A889-02CE-46B9-9B68-882C3DF601DB","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"3f7d336c369da4024dcd4ab69e7477919f884899","datavalue":{"value":"http://jmlr.csail.mit.edu/papers/v17/14-335.html","type":"string"},"datatype":"url"},"type":"statement","id":"Q2810778$11E47436-4BD8-42CE-893B-108F735CE112","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"cfe779e91fe9c53ee133568259955801965765ae","datavalue":{"value":"68T05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810778$66B4ECB2-3B24-4D19-8743-389065CA6BC2","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"377d3ab03372cff12915e0de0374438ff70c3716","datavalue":{"value":"90C40","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810778$CB6C2131-7993-41A5-85C3-80DEDD1E2A5E","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"8a3d15a65244e163303bb93327e17ec1de02764d","datavalue":{"value":"6589427","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810778$9DD34031-06F8-468D-BC7A-860F77ABD0DA","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ab31482eee8f34fa99c5284980862acac4a0b6b4","datavalue":{"value":"reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810778$CEEA842D-6BA8-47B2-9F25-776E78D4C118","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"fbd1f99995fb6a13da62a377ba6327166316e976","datavalue":{"value":"Markov decision processes","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810778$D0DF4157-16BB-49B4-B7C1-F9CF0D355040","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"b0d56083670d24287f246c347eccb78847c2e9ae","datavalue":{"value":"variance estimation","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810778$12D45DC8-A991-4E98-BDAD-7E1B82CDAC70","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"f828563fee5a57e5f16da87a79378ac587cea3ac","datavalue":{"value":"simulation","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810778$4058C1C4-7512-4231-9EAA-3CC3626C3994","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"31fb876438beb36d0d63f67a2b366860d5cad0c2","datavalue":{"value":"temporal differences","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810778$4C6741A7-2E4B-479A-A0A8-C77C1DAE40DB","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810778$900FF45C-D741-4AE2-B3BF-267E49BF513C","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"a00d1561f3c803a7be96aa3ee90121ff6d4b61d8","datavalue":{"value":{"text":"Learning the variance of the reward-to-go","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q2810778$AADF32ED-9949-426A-9DB0-1B073C4783F7","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"05810dfd27f2b8a246f7d0a5b34fbcc72e448b7a","datavalue":{"value":{"entity-type":"item","numeric-id":6582882,"id":"Q6582882"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810778$1821A9F5-C10D-41A0-8AA0-6F1276E19BD4","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"740084bc5efaa56cf3cfde88cbb26fa4d3c0f602","datavalue":{"value":{"entity-type":"item","numeric-id":1745941,"id":"Q1745941"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"5212e77a193126a88e5b33b4f77b61cda2ee9faf","datavalue":{"value":{"amount":"+0.7897273898124695","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810778$EDEFF082-C808-41C5-AA14-D37891311A80","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"bd4339c343c787e7b47e7e46bba4d617005846d5","datavalue":{"value":{"entity-type":"item","numeric-id":1689603,"id":"Q1689603"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"01d4c9110b57718846aa1466dbcbf987c33a831b","datavalue":{"value":{"amount":"+0.7869522571563721","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810778$13089FB3-C07D-4351-96F8-F1038626CB89","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"89d24c97fd5a46dc4abe5308930875eff1428ef9","datavalue":{"value":{"entity-type":"item","numeric-id":3832356,"id":"Q3832356"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"36609db2a388f057e9ab2021fdc84c736f097af4","datavalue":{"value":{"amount":"+0.7598598003387451","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810778$B1C000AE-E02F-49D7-A786-72C58A197195","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"e639d6734eb671cc3d200d71bcc5d05699120881","datavalue":{"value":{"entity-type":"item","numeric-id":2931706,"id":"Q2931706"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"ef2b02e88f68048b3521b959c8e40f75df1f5fe5","datavalue":{"value":{"amount":"+0.7573934197425842","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810778$0409B151-9F30-4315-A33C-B912FFC328F1","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"604a13bcc31889179e026b259e836323bf641089","datavalue":{"value":{"entity-type":"item","numeric-id":2409311,"id":"Q2409311"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"b4b55a4396134957cde91971548370f636d90598","datavalue":{"value":{"amount":"+0.7517201900482178","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810778$CC9EFCEF-D74F-4451-9B68-A129F42C41C1","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"Publication:2810778","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/Publication:2810778"}}}}}