{"entities":{"Q2810840":{"pageid":2821578,"ns":120,"title":"Item:Q2810840","lastrevid":42158855,"modified":"2025-05-26T17:35:01Z","type":"item","id":"Q2810840","labels":{"en":{"language":"en","value":"Addressing environment non-stationarity by repeating Q-learning updates"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 6589460"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810840$7879E91C-704B-4ED7-A3C8-1DC8D15F89CA","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"efc87b531ddfad45dd06c0ff7d1172706ab1c975","datavalue":{"value":"1360.68661","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810840$9B344A3C-DB7A-483E-86FD-B3E27FBE3C40","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"903ee3c51ddd731b2255dc6dfb5ae1442e9774a6","datavalue":{"value":{"entity-type":"item","numeric-id":2810838,"id":"Q2810838"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810840$01E27BBD-5687-4C76-AED4-B756606F3F8A","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"84ab324f4439f0aaf790a5539632ba28180fd75c","datavalue":{"value":{"entity-type":"item","numeric-id":2810839,"id":"Q2810839"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810840$1DA328C6-A3DE-43F9-8835-629CBE01F223","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"d066e43a0d378deda532184f86b234184fe2275a","datavalue":{"value":{"time":"+2016-06-06T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q2810840$CB13AAF9-C30E-44B7-9F0E-4B8C6251719F","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"fe482898a58f4bf934d343eed041560f33b5ec25","datavalue":{"value":"http://jmlr.csail.mit.edu/papers/v17/14-037.html","type":"string"},"datatype":"url"},"type":"statement","id":"Q2810840$97DBB97F-8BF4-42E5-B835-43FFBCDD9B69","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"cfe779e91fe9c53ee133568259955801965765ae","datavalue":{"value":"68T05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810840$C6C8DC2C-D913-4BAA-A5F4-B4C5818A3994","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"51e2dcec2972780f88f2fb350b87f687c147c73c","datavalue":{"value":"6589460","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2810840$D8E409E6-A5DB-4BA1-BB15-FF096ED93933","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ab31482eee8f34fa99c5284980862acac4a0b6b4","datavalue":{"value":"reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810840$48763BD6-C54C-4329-8B15-8ED23C8B3642","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"9c5166404b8821726545f8a3a9ab53c350e2fe2b","datavalue":{"value":"Q-learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810840$192DA642-906C-4BD1-83C9-7F795825FD8A","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"cdd9970ae13dcb01d7caee11b790ac5b25adb5f1","datavalue":{"value":"multi-agent learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810840$EA4DBD87-513D-45CE-ADB3-F279D2A9E13F","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"edb3d26fb7ad67b4825f1f570866d5feb784e7d6","datavalue":{"value":"non-stationary environments","type":"string"},"datatype":"string"},"type":"statement","id":"Q2810840$B8B41F2C-70E1-48A2-8E85-84589DC69051","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810840$2B6DC03E-E6CC-4860-A785-DC752803C230","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"2ddf5e1d8acdef309c4aa020a850e61c946945ae","datavalue":{"value":{"entity-type":"item","numeric-id":4861477,"id":"Q4861477"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"eb63ac598b49f576b1e35337ff0faa03b3a10505","datavalue":{"value":{"amount":"+0.84284604","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810840$A17271FC-F817-4DEF-B644-BA3E3D1EB520","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"f0a20b2680f4562ecb00702560aadf739abf6089","datavalue":{"value":{"entity-type":"item","numeric-id":1604822,"id":"Q1604822"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"8979ea1c01785b48594967b4a60bd1446d77c8f9","datavalue":{"value":{"amount":"+0.8413856","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810840$4ADCB4DB-90FE-4583-AAC1-C14369B36343","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"ee7576c3b31bbd0e88857b199d49a13aa1ed2023","datavalue":{"value":{"entity-type":"item","numeric-id":5706509,"id":"Q5706509"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"bdfbda0e2cd7d0dfb841e86995e11f66d1892029","datavalue":{"value":{"amount":"+0.8313009","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810840$C609DD38-D300-46D1-AFE7-ADA7220C1F2E","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"c0f6e6b6e78a94f497bd28c4be79bc2988c3a42e","datavalue":{"value":{"entity-type":"item","numeric-id":5499684,"id":"Q5499684"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"d914aaf78ff76fbec079c18cae5afd6e3c6933b6","datavalue":{"value":{"amount":"+0.8281231","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2810840$F7E445A7-33E3-4E03-8CCA-773591C33A9D","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"b7b25042b2c50716e1f9f27dc6e123a609f793dc","datavalue":{"value":{"text":"Addressing environment non-stationarity by repeating Q-learning updates","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q2810840$40DE1A1E-CE68-4C75-A2F5-96174C4158F8","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"05810dfd27f2b8a246f7d0a5b34fbcc72e448b7a","datavalue":{"value":{"entity-type":"item","numeric-id":6582882,"id":"Q6582882"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2810840$7DA2C7E3-56AC-442C-93B0-2A8331EE1F54","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"Publication:2810840","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/Publication:2810840"}}}}}