{"entities":{"Q1568533":{"pageid":1579273,"ns":120,"title":"Item:Q1568533","lastrevid":70728012,"modified":"2026-04-13T16:22:10Z","type":"item","id":"Q1568533","labels":{"en":{"language":"en","value":"Convergence results for single-step on-policy reinforcement-learning algorithms"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 1462817"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$C5E39042-19A9-4125-8189-EB4E775BF58F","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"3d806ca1d16ddda91af53b6e97559f1e2ec7a442","datavalue":{"value":{"text":"Convergence results for single-step on-policy reinforcement-learning algorithms","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q1568533$A62016A1-1D1B-450D-9466-D3C87DFE520F","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"9e797bb0ea87826e6dfe0275600ede97ed112830","datavalue":{"value":"0954.68127","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1568533$09DC4EF9-BB3D-4E57-B144-227820174C64","rank":"normal"}],"P27":[{"mainsnak":{"snaktype":"value","property":"P27","hash":"065d1c9b0f7f8a9e13187d8f96f6f3f0ac42147f","datavalue":{"value":"10.1023/A:1007678930559","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1568533$57704F8D-EA58-4737-B201-1B82744D3995","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"92953e4586e720c3bdd013770f6ffbe01a60f284","datavalue":{"value":{"entity-type":"item","numeric-id":230823,"id":"Q230823"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$566280D1-3653-432C-A1D7-584FC72A8601","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"0649807087cac19cbfe8dfd49f717d51cbdc5c68","datavalue":{"value":{"entity-type":"item","numeric-id":399885,"id":"Q399885"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$0D7BE535-ECC3-41C1-BEB7-6AC954E7192E","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"8773625a020b53e52e05beeecf07c19f6aa5cadc","datavalue":{"value":{"entity-type":"item","numeric-id":1812932,"id":"Q1812932"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$7B5B63EC-5D7A-4CB6-84F4-6D679A54348F","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"fa130ed0c3acdff19df21f2746eb8f529daf1ba5","datavalue":{"value":{"entity-type":"item","numeric-id":1964685,"id":"Q1964685"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$D3E00D0F-8A47-4AF8-867E-FDD34D818D8C","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"2500bd7472785bf7f3577cddf9bbcc323031858b","datavalue":{"value":{"entity-type":"item","numeric-id":65106,"id":"Q65106"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$4FAC3F41-3C4E-46C5-AC7C-10E70303492F","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"ce7843932412e0d5c566f14bc25dfa7a3675a659","datavalue":{"value":{"time":"+2000-06-21T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q1568533$E6E84F09-38A3-4449-9D2B-0B369E8F6AD9","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"cfe779e91fe9c53ee133568259955801965765ae","datavalue":{"value":"68T05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1568533$AAE3F927-7DAB-45B8-B3A8-0464E500456B","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"79b3bc872b6637176b35f9e46ac855febbf884f5","datavalue":{"value":"68W05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1568533$DA4057D2-7C78-4532-AA18-51EF3CF71080","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"f1e2160f572fcade0186086484da4b179ee21fca","datavalue":{"value":"1462817","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1568533$32005EC2-B39B-4ED7-81D7-D51A189CA874","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ab31482eee8f34fa99c5284980862acac4a0b6b4","datavalue":{"value":"reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q1568533$DD6D96C3-9112-407D-A43C-4E3E412F6935","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1568533$CB534BDB-DF1D-4ED3-B454-F053C49D6133","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"a1d6df2df0486024423768708a8680ffe37bc980","datavalue":{"value":"https://doi.org/10.1023/a:1007678930559","type":"string"},"datatype":"url"},"type":"statement","id":"Q1568533$99238B70-C364-4B89-8035-B91BE7962ABB","rank":"normal"}],"P388":[{"mainsnak":{"snaktype":"value","property":"P388","hash":"1cbeb0054c57af74fbcc57700c2f6abf8a7008d8","datavalue":{"value":"W2150339816","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1568533$13A2464C-7E6A-4CC6-8BDC-1D4CD43212E9","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"66b88b82084ddd656ce6ff348d0dc0148ae13bd9","datavalue":{"value":{"entity-type":"item","numeric-id":2665181,"id":"Q2665181"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"9fe74d0613dccccb87712eacde2337fbcd4ebe71","datavalue":{"value":{"amount":"+0.7585216164588928","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1568533$E7800946-158E-44B4-9C88-4C3E03A69B10","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"427e8903fe5e9cf359884f00a1124549187fc7dd","datavalue":{"value":{"entity-type":"item","numeric-id":1812931,"id":"Q1812931"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"fa3de17cc9e26d2f8faf2dd37deb078629858378","datavalue":{"value":{"amount":"+0.7544193863868713","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1568533$95144FC9-9BF7-4D09-99FB-300563B1FBE1","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"d87063bd93d3d0fb42281fb78b2ece361ea40693","datavalue":{"value":{"entity-type":"item","numeric-id":4323346,"id":"Q4323346"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"d1a5ced33efdfcb6acd8c417b7d7eea1bfe7141f","datavalue":{"value":{"amount":"+0.753777265548706","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1568533$0310354F-13FB-4DDA-813F-6DA8E0D220B9","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"512d4c4a45f72cf314f74017a6cf3df2fa523246","datavalue":{"value":{"entity-type":"item","numeric-id":1604817,"id":"Q1604817"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"5eb6e438378c308dd964c043d9ccb74420138e5d","datavalue":{"value":{"amount":"+0.7506934404373169","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1568533$747DC602-EF75-4740-B5E1-A0BCB29ACA21","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"74ff4f14d4b48f3efe127860a08301f5112ab204","datavalue":{"value":{"entity-type":"item","numeric-id":3044133,"id":"Q3044133"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"f8e702661896c8d459916415e80bdbbe442c80c9","datavalue":{"value":{"amount":"+0.7463492751121521","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1568533$C4DF124F-3E28-4390-8C5E-70971D3816EB","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"Convergence results for single-step on-policy reinforcement-learning algorithms","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/Convergence_results_for_single-step_on-policy_reinforcement-learning_algorithms"}}}}}