{"entities":{"Q1870309":{"pageid":1881051,"ns":120,"title":"Item:Q1870309","lastrevid":73823052,"modified":"2026-04-14T17:23:20Z","type":"item","id":"Q1870309","labels":{"en":{"language":"en","value":"From perturbation analysis to Markov decision processes and reinforcement learning"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 1908596"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1870309$32288C65-60CA-47D0-BFAE-832E185A50C4","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"7ab8b007f2243492de436a4d0a15de29a6849040","datavalue":{"value":{"text":"From perturbation analysis to Markov decision processes and reinforcement learning","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q1870309$23C2E408-C0B0-490D-8A6D-D350CA99FCEA","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"c0d7ec3de279747798be80e17f0ee1598dab7396","datavalue":{"value":"1031.93166","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$67F2DCE6-92FB-4F8F-ABE7-D79C3D8F2011","rank":"normal"}],"P27":[{"mainsnak":{"snaktype":"value","property":"P27","hash":"a5a403c856463ee31b3677285ce8a08cfa87bd3b","datavalue":{"value":"10.1023/A:1022188803039","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$D108E1CF-ECBB-46AB-9F4A-7F0A6E1CA575","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"646c4b950adcc2747e9b6d91c4105f879f76be24","datavalue":{"value":{"entity-type":"item","numeric-id":243740,"id":"Q243740"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1870309$04A3E693-983B-4A61-8095-47ADABFA162B","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"0f7c04b6b94cf13c193d472c226068c28e7c8f04","datavalue":{"value":{"entity-type":"item","numeric-id":169421,"id":"Q169421"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1870309$89E20E53-0631-4258-85AA-0CB8E5A5DD5F","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"947c49c6dc991ad4ccf38c0cba49a099db39b9c3","datavalue":{"value":{"time":"+2003-05-11T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q1870309$45872672-B1EE-4F90-B118-E4D17DE99CC8","rank":"normal"}],"P1448":[{"mainsnak":{"snaktype":"value","property":"P1448","hash":"153ea172c43940c1a62b7505582ea241697c91ab","datavalue":{"value":"There are various ways, such as perturbation analysis (PA), Markov decision processes (MDPs) and reinforcement learning (RL) etc., to achieve performance optimization of a dynamical system.    Here, the author studies the relationships among these closely related fields. The author shows that performance potentials play a crucial role in PA, MDPs and other optimization approaches. RL, neuro-dynamic programming, etc. are sample-path-based efficient ways of estimating the performance potentials and \\(Q\\)-factors. It is pointed out here that the potential-based approach is practically important due to its on-line application to real systems, which is discussed through an example.","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$2E74239D-2A68-44CE-B77B-878BACDF38E8","rank":"normal"}],"P1447":[{"mainsnak":{"snaktype":"value","property":"P1447","hash":"45e6fadf5dc208a7e2a9945e966efc6b55109061","datavalue":{"value":{"entity-type":"item","numeric-id":758008,"id":"Q758008"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1870309$9D28A01E-E804-4D78-9947-7750D3FAE820","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"4fd8d49a375e8786d86b39f94e9773f56a9b1c4e","datavalue":{"value":"93E35","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$9283D5C3-2C44-4BC7-B41B-111E7BA69040","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"4c15fc5b552da2164fcbae119962e97168cbc3a1","datavalue":{"value":"93E25","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$F40D8DB7-4C6F-473D-86DD-A1460744E6ED","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"62b95b6f7919542f12b1e12b0279617ef6dfa9f9","datavalue":{"value":"93C73","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$DDC6590B-36C2-449B-8110-56E318B16E2F","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"377d3ab03372cff12915e0de0374438ff70c3716","datavalue":{"value":"90C40","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$922DBDDB-5E72-4200-8645-81D9A961E07D","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"cfe779e91fe9c53ee133568259955801965765ae","datavalue":{"value":"68T05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$8E25577A-D764-4B41-8CD5-056D43DF0080","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"c1141154b7c417d99b766d154236bb5d4e9f304c","datavalue":{"value":"1908596","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1870309$25F868E1-2481-4447-9419-E50EB44232B5","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"be09917c8b117d2a659118ad2b48f63fb5690a50","datavalue":{"value":"on-line algorithms","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$3CB11BF9-76BB-4007-AA2A-480F9DC25A13","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"13ccc6cceb577fe3b611c89782f027ab6f966fa4","datavalue":{"value":"Poisson equations","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$3D8F4AE1-084B-4613-8131-15C871B1C4C2","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"b9fb32900ab50f323984eb24225d5c0577bad711","datavalue":{"value":"gradient-based policy iteration","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$8A2D0085-CC97-48B5-BA54-4F72A87AF22B","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"460dbe17f7ec805bf9cf37b0e6152f4f871c2b85","datavalue":{"value":"perturbation analysis","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$B68B572A-5A41-45FE-A21E-4D424E5306BC","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"9c5166404b8821726545f8a3a9ab53c350e2fe2b","datavalue":{"value":"Q-learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$BB86A18B-D58C-4766-8CC7-D5A1E0D892DC","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"7d8efb657da32da3fb13593c89714c3abf05071e","datavalue":{"value":"TD(\\(\\lambda\\))","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$998C4E0F-E7A1-4F60-992C-26263500B7E2","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"fbd1f99995fb6a13da62a377ba6327166316e976","datavalue":{"value":"Markov decision processes","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$DD889700-8C2C-47A6-B6AA-852B6525EDED","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ab31482eee8f34fa99c5284980862acac4a0b6b4","datavalue":{"value":"reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$991B2604-804C-47E4-803E-37A9BB11EBDA","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"7acfdc35aa76c43ed9f0615384fa93057940238e","datavalue":{"value":"performance potentials","type":"string"},"datatype":"string"},"type":"statement","id":"Q1870309$4FE72FCB-1B64-4B09-AFDE-69A51BE45530","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1870309$E747FCDD-C42E-480D-951C-C01ED951A087","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"b8c9600c83099dfba2d50196d73a051388b66c4f","datavalue":{"value":{"entity-type":"item","numeric-id":1041680,"id":"Q1041680"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"dcc0b0ddb96c0ebce64d2dc142af3f249c77ef58","datavalue":{"value":{"amount":"+0.8891481","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$426457D4-24A5-4E95-B1D7-CB023F4D7DD5","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"8f98a5bd240b8ac0ec91fda27205cb2d77876fa4","datavalue":{"value":{"entity-type":"item","numeric-id":2833106,"id":"Q2833106"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"9b222897155af552d5db3dff808eb56f4732656e","datavalue":{"value":{"amount":"+0.8845279","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$DF4732A4-17B4-4357-BAF5-393B28C10B40","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"c03e6cce8375d250c27e82c3839d4271bfa343dd","datavalue":{"value":{"entity-type":"item","numeric-id":4668597,"id":"Q4668597"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"88b1c9d6e89b5f2ece736c663c4da2591082da54","datavalue":{"value":{"amount":"+0.88275784","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$41AAABCF-3DB4-4E27-A4D8-C4EB4CD600C2","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"acb3dec47261d4569a2797788e47eba5761d0610","datavalue":{"value":{"entity-type":"item","numeric-id":1093563,"id":"Q1093563"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"df474a25b5f336e1ef2ffc1a986d9e401f71808a","datavalue":{"value":{"amount":"+0.8817865","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$AF03076A-17D5-44B0-AA4A-B2DA2E5B58FC","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"ce0edc8f346ff9bb1e507068642c8823d6759090","datavalue":{"value":{"entity-type":"item","numeric-id":5166474,"id":"Q5166474"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"04502828234e459584a728e3966aec2f7036ae73","datavalue":{"value":{"amount":"+0.8796505","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$17B9B7B3-74DB-4C14-8329-0A0D70BF92AA","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"512fab3a84c105d76dad5052d6c26271047da99b","datavalue":{"value":{"entity-type":"item","numeric-id":524243,"id":"Q524243"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"5d8a7ca3aec3ad429335cee49592e11be1fbc759","datavalue":{"value":{"amount":"+0.8793912","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$F75C8775-D3F4-4528-9BCB-09A62F5F0CD6","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"a9389e267d7251b5d341a045f83b06566072c0f2","datavalue":{"value":{"entity-type":"item","numeric-id":2465202,"id":"Q2465202"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"c0a751dd09407ea8012d4c6c1ecf1c4b02c2c14c","datavalue":{"value":{"amount":"+0.87878","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$6ABD3EDC-6052-4F17-8261-302C97E29802","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"73c8675d939d92cf5e1c6aac57bd4f8930cbc5b0","datavalue":{"value":{"entity-type":"item","numeric-id":2739190,"id":"Q2739190"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"40164cf9d11472dc0be5d559dccb4df568c2fc2d","datavalue":{"value":{"amount":"+0.87803507","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$EDBE1AA1-D801-4731-94E2-20D1B18DAE88","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"e99d2899949f2e71661af2bb987944a00586e8c3","datavalue":{"value":{"entity-type":"item","numeric-id":2675282,"id":"Q2675282"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"589cc49a1c03eee6f0f7aa9b5d4d018b9fe151f2","datavalue":{"value":{"amount":"+0.87453115","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$F6240189-D548-46F4-9938-D1FB4ABB6C39","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"79e8c0662814983bd4f306659c2a2e56aef00099","datavalue":{"value":{"entity-type":"item","numeric-id":3340525,"id":"Q3340525"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"5a4f082ab11fdcf7e07842e8102955218d6fbf6a","datavalue":{"value":{"amount":"+0.8744919","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1870309$4AD24DC7-FD37-43B0-A343-25E291CEF84F","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"From perturbation analysis to Markov decision processes and reinforcement learning","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/From_perturbation_analysis_to_Markov_decision_processes_and_reinforcement_learning"}}}}}