{"entities":{"Q2896181":{"pageid":2906906,"ns":120,"title":"Item:Q2896181","lastrevid":51510479,"modified":"2026-01-18T13:56:26Z","type":"item","id":"Q2896181","labels":{"en":{"language":"en","value":"A generalized path integral control approach to reinforcement learning"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 6055590"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896181$8DB621D4-8AF5-4F1E-92D0-58528939E55D","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"9b4c048b068c2d6e0d9c54bec0aa9f8a8b955a51","datavalue":{"value":"1242.68254","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896181$48EF452C-61C6-404D-B366-D2BC488C1B59","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"d130fcd398e50450e04ad173be138f9c088ce7ea","datavalue":{"value":{"entity-type":"item","numeric-id":680512,"id":"Q680512"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896181$20CE3E60-8A35-4585-B46A-62E72AF97DA6","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"27268cb2b3b8cc060a6d6773e000d9d546566680","datavalue":{"value":{"entity-type":"item","numeric-id":937304,"id":"Q937304"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896181$AB62D136-456B-4916-B553-38BF6116193D","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"f8426f5f8731e5f776213932e3183d92ea91a926","datavalue":{"value":{"entity-type":"item","numeric-id":553248,"id":"Q553248"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896181$F8E6EE59-D944-4F7A-BAF0-37679B19756E","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"b8169782b0c1573ab69940e37078f3a0c71cae46","datavalue":{"value":{"time":"+2012-07-13T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q2896181$9FBF849C-D367-49E9-93A2-D475ED107E79","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"8245a1fe716e544654a9edd9f2e8c6e029a51be6","datavalue":{"value":"http://www.jmlr.org/papers/v11/theodorou10a.html","type":"string"},"datatype":"url"},"type":"statement","id":"Q2896181$1705B636-02F4-4AA6-9EA8-14DBD877B760","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"cfe779e91fe9c53ee133568259955801965765ae","datavalue":{"value":"68T05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896181$B6737A90-19E4-40FF-9FF0-1BF453AD2924","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"48a59f52dcfcc38cd6697e0ef07319031311895b","datavalue":{"value":"62H30","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896181$EB1A2770-E459-416A-847F-9024BD4ACBC0","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"e3bc6c7cda8279d6ad2b578e7a7e4967447c3cc4","datavalue":{"value":"93E20","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896181$F2BAD277-E199-420E-AEF3-418419A2BA42","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"39fc15ff87ddc9f4e6f797d14b3f6fab7e9f6bdb","datavalue":{"value":"6055590","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896181$11997F83-F041-4E34-8FAF-3DD84C9F85B6","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"6d35e880ae23fd41bbf85e0798dfd54bb17d4ffe","datavalue":{"value":"stochastic optimal control","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896181$554A7513-2815-4973-BF33-EE4AEB05A837","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ab31482eee8f34fa99c5284980862acac4a0b6b4","datavalue":{"value":"reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896181$9DA45C3C-50C4-46C7-BEBD-4B3B26A1D9FF","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"113048813ceefeb27927b0547f456e58460219fd","datavalue":{"value":"parameterized policies","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896181$9E13E74E-CD8C-4139-BB01-629FD945E46F","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896181$209438C2-C080-484A-B6AD-C2076B98230C","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"8a673b197d69a20f3db4b3803a4b0dc86a0aca4e","datavalue":{"value":{"text":"A generalized path integral control approach to reinforcement learning","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q2896181$88529BF1-7857-4427-B5DD-A71623E4A31D","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"05810dfd27f2b8a246f7d0a5b34fbcc72e448b7a","datavalue":{"value":{"entity-type":"item","numeric-id":6582882,"id":"Q6582882"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896181$7122FB18-923A-4637-8FAE-A71394640080","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"b9e35d8683a495bfd010d8c5174f3a45a98f2295","datavalue":{"value":{"entity-type":"item","numeric-id":2804092,"id":"Q2804092"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"68113ebef32c3948d841e52f3e47efd7d35c9901","datavalue":{"value":{"amount":"+0.7674137949943542","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896181$ECE9D86A-651B-436A-8873-286EDE234704","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"34e5d18b5cb53bbbaa05bda5f30b64906dc8e1e2","datavalue":{"value":{"entity-type":"item","numeric-id":290478,"id":"Q290478"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"110caae2fb6eac3c9404950805f7ef6b264bf71f","datavalue":{"value":{"amount":"+0.7606939673423767","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896181$F58E8BDA-D35F-4EC8-91BE-D36DC7CCCF57","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"8f400a63cfede0dd6482dff336d356090715fe38","datavalue":{"value":{"entity-type":"item","numeric-id":413874,"id":"Q413874"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"dd099683bd2558ee437ddf276f0916b197745797","datavalue":{"value":{"amount":"+0.7593355178833008","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896181$83B4C970-19BF-4307-ADA6-A31FE0D1F07A","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"2019e98818d30fa59546a65dfe28c08b7ce70b06","datavalue":{"value":{"entity-type":"item","numeric-id":5378202,"id":"Q5378202"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"be05860ca62b0703291c0fef4c93401e66c3aa58","datavalue":{"value":{"amount":"+0.7514338493347168","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896181$5CDD1804-C612-4CBC-8229-B2491BCE8F50","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"d3e8da1ef484f98317bded28ae36afe4a8ad8ec6","datavalue":{"value":{"entity-type":"item","numeric-id":5045345,"id":"Q5045345"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"f8c8ccb7feb8af051a0f85d09a362d2d2bd281ba","datavalue":{"value":{"amount":"+0.747637152671814","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896181$50CC1B58-12CB-4C54-AE6F-450240AF99B0","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"Publication:2896181","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/Publication:2896181"}}}}}