{"entities":{"Q1068009":{"pageid":1078761,"ns":120,"title":"Item:Q1068009","lastrevid":69557307,"modified":"2026-04-13T07:49:37Z","type":"item","id":"Q1068009","labels":{"en":{"language":"en","value":"The variational calculus and approximation in policy space for Markovian decision processes"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 3928751"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$2E3FB484-5F00-4C80-B53F-95472D8BF958","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"f5f0386ef4fe7eea57175e760a0b163d08e65b96","datavalue":{"value":{"text":"The variational calculus and approximation in policy space for Markovian decision processes","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q1068009$1865FDB7-B616-4269-9E69-B3868BAC1E4D","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"f853bd5e8e110d2dfd337a3ee61180ee4d550ad2","datavalue":{"value":"0579.90097","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1068009$C9A8BF04-2EC4-41D9-97F5-623B9A5FFB19","rank":"normal"}],"P27":[{"mainsnak":{"snaktype":"value","property":"P27","hash":"b12d7ac411d0a1091d665663b49be433bfe992b4","datavalue":{"value":"10.1016/0022-247X(85)90197-0","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1068009$29E5AA21-543F-47FC-9352-48EEB5FCF702","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"71b5c36a12101ad151aa449ad72c4af9ce8afa01","datavalue":{"value":{"entity-type":"item","numeric-id":1066820,"id":"Q1066820"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$7F1F750B-8EE1-405C-8300-E87566650181","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"c5ad7b9baf8e531c6b1ad954eb5f2899cc8fe5e5","datavalue":{"value":{"entity-type":"item","numeric-id":85344,"id":"Q85344"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$441E7BB3-C9B2-48D1-AE3C-FED2D3BF4789","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"3c94df5c9af0ede578c52141befd29044de13172","datavalue":{"value":{"time":"+1985-00-00T00:00:00Z","timezone":0,"before":0,"after":0,"precision":9,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q1068009$D5D434E1-6D30-457E-BD2C-5BEFE820264D","rank":"normal"}],"P1448":[{"mainsnak":{"snaktype":"value","property":"P1448","hash":"68a24b5850df906b9422873e5963ddba5e6f1f2c","datavalue":{"value":"The functional equations of Markovian decision processes yield the state values (and gain rate in the undiscounted case). Variational expressions are exhibited here for these state values (and gain rate); these expressions are stationary when evaluated at the correct values. When guesses for the values (and gain rate) are inserted into these variational expressions, a superior guess is usually obtained. Repetition of this procedure is shown to be equivalent to the method of successive approximations in policy space. Two other unusual features of this procedure are these: when the linear equations determining the Lagrange multipliers are non-singular, the variational expressions for the state variables are precisely one Newton-Raphson iteration; when applied to a linear objective function and piecewise-linear constraints, which arises for the functional equations of Markovian decision processes, the variational test quantity is piecewise constant, i.e., its first variation and higher variations all vanish. The latter explains its good performance (one-step convergence) if good estimates are available.","type":"string"},"datatype":"string"},"type":"statement","id":"Q1068009$7243CF37-08E7-4000-AE5D-7A3DFB670E34","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"377d3ab03372cff12915e0de0374438ff70c3716","datavalue":{"value":"90C40","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1068009$1FCF0857-BD8E-45CD-B9B8-EE1D7407FBCB","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"843de71235f44a800ae389e1734df6bb7650efec","datavalue":{"value":"65K10","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1068009$95596C08-C74C-485F-A24A-8D62130B99FA","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"a61c612a94030169833b84ef9445f9b9a30bb15b","datavalue":{"value":"3928751","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q1068009$9D122B78-5A93-440E-8A41-3D6E6E8F6D6E","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"acd8a1b407c9409ea36f73fd5e8609b735b6d755","datavalue":{"value":"variational calculus","type":"string"},"datatype":"string"},"type":"statement","id":"Q1068009$BC4C123B-707E-47EF-93DD-16C17E3EE3D4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"acc3eafd95f2899772f7f5860f12c624d96e8ce8","datavalue":{"value":"state values","type":"string"},"datatype":"string"},"type":"statement","id":"Q1068009$B1089A56-29E3-455A-87BA-1EA1C0775E97","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"a56d2d5c44b266787afe76f87beea08d36d815aa","datavalue":{"value":"gain rate","type":"string"},"datatype":"string"},"type":"statement","id":"Q1068009$6FB205EF-60A9-4ABB-B795-CF5B939AA87B","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"e4d5ca8e01cdde63ae2661882f48518641f2ef0c","datavalue":{"value":"successive approximations in policy space","type":"string"},"datatype":"string"},"type":"statement","id":"Q1068009$1266A437-35FE-4C01-ADC7-FDFCD38EB27E","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$FBA4D195-108C-4A8C-961D-CBE1F3E5F682","rank":"normal"}],"P223":[{"mainsnak":{"snaktype":"value","property":"P223","hash":"44ab46dac833bf59c74428cd3d09602f12ec3326","datavalue":{"value":{"entity-type":"item","numeric-id":5643407,"id":"Q5643407"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$C0AF66BD-08D5-441A-BB36-96AED55C8ED4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"78f14459f67d301da6c539c2f758151b1da5d94a","datavalue":{"value":{"entity-type":"item","numeric-id":5822308,"id":"Q5822308"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$E885ABBA-751D-444A-BD8C-DAD490411A2D","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"f4a69e345c85a98bc0fecc0cd7fdd530afc62b23","datavalue":{"value":{"entity-type":"item","numeric-id":5561219,"id":"Q5561219"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$2AAC7FEC-9D27-451B-A420-66C73DFB78F1","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"b67f20914ba831be848adc3bbc57b97ae9d39e77","datavalue":{"value":{"entity-type":"item","numeric-id":5335719,"id":"Q5335719"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$51579D35-71C6-4906-B8C0-75651F91F9E5","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"98f3a5feeef33ac4f8adb51df617c82e6740453b","datavalue":{"value":{"entity-type":"item","numeric-id":5332971,"id":"Q5332971"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$E1A9D8E9-5C1A-4A9C-8127-0E7CE900FAB3","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"2fcd1ee8ac759d0b53271ab98fbce055d727d780","datavalue":{"value":{"entity-type":"item","numeric-id":5652137,"id":"Q5652137"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$02B15C0F-D878-4E66-9784-E947B9581C54","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"4ad2dfdc017105e926b94e19944eaa0d35c45a54","datavalue":{"value":{"entity-type":"item","numeric-id":5572845,"id":"Q5572845"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$B8D1A8DA-DFF2-4166-A1EE-2480C04D5C64","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"01ba2238c50e5df0fc7ad85b98af27609c70fdf5","datavalue":{"value":{"entity-type":"item","numeric-id":3908787,"id":"Q3908787"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$40DD0A44-0206-4960-95F6-0833F876B2FF","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"dcfe52bbe8796f97ec9bb2194b3d6f6fd1ed9df7","datavalue":{"value":{"entity-type":"item","numeric-id":4198357,"id":"Q4198357"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$8C99893C-FA12-430E-ABF2-E23D37BD0CD1","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"bd0a22b037e67081b98ef905dc772d8ffa56e366","datavalue":{"value":{"entity-type":"item","numeric-id":5592699,"id":"Q5592699"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$042FBFCB-06E9-44AE-B2EB-4EFC3F2B5592","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"abe1e3778427003588e1997f510b35a201dc0cca","datavalue":{"value":{"entity-type":"item","numeric-id":5568938,"id":"Q5568938"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$8F28AFE3-F020-4FBC-9585-3E0D3DD54B16","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"d5f8b0e6788eb4dfc8b21baff6a31308328d8064","datavalue":{"value":{"entity-type":"item","numeric-id":4170547,"id":"Q4170547"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$C6DDBC57-9A16-454B-8906-9CEEFCCFAE59","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"46e0ac584158283c71edd2fd126246cb670270d4","datavalue":{"value":{"entity-type":"item","numeric-id":5528345,"id":"Q5528345"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$845326CE-D9F0-44AD-A726-6CCE7B5BBAB4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"6f860969172b94eb1443288826d5ba14740228f6","datavalue":{"value":{"entity-type":"item","numeric-id":5575236,"id":"Q5575236"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q1068009$482294B7-78A7-4A42-BDF4-5D303D4F941D","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"6913d5d777edce170169a9fac625761fcdb96f1d","datavalue":{"value":{"entity-type":"item","numeric-id":1077334,"id":"Q1077334"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"cea5cc4fe9da82efd45b60597e18aeec8f8ff44e","datavalue":{"value":{"amount":"+0.9255669","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$967E6A74-CB14-4EEA-B5FF-6D9D55C66EC3","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"f5f80257f36671a6cf059b4807f83393a4037818","datavalue":{"value":{"entity-type":"item","numeric-id":4667111,"id":"Q4667111"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"292be4546e11a810620779b39f1eebcc82126330","datavalue":{"value":{"amount":"+0.9033594","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$D56D1B63-199E-4FF5-8F8D-042825922371","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"740084bc5efaa56cf3cfde88cbb26fa4d3c0f602","datavalue":{"value":{"entity-type":"item","numeric-id":1745941,"id":"Q1745941"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"b376fbfe44afcf7b8058bba48b4d31b9037d27f8","datavalue":{"value":{"amount":"+0.9019618","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$E43E3352-6E4F-4531-A108-9275C7AF8009","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"372c27f4c56ed03809ffa7c3f6fb09c9165b9a53","datavalue":{"value":{"entity-type":"item","numeric-id":3446961,"id":"Q3446961"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"c86034edab8888d38b552c0a2cc2bd643ba474c7","datavalue":{"value":{"amount":"+0.8994534","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$E789A320-2B34-45AC-9751-D220288C216C","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"604a13bcc31889179e026b259e836323bf641089","datavalue":{"value":{"entity-type":"item","numeric-id":2409311,"id":"Q2409311"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"874687cffc35887ec76125906385b8621985e3b7","datavalue":{"value":{"amount":"+0.8993524","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$10700EA6-4582-4F43-9CDF-37CEA8331535","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"0e21e9b55aafeac45795796f49fd5efdddd4a8db","datavalue":{"value":{"entity-type":"item","numeric-id":716529,"id":"Q716529"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"880689ba9b6a8db66ac68ba26cf10be26e77b68a","datavalue":{"value":{"amount":"+0.8988668","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$4EE6CFDF-7D34-4CF6-B760-17BB144C379E","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"bc4f4f295ea5d30c43dbafd02714f29f0bb63a28","datavalue":{"value":{"entity-type":"item","numeric-id":4302596,"id":"Q4302596"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"1191b1df8b9a3af45b54999602b59349eda29dbd","datavalue":{"value":{"amount":"+0.898448","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$7F8B3E19-EE0C-4B79-95D7-C90D1E2509CB","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"99f3d97eb78b2779313961bdd9b7e68c062a48c4","datavalue":{"value":{"entity-type":"item","numeric-id":3777825,"id":"Q3777825"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"7e522e982b38242c649bb50f7f5c942e05ba0772","datavalue":{"value":{"amount":"+0.89585316","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$F8D99DA3-7D04-4A28-B0E4-34112079FADE","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"bf26f3b6fadc090de0cfef69208cc1b12e612c51","datavalue":{"value":{"entity-type":"item","numeric-id":3374820,"id":"Q3374820"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"85c39be35d6043f01749bdd1fc627b6722af7f9c","datavalue":{"value":{"amount":"+0.8926705","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$4285E99A-C3DF-4CB9-9B27-0A71117414E4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"bbbf5d7c72c755e2222385b384e4208ad3081d74","datavalue":{"value":{"entity-type":"item","numeric-id":1066821,"id":"Q1066821"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"b56eae3ff004ad0333162e1de538cfbc30d8ccb1","datavalue":{"value":{"amount":"+0.89108753","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"ac3c626774dcd0d16f89557f66586245841a01db","datavalue":{"value":{"entity-type":"item","numeric-id":6767936,"id":"Q6767936"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q1068009$8B01F057-A3D0-4DE7-86ED-AAB6AF8181AA","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"The variational calculus and approximation in policy space for Markovian decision processes","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/The_variational_calculus_and_approximation_in_policy_space_for_Markovian_decision_processes"}}}}}