{"entities":{"Q5405224":{"pageid":7434798,"ns":120,"title":"Item:Q5405224","lastrevid":75720865,"modified":"2026-04-20T18:49:20Z","type":"item","id":"Q5405224","labels":{"en":{"language":"en","value":"Dynamic policy programming"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 6276212"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q5405224$744D7950-8064-4DE9-B12E-412974462881","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"7d9d9d2bb3e137523ef9ade2d74441873026bd97","datavalue":{"value":"1436.90148","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q5405224$F5D68739-F2EC-43F0-AFFF-B7E3E3B77E9F","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"c8bddd1d55c488ec5e6676691780dc4ae42bf5f1","datavalue":{"value":{"entity-type":"item","numeric-id":399888,"id":"Q399888"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q5405224$470EBE99-3D85-45A8-8A10-D8351C46A8BC","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"954d484c3d12df82ccf045903f2e657ea9889ea3","datavalue":{"value":{"entity-type":"item","numeric-id":420937,"id":"Q420937"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q5405224$B55C260B-0078-4F24-89EE-A90E9F06E517","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"59547204bd980ed31b2f0836037cbf5fed9979b0","datavalue":{"value":{"entity-type":"item","numeric-id":399889,"id":"Q399889"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q5405224$91B77FF2-6C86-474A-A0B3-E38B47FF0B4C","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"1832e2b8d11d1c115bb49a23d134e9ef7371fd03","datavalue":{"value":{"time":"+2014-04-01T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q5405224$B07DFA0F-6949-48C4-B903-525E63874E59","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"9f6fb4596c40abf834a9a3bea21de186024f7250","datavalue":{"value":"http://www.jmlr.org/papers/v13/azar12a.html","type":"string"},"datatype":"url"},"type":"statement","id":"Q5405224$85B58923-62EC-494E-883A-00342DE4D9F1","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"aa3ca91474fff28e420d9cace433f8447ec799b0","datavalue":{"value":"90C39","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q5405224$73992714-BB00-4B9F-B4FC-8A0D18533449","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"377d3ab03372cff12915e0de0374438ff70c3716","datavalue":{"value":"90C40","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q5405224$5DF58B24-524B-41EA-BEEC-1ACA4C8C004C","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"2acc045853514fe6a32ca0150ffaab6097f2ccf5","datavalue":{"value":"6276212","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q5405224$D6B0BC87-D541-4AAB-AA01-3D97299C3D3B","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ccc50d18cd76d03749bf5066c9cd1ba8681cc30f","datavalue":{"value":"approximate dynamic programming","type":"string"},"datatype":"string"},"type":"statement","id":"Q5405224$95576CC9-07EB-4F7D-9806-4846D29B382A","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"ab31482eee8f34fa99c5284980862acac4a0b6b4","datavalue":{"value":"reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q5405224$3C947588-1E99-4480-9225-2F80EE74CEEB","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"fbd1f99995fb6a13da62a377ba6327166316e976","datavalue":{"value":"Markov decision processes","type":"string"},"datatype":"string"},"type":"statement","id":"Q5405224$E1A58F74-7580-47D3-AD3A-29722A259E64","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"e0f10ed43c622fc62cfada175a917db8ff083e88","datavalue":{"value":"Monte-Carlo methods","type":"string"},"datatype":"string"},"type":"statement","id":"Q5405224$74D9C536-2535-4F17-9E4E-52D904BFA9DC","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"552a0fbf62290d4861ca327f137adb07a4cc5e11","datavalue":{"value":"function approximation","type":"string"},"datatype":"string"},"type":"statement","id":"Q5405224$54B36852-8557-48D8-9474-5EF01B49C835","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q5405224$6332C80A-CC96-4363-9340-90666F00A442","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"321bf2eafddabd1476c5c7a68f2c87d454714238","datavalue":{"value":{"entity-type":"item","numeric-id":2806811,"id":"Q2806811"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"7ffb766e6f277f310aa237c718a091fafc67fc6e","datavalue":{"value":{"amount":"+0.7982197999954224","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q5405224$F4EE0496-8E96-4AA0-8FAD-C8A46887EB64","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"3e0d3ef632e83b0f7e49cddae362ec492d4338cc","datavalue":{"value":{"entity-type":"item","numeric-id":2887629,"id":"Q2887629"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"9b619bd728e7df16c4df6d21c31c905b9b86cbb4","datavalue":{"value":{"amount":"+0.7861943244934082","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q5405224$611D11CD-BA29-4CEB-B467-E694B21840BD","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"739d59389b2782417fed4c14d7d1a4110edbb87e","datavalue":{"value":{"entity-type":"item","numeric-id":3755250,"id":"Q3755250"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"c283931ce1e60685de7067f4fefd2e6c430c12f9","datavalue":{"value":{"amount":"+0.7752578854560852","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q5405224$D7A11956-C6F9-4568-8E66-02E8BC54BFAC","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"0bb4b180ae01ee68a5083c32db1975f7b676e79e","datavalue":{"value":{"entity-type":"item","numeric-id":1990495,"id":"Q1990495"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"2b232f9117d74044720fe1b91df91f726bb118f5","datavalue":{"value":{"amount":"+0.7745881080627441","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q5405224$B30D6A6A-2F7D-41F2-93BD-332752718EAA","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"2f2e03a81bb9a955b9ab3df3f9d65f33443e474e","datavalue":{"value":{"entity-type":"item","numeric-id":928140,"id":"Q928140"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"4854ebe7654301c79dc3dd97fa16c20653ca86b1","datavalue":{"value":{"amount":"+0.7731862664222717","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q5405224$20DD6852-B23C-4691-8D6D-4CE72E72AE56","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"Dynamic policy programming","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/Dynamic_policy_programming"}}}}}