{"entities":{"Q2896090":{"pageid":2906815,"ns":120,"title":"Item:Q2896090","lastrevid":51510353,"modified":"2026-01-18T13:56:22Z","type":"item","id":"Q2896090","labels":{"en":{"language":"en","value":"Near-optimal regret bounds for reinforcement learning"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 6055537"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$645977EC-D389-4B46-ADDE-7E512E246E06","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"f9817f073ed02565fa3804c19c08d87ca9af9f91","datavalue":{"value":"1242.68229","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896090$1A78742A-F04B-42F9-9548-31D2A19A00EA","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"8e2f795c42e5be228a6afe31d18a6093a1e00032","datavalue":{"value":{"entity-type":"item","numeric-id":2896089,"id":"Q2896089"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$5D50C0EC-1695-4B59-A3C5-004053F6EE89","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"5628914a0499277e4ad11bfbf842d89efca1f2c1","datavalue":{"value":{"entity-type":"item","numeric-id":378752,"id":"Q378752"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$EDAEA583-A546-448B-8D7E-95EA26AA5551","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P16","hash":"ee8883d7619b99d8980e310084b3469a731d9307","datavalue":{"value":{"entity-type":"item","numeric-id":239426,"id":"Q239426"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$537EA522-C4A4-4954-B28C-3A46911EFE09","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"b8169782b0c1573ab69940e37078f3a0c71cae46","datavalue":{"value":{"time":"+2012-07-13T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q2896090$14AB8875-7672-46B8-8365-B98A91085158","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"9f20285dfa6c9e110341f7c0644c0cfef30e4577","datavalue":{"value":"http://www.jmlr.org/papers/v11/jaksch10a.html","type":"string"},"datatype":"url"},"type":"statement","id":"Q2896090$9EE69FC0-48CD-4DDF-9619-032BE3FE9BA1","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"cfe779e91fe9c53ee133568259955801965765ae","datavalue":{"value":"68T05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896090$412FFB42-AF12-4E30-8B44-F507D5E2886F","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"377d3ab03372cff12915e0de0374438ff70c3716","datavalue":{"value":"90C40","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896090$CA230557-ECC1-4752-9613-A9B37A3C29B9","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"e0155daac2ce47983d0607a424acae0d1d4a9c1b","datavalue":{"value":"6055537","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2896090$DC0ABE44-A98D-4B08-B97A-0F1A32142860","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"cd0d3b7eac266d6a4e502d1cd5a51047616fb81c","datavalue":{"value":"undiscounted reinforcement learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896090$B80D8F9B-E6D8-43EF-81A5-742BBF6368B9","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"a8cfb635100bcc8a85463e6beac1ce534f15033d","datavalue":{"value":"Markov decision process","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896090$0532774E-6AC5-4371-B41A-5560FEE02BB5","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"af637498c021118a08b6b4f4d04cef45ea88a21b","datavalue":{"value":"regret","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896090$07EE564A-D368-49D1-BE78-8CE12F6BB245","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"6ff3a87d2a1ef11672d22dcfbd650d697545a268","datavalue":{"value":"online learning","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896090$813BEAEA-1E2E-4989-BD81-8C7AD1DB0F36","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"069723b5518c531a3e45ceb3a7ca0ae760d0fab9","datavalue":{"value":"sample complexity","type":"string"},"datatype":"string"},"type":"statement","id":"Q2896090$A7DC0B0A-CBFF-49FF-8333-199F52A7AAB0","rank":"normal"}],"P1463":[{"mainsnak":{"snaktype":"value","property":"P1463","hash":"43217cc7921c31b6bc194c63fa0ab19b7fe52f4c","datavalue":{"value":{"entity-type":"item","numeric-id":15078,"id":"Q15078"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$76B4FB8C-854B-4F46-BFD1-7E74F30D385C","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$481EC56E-EA63-431B-BCC1-1099F727803F","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"6c8933294521d7f04bcdbe90acf82616715089dc","datavalue":{"value":{"text":"Near-optimal regret bounds for reinforcement learning","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q2896090$B8E3394B-F0D0-4EBA-80AE-07B07D411084","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"05810dfd27f2b8a246f7d0a5b34fbcc72e448b7a","datavalue":{"value":{"entity-type":"item","numeric-id":6582882,"id":"Q6582882"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2896090$0622DF8B-1178-4EE0-933F-742E0CDE58E3","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"277e199efeb2dce09dfc627db600b267fa004957","datavalue":{"value":{"entity-type":"item","numeric-id":4617639,"id":"Q4617639"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"c96fa24e43e6e5a653173dd227bc6debd3334d55","datavalue":{"value":{"amount":"+0.8324500322341919","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896090$EA24873D-E557-49EE-AD93-1021B4C97545","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"1863e9b0ebf39a4467e6603c79317024e91f8fc7","datavalue":{"value":{"entity-type":"item","numeric-id":465258,"id":"Q465258"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"b8c223367640ccc10d64a8a95c2435697eeebdcb","datavalue":{"value":{"amount":"+0.8222609162330627","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896090$C8CCDA4F-D637-4BD0-BC5A-4043EA5608E4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"fec0a6613d187b17c77c9f19a83365dac637d836","datavalue":{"value":{"entity-type":"item","numeric-id":5214808,"id":"Q5214808"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"b64d593255d6073e9048aa2df177c44fb5a35c87","datavalue":{"value":{"amount":"+0.8211166262626648","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896090$954933EC-6C1D-4F18-9A38-D2F1826F6E0D","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"512d4c4a45f72cf314f74017a6cf3df2fa523246","datavalue":{"value":{"entity-type":"item","numeric-id":1604817,"id":"Q1604817"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"b43382e79735da28b5e9ddc2167cf4ad34732003","datavalue":{"value":{"amount":"+0.8152390122413635","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896090$D58A3DE3-D052-43C9-BEE2-C0861538FE93","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"04e2e1267eb6bbc170977aa45a566bac751c8b91","datavalue":{"value":{"entity-type":"item","numeric-id":3164829,"id":"Q3164829"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"0b98a5dc06cc4f2dc1db84d5ef7ed7119328f506","datavalue":{"value":{"amount":"+0.8134222626686096","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2896090$87FBBA3D-8329-43EE-93B5-101792C6D27A","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"Publication:2896090","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/Publication:2896090"}}}}}