{"entities":{"Q2176624":{"pageid":2187367,"ns":120,"title":"Item:Q2176624","lastrevid":73553529,"modified":"2026-04-14T16:26:23Z","type":"item","id":"Q2176624","labels":{"en":{"language":"en","value":"The multi-armed bandit problem: an efficient nonparametric solution"}},"descriptions":{"en":{"language":"en","value":"scientific article; zbMATH DE number 7196542"}},"aliases":{},"claims":{"P31":[{"mainsnak":{"snaktype":"value","property":"P31","hash":"fd5912e4dab4b881a8eb0eb27e7893fef55176ad","datavalue":{"value":{"entity-type":"item","numeric-id":56887,"id":"Q56887"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$6615AF65-6B6E-4DAF-A671-EF95ED0063F8","rank":"normal"}],"P159":[{"mainsnak":{"snaktype":"value","property":"P159","hash":"0db878fcfdedcd334802e59cb3c4ecbd48a02097","datavalue":{"value":{"text":"The multi-armed bandit problem: an efficient nonparametric solution","language":"en"},"type":"monolingualtext"},"datatype":"monolingualtext"},"type":"statement","id":"Q2176624$72C6CB21-B36A-4995-AF42-B7BAA0871BC7","rank":"normal"}],"P225":[{"mainsnak":{"snaktype":"value","property":"P225","hash":"19946eb63d9d4d0b54b19af54021ab0fa2e5abab","datavalue":{"value":"1442.62180","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$0F98AA66-6746-4834-B6AB-BA0D5F6338A2","rank":"normal"}],"P27":[{"mainsnak":{"snaktype":"value","property":"P27","hash":"bfe653b39b60e8a98433c3e27577e91eb5eebf53","datavalue":{"value":"10.1214/19-AOS1809","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$A9EC8614-F619-4336-883F-CC3ECCFF7C12","rank":"normal"}],"P16":[{"mainsnak":{"snaktype":"value","property":"P16","hash":"3ee5a67b8818bb1dbbdfdb5e5d2909489bb1acbf","datavalue":{"value":{"entity-type":"item","numeric-id":558685,"id":"Q558685"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$3D959BAC-1EC9-44A6-82E2-22ED83328382","rank":"normal"}],"P200":[{"mainsnak":{"snaktype":"value","property":"P200","hash":"0b73f6da78562727d9e1c290db85e0053cdeb667","datavalue":{"value":{"entity-type":"item","numeric-id":60819,"id":"Q60819"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$4939D686-1B23-401A-B43C-2419DECEE262","rank":"normal"}],"P28":[{"mainsnak":{"snaktype":"value","property":"P28","hash":"2ffa913ad058323c97cdd62b11ad32d016ae0804","datavalue":{"value":{"time":"+2020-05-05T00:00:00Z","timezone":0,"before":0,"after":0,"precision":11,"calendarmodel":"http://www.wikidata.org/entity/Q1985727"},"type":"time"},"datatype":"time"},"type":"statement","id":"Q2176624$EEDFA98A-AA49-4E33-8429-7AF3A687C6EC","rank":"normal"}],"P205":[{"mainsnak":{"snaktype":"value","property":"P205","hash":"250b2f4596e7e31c3631ec08f08a369c53bbe672","datavalue":{"value":"https://arxiv.org/abs/1703.08285","type":"string"},"datatype":"url"},"type":"statement","id":"Q2176624$6A3E93C4-86B8-45B4-929C-B8A06AE5519B","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P205","hash":"b410550e839e38d0f7408f48316ed7a66a8ee560","datavalue":{"value":"https://projecteuclid.org/euclid.aos/1581930138","type":"string"},"datatype":"url"},"type":"statement","id":"Q2176624$20629F17-B476-4358-B2E9-71F28E62BF02","rank":"normal"}],"P1448":[{"mainsnak":{"snaktype":"value","property":"P1448","hash":"2759fc85e60037743e0b35a40dc0438d9906960c","datavalue":{"value":"The author treats the multi-armed bandit problem in the formulation which can be found in [\\textit{T. L. Lai} and \\textit{H. Robbins}, Adv. Appl. Math. 6, 4--22 (1985; Zbl 0568.62074)]. \\textit{T. L. Lai} [Ann. Stat. 15, 1091--1114 (1987; Zbl 0643.62054)] provided efficient parametric solutions to the multi-armed bandit problem, showing that arm allocation via upper confidence bounds (UCB) achieves minimum regret. These bounds are constructed from the Kullback-Leibler information of the reward distributions, estimated from specified parametric families. The subject of this paper is a new nonparametric an arm allocation procedure subsample-mean comparison (SSMC) which is efficient when the reward distributions are from an unspecified one-dimensional exponential family. It achieves this by comparing subsample means of the leading arm with the sample means of its competitors. It is empirical in its approach, using more informative subsample means rather than full-sample means alone, for better decision-making.","type":"string"},"datatype":"string"},"type":"statement","id":"Q2176624$5A731683-0B59-4F98-B6C3-290C21E4A2BF","rank":"normal"}],"P226":[{"mainsnak":{"snaktype":"value","property":"P226","hash":"2c0c09d2caba66ba44b1be99e80b2f2867b9bbb8","datavalue":{"value":"62L05","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$DDD1B0BD-6AD9-46FE-A7E4-DEF7830E18F4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"3d0e7b322622d5e8df8bd4a7f15a34940eb62cd4","datavalue":{"value":"62L15","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$E45C92B9-78C5-4A7E-B8C7-36E1D640548C","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"41500ce50b5ca65fdee8ff163694334bc7f157ae","datavalue":{"value":"62G15","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$AF3F5107-31CE-4B49-B87B-2CD79951D0C9","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P226","hash":"648e65de343c7ed1bbc81380c6f67e618373580b","datavalue":{"value":"62C25","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$5BB9F03D-1B6B-4C1D-BFB7-2B5D235C3921","rank":"normal"}],"P1451":[{"mainsnak":{"snaktype":"value","property":"P1451","hash":"110b7ec77f54fee82d98d019b213cf01616f9b8f","datavalue":{"value":"7196542","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$39B94D88-8852-4973-AB1B-D29A9BE09C5B","rank":"normal"}],"P1450":[{"mainsnak":{"snaktype":"value","property":"P1450","hash":"75f7fe19f725521885c5a40b8a361664ab1a2991","datavalue":{"value":"efficiency","type":"string"},"datatype":"string"},"type":"statement","id":"Q2176624$104B56D3-F13A-4E96-B5C6-7682A659C966","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"d49a2438df9002fffa0409de228442705f35227c","datavalue":{"value":"KL-UCB","type":"string"},"datatype":"string"},"type":"statement","id":"Q2176624$4BBA20B7-D103-4C35-92BF-8E579EBDE0AB","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"e44ec383080eca19f7f5f7d73841dae9eb8e8223","datavalue":{"value":"subsampling","type":"string"},"datatype":"string"},"type":"statement","id":"Q2176624$8B716B50-81E1-4E03-81E0-C7F9D3EAEA2B","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"61fa22f8c69ffa2a2530f1d63c330f11b2c5fef4","datavalue":{"value":"Thompson sampling","type":"string"},"datatype":"string"},"type":"statement","id":"Q2176624$413FF579-71E3-4C34-9B77-548081CDF0D0","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1450","hash":"c0aa27eb9c3dc2ee01371e09ca4f7a6708002c83","datavalue":{"value":"upper confidence bound (UCB)","type":"string"},"datatype":"string"},"type":"statement","id":"Q2176624$D6943769-04F3-41E6-A2B1-36C6C23373FE","rank":"normal"}],"P1447":[{"mainsnak":{"snaktype":"value","property":"P1447","hash":"ec3e05d98779d46740c66c09531c060d978b1d6d","datavalue":{"value":{"entity-type":"item","numeric-id":1656863,"id":"Q1656863"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$80F06555-DD7F-478F-A4D6-33BB99E11D3C","rank":"normal"}],"P1460":[{"mainsnak":{"snaktype":"value","property":"P1460","hash":"57f7fea50d2ce1b39b695c4a1313582eed405e38","datavalue":{"value":{"entity-type":"item","numeric-id":5976449,"id":"Q5976449"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$6A746983-B93C-4DB9-AAA6-A2D8265E0FFC","rank":"normal"}],"P223":[{"mainsnak":{"snaktype":"value","property":"P223","hash":"58e0063881e0b91efbf4cf474d5c5a121f0b0cf3","datavalue":{"value":{"entity-type":"item","numeric-id":4862097,"id":"Q4862097"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$26EF5395-B456-4402-89FF-5C8C704DED39","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"e756665fb763d9311868dc201db16f8188ebccce","datavalue":{"value":{"entity-type":"item","numeric-id":3032153,"id":"Q3032153"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$8B643732-A147-4B1D-8EB4-0A7C6A361A6A","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"e5314db28cbe3eb7bfca044b623c4acedcac4a8c","datavalue":{"value":{"entity-type":"item","numeric-id":5959973,"id":"Q5959973"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$1A05BDB6-4E8E-4A28-9423-415AC1615049","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"321f4d325c75f8a6ca0573c48ce45aa4fc8c7d5f","datavalue":{"value":{"entity-type":"item","numeric-id":5674229,"id":"Q5674229"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$514A178C-2310-4DE2-92C1-E5B83FCDE2E2","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"d2fdb39dbb52b1ef7a73d5a2e0bbb2c2081efaa1","datavalue":{"value":{"entity-type":"item","numeric-id":3809068,"id":"Q3809068"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$4A8DED93-CE2A-4BFD-BA40-62B3A223CEB0","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"ee1898a92b3124c26a0e2b8b506737e1f0ba15c2","datavalue":{"value":{"entity-type":"item","numeric-id":1614793,"id":"Q1614793"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$19F7393B-EBB9-401F-A5E0-A7DEE9CF4120","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"16fb9b209b6f507645a1f045e4e3992b973269de","datavalue":{"value":{"entity-type":"item","numeric-id":1922542,"id":"Q1922542"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$30E2E373-5F58-4899-BABC-8C528F508CB2","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"608486c3ef4b6517e63adc205f056f0ba6d1a32f","datavalue":{"value":{"entity-type":"item","numeric-id":366995,"id":"Q366995"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$54C786CB-1795-42A4-8D64-89D83F5BCE4C","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"99160d2264a7d98d006dd17102ddf33ce059217c","datavalue":{"value":{"entity-type":"item","numeric-id":3779527,"id":"Q3779527"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$8CC01C53-031A-4584-9A66-06AC7A9684DF","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"b5d8b8ca9589c9bc53097c65c619b041b2b309b5","datavalue":{"value":{"entity-type":"item","numeric-id":5627499,"id":"Q5627499"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$D033B2B0-B0F4-464D-86D2-E5CCE428EF2B","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"72ac173876e3ad53e523042bc23f91ca926212b5","datavalue":{"value":{"entity-type":"item","numeric-id":4197923,"id":"Q4197923"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$94E3FF45-74D6-489B-ACD4-5963FB6312B8","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"3285a4d6a81e75b9f90b01804ba4feeaff9367ef","datavalue":{"value":{"entity-type":"item","numeric-id":4337732,"id":"Q4337732"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$763CBEDF-58C6-4666-94EF-9BEA9D25A329","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"5fb2c1a9570efe9f1d0182f2ce61a27670a5b736","datavalue":{"value":{"entity-type":"item","numeric-id":2723273,"id":"Q2723273"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$493C24A7-C023-4F9C-85AE-0661E0963510","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"d7fddd87a0160591eb77e404a7d2b9d3f7a7fdf1","datavalue":{"value":{"entity-type":"item","numeric-id":1102059,"id":"Q1102059"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$BAA367A4-435C-4270-A782-5DB9ECA5AAF4","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"d0b556d51b5e676c221d0327f63920155af2c236","datavalue":{"value":{"entity-type":"item","numeric-id":1060517,"id":"Q1060517"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$42455109-43D1-413C-AE9A-C8C2C89996CB","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"6d3bd02791f3fd6f2c39b3ae9244b7d656a93c72","datavalue":{"value":{"entity-type":"item","numeric-id":4626283,"id":"Q4626283"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$699C085A-1DFF-47E8-84E9-4280F903D20D","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"ed922887106fcc2b705a88e87edcc74d26102c1a","datavalue":{"value":{"entity-type":"item","numeric-id":3690233,"id":"Q3690233"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$2FF118F8-1F39-4FB8-8FF9-F2A7881E275D","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P223","hash":"cecf733ca3a41740cc26b62643013d0b79ee3850","datavalue":{"value":{"entity-type":"item","numeric-id":806690,"id":"Q806690"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","id":"Q2176624$FA17CA8E-3DC2-4DBB-98FC-1D18C69CD1AD","rank":"normal"}],"P388":[{"mainsnak":{"snaktype":"value","property":"P388","hash":"3f510e6adafdae8488b6fc095c0a20945c52660b","datavalue":{"value":"W3007054292","type":"string"},"datatype":"external-id"},"type":"statement","id":"Q2176624$A75B2170-5BB0-4F4D-B333-EDD98C11DCE6","rank":"normal"}],"P1643":[{"mainsnak":{"snaktype":"value","property":"P1643","hash":"170e25028faeb692c58cde884d0d3e18b3a9834b","datavalue":{"value":{"entity-type":"item","numeric-id":806690,"id":"Q806690"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"2a729123aa451d9e8ba7385c62f477a41aa68bbd","datavalue":{"value":{"amount":"+0.8320726156234741","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2176624$43D6394F-4B49-49D4-BF98-5C4F170237A0","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"1f695fb1d4b9bbc1e27ae3115285260843b8ce25","datavalue":{"value":{"entity-type":"item","numeric-id":3798561,"id":"Q3798561"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"048cfbf4330c11b7f92a770f8704768454558b32","datavalue":{"value":{"amount":"+0.8070183992385864","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2176624$6AE144EF-9B7F-4C1C-9E94-DCDA132F23AE","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"0a189116474a5f28b8ae9d73ce2d6a71ffc870bb","datavalue":{"value":{"entity-type":"item","numeric-id":1102059,"id":"Q1102059"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"c3b6e2364d4e2155c67be27925184337dfde4590","datavalue":{"value":{"amount":"+0.8067863583564758","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2176624$B78B7F13-6AEB-4A76-ADE8-A1B2DCB2A9A7","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"672a0d87ba406eeb0b9df7ad0070c301831a3071","datavalue":{"value":{"entity-type":"item","numeric-id":4785631,"id":"Q4785631"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"761861dbc2d88233cc3ed5c72ad456b82eb38c65","datavalue":{"value":{"amount":"+0.8013803958892822","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2176624$21D9D816-02D8-4E21-9762-43C128D3DE21","rank":"normal"},{"mainsnak":{"snaktype":"value","property":"P1643","hash":"1f992dd29efcbba43103b5aa70a308dafb66acee","datavalue":{"value":{"entity-type":"item","numeric-id":366995,"id":"Q366995"},"type":"wikibase-entityid"},"datatype":"wikibase-item"},"type":"statement","qualifiers":{"P1659":[{"snaktype":"value","property":"P1659","hash":"7c2c803bb51df582484ea69ebd8af3ab0670dc57","datavalue":{"value":{"amount":"+0.8010877966880798","unit":"1"},"type":"quantity"},"datatype":"quantity"}],"P1660":[{"snaktype":"value","property":"P1660","hash":"a327a09ea0305e98d5cf33bd4036320e19f2aed0","datavalue":{"value":{"entity-type":"item","numeric-id":6821328,"id":"Q6821328"},"type":"wikibase-entityid"},"datatype":"wikibase-item"}]},"qualifiers-order":["P1659","P1660"],"id":"Q2176624$6E5D1F1F-6352-409F-B945-2719BFAA8BB7","rank":"normal"}]},"sitelinks":{"mardi":{"site":"mardi","title":"The multi-armed bandit problem: an efficient nonparametric solution","badges":[],"url":"https://portal.mardi4nfdi.de/wiki/The_multi-armed_bandit_problem:_an_efficient_nonparametric_solution"}}}}}