Files in contextual
Simulation and Analysis of Contextual Multi-Armed Bandit Policies

MD5
NEWS.md
DESCRIPTION
README.md
NAMESPACE
inst/doc/offline_depaul_movies.R inst/doc/introduction.R inst/doc/sutton_barto.R
inst/doc/mabs.html
inst/doc/sutton_barto.html
inst/doc/introduction.Rmd inst/doc/cmabsoffline.R
inst/doc/website_optimization.html
inst/doc/replication.R inst/doc/eckles_kaptein.Rmd inst/doc/website_optimization.R inst/doc/epsilongreedy.Rmd inst/doc/cmabs.R
inst/doc/ml10m.html
inst/doc/replication.Rmd
inst/doc/cmabs.html
inst/doc/mabs.R
inst/doc/cmabsoffline.html
inst/doc/mabs.Rmd inst/doc/website_optimization.Rmd
inst/doc/epsilongreedy.html
inst/doc/sutton_barto.Rmd
inst/doc/simpsons.html
inst/doc/simpsons.R inst/doc/offline_depaul_movies.Rmd inst/doc/eckles_kaptein.R inst/doc/ml10m.Rmd
inst/doc/replication.html
inst/doc/cmabsoffline.Rmd
inst/doc/offline_depaul_movies.html
inst/doc/eckles_kaptein.html
inst/doc/epsilongreedy.R inst/doc/cmabs.Rmd inst/doc/simpsons.Rmd inst/doc/ml10m.R
inst/doc/introduction.html
vignettes/compare.png
vignettes/mabs.png
vignettes/sutton_gradient.png
vignettes/cmabs.png
vignettes/ucb_cumulative_reward.png
vignettes/replication-fig-2.png
vignettes/sutton_optimistic.png
vignettes/replication-fig-1.png
vignettes/introduction.Rmd
vignettes/eg_incorrect.png
vignettes/sutton_eg_1.png
vignettes/ucb_optimal_action.png
vignettes/ml10m.png
vignettes/sutton_eg_2.png
vignettes/eckles_kaptein.Rmd vignettes/epsilongreedy.Rmd
vignettes/eckles_kaptein_1.png
vignettes/replication.Rmd
vignettes/eg_optimal_action.png
vignettes/linucboffline.png
vignettes/mabs.Rmd vignettes/website_optimization.Rmd
vignettes/eckles_kaptein_0.png
vignettes/softmax_optimal_action.png
vignettes/sutton_barto.Rmd
vignettes/contextual-fig-1.png
vignettes/eg_average_reward.png
vignettes/offline_depaul_movies.Rmd vignettes/ml10m.Rmd
vignettes/softmax_average_reward.png
vignettes/softmax_cumulative_reward.png
vignettes/cmabsoffline.Rmd
vignettes/1.png
vignettes/ucb_average_reward.png
vignettes/carskit_depaul.png
vignettes/eg_cumulative_reward.png
vignettes/basic_epsilon_greedy.png
vignettes/cmabs.Rmd vignettes/simpsons.Rmd
vignettes/Rplot.png
vignettes/sutton_ucb.png
vignettes/sutton_violin.png
vignettes/contextual-fig-2.png
vignettes/introduction_cache/html/__packages
vignettes/introduction_cache/html/setup_423d3c22bc5d12b7b7998aec18aaa96c.rdb
vignettes/introduction_cache/html/setup_423d3c22bc5d12b7b7998aec18aaa96c.RData
vignettes/introduction_cache/html/setup_423d3c22bc5d12b7b7998aec18aaa96c.rdx
vignettes/mabs_cache/html/__packages
vignettes/mabs_cache/html/setup_96a5e4564f97204fe7c59f806f37e175.RData
vignettes/mabs_cache/html/setup_96a5e4564f97204fe7c59f806f37e175.rdb
vignettes/mabs_cache/html/setup_96a5e4564f97204fe7c59f806f37e175.rdx
vignettes/epsilongreedy_cache/html/__packages
vignettes/epsilongreedy_cache/html/setup_40c4b1deea165e9edb69c3e04e0fcbbb.rdx
vignettes/epsilongreedy_cache/html/setup_40c4b1deea165e9edb69c3e04e0fcbbb.rdb
vignettes/epsilongreedy_cache/html/setup_40c4b1deea165e9edb69c3e04e0fcbbb.RData
vignettes/sutton_barto_cache/html/__packages
vignettes/sutton_barto_cache/html/setup_066a1bd36d291cf703be2d20d6d0854e.rdb
vignettes/sutton_barto_cache/html/setup_066a1bd36d291cf703be2d20d6d0854e.RData
vignettes/sutton_barto_cache/html/setup_066a1bd36d291cf703be2d20d6d0854e.rdx
vignettes/simpsons_cache/html/__packages
vignettes/simpsons_cache/html/setup_0141f6ab740f28d6236343eee15de3dc.rdx
vignettes/simpsons_cache/html/setup_0141f6ab740f28d6236343eee15de3dc.RData
vignettes/simpsons_cache/html/setup_0141f6ab740f28d6236343eee15de3dc.rdb
vignettes/offline_depaul_movies_cache/html/__packages
vignettes/offline_depaul_movies_cache/html/setup_94753f3f3f5a048cc0df4f6f86d05b29.RData
vignettes/offline_depaul_movies_cache/html/setup_94753f3f3f5a048cc0df4f6f86d05b29.rdb
vignettes/offline_depaul_movies_cache/html/setup_94753f3f3f5a048cc0df4f6f86d05b29.rdx
vignettes/replication_cache/html/__packages
vignettes/replication_cache/html/setup_73927c9da22ce3c8c4ecdd73f02b1941.rdb
vignettes/replication_cache/html/setup_73927c9da22ce3c8c4ecdd73f02b1941.RData
vignettes/replication_cache/html/setup_73927c9da22ce3c8c4ecdd73f02b1941.rdx
vignettes/website_optimization_cache/html/__packages
vignettes/website_optimization_cache/html/setup_19bf55e18eb38b25f5aa62a3bd0c2716.rdx
vignettes/website_optimization_cache/html/setup_19bf55e18eb38b25f5aa62a3bd0c2716.RData
vignettes/website_optimization_cache/html/setup_19bf55e18eb38b25f5aa62a3bd0c2716.rdb
vignettes/cmabs_cache/html/__packages
vignettes/cmabs_cache/html/setup_a3c2dacd1ece1f4bd648ec373f0022bd.RData
vignettes/cmabs_cache/html/setup_a3c2dacd1ece1f4bd648ec373f0022bd.rdb
vignettes/cmabs_cache/html/setup_a3c2dacd1ece1f4bd648ec373f0022bd.rdx
vignettes/cmabsoffline_cache/html/__packages
vignettes/cmabsoffline_cache/html/setup_478ba5a5109d58a29d2e0e29acbef5c7.RData
vignettes/cmabsoffline_cache/html/setup_478ba5a5109d58a29d2e0e29acbef5c7.rdb
vignettes/cmabsoffline_cache/html/setup_478ba5a5109d58a29d2e0e29acbef5c7.rdx
vignettes/ml10m_cache/html/__packages
vignettes/ml10m_cache/html/setup_234cc75546d1e3a521d603561c7fe9a3.RData
vignettes/ml10m_cache/html/setup_234cc75546d1e3a521d603561c7fe9a3.rdx
vignettes/ml10m_cache/html/setup_234cc75546d1e3a521d603561c7fe9a3.rdb
vignettes/eckles_kaptein_cache/html/setup_97c042ef7ccb57f2041f9440d86d74a1.rdb
vignettes/eckles_kaptein_cache/html/__packages
vignettes/eckles_kaptein_cache/html/setup_97c042ef7ccb57f2041f9440d86d74a1.RData
vignettes/eckles_kaptein_cache/html/setup_97c042ef7ccb57f2041f9440d86d74a1.rdx
demo/demo_offline_cmab_alpha_linucb_direct_method.R demo/demo_offline_direct_method.R demo/demo_simpsons_paradox_propensity.R demo/demo_epsilon_greedy_policy.R demo/demo_cmab_policy_comparison_weight_bandit.R demo/demo_subsubclass.R demo/demo_mab_policy_comparison.R demo/demo_lif_bandit.R demo/demo_offline_cmab_alpha_linucb_replay.R demo/demo_sutton_barto.R demo/demo_offline_propensity_score.R demo/demo_cmab_policy_comparison_linear_bandit.R demo/demo_sine_bandit.R demo/demo_bandit_algorithms_for_website_optimization.R demo/demo_offline_doubly_robust.R
demo/00Index
demo/replication_li_2010/2_run_simulation.R demo/replication_li_2010/4_plotter.R demo/replication_li_2010/3_plotter.R demo/replication_li_2010/1_import_yahoo_to_monetdb.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_epsilon_greedy_seg.R demo/replication_li_2010/demo_yahoo_classes/yahoo_bandit.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_ucb1_alpha_seg.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_linucb_disjoint.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_epsilon_greedy.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_linucb_hybrid.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_random.R demo/replication_li_2010/demo_yahoo_classes/yahoo_policy_ucb1_alpha.R demo/replication_li_2010/alternative_db_scripts/1_import_yahoo_data_to_monetdb_lite.R demo/replication_li_2010/alternative_db_scripts/2_run_the_simulation_on_monetdb_lite.R demo/replication_li_2010/alternative_db_scripts/2_run_the_simulation_on_monetdb.R demo/replication_li_2010/alternative_db_scripts/yahoo_to_mysql.R demo/replication_li_2010/alternative_db_scripts/yahoo_to_sqlite.R demo/replication_li_2010/alternative_db_scripts/yahoo_to_postgresql.R demo/replication_li_2010/demo_yahoo_exploration/plots.R demo/replication_li_2010/demo_yahoo_exploration/exploration.R demo/replication_eckles_kaptein_2014/demo_bootstrap_fig_3.R demo/replication_eckles_kaptein_2014/demo_bootstrap_fig_2.R demo/replication_van_emden_2018/section_5_2.R demo/replication_van_emden_2018/section_4_2_plot.R demo/replication_van_emden_2018/section_5_4.R demo/replication_van_emden_2018/section_3_2_2.R demo/replication_van_emden_2018/section_3_2_1.R demo/replication_van_emden_2018/section_7.R demo/replication_van_emden_2018/section_6.R demo/replication_van_emden_2018/section_2_3.R demo/replication_van_emden_2018/section_8.R demo/replication_van_emden_2018/section_5_3.R demo/replication_kruijswijk_2018/bandit_bernoulli.R demo/replication_kruijswijk_2018/policy_pooled_egreedy.R demo/replication_kruijswijk_2018/2a_offline_replay_persuasion.R demo/replication_kruijswijk_2018/policy_pooled_thompson.R demo/replication_kruijswijk_2018/bandit_bootstrapped_replay.R
demo/replication_kruijswijk_2018/beta_binom_hier_model.stan
demo/replication_kruijswijk_2018/4a_main_synthetic_evaluation.R demo/replication_kruijswijk_2018/2b_offline_bootstrapped_persuasion.R demo/replication_kruijswijk_2018/bandit_replay.R demo/replication_kruijswijk_2018/3_offline_replay_movielens.R
demo/replication_kruijswijk_2018/beta_binom_hier_model.rds
demo/replication_kruijswijk_2018/4b_dependent_observations_plot_bar.R demo/replication_kruijswijk_2018/1_basic_synthetic_evaluation.R demo/replication_kruijswijk_2018/policy_pooled_ucb.R demo/evaluations_on_public_datasets/demo_movielens_100k.R demo/evaluations_on_public_datasets/demo_movielens_10m.R demo/evaluations_on_public_datasets/demo_carskit_depaul.R demo/alternative_parallel_backends/rmpi/test_rmpi_connection.R demo/alternative_parallel_backends/rmpi/simulator_rmpi.R demo/alternative_parallel_backends/rmpi/demo_rmpi.R demo/alternative_parallel_backends/redis/demo_redis.R demo/alternative_parallel_backends/redis/simulator_redis.R demo/alternative_parallel_backends/azure/test_azure_connection.R demo/alternative_parallel_backends/azure/demo_azure.R
demo/alternative_parallel_backends/azure/credentials-sample.json
demo/alternative_parallel_backends/azure/cluster.json
demo/alternative_parallel_backends/azure/simulator_azure.R R/policy_cmab_lin_ucb_hybrid_optimized.R R/bandit_offline_direct_method.R R/bandit_cmab_binary.R R/policy_cmab_lin_ucb_disjoint_optimized.R R/agent.R R/bandit_cmab_logit.R R/policy_cmab_logit_ts_bootstrap.R R/policy_mab_ucb2.R R/policy_fixed.R R/simulator.R R/policy_cmab_lin_ucb_general.R R/policy_cmab_lin_epsilon_greedy.R R/bandit_cmab_precaching.R R/bandit_basic_gaussian.R R/functions_utility.R R/policy_mab_epsilon_first.R R/plot.R R/policy_random.R R/policy_cmab_probit_ts.R R/bandit_cmab_linear.R R/policy_cmab_lin_ucb_disjoint.R R/bandit_offline_doubly_robust.R R/policy_mab_ucb1.R R/bandit_cmab_hybrid.R R/policy_mab_gradient.R R/bandit_cmab_wheel.R R/bandit.R R/policy_mab_ts_bootstrap.R R/history.R R/bandit_offline_replay_evaluator_lookup.R R/policy_cmab_lin_ucb_hybrid.R R/policy_oracle.R R/policy_cont_lif.R R/bandit_cmab_bernoulli.R R/policy_cmab_lin_epoch_greedy.R R/policy_mab_ts.R R/policy.R R/bandit_continuum_function.R R/policy_mab_exp3.R R/policy_cmab_lin_ts_disjoint.R R/bandit_offline_replay_evaluator.R R/bandit_basic_bernoulli.R R/policy_mab_epsilon_greedy.R R/policy_mab_gittins_bl.R R/bandit_offline_bootstrapped_replay.R R/functions_generic.R R/policy_mab_softmax.R R/bandit_offline_propensity_weighting.R man/ones_in_zeroes.Rd man/Policy.Rd man/LifPolicy.Rd man/UCB1Policy.Rd man/OfflinePropensityWeightingBandit.Rd man/ContextualBinaryBandit.Rd man/ContextualLogitBTSPolicy.Rd man/sample_one_of.Rd man/OfflineDoublyRobustBandit.Rd man/RandomPolicy.Rd man/Plot.Rd man/var_welford.Rd man/BootstrapTSPolicy.Rd man/which_max_tied.Rd man/value_remaining.Rd man/LinUCBDisjointPolicy.Rd man/LinUCBHybridOptimizedPolicy.Rd man/ContextualPrecachingBandit.Rd man/ContextualEpochGreedyPolicy.Rd man/GittinsBrezziLaiPolicy.Rd man/ContextualHybridBandit.Rd man/ContextualTSProbitPolicy.Rd man/sim_post.Rd man/prob_winner.Rd man/ContextualWheelBandit.Rd man/inc-set.Rd man/LinUCBGeneralPolicy.Rd man/ContextualBernoulliBandit.Rd man/formatted_difftime.Rd man/OfflineLookupReplayEvaluatorBandit.Rd man/plot.history.Rd man/ContinuumBandit.Rd man/Bandit.Rd man/EpsilonGreedyPolicy.Rd man/EpsilonFirstPolicy.Rd man/sum_of.Rd man/data_table_factors_to_numeric.Rd man/summary.history.Rd man/BasicBernoulliBandit.Rd man/GradientPolicy.Rd man/ContextualLogitBandit.Rd man/LinUCBHybridPolicy.Rd man/Agent.Rd man/ThompsonSamplingPolicy.Rd man/OfflineBootstrappedReplayBandit.Rd man/BasicGaussianBandit.Rd man/UCB2Policy.Rd man/ContextualLinTSPolicy.Rd man/ind.Rd man/OraclePolicy.Rd man/which_max_list.Rd man/OfflineDirectMethodBandit.Rd man/LinUCBDisjointOptimizedPolicy.Rd man/sherman_morrisson.Rd man/History.Rd man/Exp3Policy.Rd man/dec-set.Rd man/invgamma.Rd man/get_arm_context.Rd man/clipr.Rd man/ContextualLinearBandit.Rd man/FixedPolicy.Rd man/is_rstudio.Rd man/get_full_context.Rd man/inv.Rd man/ContextualEpsilonGreedyPolicy.Rd man/Simulator.Rd man/mvrnorm.Rd man/print.history.Rd man/set_external.Rd man/SoftmaxPolicy.Rd man/invlogit.Rd man/one_hot.Rd man/OfflineReplayEvaluatorBandit.Rd
man/figures/algoepsilonfirst.jpg
man/figures/3cbandit.jpeg
man/figures/cmab_all_large.jpg
man/figures/cmab_all_medium.jpg
man/figures/3bpolicy.jpeg
man/figures/cmab_all.jpeg
man/figures/3dpolicy.jpeg
man/figures/3abandit.jpeg
man/figures/1simulator.jpeg
man/figures/2agent.jpeg
build/vignette.rds
tests/testthat.R
tests/testthat/logdiv.rds
tests/testthat/test_agent.R tests/testthat/setup_tests.R tests/testthat/test_utility_functions.R tests/testthat/test_history.R
tests/testthat/history_context_theta_test.ref
tests/testthat/history_context_test.ref
tests/testthat/history_test.ref
tests/testthat/teardown_tests.R
tests/testthat/history_theta_test.ref
tests/testthat/test_policies.R
tests/testthat/summary_history_limit.rds
tests/testthat/test_policy.R tests/testthat/test_plot.R
tests/testthat/dinvgamma1.rds
tests/testthat/summary_history.rds
tests/testthat/test_bandits.R
tests/testthat/dinvgamma2.rds
tests/figs/deps.txt
tests/figs/plot/average-regret-plot.svg
tests/figs/plot/color-and-lty-stepping.svg
tests/figs/plot/arms-color.svg
tests/figs/plot/arms-lims.svg
tests/figs/plot/traces-plot-smooth.svg
tests/figs/plot/average-reward-plot.svg
tests/figs/plot/cumulative-sd-plot.svg
tests/figs/plot/cumulative-traces-plot.svg
tests/figs/plot/ylim-plot.svg
tests/figs/plot/lwd-pot.svg
tests/figs/plot/basic-cumulative-plot.svg
tests/figs/plot/arm-plot.svg
tests/figs/plot/limits-plot.svg
tests/figs/plot/only-sd-plot.svg
tests/figs/plot/plot-inc-var-no-color.svg
tests/figs/plot/traces-alpha-and-max-plot.svg
tests/figs/plot/legend-title-and-labels-plot.svg
contextual documentation built on March 17, 2019, 5:05 p.m.