obp
latest
Introduction:
About
Related Resources
Off-Policy Evaluation (OPE):
Overview
Estimators
Evaluation of OPE
Getting Started:
Installation
Quickstart
Package Reference:
OBP Package Reference
Others:
Github
Dataset
Google Group
LICENSE
References
obp
Docs
»
Index
Edit on GitHub
Index
B
|
C
|
D
|
E
|
F
|
G
|
I
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
U
|
V
B
BaseContextFreePolicy (class in obp.policy.base)
BaseContextualPolicy (class in obp.policy.base)
BaseOfflinePolicyLearner (class in obp.policy.base)
BaseOffPolicyEstimator (class in obp.ope.estimators)
BaseRealBanditDataset (class in obp.dataset.base)
BaseSyntheticBanditDataset (class in obp.dataset.base)
BernoulliTS (class in obp.policy.contextfree)
C
calc_ground_truth_policy_value() (obp.dataset.multiclass.MultiClassToBanditReduction method)
calc_on_policy_policy_value_estimate() (obp.dataset.real.OpenBanditDataset class method)
check_bandit_feedback_inputs() (in module obp.utils)
check_is_fitted() (in module obp.utils)
compute_batch_action_dist() (obp.policy.contextfree.BernoulliTS method)
(obp.policy.contextfree.Random method)
convert_to_action_dist() (in module obp.utils)
D
dim_context() (obp.dataset.real.OpenBanditDataset property)
DirectMethod (class in obp.ope.estimators)
DoublyRobust (class in obp.ope.estimators)
DoublyRobustWithShrinkage (class in obp.ope.estimators)
E
EpsilonGreedy (class in obp.policy.contextfree)
estimate_confidence_interval_by_bootstrap() (in module obp.utils)
estimate_interval() (obp.ope.estimators.BaseOffPolicyEstimator method)
(obp.ope.estimators.DirectMethod method)
(obp.ope.estimators.DoublyRobust method)
(obp.ope.estimators.DoublyRobustWithShrinkage method)
(obp.ope.estimators.InverseProbabilityWeighting method)
(obp.ope.estimators.ReplayMethod method)
(obp.ope.estimators.SelfNormalizedDoublyRobust method)
(obp.ope.estimators.SelfNormalizedInverseProbabilityWeighting method)
(obp.ope.estimators.SwitchDoublyRobust method)
(obp.ope.estimators.SwitchInverseProbabilityWeighting method)
estimate_intervals() (obp.ope.meta.OffPolicyEvaluation method)
estimate_policy_value() (obp.ope.estimators.BaseOffPolicyEstimator method)
(obp.ope.estimators.DirectMethod method)
(obp.ope.estimators.DoublyRobust method)
(obp.ope.estimators.DoublyRobustWithShrinkage method)
(obp.ope.estimators.InverseProbabilityWeighting method)
(obp.ope.estimators.ReplayMethod method)
(obp.ope.estimators.SelfNormalizedDoublyRobust method)
(obp.ope.estimators.SelfNormalizedInverseProbabilityWeighting method)
(obp.ope.estimators.SwitchDoublyRobust method)
(obp.ope.estimators.SwitchInverseProbabilityWeighting method)
estimate_policy_values() (obp.ope.meta.OffPolicyEvaluation method)
evaluate_performance_of_estimators() (obp.ope.meta.OffPolicyEvaluation method)
F
fit() (obp.ope.regression_model.RegressionModel method)
(obp.policy.base.BaseOfflinePolicyLearner method)
(obp.policy.logistic.MiniBatchLogisticRegression method)
(obp.policy.offline.IPWLearner method)
fit_predict() (obp.ope.regression_model.RegressionModel method)
G
get_params() (obp.ope.regression_model.RegressionModel method)
grad() (obp.policy.logistic.MiniBatchLogisticRegression method)
I
initialize() (obp.policy.base.BaseContextFreePolicy method)
(obp.policy.base.BaseContextualPolicy method)
(obp.policy.contextfree.BernoulliTS method)
(obp.policy.contextfree.EpsilonGreedy method)
(obp.policy.contextfree.Random method)
(obp.policy.linear.LinEpsilonGreedy method)
(obp.policy.linear.LinTS method)
(obp.policy.linear.LinUCB method)
(obp.policy.logistic.LogisticEpsilonGreedy method)
(obp.policy.logistic.LogisticTS method)
(obp.policy.logistic.LogisticUCB method)
InverseProbabilityWeighting (class in obp.ope.estimators)
IPWLearner (class in obp.policy.offline)
L
len_list() (obp.dataset.multiclass.MultiClassToBanditReduction property)
(obp.dataset.real.OpenBanditDataset property)
(obp.dataset.synthetic.SyntheticBanditDataset property)
linear_behavior_policy() (in module obp.dataset.synthetic)
linear_reward_function() (in module obp.dataset.synthetic)
LinEpsilonGreedy (class in obp.policy.linear)
LinTS (class in obp.policy.linear)
LinUCB (class in obp.policy.linear)
load_raw_data() (obp.dataset.base.BaseRealBanditDataset method)
(obp.dataset.real.OpenBanditDataset method)
logistic_reward_function() (in module obp.dataset.synthetic)
LogisticEpsilonGreedy (class in obp.policy.logistic)
LogisticTS (class in obp.policy.logistic)
LogisticUCB (class in obp.policy.logistic)
loss() (obp.policy.logistic.MiniBatchLogisticRegression method)
M
MiniBatchLogisticRegression (class in obp.policy.logistic)
module
obp.dataset.base
obp.dataset.multiclass
obp.dataset.real
obp.dataset.synthetic
obp.ope.estimators
obp.ope.meta
obp.ope.regression_model
obp.policy.base
obp.policy.contextfree
obp.policy.linear
obp.policy.logistic
obp.policy.offline
obp.simulator.simulator
obp.utils
MultiClassToBanditReduction (class in obp.dataset.multiclass)
N
n_actions() (obp.dataset.multiclass.MultiClassToBanditReduction property)
(obp.dataset.real.OpenBanditDataset property)
n_rounds() (obp.dataset.multiclass.MultiClassToBanditReduction property)
(obp.dataset.real.OpenBanditDataset property)
O
obp.dataset.base
module
obp.dataset.multiclass
module
obp.dataset.real
module
obp.dataset.synthetic
module
obp.ope.estimators
module
obp.ope.meta
module
obp.ope.regression_model
module
obp.policy.base
module
obp.policy.contextfree
module
obp.policy.linear
module
obp.policy.logistic
module
obp.policy.offline
module
obp.simulator.simulator
module
obp.utils
module
obtain_action_dist_by_eval_policy() (obp.dataset.multiclass.MultiClassToBanditReduction method)
obtain_batch_bandit_feedback() (obp.dataset.base.BaseRealBanditDataset method)
(obp.dataset.base.BaseSyntheticBanditDataset method)
(obp.dataset.multiclass.MultiClassToBanditReduction method)
(obp.dataset.real.OpenBanditDataset method)
(obp.dataset.synthetic.SyntheticBanditDataset method)
OffPolicyEvaluation (class in obp.ope.meta)
OpenBanditDataset (class in obp.dataset.real)
P
policy_type() (obp.policy.base.BaseContextFreePolicy property)
(obp.policy.base.BaseContextualPolicy property)
(obp.policy.base.BaseOfflinePolicyLearner property)
(obp.policy.contextfree.BernoulliTS property)
(obp.policy.contextfree.EpsilonGreedy property)
(obp.policy.contextfree.Random property)
(obp.policy.linear.LinEpsilonGreedy property)
(obp.policy.linear.LinTS property)
(obp.policy.linear.LinUCB property)
(obp.policy.logistic.LogisticEpsilonGreedy property)
(obp.policy.logistic.LogisticTS property)
(obp.policy.logistic.LogisticUCB property)
(obp.policy.offline.IPWLearner property)
pre_process() (obp.dataset.base.BaseRealBanditDataset method)
(obp.dataset.real.OpenBanditDataset method)
predict() (obp.ope.regression_model.RegressionModel method)
(obp.policy.base.BaseOfflinePolicyLearner method)
(obp.policy.offline.IPWLearner method)
predict_proba() (obp.policy.logistic.MiniBatchLogisticRegression method)
(obp.policy.offline.IPWLearner method)
predict_proba_with_sampling() (obp.policy.logistic.MiniBatchLogisticRegression method)
predict_score() (obp.policy.offline.IPWLearner method)
R
Random (class in obp.policy.contextfree)
RegressionModel (class in obp.ope.regression_model)
ReplayMethod (class in obp.ope.estimators)
run_bandit_simulation() (in module obp.simulator.simulator)
S
sample() (obp.policy.logistic.MiniBatchLogisticRegression method)
sample_action() (obp.policy.offline.IPWLearner method)
sample_bootstrap_bandit_feedback() (obp.dataset.real.OpenBanditDataset method)
sample_contextfree_expected_reward() (obp.dataset.synthetic.SyntheticBanditDataset method)
sd() (obp.policy.logistic.MiniBatchLogisticRegression method)
select_action() (obp.policy.base.BaseContextFreePolicy method)
(obp.policy.base.BaseContextualPolicy method)
(obp.policy.contextfree.BernoulliTS method)
(obp.policy.contextfree.EpsilonGreedy method)
(obp.policy.contextfree.Random method)
(obp.policy.linear.LinEpsilonGreedy method)
(obp.policy.linear.LinTS method)
(obp.policy.linear.LinUCB method)
(obp.policy.logistic.LogisticEpsilonGreedy method)
(obp.policy.logistic.LogisticTS method)
(obp.policy.logistic.LogisticUCB method)
SelfNormalizedDoublyRobust (class in obp.ope.estimators)
SelfNormalizedInverseProbabilityWeighting (class in obp.ope.estimators)
set_params() (obp.ope.regression_model.RegressionModel method)
sigmoid() (in module obp.utils)
softmax() (in module obp.utils)
split_train_eval() (obp.dataset.multiclass.MultiClassToBanditReduction method)
summarize_estimators_comparison() (obp.ope.meta.OffPolicyEvaluation method)
summarize_off_policy_estimates() (obp.ope.meta.OffPolicyEvaluation method)
SwitchDoublyRobust (class in obp.ope.estimators)
SwitchInverseProbabilityWeighting (class in obp.ope.estimators)
SyntheticBanditDataset (class in obp.dataset.synthetic)
U
update_params() (obp.policy.base.BaseContextFreePolicy method)
(obp.policy.base.BaseContextualPolicy method)
(obp.policy.contextfree.BernoulliTS method)
(obp.policy.contextfree.EpsilonGreedy method)
(obp.policy.contextfree.Random method)
(obp.policy.linear.LinEpsilonGreedy method)
(obp.policy.linear.LinTS method)
(obp.policy.linear.LinUCB method)
(obp.policy.logistic.LogisticEpsilonGreedy method)
(obp.policy.logistic.LogisticTS method)
(obp.policy.logistic.LogisticUCB method)
V
visualize_off_policy_estimates() (obp.ope.meta.OffPolicyEvaluation method)
Read the Docs
v: latest
Versions
latest
stable
Downloads
pdf
html
epub
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.