jubatus_core  0.1.2
Jubatus: Online machine learning framework for distributed environment
Public Member Functions | Private Member Functions | Private Attributes | List of all members
jubatus::core::bandit::exp3 Class Reference

#include <exp3.hpp>

Inheritance diagram for jubatus::core::bandit::exp3:
Inheritance graph
Collaboration diagram for jubatus::core::bandit::exp3:
Collaboration graph

Public Member Functions

void clear ()
 
bool delete_arm (const std::string &arm_id)
 
 exp3 (bool assume_unrewarded, double gamma)
 
arm_info_map get_arm_info (const std::string &player_id) const
 
void get_diff (diff_t &diff) const
 
storage::version get_version () const
 
void mix (const diff_t &lhs, diff_t &rhs) const
 
std::string name () const
 
void pack (framework::packer &pk) const
 
bool put_diff (const diff_t &diff)
 
bool register_arm (const std::string &arm_id)
 
bool register_reward (const std::string &player_id, const std::string &arm_id, double reward)
 
bool reset (const std::string &player_id)
 
std::string select_arm (const std::string &player_id)
 
void unpack (msgpack::object o)
 
- Public Member Functions inherited from jubatus::core::bandit::bandit_base
 bandit_base ()
 
virtual ~bandit_base ()
 

Private Member Functions

void calc_weights_ (const std::string &player_id, std::vector< double > &weights) const
 

Private Attributes

double gamma_
 
jubatus::util::math::random::mtrand rand_
 
summation_storage s_
 

Additional Inherited Members

- Public Types inherited from jubatus::core::bandit::bandit_base
typedef jubatus::util::data::unordered_map< std::string, arm_info_mapdiff_t
 

Detailed Description

Definition at line 31 of file exp3.hpp.

Constructor & Destructor Documentation

jubatus::core::bandit::exp3::exp3 ( bool  assume_unrewarded,
double  gamma 
)

Definition at line 30 of file exp3.cpp.

References JUBATUS_EXCEPTION.

31  : gamma_(gamma), s_(assume_unrewarded) {
32  if (gamma < 0 || 1 < gamma) {
33  throw JUBATUS_EXCEPTION(
34  common::invalid_parameter("0 <= gamma <= 1"));
35  }
36 }
summation_storage s_
Definition: exp3.hpp:64
#define JUBATUS_EXCEPTION(e)
Definition: exception.hpp:79

Member Function Documentation

void jubatus::core::bandit::exp3::calc_weights_ ( const std::string &  player_id,
std::vector< double > &  weights 
) const
private

Definition at line 38 of file exp3.cpp.

References gamma_, jubatus::core::bandit::summation_storage::get_arm_ids(), jubatus::core::bandit::summation_storage::get_arm_info(), JUBATUS_EXCEPTION, s_, and jubatus::core::bandit::arm_info::weight.

Referenced by register_reward(), and select_arm().

39  {
40  const std::vector<std::string>& arms = s_.get_arm_ids();
41  if (arms.empty()) {
42  throw JUBATUS_EXCEPTION(
43  common::exception::runtime_error("arm is not registered"));
44  }
45 
46  const size_t n = arms.size();
47  weights.clear();
48  weights.reserve(n);
49  double total_weight = 0;
50  for (size_t i = 0; i < n; ++i) {
51  const double weight = std::exp(s_.get_arm_info(player_id, arms[i]).weight);
52  weights.push_back(weight);
53  total_weight += weight;
54  }
55  for (size_t i = 0; i < n; ++i) {
56  weights[i] = (1.0 - gamma_) * weights[i] / total_weight + gamma_ * n;
57  }
58 }
summation_storage s_
Definition: exp3.hpp:64
#define JUBATUS_EXCEPTION(e)
Definition: exception.hpp:79
const std::vector< std::string > & get_arm_ids() const
arm_info get_arm_info(const std::string &player_id, const std::string &arm_id) const

Here is the call graph for this function:

Here is the caller graph for this function:

void jubatus::core::bandit::exp3::clear ( )
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 102 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::clear(), and s_.

102  {
103  s_.clear();
104 }
summation_storage s_
Definition: exp3.hpp:64

Here is the call graph for this function:

bool jubatus::core::bandit::exp3::delete_arm ( const std::string &  arm_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 77 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::delete_arm(), and s_.

77  {
78  return s_.delete_arm(arm_id);
79 }
summation_storage s_
Definition: exp3.hpp:64
bool delete_arm(const std::string &arm_id)

Here is the call graph for this function:

arm_info_map jubatus::core::bandit::exp3::get_arm_info ( const std::string &  player_id) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 95 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::get_arm_info_map(), and s_.

95  {
96  return s_.get_arm_info_map(player_id);
97 }
summation_storage s_
Definition: exp3.hpp:64
arm_info_map get_arm_info_map(const std::string &player_id) const

Here is the call graph for this function:

void jubatus::core::bandit::exp3::get_diff ( diff_t diff) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 113 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::get_diff(), and s_.

113  {
114  s_.get_diff(diff);
115 }
summation_storage s_
Definition: exp3.hpp:64

Here is the call graph for this function:

storage::version jubatus::core::bandit::exp3::get_version ( ) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 123 of file exp3.cpp.

123  {
124  return storage::version();
125 }
void jubatus::core::bandit::exp3::mix ( const diff_t lhs,
diff_t rhs 
) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 119 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::mix(), and s_.

119  {
120  s_.mix(lhs, rhs);
121 }
summation_storage s_
Definition: exp3.hpp:64
static void mix(const table_t &lhs, table_t &rhs)

Here is the call graph for this function:

std::string jubatus::core::bandit::exp3::name ( ) const
inlinevirtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 49 of file exp3.hpp.

49  {
50  return "exp3";
51  }
void jubatus::core::bandit::exp3::pack ( framework::packer pk) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 106 of file exp3.cpp.

References s_.

106  {
107  pk.pack(s_);
108 }
summation_storage s_
Definition: exp3.hpp:64
bool jubatus::core::bandit::exp3::put_diff ( const diff_t diff)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 116 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::put_diff(), and s_.

116  {
117  return s_.put_diff(diff);
118 }
summation_storage s_
Definition: exp3.hpp:64

Here is the call graph for this function:

bool jubatus::core::bandit::exp3::register_arm ( const std::string &  arm_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 74 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::register_arm(), and s_.

74  {
75  return s_.register_arm(arm_id);
76 }
summation_storage s_
Definition: exp3.hpp:64
bool register_arm(const std::string &arm_id)

Here is the call graph for this function:

bool jubatus::core::bandit::exp3::register_reward ( const std::string &  player_id,
const std::string &  arm_id,
double  reward 
)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 81 of file exp3.cpp.

References calc_weights_(), gamma_, jubatus::core::bandit::summation_storage::get_arm_ids(), jubatus::core::bandit::summation_storage::register_reward(), and s_.

83  {
84  const std::vector<std::string>& arms = s_.get_arm_ids();
85  size_t i = std::find(arms.begin(), arms.end(), arm_id) - arms.begin();
86  if (i >= arms.size()) {
87  return false;
88  }
89  std::vector<double> weights;
90  calc_weights_(player_id, weights);
91  return s_.register_reward(player_id, arm_id,
92  reward * weights[i] * gamma_ / arms.size());
93 }
summation_storage s_
Definition: exp3.hpp:64
bool register_reward(const std::string &player_id, const std::string &arm_id, double reward)
const std::vector< std::string > & get_arm_ids() const
void calc_weights_(const std::string &player_id, std::vector< double > &weights) const
Definition: exp3.cpp:38

Here is the call graph for this function:

bool jubatus::core::bandit::exp3::reset ( const std::string &  player_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 99 of file exp3.cpp.

References jubatus::core::bandit::summation_storage::reset(), and s_.

99  {
100  return s_.reset(player_id);
101 }
summation_storage s_
Definition: exp3.hpp:64
bool reset(const std::string &player_id)

Here is the call graph for this function:

std::string jubatus::core::bandit::exp3::select_arm ( const std::string &  player_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 60 of file exp3.cpp.

References calc_weights_(), jubatus::core::bandit::summation_storage::get_arm_ids(), JUBATUS_EXCEPTION, jubatus::core::bandit::summation_storage::notify_selected(), rand_, s_, and jubatus::core::bandit::select_by_weights().

60  {
61  const std::vector<std::string>& arms = s_.get_arm_ids();
62  if (arms.empty()) {
63  throw JUBATUS_EXCEPTION(
64  common::exception::runtime_error("arm is not registered"));
65  }
66 
67  std::vector<double> weights;
68  calc_weights_(player_id, weights);
69  std::string result = arms[select_by_weights(weights, rand_)];
70  s_.notify_selected(player_id, result);
71  return result;
72 }
summation_storage s_
Definition: exp3.hpp:64
int select_by_weights(const std::vector< double > &weights, mtrand &rand)
#define JUBATUS_EXCEPTION(e)
Definition: exception.hpp:79
const std::vector< std::string > & get_arm_ids() const
void notify_selected(const std::string &player_id, const std::string &arm_id)
void calc_weights_(const std::string &player_id, std::vector< double > &weights) const
Definition: exp3.cpp:38
jubatus::util::math::random::mtrand rand_
Definition: exp3.hpp:63

Here is the call graph for this function:

void jubatus::core::bandit::exp3::unpack ( msgpack::object  o)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 109 of file exp3.cpp.

References s_.

109  {
110  o.convert(&s_);
111 }
summation_storage s_
Definition: exp3.hpp:64

Member Data Documentation

double jubatus::core::bandit::exp3::gamma_
private

Definition at line 62 of file exp3.hpp.

Referenced by calc_weights_(), and register_reward().

jubatus::util::math::random::mtrand jubatus::core::bandit::exp3::rand_
private

Definition at line 63 of file exp3.hpp.

Referenced by select_arm().

summation_storage jubatus::core::bandit::exp3::s_
private

The documentation for this class was generated from the following files: