jubatus_core  0.1.2
Jubatus: Online machine learning framework for distributed environment
Public Member Functions | Private Attributes | List of all members
jubatus::core::bandit::softmax Class Reference

#include <softmax.hpp>

Inheritance diagram for jubatus::core::bandit::softmax:
Inheritance graph
Collaboration diagram for jubatus::core::bandit::softmax:
Collaboration graph

Public Member Functions

void clear ()
 
bool delete_arm (const std::string &arm_id)
 
arm_info_map get_arm_info (const std::string &player_id) const
 
void get_diff (diff_t &diff) const
 
storage::version get_version () const
 
void mix (const diff_t &lhs, diff_t &rhs) const
 
std::string name () const
 
void pack (framework::packer &pk) const
 
bool put_diff (const diff_t &diff)
 
bool register_arm (const std::string &arm_id)
 
bool register_reward (const std::string &player_id, const std::string &arm_id, double reward)
 
bool reset (const std::string &player_id)
 
std::string select_arm (const std::string &player_id)
 
 softmax (bool assume_unrewarded, double tau)
 
void unpack (msgpack::object o)
 
- Public Member Functions inherited from jubatus::core::bandit::bandit_base
 bandit_base ()
 
virtual ~bandit_base ()
 

Private Attributes

jubatus::util::math::random::mtrand rand_
 
summation_storage s_
 
double tau_
 

Additional Inherited Members

- Public Types inherited from jubatus::core::bandit::bandit_base
typedef jubatus::util::data::unordered_map< std::string, arm_info_mapdiff_t
 

Detailed Description

Definition at line 30 of file softmax.hpp.

Constructor & Destructor Documentation

jubatus::core::bandit::softmax::softmax ( bool  assume_unrewarded,
double  tau 
)

Definition at line 32 of file softmax.cpp.

References JUBATUS_EXCEPTION.

33  : tau_(tau), s_(assume_unrewarded) {
34  if (tau <= 0) {
35  throw JUBATUS_EXCEPTION(
36  common::invalid_parameter("0 < tau"));
37  }
38 }
#define JUBATUS_EXCEPTION(e)
Definition: exception.hpp:79
summation_storage s_
Definition: softmax.hpp:63

Member Function Documentation

void jubatus::core::bandit::softmax::clear ( )
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 79 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::clear(), and s_.

Here is the call graph for this function:

bool jubatus::core::bandit::softmax::delete_arm ( const std::string &  arm_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 62 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::delete_arm(), and s_.

62  {
63  return s_.delete_arm(arm_id);
64 }
summation_storage s_
Definition: softmax.hpp:63
bool delete_arm(const std::string &arm_id)

Here is the call graph for this function:

arm_info_map jubatus::core::bandit::softmax::get_arm_info ( const std::string &  player_id) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 72 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::get_arm_info_map(), and s_.

72  {
73  return s_.get_arm_info_map(player_id);
74 }
arm_info_map get_arm_info_map(const std::string &player_id) const
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

void jubatus::core::bandit::softmax::get_diff ( diff_t diff) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 90 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::get_diff(), and s_.

90  {
91  s_.get_diff(diff);
92 }
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

storage::version jubatus::core::bandit::softmax::get_version ( ) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 100 of file softmax.cpp.

100  {
101  return storage::version();
102 }
void jubatus::core::bandit::softmax::mix ( const diff_t lhs,
diff_t rhs 
) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 96 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::mix(), and s_.

96  {
97  s_.mix(lhs, rhs);
98 }
static void mix(const table_t &lhs, table_t &rhs)
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

std::string jubatus::core::bandit::softmax::name ( ) const
inlinevirtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 48 of file softmax.hpp.

48  {
49  return "softmax";
50  }
void jubatus::core::bandit::softmax::pack ( framework::packer pk) const
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 83 of file softmax.cpp.

References s_.

83  {
84  pk.pack(s_);
85 }
summation_storage s_
Definition: softmax.hpp:63
bool jubatus::core::bandit::softmax::put_diff ( const diff_t diff)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 93 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::put_diff(), and s_.

93  {
94  return s_.put_diff(diff);
95 }
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

bool jubatus::core::bandit::softmax::register_arm ( const std::string &  arm_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 59 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::register_arm(), and s_.

59  {
60  return s_.register_arm(arm_id);
61 }
bool register_arm(const std::string &arm_id)
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

bool jubatus::core::bandit::softmax::register_reward ( const std::string &  player_id,
const std::string &  arm_id,
double  reward 
)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 66 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::register_reward(), and s_.

68  {
69  return s_.register_reward(player_id, arm_id, reward);
70 }
bool register_reward(const std::string &player_id, const std::string &arm_id, double reward)
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

bool jubatus::core::bandit::softmax::reset ( const std::string &  player_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 76 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::reset(), and s_.

76  {
77  return s_.reset(player_id);
78 }
bool reset(const std::string &player_id)
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

std::string jubatus::core::bandit::softmax::select_arm ( const std::string &  player_id)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 40 of file softmax.cpp.

References jubatus::core::bandit::summation_storage::get_arm_ids(), jubatus::core::bandit::summation_storage::get_expectation(), JUBATUS_EXCEPTION, jubatus::core::bandit::summation_storage::notify_selected(), rand_, s_, jubatus::core::bandit::select_by_weights(), and tau_.

40  {
41  const std::vector<std::string>& arms = s_.get_arm_ids();
42  if (arms.empty()) {
43  throw JUBATUS_EXCEPTION(
44  common::exception::runtime_error("arm is not registered"));
45  }
46 
47  std::vector<double> weights;
48  weights.reserve(arms.size());
49 
50  for (size_t i = 0; i < arms.size(); ++i) {
51  double expectation = s_.get_expectation(player_id, arms[i]);
52  weights.push_back(std::exp(expectation / tau_));
53  }
54  std::string result = arms[select_by_weights(weights, rand_)];
55  s_.notify_selected(player_id, result);
56  return result;
57 }
jubatus::util::math::random::mtrand rand_
Definition: softmax.hpp:62
int select_by_weights(const std::vector< double > &weights, mtrand &rand)
#define JUBATUS_EXCEPTION(e)
Definition: exception.hpp:79
double get_expectation(const std::string &player_id, const std::string &arm_id) const
const std::vector< std::string > & get_arm_ids() const
void notify_selected(const std::string &player_id, const std::string &arm_id)
summation_storage s_
Definition: softmax.hpp:63

Here is the call graph for this function:

void jubatus::core::bandit::softmax::unpack ( msgpack::object  o)
virtual

Implements jubatus::core::bandit::bandit_base.

Definition at line 86 of file softmax.cpp.

References s_.

86  {
87  o.convert(&s_);
88 }
summation_storage s_
Definition: softmax.hpp:63

Member Data Documentation

jubatus::util::math::random::mtrand jubatus::core::bandit::softmax::rand_
private

Definition at line 62 of file softmax.hpp.

Referenced by select_arm().

summation_storage jubatus::core::bandit::softmax::s_
private
double jubatus::core::bandit::softmax::tau_
private

Definition at line 61 of file softmax.hpp.

Referenced by select_arm().


The documentation for this class was generated from the following files: