17 #ifndef JUBATUS_CORE_BANDIT_SOFTMAX_HPP_
18 #define JUBATUS_CORE_BANDIT_SOFTMAX_HPP_
22 #include "jubatus/util/math/random.h"
32 softmax(
bool assume_unrewarded,
double tau);
34 std::string
select_arm(
const std::string& player_id);
40 const std::string& arm_id,
45 bool reset(
const std::string& player_id);
53 void unpack(msgpack::object o);
62 jubatus::util::math::random::mtrand
rand_;
70 #endif // JUBATUS_CORE_BANDIT_SOFTMAX_HPP_
bool put_diff(const diff_t &diff)
jubatus::util::math::random::mtrand rand_
bool reset(const std::string &player_id)
void get_diff(diff_t &diff) const
bool register_arm(const std::string &arm_id)
void pack(framework::packer &pk) const
jubatus::util::data::unordered_map< std::string, arm_info_map > diff_t
storage::version get_version() const
softmax(bool assume_unrewarded, double tau)
jubatus::util::data::unordered_map< std::string, arm_info > arm_info_map
void unpack(msgpack::object o)
std::string select_arm(const std::string &player_id)
bool delete_arm(const std::string &arm_id)
void mix(const diff_t &lhs, diff_t &rhs) const
bool register_reward(const std::string &player_id, const std::string &arm_id, double reward)
arm_info_map get_arm_info(const std::string &player_id) const