jubatus_core  0.1.2
Jubatus: Online machine learning framework for distributed environment
re2_splitter.hpp
Go to the documentation of this file.
1 // Jubatus: Online machine learning framework for distributed environment
2 // Copyright (C) 2012 Preferred Networks and Nippon Telegraph and Telephone Corporation.
3 //
4 // This library is free software; you can redistribute it and/or
5 // modify it under the terms of the GNU Lesser General Public
6 // License version 2.1 as published by the Free Software Foundation.
7 //
8 // This library is distributed in the hope that it will be useful,
9 // but WITHOUT ANY WARRANTY; without even the implied warranty of
10 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 // Lesser General Public License for more details.
12 //
13 // You should have received a copy of the GNU Lesser General Public
14 // License along with this library; if not, write to the Free Software
15 // Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
16 
17 #ifndef JUBATUS_CORE_FV_CONVERTER_RE2_SPLITTER_HPP_
18 #define JUBATUS_CORE_FV_CONVERTER_RE2_SPLITTER_HPP_
19 
20 #include <map>
21 #include <string>
22 #include <utility>
23 #include <vector>
24 #include <re2/re2.h>
25 #include "jubatus/util/lang/scoped_ptr.h"
26 #include "word_splitter.hpp"
27 
28 namespace jubatus {
29 namespace core {
30 namespace fv_converter {
31 
32 class regexp_splitter : public word_splitter {
33  public:
34  regexp_splitter(const std::string& regexp, int group);
35  void split(
36  const std::string& str,
37  std::vector<std::pair<size_t, size_t> >& bounds) const;
38 
39  private:
40  re2::RE2 re_;
41  int group_;
42 };
43 
44 } // namespace fv_converter
45 } // namespace core
46 } // namespace jubatus
47 
48 #endif // JUBATUS_CORE_FV_CONVERTER_RE2_SPLITTER_HPP_
regexp_splitter(const std::string &regexp, int group)
void split(const std::string &str, std::vector< std::pair< size_t, size_t > > &bounds) const