jubatus_core  0.1.2
Jubatus: Online machine learning framework for distributed environment
space_splitter.cpp
Go to the documentation of this file.
1 // Jubatus: Online machine learning framework for distributed environment
2 // Copyright (C) 2011 Preferred Networks and Nippon Telegraph and Telephone Corporation.
3 //
4 // This library is free software; you can redistribute it and/or
5 // modify it under the terms of the GNU Lesser General Public
6 // License version 2.1 as published by the Free Software Foundation.
7 //
8 // This library is distributed in the hope that it will be useful,
9 // but WITHOUT ANY WARRANTY; without even the implied warranty of
10 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 // Lesser General Public License for more details.
12 //
13 // You should have received a copy of the GNU Lesser General Public
14 // License along with this library; if not, write to the Free Software
15 // Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
16 
17 #include "space_splitter.hpp"
18 
19 #include <string>
20 #include <utility>
21 #include <vector>
22 
23 namespace jubatus {
24 namespace core {
25 namespace fv_converter {
26 
27 namespace {
28 
29 const char* SPACES = " \t\f\n\r\v";
30 
31 } // namespace
32 
34  const std::string& string,
35  std::vector<std::pair<size_t, size_t> >& ret_boundaries) const {
36  std::vector<std::pair<size_t, size_t> > bounds;
37 
38  size_t last = 0;
39  while (true) {
40  size_t begin = string.find_first_not_of(SPACES, last);
41  if (begin == std::string::npos) {
42  break;
43  }
44 
45  size_t end = string.find_first_of(SPACES, begin);
46  if (end == std::string::npos) {
47  size_t len = string.size() - begin;
48  bounds.push_back(std::make_pair(begin, len));
49  break;
50  } else {
51  size_t len = end - begin;
52  bounds.push_back(std::make_pair(begin, len));
53  last = end;
54  }
55  }
56 
57  bounds.swap(ret_boundaries);
58 }
59 
60 } // namespace fv_converter
61 } // namespace core
62 } // namespace jubatus
void split(const std::string &string, std::vector< std::pair< size_t, size_t > > &ret_boundaries) const