split.cc revision 0ae28bd5885b5daa526898fcf7c323dc2c3e1963
1// Ceres Solver - A fast non-linear least squares minimizer
2// Copyright 2010, 2011, 2012 Google Inc. All rights reserved.
3// http://code.google.com/p/ceres-solver/
4//
5// Redistribution and use in source and binary forms, with or without
6// modification, are permitted provided that the following conditions are met:
7//
8// * Redistributions of source code must retain the above copyright notice,
9//   this list of conditions and the following disclaimer.
10// * Redistributions in binary form must reproduce the above copyright notice,
11//   this list of conditions and the following disclaimer in the documentation
12//   and/or other materials provided with the distribution.
13// * Neither the name of Google Inc. nor the names of its contributors may be
14//   used to endorse or promote products derived from this software without
15//   specific prior written permission.
16//
17// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27// POSSIBILITY OF SUCH DAMAGE.
28//
29// Author: keir@google.com (Keir Mierle)
30
31#include <string>
32#include <vector>
33#include <iterator>
34#include "ceres/internal/port.h"
35
36namespace ceres {
37
38// If we know how much to allocate for a vector of strings, we can allocate the
39// vector<string> only once and directly to the right size. This saves in
40// between 33-66 % of memory space needed for the result, and runs faster in the
41// microbenchmarks.
42//
43// The reserve is only implemented for the single character delim.
44//
45// The implementation for counting is cut-and-pasted from
46// SplitStringToIteratorUsing. I could have written my own counting iterator,
47// and use the existing template function, but probably this is more clear and
48// more sure to get optimized to reasonable code.
49static int CalculateReserveForVector(const string& full, const char* delim) {
50  int count = 0;
51  if (delim[0] != '\0' && delim[1] == '\0') {
52    // Optimize the common case where delim is a single character.
53    char c = delim[0];
54    const char* p = full.data();
55    const char* end = p + full.size();
56    while (p != end) {
57      if (*p == c) {  // This could be optimized with hasless(v,1) trick.
58        ++p;
59      } else {
60        while (++p != end && *p != c) {
61          // Skip to the next occurence of the delimiter.
62        }
63        ++count;
64      }
65    }
66  }
67  return count;
68}
69
70template <typename StringType, typename ITR>
71static inline
72void SplitStringToIteratorUsing(const StringType& full,
73                                const char* delim,
74                                ITR& result) {
75  // Optimize the common case where delim is a single character.
76  if (delim[0] != '\0' && delim[1] == '\0') {
77    char c = delim[0];
78    const char* p = full.data();
79    const char* end = p + full.size();
80    while (p != end) {
81      if (*p == c) {
82        ++p;
83      } else {
84        const char* start = p;
85        while (++p != end && *p != c) {
86          // Skip to the next occurence of the delimiter.
87        }
88        *result++ = StringType(start, p - start);
89      }
90    }
91    return;
92  }
93
94  string::size_type begin_index, end_index;
95  begin_index = full.find_first_not_of(delim);
96  while (begin_index != string::npos) {
97    end_index = full.find_first_of(delim, begin_index);
98    if (end_index == string::npos) {
99      *result++ = full.substr(begin_index);
100      return;
101    }
102    *result++ = full.substr(begin_index, (end_index - begin_index));
103    begin_index = full.find_first_not_of(delim, end_index);
104  }
105}
106
107void SplitStringUsing(const string& full,
108                      const char* delim,
109                      vector<string>* result) {
110  result->reserve(result->size() + CalculateReserveForVector(full, delim));
111  back_insert_iterator< vector<string> > it(*result);
112  SplitStringToIteratorUsing(full, delim, it);
113}
114
115}  // namespace ceres
116