stringpiece.h revision c73f511526464f8e56c242df80552e9b0d94ae3d
1// Copyright (C) 2009-2013, International Business Machines
2// Corporation and others. All Rights Reserved.
3//
4// Copyright 2001 and onwards Google Inc.
5// Author: Sanjay Ghemawat
6
7// This code is a contribution of Google code, and the style used here is
8// a compromise between the original Google code and the ICU coding guidelines.
9// For example, data types are ICU-ified (size_t,int->int32_t),
10// and API comments doxygen-ified, but function names and behavior are
11// as in the original, if possible.
12// Assertion-style error handling, not available in ICU, was changed to
13// parameter "pinning" similar to UnicodeString.
14//
15// In addition, this is only a partial port of the original Google code,
16// limited to what was needed so far. The (nearly) complete original code
17// is in the ICU svn repository at icuhtml/trunk/design/strings/contrib
18// (see ICU ticket 6765, r25517).
19
20#ifndef __STRINGPIECE_H__
21#define __STRINGPIECE_H__
22
23/**
24 * \file
25 * \brief C++ API: StringPiece: Read-only byte string wrapper class.
26 */
27
28#include "unicode/utypes.h"
29#include "unicode/uobject.h"
30#include "unicode/std_string.h"
31
32// Arghh!  I wish C++ literals were "string".
33
34U_NAMESPACE_BEGIN
35
36/**
37 * A string-like object that points to a sized piece of memory.
38 *
39 * We provide non-explicit singleton constructors so users can pass
40 * in a "const char*" or a "string" wherever a "StringPiece" is
41 * expected.
42 *
43 * Functions or methods may use const StringPiece& parameters to accept either
44 * a "const char*" or a "string" value that will be implicitly converted to
45 * a StringPiece.
46 *
47 * Systematic usage of StringPiece is encouraged as it will reduce unnecessary
48 * conversions from "const char*" to "string" and back again.
49 *
50 * @stable ICU 4.2
51 */
52class U_COMMON_API StringPiece : public UMemory {
53 private:
54  const char*   ptr_;
55  int32_t       length_;
56
57 public:
58  /**
59   * Default constructor, creates an empty StringPiece.
60   * @stable ICU 4.2
61   */
62  StringPiece() : ptr_(NULL), length_(0) { }
63  /**
64   * Constructs from a NUL-terminated const char * pointer.
65   * @param str a NUL-terminated const char * pointer
66   * @stable ICU 4.2
67   */
68  StringPiece(const char* str);
69#if U_HAVE_STD_STRING
70  /**
71   * Constructs from a std::string.
72   * @stable ICU 4.2
73   */
74  StringPiece(const std::string& str)
75    : ptr_(str.data()), length_(static_cast<int32_t>(str.size())) { }
76#endif
77  /**
78   * Constructs from a const char * pointer and a specified length.
79   * @param offset a const char * pointer (need not be terminated)
80   * @param len the length of the string; must be non-negative
81   * @stable ICU 4.2
82   */
83  StringPiece(const char* offset, int32_t len) : ptr_(offset), length_(len) { }
84  /**
85   * Substring of another StringPiece.
86   * @param x the other StringPiece
87   * @param pos start position in x; must be non-negative and <= x.length().
88   * @stable ICU 4.2
89   */
90  StringPiece(const StringPiece& x, int32_t pos);
91  /**
92   * Substring of another StringPiece.
93   * @param x the other StringPiece
94   * @param pos start position in x; must be non-negative and <= x.length().
95   * @param len length of the substring;
96   *            must be non-negative and will be pinned to at most x.length() - pos.
97   * @stable ICU 4.2
98   */
99  StringPiece(const StringPiece& x, int32_t pos, int32_t len);
100
101  /**
102   * Returns the string pointer. May be NULL if it is empty.
103   *
104   * data() may return a pointer to a buffer with embedded NULs, and the
105   * returned buffer may or may not be null terminated.  Therefore it is
106   * typically a mistake to pass data() to a routine that expects a NUL
107   * terminated string.
108   * @return the string pointer
109   * @stable ICU 4.2
110   */
111  const char* data() const { return ptr_; }
112  /**
113   * Returns the string length. Same as length().
114   * @return the string length
115   * @stable ICU 4.2
116   */
117  int32_t size() const { return length_; }
118  /**
119   * Returns the string length. Same as size().
120   * @return the string length
121   * @stable ICU 4.2
122   */
123  int32_t length() const { return length_; }
124  /**
125   * Returns whether the string is empty.
126   * @return TRUE if the string is empty
127   * @stable ICU 4.2
128   */
129  UBool empty() const { return length_ == 0; }
130
131  /**
132   * Sets to an empty string.
133   * @stable ICU 4.2
134   */
135  void clear() { ptr_ = NULL; length_ = 0; }
136
137  /**
138   * Reset the stringpiece to refer to new data.
139   * @param xdata pointer the new string data.  Need not be nul terminated.
140   * @param len the length of the new data
141   * @stable ICU 4.8
142   */
143  void set(const char* xdata, int32_t len) { ptr_ = xdata; length_ = len; }
144
145  /**
146   * Reset the stringpiece to refer to new data.
147   * @param str a pointer to a NUL-terminated string.
148   * @stable ICU 4.8
149   */
150  void set(const char* str);
151
152  /**
153   * Removes the first n string units.
154   * @param n prefix length, must be non-negative and <=length()
155   * @stable ICU 4.2
156   */
157  void remove_prefix(int32_t n) {
158    if (n >= 0) {
159      if (n > length_) {
160        n = length_;
161      }
162      ptr_ += n;
163      length_ -= n;
164    }
165  }
166
167  /**
168   * Removes the last n string units.
169   * @param n suffix length, must be non-negative and <=length()
170   * @stable ICU 4.2
171   */
172  void remove_suffix(int32_t n) {
173    if (n >= 0) {
174      if (n <= length_) {
175        length_ -= n;
176      } else {
177        length_ = 0;
178      }
179    }
180  }
181
182  /**
183   * Maximum integer, used as a default value for substring methods.
184   * @stable ICU 4.2
185   */
186  static const int32_t npos; // = 0x7fffffff;
187
188  /**
189   * Returns a substring of this StringPiece.
190   * @param pos start position; must be non-negative and <= length().
191   * @param len length of the substring;
192   *            must be non-negative and will be pinned to at most length() - pos.
193   * @return the substring StringPiece
194   * @stable ICU 4.2
195   */
196  StringPiece substr(int32_t pos, int32_t len = npos) const {
197    return StringPiece(*this, pos, len);
198  }
199};
200
201/**
202 * Global operator == for StringPiece
203 * @param x The first StringPiece to compare.
204 * @param y The second StringPiece to compare.
205 * @return TRUE if the string data is equal
206 * @stable ICU 4.8
207 */
208U_EXPORT UBool U_EXPORT2
209operator==(const StringPiece& x, const StringPiece& y);
210
211/**
212 * Global operator != for StringPiece
213 * @param x The first StringPiece to compare.
214 * @param y The second StringPiece to compare.
215 * @return TRUE if the string data is not equal
216 * @stable ICU 4.8
217 */
218inline UBool operator!=(const StringPiece& x, const StringPiece& y) {
219  return !(x == y);
220}
221
222U_NAMESPACE_END
223
224#endif  // __STRINGPIECE_H__
225