1// Protocol Buffers - Google's data interchange format 2// Copyright 2008 Google Inc. All rights reserved. 3// https://developers.google.com/protocol-buffers/ 4// 5// Redistribution and use in source and binary forms, with or without 6// modification, are permitted provided that the following conditions are 7// met: 8// 9// * Redistributions of source code must retain the above copyright 10// notice, this list of conditions and the following disclaimer. 11// * Redistributions in binary form must reproduce the above 12// copyright notice, this list of conditions and the following disclaimer 13// in the documentation and/or other materials provided with the 14// distribution. 15// * Neither the name of Google Inc. nor the names of its 16// contributors may be used to endorse or promote products derived from 17// this software without specific prior written permission. 18// 19// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 20// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 21// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 22// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 23// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 24// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 25// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 26// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 27// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 28// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 29// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 30 31// Author: kenton@google.com (Kenton Varda) 32// Based on original Protocol Buffers design by 33// Sanjay Ghemawat, Jeff Dean, and others. 34// 35// Utility class for writing text to a ZeroCopyOutputStream. 36 37#ifndef GOOGLE_PROTOBUF_IO_PRINTER_H__ 38#define GOOGLE_PROTOBUF_IO_PRINTER_H__ 39 40#include <string> 41#include <map> 42#include <vector> 43#include <google/protobuf/stubs/common.h> 44 45namespace google { 46namespace protobuf { 47namespace io { 48 49class ZeroCopyOutputStream; // zero_copy_stream.h 50 51// Records annotations about a Printer's output. 52class LIBPROTOBUF_EXPORT AnnotationCollector { 53 public: 54 // Records that the bytes in file_path beginning with begin_offset and ending 55 // before end_offset are associated with the SourceCodeInfo-style path. 56 virtual void AddAnnotation(size_t begin_offset, size_t end_offset, 57 const string& file_path, 58 const vector<int>& path) = 0; 59 60 virtual ~AnnotationCollector() {} 61}; 62 63// Records annotations about a Printer's output to the given protocol buffer, 64// assuming that the buffer has an ::Annotation message exposing path, 65// source_file, begin and end fields. 66template <typename AnnotationProto> 67class AnnotationProtoCollector : public AnnotationCollector { 68 public: 69 // annotation_proto is the protocol buffer to which new Annotations should be 70 // added. It is not owned by the AnnotationProtoCollector. 71 explicit AnnotationProtoCollector(AnnotationProto* annotation_proto) 72 : annotation_proto_(annotation_proto) {} 73 74 // Override for AnnotationCollector::AddAnnotation. 75 virtual void AddAnnotation(size_t begin_offset, size_t end_offset, 76 const string& file_path, const vector<int>& path) { 77 typename AnnotationProto::Annotation* annotation = 78 annotation_proto_->add_annotation(); 79 for (int i = 0; i < path.size(); ++i) { 80 annotation->add_path(path[i]); 81 } 82 annotation->set_source_file(file_path); 83 annotation->set_begin(begin_offset); 84 annotation->set_end(end_offset); 85 } 86 87 private: 88 // The protocol buffer to which new annotations should be added. 89 AnnotationProto* const annotation_proto_; 90}; 91 92// This simple utility class assists in code generation. It basically 93// allows the caller to define a set of variables and then output some 94// text with variable substitutions. Example usage: 95// 96// Printer printer(output, '$'); 97// map<string, string> vars; 98// vars["name"] = "Bob"; 99// printer.Print(vars, "My name is $name$."); 100// 101// The above writes "My name is Bob." to the output stream. 102// 103// Printer aggressively enforces correct usage, crashing (with assert failures) 104// in the case of undefined variables in debug builds. This helps greatly in 105// debugging code which uses it. 106// 107// If a Printer is constructed with an AnnotationCollector, it will provide it 108// with annotations that connect the Printer's output to paths that can identify 109// various descriptors. In the above example, if person_ is a descriptor that 110// identifies Bob, we can associate the output string "My name is Bob." with 111// a source path pointing to that descriptor with: 112// 113// printer.Annotate("name", person_); 114// 115// The AnnotationCollector will be sent an annotation linking the output range 116// covering "Bob" to the logical path provided by person_. Tools may use 117// this association to (for example) link "Bob" in the output back to the 118// source file that defined the person_ descriptor identifying Bob. 119// 120// Annotate can only examine variables substituted during the last call to 121// Print. It is invalid to refer to a variable that was used multiple times 122// in a single Print call. 123// 124// In full generality, one may specify a range of output text using a beginning 125// substitution variable and an ending variable. The resulting annotation will 126// span from the first character of the substituted value for the beginning 127// variable to the last character of the substituted value for the ending 128// variable. For example, the Annotate call above is equivalent to this one: 129// 130// printer.Annotate("name", "name", person_); 131// 132// This is useful if multiple variables combine to form a single span of output 133// that should be annotated with the same source path. For example: 134// 135// Printer printer(output, '$'); 136// map<string, string> vars; 137// vars["first"] = "Alice"; 138// vars["last"] = "Smith"; 139// printer.Print(vars, "My name is $first$ $last$."); 140// printer.Annotate("first", "last", person_); 141// 142// This code would associate the span covering "Alice Smith" in the output with 143// the person_ descriptor. 144// 145// Note that the beginning variable must come before (or overlap with, in the 146// case of zero-sized substitution values) the ending variable. 147// 148// It is also sometimes useful to use variables with zero-sized values as 149// markers. This avoids issues with multiple references to the same variable 150// and also allows annotation ranges to span literal text from the Print 151// templates: 152// 153// Printer printer(output, '$'); 154// map<string, string> vars; 155// vars["foo"] = "bar"; 156// vars["function"] = "call"; 157// vars["mark"] = ""; 158// printer.Print(vars, "$function$($foo$,$foo$)$mark$"); 159// printer.Annotate("function", "rmark", call_); 160// 161// This code associates the span covering "call(bar,bar)" in the output with the 162// call_ descriptor. 163 164class LIBPROTOBUF_EXPORT Printer { 165 public: 166 // Create a printer that writes text to the given output stream. Use the 167 // given character as the delimiter for variables. 168 Printer(ZeroCopyOutputStream* output, char variable_delimiter); 169 170 // Create a printer that writes text to the given output stream. Use the 171 // given character as the delimiter for variables. If annotation_collector 172 // is not null, Printer will provide it with annotations about code written 173 // to the stream. annotation_collector is not owned by Printer. 174 Printer(ZeroCopyOutputStream* output, char variable_delimiter, 175 AnnotationCollector* annotation_collector); 176 177 ~Printer(); 178 179 // Link a subsitution variable emitted by the last call to Print to the object 180 // described by descriptor. 181 template <typename SomeDescriptor> 182 void Annotate(const char* varname, const SomeDescriptor* descriptor) { 183 Annotate(varname, varname, descriptor); 184 } 185 186 // Link the output range defined by the substitution variables as emitted by 187 // the last call to Print to the object described by descriptor. The range 188 // begins at begin_varname's value and ends after the last character of the 189 // value substituted for end_varname. 190 template <typename SomeDescriptor> 191 void Annotate(const char* begin_varname, const char* end_varname, 192 const SomeDescriptor* descriptor) { 193 if (annotation_collector_ == NULL) { 194 // Annotations aren't turned on for this Printer, so don't pay the cost 195 // of building the location path. 196 return; 197 } 198 vector<int> path; 199 descriptor->GetLocationPath(&path); 200 Annotate(begin_varname, end_varname, descriptor->file()->name(), path); 201 } 202 203 // Print some text after applying variable substitutions. If a particular 204 // variable in the text is not defined, this will crash. Variables to be 205 // substituted are identified by their names surrounded by delimiter 206 // characters (as given to the constructor). The variable bindings are 207 // defined by the given map. 208 void Print(const map<string, string>& variables, const char* text); 209 210 // Like the first Print(), except the substitutions are given as parameters. 211 void Print(const char* text); 212 // Like the first Print(), except the substitutions are given as parameters. 213 void Print(const char* text, const char* variable, const string& value); 214 // Like the first Print(), except the substitutions are given as parameters. 215 void Print(const char* text, const char* variable1, const string& value1, 216 const char* variable2, const string& value2); 217 // Like the first Print(), except the substitutions are given as parameters. 218 void Print(const char* text, const char* variable1, const string& value1, 219 const char* variable2, const string& value2, 220 const char* variable3, const string& value3); 221 // Like the first Print(), except the substitutions are given as parameters. 222 void Print(const char* text, const char* variable1, const string& value1, 223 const char* variable2, const string& value2, 224 const char* variable3, const string& value3, 225 const char* variable4, const string& value4); 226 // Like the first Print(), except the substitutions are given as parameters. 227 void Print(const char* text, const char* variable1, const string& value1, 228 const char* variable2, const string& value2, 229 const char* variable3, const string& value3, 230 const char* variable4, const string& value4, 231 const char* variable5, const string& value5); 232 // Like the first Print(), except the substitutions are given as parameters. 233 void Print(const char* text, const char* variable1, const string& value1, 234 const char* variable2, const string& value2, 235 const char* variable3, const string& value3, 236 const char* variable4, const string& value4, 237 const char* variable5, const string& value5, 238 const char* variable6, const string& value6); 239 // Like the first Print(), except the substitutions are given as parameters. 240 void Print(const char* text, const char* variable1, const string& value1, 241 const char* variable2, const string& value2, 242 const char* variable3, const string& value3, 243 const char* variable4, const string& value4, 244 const char* variable5, const string& value5, 245 const char* variable6, const string& value6, 246 const char* variable7, const string& value7); 247 // Like the first Print(), except the substitutions are given as parameters. 248 void Print(const char* text, const char* variable1, const string& value1, 249 const char* variable2, const string& value2, 250 const char* variable3, const string& value3, 251 const char* variable4, const string& value4, 252 const char* variable5, const string& value5, 253 const char* variable6, const string& value6, 254 const char* variable7, const string& value7, 255 const char* variable8, const string& value8); 256 257 // Indent text by two spaces. After calling Indent(), two spaces will be 258 // inserted at the beginning of each line of text. Indent() may be called 259 // multiple times to produce deeper indents. 260 void Indent(); 261 262 // Reduces the current indent level by two spaces, or crashes if the indent 263 // level is zero. 264 void Outdent(); 265 266 // Write a string to the output buffer. 267 // This method does not look for newlines to add indentation. 268 void PrintRaw(const string& data); 269 270 // Write a zero-delimited string to output buffer. 271 // This method does not look for newlines to add indentation. 272 void PrintRaw(const char* data); 273 274 // Write some bytes to the output buffer. 275 // This method does not look for newlines to add indentation. 276 void WriteRaw(const char* data, int size); 277 278 // True if any write to the underlying stream failed. (We don't just 279 // crash in this case because this is an I/O failure, not a programming 280 // error.) 281 bool failed() const { return failed_; } 282 283 private: 284 // Link the output range defined by the substitution variables as emitted by 285 // the last call to Print to the object found at the SourceCodeInfo-style path 286 // in a file with path file_path. The range begins at the start of 287 // begin_varname's value and ends after the last character of the value 288 // substituted for end_varname. Note that begin_varname and end_varname 289 // may refer to the same variable. 290 void Annotate(const char* begin_varname, const char* end_varname, 291 const string& file_path, const vector<int>& path); 292 293 const char variable_delimiter_; 294 295 ZeroCopyOutputStream* const output_; 296 char* buffer_; 297 int buffer_size_; 298 // The current position, in bytes, in the output stream. This is equivalent 299 // to the total number of bytes that have been written so far. This value is 300 // used to calculate annotation ranges in the substitutions_ map below. 301 size_t offset_; 302 303 string indent_; 304 bool at_start_of_line_; 305 bool failed_; 306 307 // A map from variable name to [start, end) offsets in the output buffer. 308 // These refer to the offsets used for a variable after the last call to 309 // Print. If a variable was used more than once, the entry used in 310 // this map is set to a negative-length span. For singly-used variables, the 311 // start offset is the beginning of the substitution; the end offset is the 312 // last byte of the substitution plus one (such that (end - start) is the 313 // length of the substituted string). 314 map<string, pair<size_t, size_t> > substitutions_; 315 316 // Returns true and sets range to the substitution range in the output for 317 // varname if varname was used once in the last call to Print. If varname 318 // was not used, or if it was used multiple times, returns false (and 319 // fails a debug assertion). 320 bool GetSubstitutionRange(const char* varname, pair<size_t, size_t>* range); 321 322 // If non-null, annotation_collector_ is used to store annotations about 323 // generated code. 324 AnnotationCollector* const annotation_collector_; 325 326 GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(Printer); 327}; 328 329} // namespace io 330} // namespace protobuf 331 332} // namespace google 333#endif // GOOGLE_PROTOBUF_IO_PRINTER_H__ 334