1324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver#!/usr/bin/ruby
2324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver# encoding: utf-8
3324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
4324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver=begin LICENSE
5324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
6324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver[The "BSD licence"]
7324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverCopyright (c) 2009-2010 Kyle Yetter
8324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverAll rights reserved.
9324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
10324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverRedistribution and use in source and binary forms, with or without
11324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruvermodification, are permitted provided that the following conditions
12324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverare met:
13324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
14324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver 1. Redistributions of source code must retain the above copyright
15324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    notice, this list of conditions and the following disclaimer.
16324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver 2. Redistributions in binary form must reproduce the above copyright
17324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    notice, this list of conditions and the following disclaimer in the
18324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    documentation and/or other materials provided with the distribution.
19324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver 3. The name of the author may not be used to endorse or promote products
20324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    derived from this software without specific prior written permission.
21324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
22324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverTHIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
23324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverIMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
24324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverOF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
25324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverIN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
26324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverINCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
27324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverNOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverDATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverTHEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
31324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverTHIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
33324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver=end
34324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
35324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruvermodule ANTLR3
36324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruvermodule Profile
37324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver=begin rdoc ANTLR3::Profile::ParserEvents
38324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
39324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverANTLR3::Profile::ParserEvents expands basic debugging events for use by
40324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverrecognition code generated by ANTLR when called with the <tt>-profile</tt>
41324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverswitch.
42324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
43324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver=end
44324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruvermodule ParserEvents
45324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  include ANTLR3::Debug::ParserEvents
46324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
47324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def self.included( klass )
48324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    super
49324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    if klass.is_a?( ::Class )
50324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      def klass.profile?
51324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver        true
52324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      end
53324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
54324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
55324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
56324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def initialize( stream, options = {} )
57324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    options[ :debug_listener ] ||= Profiler.new( self )
58324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    super( stream, options )
59324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
60324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
61324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def already_parsed_rule?( rule )
62324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @debug_listener.examine_rule_memoization( rule )
63324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    super
64324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
65324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
66324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def profile
67324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @debug_listener.profile
68324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
69324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
70324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def memoize( rule, start_index, success )
71324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @debug_listener.memoize( rule, rule_start_index, sucess )
72324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    super
73324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
74324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
75324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
76324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverclass DataSet < ::Array
77324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  include ::Math
78324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def total
79324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    inject( :+ )
80324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
81324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def average
82324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    length > 0 ? ( total.to_f / length ) : 0
83324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
84324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def variance
85324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    length.zero? and return( 0.0 )
86324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    mean = average
87324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    inject( 0.0 ) { |t, i| t + ( i - mean )**2 } / ( length - 1 )
88324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
89324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def standard_deviation
90324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    sqrt( variance )
91324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
92324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
93324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
94324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
95324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverunless const_defined?( :Profile )
96324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  Profile = Struct.new( 
97324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :grammar_file, :parser_class, :top_rule,
98324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :rule_invocations, :guessing_rule_invocations, :rule_invocation_depth,
99324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :fixed_looks, :cyclic_looks, :syntactic_predicate_looks,
100324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :memoization_cache_entries, :memoization_cache_hits,
101324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :memoization_cache_misses, :tokens, :hidden_tokens,
102324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :characters_matched, :hidden_characters_matched, :semantic_predicates,
103324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    :syntactic_predicates, :reported_errors
104324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  )
105324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
106324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
107324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverclass Profile
108324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def initialize
109324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    init_values = Array.new( self.class.members.length, 0 )
110324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    super( *init_values )
111324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    self.top_rule = self.parser_class = self.grammar_file = nil
112324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    self.fixed_looks = DataSet.new
113324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    self.cyclic_looks = DataSet.new
114324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    self.syntactic_predicate_looks = DataSet.new
115324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
116324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
117324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def fixed_decisions
118324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    fixed_looks.length
119324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
120324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
121324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def cyclic_decisions
122324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    cyclic_looks.length
123324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
124324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
125324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def backtracking_decisions
126324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    syntactic_predicate_looks.length
127324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
128324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
129324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def generate_report
130324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report = '+' << '-' * 78 << "+\n"
131324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '| ' << "ANTLR Rule Profile".center( 76 ) << " |\n"
132324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 78 << "+\n"
133324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| Generated at #{ Time.now }".ljust( 78 ) << " |\n"
134324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| Profiled #{ parser_class.name }##{ top_rule }".ljust( 78 ) << " |\n"
135324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| Rule source generated from grammar file #{ grammar_file }".ljust( 78 ) << " |\n"
136324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 78 << "+\n"
137324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    
138324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '| ' << "Rule Invocations".center( 76 ) << " |\n"
139324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
140324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Total Invocations", rule_invocations ]
141324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "``Guessing'' Invocations", guessing_rule_invocations ]
142324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Deepest Level of Invocation", rule_invocation_depth ]
143324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
144324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    
145324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '| ' << "Execution Events".center( 76 ) << " |\n"
146324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
147324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Semantic Predicates Evaluated", semantic_predicates ]
148324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Syntactic Predicates Evaluated", syntactic_predicates ]
149324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Errors Reported", reported_errors ]
150324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
151324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    
152324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '| ' << "Token and Character Data".center( 76 ) << " |\n"
153324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
154324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Tokens Consumed", tokens ]
155324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Hidden Tokens Consumed", hidden_tokens ]
156324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Characters Matched", characters_matched ]
157324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Hidden Characters Matched", hidden_characters_matched ]
158324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
159324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    
160324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '| ' << "Memoization".center( 76 ) << " |\n"
161324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
162324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Cache Entries", memoization_cache_entries ]
163324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Cache Hits", memoization_cache_hits ]
164324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << "| %-66s | %7i |\n" % [ "Cache Misses", memoization_cache_misses ]
165324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
166324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    
167324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    [ 
168324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      [ 'Fixed Lookahead (k)', fixed_looks ],
169324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      [ 'Arbitrary Lookahead (k)', cyclic_looks ],
170324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      [ 'Backtracking (Syntactic Predicate)', syntactic_predicate_looks ]
171324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    ].each do |name, set|
172324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      mean, stdev = '%4.2f' % set.average, '%4.2f' % set.standard_deviation
173324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << '| ' << "#{ name } Decisions".center( 76 ) << " |\n"
174324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
175324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << "| %-66s | %7i |\n" % [ "Count", set.length ]
176324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << "| %-66s | %7i |\n" % [ "Minimum k", set.min ]
177324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << "| %-66s | %7i |\n" % [ "Maximum k", set.max ]
178324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << "| %-66s | %7s |\n" % [ "Average k", mean ]
179324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << "| %-66s | %7s |\n" % [ "Standard Deviation of k", stdev ]
180324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      report << '+' << '-' * 68 << '+' << '-' * 9 << "+\n"
181324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
182324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    return( report )
183324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
184324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
185324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
186324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver=begin rdoc ANTLR3::Profile::Profiler
187324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
188324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverWhen ANTLR is run with the <tt>-profile</tt> switch, it generates recognition
189324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruvercode that performs accounting about the decision logic performed while parsing
190324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverany given input. This information can be used to help refactor a slow grammar.
191324c4644fee44b9898524c09511bd33c3f12e2dfBen GruverProfiler is an event-listener that performs all of the profiling accounting and
192324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverbuilds a simple report to present the various statistics.
193324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
194324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver=end
195324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverclass Profiler
196324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  include Debug::EventListener
197324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  include Constants
198324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
199324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  PROTOCOL_VERSION = 2
200324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
201324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_accessor :parser
202324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_reader :rule_level
203324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_reader :decision_level
204324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
205324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  # tracks the maximum look value for the current decision
206324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  # (maxLookaheadInCurrentDecision in java Profiler)
207324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_reader :decision_look
208324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
209324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  # the last token consumed
210324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  # (lastTokenConsumed in java Profiler)
211324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_reader :last_token
212324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_reader :look_stack
213324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_reader :profile
214324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
215324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  attr_accessor :output
216324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
217324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def initialize( parser = nil, output = nil )
218324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @parser = parser
219324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile = nil
220324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @rule_level = 0
221324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_level = 0
222324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_look = 0
223324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @last_token = nil
224324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @look_stack = []
225324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @output = output
226324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
227324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
228324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def commence
229324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile = Profile.new
230324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @rule_level = 0
231324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_level = 0
232324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_look = 0
233324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @last_token = nil
234324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @look_stack = []
235324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
236324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
237324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def enter_rule( grammar_file_name, rule_name )
238324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    if @rule_level.zero?
239324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      commence
240324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.grammar_file = grammar_file_name
241324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.parser_class = @parser.class
242324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.top_rule = rule_name
243324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
244324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @rule_level += 1
245324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.rule_invocations += 1
246324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.rule_invocation_depth < @rule_level and
247324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.rule_invocation_depth = @rule_level
248324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
249324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
250324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def exit_rule( grammar_file_name, rule_name )
251324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @rule_level -= 1
252324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
253324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
254324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def examine_rule_memoization( rule )
255324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    stop_index = parser.rule_memoization( rule, @parser.input.index )
256324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    if stop_index == MEMO_RULE_UNKNOWN
257324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.memoization_cache_misses += 1
258324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.guessing_rule_invocations += 1
259324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    else
260324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.memoization_cache_hits += 1
261324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
262324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
263324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
264324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def memoize( rule, start_index, success )
265324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.memoization_cache_entries += 1
266324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
267324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
268324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
269324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def enter_decision( decision_number )
270324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_level += 1
271324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    starting_look_index = @parser.input.index
272324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @look_stack << starting_look_index
273324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
274324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
275324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def exit_decision( decision_number )
276324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @look_stack.pop
277324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_level -= 1
278324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    if @parser.cyclic_decision? then
279324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @profile.cyclic_looks << @decision_look
280324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    else @profile.fixed_looks << @decision_look
281324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
282324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    
283324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @parser.cyclic_decision = false
284324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @decision_look = 0    
285324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
286324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
287324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def consume_token( token )
288324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @last_token = token
289324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
290324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
291324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def in_decision?
292324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    return( @decision_level > 0 )
293324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
294324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
295324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def consume_hidden_token( token )
296324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @last_token = token
297324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
298324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver
299324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def look( i, token )
300324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    in_decision? or return
301324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    starting_index = look_stack.last
302324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    input = @parser.input
303324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    this_ref_index = input.index
304324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    num_hidden = input.tokens( starting_index, this_ref_index ).count { |t| t.hidden? }
305324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    depth = i + this_ref_index - starting_index - num_hidden
306324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    if depth > @decision_look
307324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      @decision_look = depth
308324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
309324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
310324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
311324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def end_backtrack( level, successful )
312324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.syntactic_predicate_looks << @decision_look
313324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
314324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
315324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def recognition_exception( error )
316324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.reported_errors += 1
317324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
318324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
319324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def semantic_predicate( result, predicate )
320324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    in_decision? and @profile.semantic_predicates += 1
321324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
322324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
323324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def terminate
324324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    input = @parser.input
325324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    hidden_tokens = input.select { |token| token.hidden? }
326324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.hidden_tokens = hidden_tokens.length
327324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.tokens = input.tokens.length
328324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.hidden_characters_matched = hidden_tokens.inject( 0 ) do |count, token|
329324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      count + token.text.length rescue count
330324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
331324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.characters_matched = ( @last_token || input.tokens.last ).stop + 1 rescue 0
332324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    write_report
333324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
334324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
335324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
336324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def write_report
337324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @output << @profile.generate_report unless @output.nil?
338324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  rescue NoMethodError => error
339324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    if error.name.to_s == '<<'
340324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      warn( <<-END.strip! % [ __FILE__, __LINE__, @output ] )
341324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver        [%s @ %s]: failed to write report to %p as it does not respond to :<<
342324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver      END
343324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    else raise
344324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    end
345324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  rescue IOError => error
346324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    $stderr.puts( Util.tidy( <<-END ) % [ __FILE__, __LINE__, @output, error.class, error.message ] )
347324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    | [%s @ %s]: failed to write profile report to %p due to an IO Error:
348324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    |   %s: %s
349324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    END
350324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    $stderr.puts( error.backtrace.map { |call| "  - #{ call }" }.join( "\n" ) )
351324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
352324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
353324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  def report
354324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver    @profile.generate_report
355324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  end
356324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  
357324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruver  alias to_s report
358324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
359324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
360324c4644fee44b9898524c09511bd33c3f12e2dfBen Gruverend
361