ccc-analyzer revision 6e53137f447a455ccddc2cae5aa000d56fe4b50b
1#!/usr/bin/env perl
2#
3#                     The LLVM Compiler Infrastructure
4#
5# This file is distributed under the University of Illinois Open Source
6# License. See LICENSE.TXT for details.
7#
8##===----------------------------------------------------------------------===##
9#
10#  A script designed to interpose between the build system and gcc.  It invokes
11#  both gcc and the static analyzer.
12#
13##===----------------------------------------------------------------------===##
14
15use strict;
16use warnings;
17use FindBin;
18use Cwd qw/ getcwd abs_path /;
19use File::Temp qw/ tempfile /;
20use File::Path qw / mkpath /;
21use File::Basename;
22use Text::ParseWords;
23
24##===----------------------------------------------------------------------===##
25# Compiler command setup.
26##===----------------------------------------------------------------------===##
27
28my $Compiler;
29my $Clang;
30my $DefaultCCompiler;
31my $DefaultCXXCompiler;
32
33if (`uname -a` =~ m/Darwin/) { 
34	$DefaultCCompiler = 'clang';
35	$DefaultCXXCompiler = 'clang++'; 
36} else {
37    $DefaultCCompiler = 'gcc';
38    $DefaultCXXCompiler = 'g++'; 	
39}
40
41if ($FindBin::Script =~ /c\+\+-analyzer/) {
42  $Compiler = $ENV{'CCC_CXX'};
43  if (!defined $Compiler) { $Compiler = $DefaultCXXCompiler; }
44  
45  $Clang = $ENV{'CLANG_CXX'};
46  if (!defined $Clang) { $Clang = 'clang++'; }
47}
48else {
49  $Compiler = $ENV{'CCC_CC'};
50  if (!defined $Compiler) { $Compiler = $DefaultCCompiler; }
51
52  $Clang = $ENV{'CLANG'};
53  if (!defined $Clang) { $Clang = 'clang'; }
54}
55
56##===----------------------------------------------------------------------===##
57# Cleanup.
58##===----------------------------------------------------------------------===##
59
60my $ReportFailures = $ENV{'CCC_REPORT_FAILURES'};
61if (!defined $ReportFailures) { $ReportFailures = 1; }
62
63my $CleanupFile;
64my $ResultFile;
65
66# Remove any stale files at exit.
67END { 
68  if (defined $ResultFile && -z $ResultFile) {
69    `rm -f $ResultFile`;
70  }
71  if (defined $CleanupFile) {
72    `rm -f $CleanupFile`;
73  }
74}
75
76##----------------------------------------------------------------------------##
77#  Process Clang Crashes.
78##----------------------------------------------------------------------------##
79
80sub GetPPExt {
81  my $Lang = shift;
82  if ($Lang =~ /objective-c\+\+/) { return ".mii" };
83  if ($Lang =~ /objective-c/) { return ".mi"; }
84  if ($Lang =~ /c\+\+/) { return ".ii"; }
85  return ".i";
86}
87
88# Set this to 1 if we want to include 'parser rejects' files.
89my $IncludeParserRejects = 0;
90my $ParserRejects = "Parser Rejects";
91my $AttributeIgnored = "Attribute Ignored";
92my $OtherError = "Other Error";
93
94sub ProcessClangFailure {
95  my ($Clang, $Lang, $file, $Args, $HtmlDir, $ErrorType, $ofile) = @_;
96  my $Dir = "$HtmlDir/failures";
97  mkpath $Dir;
98  
99  my $prefix = "clang_crash";
100  if ($ErrorType eq $ParserRejects) {
101    $prefix = "clang_parser_rejects";
102  }
103  elsif ($ErrorType eq $AttributeIgnored) {
104    $prefix = "clang_attribute_ignored";
105  }
106  elsif ($ErrorType eq $OtherError) {
107    $prefix = "clang_other_error";
108  }
109
110  # Generate the preprocessed file with Clang.
111  my ($PPH, $PPFile) = tempfile( $prefix . "_XXXXXX",
112                                 SUFFIX => GetPPExt($Lang),
113                                 DIR => $Dir);
114  system $Clang, @$Args, "-E", "-o", $PPFile;
115  close ($PPH);
116  
117  # Create the info file.
118  open (OUT, ">", "$PPFile.info.txt") or die "Cannot open $PPFile.info.txt\n";
119  print OUT abs_path($file), "\n";
120  print OUT "$ErrorType\n";
121  print OUT "@$Args\n";
122  close OUT;
123  `uname -a >> $PPFile.info.txt 2>&1`;
124  `$Compiler -v >> $PPFile.info.txt 2>&1`;
125  system 'mv',$ofile,"$PPFile.stderr.txt";
126  return (basename $PPFile);
127}
128
129##----------------------------------------------------------------------------##
130#  Running the analyzer.
131##----------------------------------------------------------------------------##
132
133sub GetCCArgs {
134  my $mode = shift;
135  my $Args = shift;
136  
137  pipe (FROM_CHILD, TO_PARENT);
138  my $pid = fork();
139  if ($pid == 0) {
140    close FROM_CHILD;
141    open(STDOUT,">&", \*TO_PARENT);
142    open(STDERR,">&", \*TO_PARENT);
143    exec $Clang, "-###", $mode, @$Args;
144  }  
145  close(TO_PARENT);
146  my $line;
147  while (<FROM_CHILD>) {
148    next if (!/-cc1/);
149    $line = $_;
150  }
151
152  waitpid($pid,0);
153  close(FROM_CHILD);
154  
155  die "could not find clang line\n" if (!defined $line);
156  # Strip the newline and initial whitspace
157  chomp $line;
158  $line =~ s/^\s+//;
159  my @items = quotewords('\s+', 0, $line);
160  my $cmd = shift @items;
161  die "cannot find 'clang' in 'clang' command\n" if (!($cmd =~ /clang/));
162  return \@items;
163}
164
165sub Analyze {
166  my ($Clang, $OriginalArgs, $AnalyzeArgs, $Lang, $Output, $Verbose, $HtmlDir,
167      $file) = @_;
168
169  my @Args = @$OriginalArgs;
170  my $Cmd;
171  my @CmdArgs;
172  my @CmdArgsSansAnalyses;
173
174  if ($Lang =~ /header/) {
175    exit 0 if (!defined ($Output));
176    $Cmd = 'cp';
177    push @CmdArgs, $file;
178    # Remove the PCH extension.
179    $Output =~ s/[.]gch$//;
180    push @CmdArgs, $Output;
181    @CmdArgsSansAnalyses = @CmdArgs;
182  }
183  else {
184    $Cmd = $Clang;
185
186    # Create arguments for doing regular parsing.
187    my $SyntaxArgs = GetCCArgs("-fsyntax-only", \@Args);
188    @CmdArgsSansAnalyses = @$SyntaxArgs;
189
190    # Create arguments for doing static analysis.
191    if (defined $ResultFile) {
192      push @Args, '-o', $ResultFile;
193    }
194    elsif (defined $HtmlDir) {
195      push @Args, '-o', $HtmlDir;
196    }
197    if ($Verbose) {
198      push @Args, "-Xclang", "-analyzer-display-progress";
199    }
200
201    foreach my $arg (@$AnalyzeArgs) {
202      push @Args, "-Xclang", $arg;
203    }
204
205    # Display Ubiviz graph?
206    if (defined $ENV{'CCC_UBI'}) {   
207      push @Args, "-Xclang", "-analyzer-viz-egraph-ubigraph";
208    }
209
210    my $AnalysisArgs = GetCCArgs("--analyze", \@Args);
211    @CmdArgs = @$AnalysisArgs;
212  }
213
214  my @PrintArgs;
215  my $dir;
216
217  if ($Verbose) {
218    $dir = getcwd();
219    print STDERR "\n[LOCATION]: $dir\n";
220    push @PrintArgs,"'$Cmd'";
221    foreach my $arg (@CmdArgs) {
222        push @PrintArgs,"\'$arg\'";
223    }
224  }
225  if ($Verbose == 1) {
226    # We MUST print to stderr.  Some clients use the stdout output of
227    # gcc for various purposes. 
228    print STDERR join(' ', @PrintArgs);
229    print STDERR "\n";
230  }
231  elsif ($Verbose == 2) {
232    print STDERR "#SHELL (cd '$dir' && @PrintArgs)\n";
233  }
234
235  # Capture the STDERR of clang and send it to a temporary file.
236  # Capture the STDOUT of clang and reroute it to ccc-analyzer's STDERR.
237  # We save the output file in the 'crashes' directory if clang encounters
238  # any problems with the file.  
239  pipe (FROM_CHILD, TO_PARENT);
240  my $pid = fork();
241  if ($pid == 0) {
242    close FROM_CHILD;
243    open(STDOUT,">&", \*TO_PARENT);
244    open(STDERR,">&", \*TO_PARENT);
245    exec $Cmd, @CmdArgs;
246  }
247
248  close TO_PARENT;
249  my ($ofh, $ofile) = tempfile("clang_output_XXXXXX", DIR => $HtmlDir);
250  
251  while (<FROM_CHILD>) {
252    print $ofh $_;
253    print STDERR $_;
254  }
255
256  waitpid($pid,0);
257  close(FROM_CHILD);
258  my $Result = $?;
259
260  # Did the command die because of a signal?
261  if ($ReportFailures) {
262    if ($Result & 127 and $Cmd eq $Clang and defined $HtmlDir) {
263      ProcessClangFailure($Clang, $Lang, $file, \@CmdArgsSansAnalyses,
264                          $HtmlDir, "Crash", $ofile);
265    }
266    elsif ($Result) {
267      if ($IncludeParserRejects && !($file =~/conftest/)) {
268        ProcessClangFailure($Clang, $Lang, $file, \@CmdArgsSansAnalyses,
269                            $HtmlDir, $ParserRejects, $ofile);
270      } else {
271        ProcessClangFailure($Clang, $Lang, $file, \@CmdArgsSansAnalyses,
272                            $HtmlDir, $OtherError, $ofile);      	
273      }
274    }
275    else {
276      # Check if there were any unhandled attributes.
277      if (open(CHILD, $ofile)) {
278        my %attributes_not_handled;
279
280        # Don't flag warnings about the following attributes that we
281        # know are currently not supported by Clang.
282        $attributes_not_handled{"cdecl"} = 1;
283
284        my $ppfile;
285        while (<CHILD>) {
286          next if (! /warning: '([^\']+)' attribute ignored/);
287
288          # Have we already spotted this unhandled attribute?
289          next if (defined $attributes_not_handled{$1});
290          $attributes_not_handled{$1} = 1;
291        
292          # Get the name of the attribute file.
293          my $dir = "$HtmlDir/failures";
294          my $afile = "$dir/attribute_ignored_$1.txt";
295        
296          # Only create another preprocessed file if the attribute file
297          # doesn't exist yet.
298          next if (-e $afile);
299        
300          # Add this file to the list of files that contained this attribute.
301          # Generate a preprocessed file if we haven't already.
302          if (!(defined $ppfile)) {
303            $ppfile = ProcessClangFailure($Clang, $Lang, $file,
304                                          \@CmdArgsSansAnalyses,
305                                          $HtmlDir, $AttributeIgnored, $ofile);
306          }
307
308          mkpath $dir;
309          open(AFILE, ">$afile");
310          print AFILE "$ppfile\n";
311          close(AFILE);
312        }
313        close CHILD;
314      }
315    }
316  }
317  
318  unlink($ofile);
319}
320
321##----------------------------------------------------------------------------##
322#  Lookup tables.
323##----------------------------------------------------------------------------##
324
325my %CompileOptionMap = (
326  '-nostdinc' => 0,
327  '-fblocks' => 0,
328  '-fno-builtin' => 0,
329  '-fobjc-gc-only' => 0,
330  '-fobjc-gc' => 0,
331  '-ffreestanding' => 0,
332  '-include' => 1,
333  '-idirafter' => 1,
334  '-imacros' => 1,
335  '-iprefix' => 1,
336  '-iquote' => 1,
337  '-isystem' => 1,
338  '-iwithprefix' => 1,
339  '-iwithprefixbefore' => 1
340);
341
342my %LinkerOptionMap = (
343  '-framework' => 1,
344  '-fobjc-link-runtime' => 0
345);
346
347my %CompilerLinkerOptionMap = (
348  '-fobjc-arc' => 0,
349  '-fobjc-abi-version' => 0, # This is really a 1 argument, but always has '='
350  '-fobjc-legacy-dispatch' => 0,
351  '-mios-simulator-version-min' => 0, # This really has 1 argument, but always has '='
352  '-isysroot' => 1,
353  '-arch' => 1,
354  '-m32' => 0,
355  '-m64' => 0,
356  '-v' => 0,
357  '-fpascal-strings' => 0,
358  '-mmacosx-version-min' => 0, # This is really a 1 argument, but always has '='
359  '-miphoneos-version-min' => 0 # This is really a 1 argument, but always has '='
360);
361
362my %IgnoredOptionMap = (
363  '-MT' => 1,  # Ignore these preprocessor options.
364  '-MF' => 1,
365
366  '-fsyntax-only' => 0,
367  '-save-temps' => 0,
368  '-install_name' => 1,
369  '-exported_symbols_list' => 1,
370  '-current_version' => 1,
371  '-compatibility_version' => 1,
372  '-init' => 1,
373  '-e' => 1,
374  '-seg1addr' => 1,
375  '-bundle_loader' => 1,
376  '-multiply_defined' => 1,
377  '-sectorder' => 3,
378  '--param' => 1,
379  '-u' => 1,
380  '--serialize-diagnostics' => 1
381);
382
383my %LangMap = (
384  'c'   => 'c',
385  'cp'  => 'c++',
386  'cpp' => 'c++',
387  'cxx' => 'c++',
388  'txx' => 'c++',
389  'cc'  => 'c++',
390  'ii'  => 'c++',
391  'i'   => 'c-cpp-output',
392  'm'   => 'objective-c',
393  'mi'  => 'objective-c-cpp-output',
394  'mm'  => 'objective-c++'
395);
396
397my %UniqueOptions = (
398  '-isysroot' => 0  
399);
400
401##----------------------------------------------------------------------------##
402# Languages accepted.
403##----------------------------------------------------------------------------##
404
405my %LangsAccepted = (
406  "objective-c" => 1,
407  "c" => 1,
408  "c++" => 1,
409  "objective-c++" => 1
410);
411
412##----------------------------------------------------------------------------##
413#  Main Logic.
414##----------------------------------------------------------------------------##
415
416my $Action = 'link';
417my @CompileOpts;
418my @LinkOpts;
419my @Files;
420my $Lang;
421my $Output;
422my %Uniqued;
423
424# Forward arguments to gcc.
425my $Status = system($Compiler,@ARGV);
426if  (defined $ENV{'CCC_ANALYZER_LOG'}) {
427  print "$Compiler @ARGV\n";
428}
429if ($Status) { exit($Status >> 8); }
430
431# Get the analysis options.
432my $Analyses = $ENV{'CCC_ANALYZER_ANALYSIS'};
433
434# Get the plugins to load.
435my $Plugins = $ENV{'CCC_ANALYZER_PLUGINS'};
436
437# Get the store model.
438my $StoreModel = $ENV{'CCC_ANALYZER_STORE_MODEL'};
439
440# Get the constraints engine.
441my $ConstraintsModel = $ENV{'CCC_ANALYZER_CONSTRAINTS_MODEL'};
442
443#Get the internal stats setting.
444my $InternalStats = $ENV{'CCC_ANALYZER_INTERNAL_STATS'};
445
446# Get the output format.
447my $OutputFormat = $ENV{'CCC_ANALYZER_OUTPUT_FORMAT'};
448if (!defined $OutputFormat) { $OutputFormat = "html"; }
449
450# Determine the level of verbosity.
451my $Verbose = 0;
452if (defined $ENV{CCC_ANALYZER_VERBOSE}) { $Verbose = 1; }
453if (defined $ENV{CCC_ANALYZER_LOG}) { $Verbose = 2; }
454
455# Get the HTML output directory.
456my $HtmlDir = $ENV{'CCC_ANALYZER_HTML'};
457
458my %DisabledArchs = ('ppc' => 1, 'ppc64' => 1);
459my %ArchsSeen;
460my $HadArch = 0;
461
462# Process the arguments.
463foreach (my $i = 0; $i < scalar(@ARGV); ++$i) {
464  my $Arg = $ARGV[$i];  
465  my ($ArgKey) = split /=/,$Arg,2;
466
467  # Modes ccc-analyzer supports
468  if ($Arg =~ /^-(E|MM?)$/) { $Action = 'preprocess'; }
469  elsif ($Arg eq '-c') { $Action = 'compile'; }
470  elsif ($Arg =~ /^-print-prog-name/) { exit 0; }
471
472  # Specially handle duplicate cases of -arch
473  if ($Arg eq "-arch") {
474    my $arch = $ARGV[$i+1];
475    # We don't want to process 'ppc' because of Clang's lack of support
476    # for Altivec (also some #defines won't likely be defined correctly, etc.)
477    if (!(defined $DisabledArchs{$arch})) { $ArchsSeen{$arch} = 1; }
478    $HadArch = 1;
479    ++$i;
480    next;
481  }
482
483  # Options with possible arguments that should pass through to compiler.
484  if (defined $CompileOptionMap{$ArgKey}) {
485    my $Cnt = $CompileOptionMap{$ArgKey};
486    push @CompileOpts,$Arg;
487    while ($Cnt > 0) { ++$i; --$Cnt; push @CompileOpts, $ARGV[$i]; }
488    next;
489  }
490
491  # Options with possible arguments that should pass through to linker.
492  if (defined $LinkerOptionMap{$ArgKey}) {
493    my $Cnt = $LinkerOptionMap{$ArgKey};
494    push @LinkOpts,$Arg;
495    while ($Cnt > 0) { ++$i; --$Cnt; push @LinkOpts, $ARGV[$i]; }
496    next;
497  }
498
499  # Options with possible arguments that should pass through to both compiler
500  # and the linker.
501  if (defined $CompilerLinkerOptionMap{$ArgKey}) {
502    my $Cnt = $CompilerLinkerOptionMap{$ArgKey};
503    
504    # Check if this is an option that should have a unique value, and if so
505    # determine if the value was checked before.
506    if ($UniqueOptions{$Arg}) {
507      if (defined $Uniqued{$Arg}) {
508        $i += $Cnt;
509        next;
510      }
511      $Uniqued{$Arg} = 1;
512    }
513    
514    push @CompileOpts,$Arg;    
515    push @LinkOpts,$Arg;
516
517    while ($Cnt > 0) {
518      ++$i; --$Cnt;
519      push @CompileOpts, $ARGV[$i];
520      push @LinkOpts, $ARGV[$i];
521    }
522    next;
523  }
524  
525  # Ignored options.
526  if (defined $IgnoredOptionMap{$ArgKey}) {
527    my $Cnt = $IgnoredOptionMap{$ArgKey};
528    while ($Cnt > 0) {
529      ++$i; --$Cnt;
530    }
531    next;
532  }
533  
534  # Compile mode flags.
535  if ($Arg =~ /^-[D,I,U](.*)$/) {
536    my $Tmp = $Arg;    
537    if ($1 eq '') {
538      # FIXME: Check if we are going off the end.
539      ++$i;
540      $Tmp = $Arg . $ARGV[$i];
541    }
542    push @CompileOpts,$Tmp;
543    next;
544  }
545  
546  # Language.
547  if ($Arg eq '-x') {
548    $Lang = $ARGV[$i+1];
549    ++$i; next;
550  }
551
552  # Output file.
553  if ($Arg eq '-o') {
554    ++$i;
555    $Output = $ARGV[$i];
556    next;
557  }
558  
559  # Get the link mode.
560  if ($Arg =~ /^-[l,L,O]/) {
561    if ($Arg eq '-O') { push @LinkOpts,'-O1'; }
562    elsif ($Arg eq '-Os') { push @LinkOpts,'-O2'; }
563    else { push @LinkOpts,$Arg; }
564    next;
565  }
566  
567  if ($Arg =~ /^-std=/) {
568    push @CompileOpts,$Arg;
569    next;
570  }
571  
572#  if ($Arg =~ /^-f/) {
573#    # FIXME: Not sure if the remaining -fxxxx options have no arguments.
574#    push @CompileOpts,$Arg;
575#    push @LinkOpts,$Arg;  # FIXME: Not sure if these are link opts.
576#  }
577  
578  # Get the compiler/link mode.
579  if ($Arg =~ /^-F(.+)$/) {
580    my $Tmp = $Arg;
581    if ($1 eq '') {
582      # FIXME: Check if we are going off the end.
583      ++$i;
584      $Tmp = $Arg . $ARGV[$i];
585    }
586    push @CompileOpts,$Tmp;
587    push @LinkOpts,$Tmp;
588    next;
589  }
590
591  # Input files.
592  if ($Arg eq '-filelist') {
593    # FIXME: Make sure we aren't walking off the end.
594    open(IN, $ARGV[$i+1]);
595    while (<IN>) { s/\015?\012//; push @Files,$_; }
596    close(IN);
597    ++$i;
598    next;
599  }
600  
601  # Handle -Wno-.  We don't care about extra warnings, but
602  # we should suppress ones that we don't want to see.
603  if ($Arg =~ /^-Wno-/) {
604    push @CompileOpts, $Arg;
605    next;
606  }
607
608  if (!($Arg =~ /^-/)) {
609    push @Files, $Arg;
610    next;
611  }
612}
613
614if ($Action eq 'compile' or $Action eq 'link') {
615  my @Archs = keys %ArchsSeen;
616  # Skip the file if we don't support the architectures specified.
617  exit 0 if ($HadArch && scalar(@Archs) == 0);
618  
619  foreach my $file (@Files) {
620    # Determine the language for the file.
621    my $FileLang = $Lang;
622
623    if (!defined($FileLang)) {
624      # Infer the language from the extension.
625      if ($file =~ /[.]([^.]+)$/) {
626        $FileLang = $LangMap{$1};
627      }
628    }
629    
630    # FileLang still not defined?  Skip the file.
631    next if (!defined $FileLang);
632
633    # Language not accepted?
634    next if (!defined $LangsAccepted{$FileLang});
635
636    my @CmdArgs;
637    my @AnalyzeArgs;    
638    
639    if ($FileLang ne 'unknown') {
640      push @CmdArgs, '-x', $FileLang;
641    }
642
643    if (defined $StoreModel) {
644      push @AnalyzeArgs, "-analyzer-store=$StoreModel";
645    }
646
647    if (defined $ConstraintsModel) {
648      push @AnalyzeArgs, "-analyzer-constraints=$ConstraintsModel";
649    }
650
651    if (defined $InternalStats) {
652      push @AnalyzeArgs, "-analyzer-stats";
653    }
654    
655    if (defined $Analyses) {
656      push @AnalyzeArgs, split '\s+', $Analyses;
657    }
658
659    if (defined $Plugins) {
660      push @AnalyzeArgs, split '\s+', $Plugins;
661    }
662
663    if (defined $OutputFormat) {
664      push @AnalyzeArgs, "-analyzer-output=" . $OutputFormat;
665      if ($OutputFormat =~ /plist/) {
666        # Change "Output" to be a file.
667        my ($h, $f) = tempfile("report-XXXXXX", SUFFIX => ".plist",
668                               DIR => $HtmlDir);
669        $ResultFile = $f;
670        # If the HtmlDir is not set, we sould clean up the plist files.
671        if (!defined $HtmlDir || -z $HtmlDir) {
672        	$CleanupFile = $f; 
673        }
674      }
675    }
676
677    push @CmdArgs, @CompileOpts;
678    push @CmdArgs, $file;
679
680    if (scalar @Archs) {
681      foreach my $arch (@Archs) {
682        my @NewArgs;
683        push @NewArgs, '-arch', $arch;
684        push @NewArgs, @CmdArgs;
685        Analyze($Clang, \@NewArgs, \@AnalyzeArgs, $FileLang, $Output,
686                $Verbose, $HtmlDir, $file);
687      }
688    }
689    else {
690      Analyze($Clang, \@CmdArgs, \@AnalyzeArgs, $FileLang, $Output,
691              $Verbose, $HtmlDir, $file);
692    }
693  }
694}
695
696exit($Status >> 8);
697
698