2011-01-26 02:59:19 +01:00
#!/usr/bin/perl
# use warnings;
use strict ;
2012-09-01 07:20:01 +02:00
use feature "switch" ;
2011-01-26 02:59:19 +01:00
use IPC::Open2 ;
2011-02-04 03:50:52 +01:00
use Text::Balanced qw( extract_bracketed extract_delimited ) ;
2011-01-26 02:59:19 +01:00
use IO::Socket ;
use LWP::UserAgent ;
2011-02-08 02:24:12 +01:00
my $ debug = 0 ;
2011-02-01 01:41:51 +01:00
my $ USE_LOCAL = defined $ ENV { 'CC_LOCAL' } ;
2012-01-28 08:39:13 +01:00
my $ MAX_UNDO_HISTORY = 1000000 ;
2011-01-26 02:59:19 +01:00
my $ output = "" ;
my $ nooutput = 'No output.' ;
2012-11-21 20:01:10 +01:00
my $ warn_unterminated_define = 0 ;
2011-01-26 02:59:19 +01:00
my % languages = (
2012-01-28 08:39:13 +01:00
'C11' = > "gcc -std=c11 -pedantic -Wall -Wextra (default)" ,
'C99' = > "gcc -std=c99 -pedantic -Wall -Wextra" ,
'C89' = > "gcc -std=c89 -pedantic -Wall -Wextra" ,
2011-01-26 02:59:19 +01:00
) ;
my % preludes = (
2012-08-18 05:28:10 +02:00
'C99' = > "#define _XOPEN_SOURCE 9001\n#define __USE_XOPEN\n#include <stdio.h>\n#include <stdlib.h>\n#include <string.h>\n#include <unistd.h>\n#include <math.h>\n#include <limits.h>\n#include <sys/types.h>\n#include <stdint.h>\n#include <stdbool.h>\n#include <stddef.h>\n#include <stdarg.h>\n#include <ctype.h>\n#include <inttypes.h>\n#include <float.h>\n#include <errno.h>\n#include <time.h>\n#include <assert.h>\n#include <prelude.h>\n\n" ,
'C11' = > "#define _XOPEN_SOURCE 9001\n#define __USE_XOPEN\n#include <stdio.h>\n#include <stdlib.h>\n#include <string.h>\n#include <unistd.h>\n#include <math.h>\n#include <limits.h>\n#include <sys/types.h>\n#include <stdint.h>\n#include <stdbool.h>\n#include <stddef.h>\n#include <stdarg.h>\n#include <stdnoreturn.h>\n#include <stdalign.h>\n#include <ctype.h>\n#include <inttypes.h>\n#include <float.h>\n#include <errno.h>\n#include <time.h>\n#include <assert.h>\n#include <complex.h>\n#include <prelude.h>\n\n" ,
2012-11-21 20:01:10 +01:00
'C89' = > "#define _XOPEN_SOURCE 9001\n#define __USE_XOPEN\n#include <stdio.h>\n#include <stdlib.h>\n#include <string.h>\n#include <unistd.h>\n#include <math.h>\n#include <limits.h>\n#include <sys/types.h>\n#include <stdint.h>\n#include <errno.h>\n#include <ctype.h>\n#include <assert.h>\n#include <prelude.h>\n\n" ,
2011-02-08 02:27:45 +01:00
) ;
2011-01-26 02:59:19 +01:00
sub pretty {
my $ code = join '' , @ _ ;
my $ result ;
2012-02-15 23:00:58 +01:00
open my $ fh , ">prog.c" or die "Couldn't write prog.c: $!" ;
print $ fh $ code ;
close $ fh ;
2012-12-29 17:19:51 +01:00
system ( "astyle" , "-UHfenq" , "prog.c" ) ;
2012-02-15 23:00:58 +01:00
open $ fh , "<prog.c" or die "Couldn't read prog.c: $!" ;
$ result = join '' , <$fh> ;
close $ fh ;
2011-01-26 02:59:19 +01:00
return $ result ;
}
sub paste_codepad {
my $ text = join ( ' ' , @ _ ) ;
$ text =~ s/(.{120})\s/$1\n/g ;
my $ ua = LWP::UserAgent - > new ( ) ;
$ ua - > agent ( "Mozilla/5.0" ) ;
push @ { $ ua - > requests_redirectable } , 'POST' ;
my % post = ( 'lang' = > 'C' , 'code' = > $ text , 'private' = > 'True' , 'submit' = > 'Submit' ) ;
my $ response = $ ua - > post ( "http://codepad.org" , \ % post ) ;
2012-02-15 23:00:58 +01:00
if ( not $ response - > is_success ) {
return $ response - > status_line ;
}
2011-01-26 02:59:19 +01:00
2012-02-15 23:00:58 +01:00
return $ response - > request - > uri ;
2011-01-26 02:59:19 +01:00
}
2012-02-02 05:14:38 +01:00
2012-02-15 23:00:58 +01:00
sub paste_sprunge {
2012-02-02 05:14:38 +01:00
my $ text = join ( ' ' , @ _ ) ;
$ text =~ s/(.{120})\s/$1\n/g ;
my $ ua = LWP::UserAgent - > new ( ) ;
$ ua - > agent ( "Mozilla/5.0" ) ;
$ ua - > requests_redirectable ( [ ] ) ;
my % post = ( 'sprunge' = > $ text , 'submit' = > 'Submit' ) ;
my $ response = $ ua - > post ( "http://sprunge.us" , \ % post ) ;
if ( not $ response - > is_success ) {
return $ response - > status_line ;
}
my $ result = $ response - > content ;
$ result =~ s/^\s+// ;
$ result =~ s/\s+$/?c/ ;
return $ result ;
}
2011-01-26 02:59:19 +01:00
sub compile {
2011-02-01 01:41:51 +01:00
my ( $ lang , $ code , $ args , $ input , $ local ) = @ _ ;
my ( $ compiler , $ compiler_output , $ pid ) ;
2011-02-08 02:27:45 +01:00
2011-02-01 01:41:51 +01:00
if ( defined $ local and $ local != 0 ) {
print "Using local compiler instead of virtual machine\n" ;
$ pid = open2 ( $ compiler_output , $ compiler , './compiler_vm_server.pl' ) || die "repl failed: $@\n" ;
print "Started compiler, pid: $pid\n" ;
} else {
2012-01-28 08:39:13 +01:00
$ compiler = IO::Socket::INET - > new ( PeerAddr = > '127.0.0.1' , PeerPort = > '3333' , Proto = > 'tcp' , Type = > SOCK_STREAM ) ;
2011-02-01 01:41:51 +01:00
die "Could not create socket: $!" unless $ compiler ;
$ compiler_output = $ compiler ;
}
2011-01-26 02:59:19 +01:00
2012-10-24 14:26:18 +02:00
my $ date = time ;
print $ compiler "compile:$lang:$args:$input:$date\n" ;
2011-02-01 01:41:51 +01:00
print $ compiler "$code\n" ;
print $ compiler "compile:end\n" ;
2011-01-26 02:59:19 +01:00
my $ result = "" ;
my $ got_result = 0 ;
2011-02-01 01:41:51 +01:00
while ( my $ line = <$compiler_output> ) {
2011-01-26 02:59:19 +01:00
$ line =~ s/[\r\n]+$// ;
2012-07-22 21:22:30 +02:00
last if $ line =~ /^result:end$/ ;
2011-01-26 02:59:19 +01:00
if ( $ line =~ /^result:/ ) {
$ line =~ s/^result:// ;
$ result . = $ line ;
$ got_result = 1 ;
next ;
}
if ( $ got_result ) {
$ result . = $ line . "\n" ;
}
}
2011-02-01 01:41:51 +01:00
close $ compiler ;
close $ output if defined $ output ;
waitpid ( $ pid , 0 ) if defined $ pid ;
2011-01-26 02:59:19 +01:00
return $ result ;
}
if ( $# ARGV < 1 ) {
print "Usage: cc [-compiler -options] <code> [-stdin=input]\n" ;
exit 0 ;
}
my $ nick = shift @ ARGV ;
my $ code = join ' ' , @ ARGV ;
my @ last_code ;
2011-02-08 02:24:12 +01:00
print " code: [$code]\n" if $ debug ;
2012-01-28 08:39:13 +01:00
my $ lang = "C11" ;
$ lang = uc $ 1 if $ code =~ s/-lang=([^\b\s]+)//i ;
2011-01-26 02:59:19 +01:00
my $ input = "" ;
2012-02-11 06:05:49 +01:00
$ input = $ 1 if $ code =~ s/-(?:input|stdin)=(.*)$//i ;
2011-01-26 02:59:19 +01:00
2012-11-14 19:36:04 +01:00
my $ got_paste = undef ;
2012-12-29 17:19:51 +01:00
$ got_paste = 1 if $ code =~ s/\s*-paste\s*//i ;
2012-12-30 09:14:27 +01:00
my $ got_nomain = undef ;
$ got_nomain = 1 if $ code =~ s/\s*-nomain\s*//i ;
2012-11-14 19:36:04 +01:00
2011-01-26 02:59:19 +01:00
my $ args = "" ;
$ args . = "$1 " while $ code =~ s/^\s*(-[^ ]+)\s*// ;
$ args =~ s/\s+$// ;
if ( open FILE , "< last_code.txt" ) {
while ( my $ line = <FILE> ) {
chomp $ line ;
push @ last_code , $ line ;
}
close FILE ;
}
if ( $ code =~ m/^\s*show\s*$/i ) {
if ( defined $ last_code [ 0 ] ) {
print "$nick: $last_code[0]\n" ;
} else {
print "$nick: No recent code to show.\n"
}
exit 0 ;
}
my $ got_run = undef ;
if ( $ code =~ m/^\s*(run|paste)\s*$/i ) {
$ got_run = lc $ 1 ;
if ( defined $ last_code [ 0 ] ) {
$ code = $ last_code [ 0 ] ;
} else {
print "$nick: No recent code to $got_run.\n" ;
exit 0 ;
}
} else {
my $ subcode = $ code ;
my $ got_undo = 0 ;
my $ got_sub = 0 ;
while ( $ subcode =~ s/^\s*(and)?\s*undo// ) {
splice @ last_code , 0 , 1 ;
if ( not defined $ last_code [ 0 ] ) {
print "$nick: No more undos remaining.\n" ;
exit 0 ;
} else {
$ code = $ last_code [ 0 ] ;
$ got_undo = 1 ;
}
}
my @ replacements ;
my $ prevchange = $ last_code [ 0 ] ;
my $ got_changes = 0 ;
while ( 1 ) {
$ got_sub = 0 ;
$ got_changes = 0 ;
if ( $ subcode =~ m/^\s*(and)?\s*remove \s*([^']+)?\s*'/ ) {
my $ modifier = 'first' ;
$ subcode =~ s/^\s*(and)?\s*// ;
$ subcode =~ s/remove\s*([^']+)?\s*//i ;
$ modifier = $ 1 if defined $ 1 ;
$ modifier =~ s/\s+$// ;
my ( $ e , $ r ) = extract_delimited ( $ subcode , "'" ) ;
my $ text ;
if ( defined $ e ) {
$ text = $ e ;
$ text =~ s/^'// ;
$ text =~ s/'$// ;
$ subcode = "replace $modifier '$text' with ''$r" ;
} else {
print "$nick: Unbalanced single quotes. Usage: !cc remove [all, first, .., tenth, last] 'text' [and ...]\n" ;
exit 0 ;
}
next ;
}
if ( $ subcode =~ s/^\s*(and)?\s*prepend '// ) {
$ subcode = "'$subcode" ;
my ( $ e , $ r ) = extract_delimited ( $ subcode , "'" ) ;
my $ text ;
if ( defined $ e ) {
$ text = $ e ;
$ text =~ s/^'// ;
$ text =~ s/'$// ;
$ subcode = $ r ;
$ got_sub = 1 ;
$ got_changes = 1 ;
if ( not defined $ prevchange ) {
print "$nick: No recent code to prepend to.\n" ;
exit 0 ;
}
$ code = $ prevchange ;
$ code =~ s/^/$text / ;
$ prevchange = $ code ;
} else {
print "$nick: Unbalanced single quotes. Usage: !cc prepend 'text' [and ...]\n" ;
exit 0 ;
}
next ;
}
if ( $ subcode =~ s/^\s*(and)?\s*append '// ) {
$ subcode = "'$subcode" ;
my ( $ e , $ r ) = extract_delimited ( $ subcode , "'" ) ;
my $ text ;
if ( defined $ e ) {
$ text = $ e ;
$ text =~ s/^'// ;
$ text =~ s/'$// ;
$ subcode = $ r ;
$ got_sub = 1 ;
$ got_changes = 1 ;
if ( not defined $ prevchange ) {
print "$nick: No recent code to append to.\n" ;
exit 0 ;
}
$ code = $ prevchange ;
$ code =~ s/$/ $text/ ;
$ prevchange = $ code ;
} else {
print "$nick: Unbalanced single quotes. Usage: !cc append 'text' [and ...]\n" ;
exit 0 ;
}
next ;
}
if ( $ subcode =~ m/^\s*(and)?\s*replace\s*([^']+)?\s*'.*'\s*with\s*'.*'/i ) {
$ got_sub = 1 ;
my $ modifier = 'first' ;
$ subcode =~ s/^\s*(and)?\s*// ;
$ subcode =~ s/replace\s*([^']+)?\s*//i ;
$ modifier = $ 1 if defined $ 1 ;
$ modifier =~ s/\s+$// ;
my ( $ from , $ to ) ;
my ( $ e , $ r ) = extract_delimited ( $ subcode , "'" ) ;
if ( defined $ e ) {
$ from = $ e ;
$ from =~ s/^'// ;
$ from =~ s/'$// ;
$ from = quotemeta $ from ;
$ subcode = $ r ;
$ subcode =~ s/\s*with\s*//i ;
} else {
print "$nick: Unbalanced single quotes. Usage: !cc replace 'from' with 'to' [and ...]\n" ;
exit 0 ;
}
( $ e , $ r ) = extract_delimited ( $ subcode , "'" ) ;
if ( defined $ e ) {
$ to = $ e ;
$ to =~ s/^'// ;
$ to =~ s/'$// ;
$ subcode = $ r ;
} else {
print "$nick: Unbalanced single quotes. Usage: !cc replace 'from' with 'to' [and replace ... with ... [and ...]]\n" ;
exit 0 ;
}
given ( $ modifier ) {
when ( $ _ eq 'all' ) { }
when ( $ _ eq 'last' ) { }
when ( $ _ eq 'first' ) { $ modifier = 1 ; }
when ( $ _ eq 'second' ) { $ modifier = 2 ; }
when ( $ _ eq 'third' ) { $ modifier = 3 ; }
when ( $ _ eq 'fourth' ) { $ modifier = 4 ; }
when ( $ _ eq 'fifth' ) { $ modifier = 5 ; }
when ( $ _ eq 'sixth' ) { $ modifier = 6 ; }
when ( $ _ eq 'seventh' ) { $ modifier = 7 ; }
when ( $ _ eq 'eighth' ) { $ modifier = 8 ; }
when ( $ _ eq 'nineth' ) { $ modifier = 9 ; }
when ( $ _ eq 'tenth' ) { $ modifier = 10 ; }
default { print "$nick: Bad replacement modifier '$modifier'; valid modifiers are 'all', 'first', 'second', ..., 'tenth', 'last'\n" ; exit 0 ; }
}
my $ replacement = { } ;
$ replacement - > { 'from' } = $ from ;
$ replacement - > { 'to' } = $ to ;
$ replacement - > { 'modifier' } = $ modifier ;
push @ replacements , $ replacement ;
next ;
}
if ( $ subcode =~ m/^\s*(and)?\s*s\/.*\// ) {
$ got_sub = 1 ;
$ subcode =~ s/^\s*(and)?\s*s// ;
my ( $ regex , $ to ) ;
my ( $ e , $ r ) = extract_delimited ( $ subcode , '/' ) ;
if ( defined $ e ) {
$ regex = $ e ;
$ regex =~ s/^\/// ;
$ regex =~ s/\/$// ;
$ subcode = "/$r" ;
} else {
print "$nick: Unbalanced slashes. Usage: !cc s/regex/substitution/[gi] [and s/.../.../ [and ...]]\n" ;
exit 0 ;
}
( $ e , $ r ) = extract_delimited ( $ subcode , '/' ) ;
if ( defined $ e ) {
$ to = $ e ;
$ to =~ s/^\/// ;
$ to =~ s/\/$// ;
$ subcode = $ r ;
} else {
print "$nick: Unbalanced slashes. Usage: !cc s/regex/substitution/[gi] [and s/.../.../ [and ...]]\n" ;
exit 0 ;
}
my $ suffix ;
$ suffix = $ 1 if $ subcode =~ s/^([^ ]+)// ;
if ( length $ suffix and $ suffix =~ m/[^gi]/ ) {
print "$nick: Bad regex modifier '$suffix'. Only 'i' and 'g' are allowed.\n" ;
exit 0 ;
}
if ( defined $ prevchange ) {
$ code = $ prevchange ;
} else {
print "$nick: No recent code to change.\n" ;
exit 0 ;
}
my $ ret = eval {
my ( $ ret , $ a , $ b , $ c , $ d , $ e , $ f , $ g , $ h , $ i , $ before , $ after ) ;
2011-02-08 02:27:45 +01:00
2011-01-26 02:59:19 +01:00
if ( not length $ suffix ) {
$ ret = $ code =~ s | $ regex | $ to | ;
( $ a , $ b , $ c , $ d , $ e , $ f , $ g , $ h , $ i ) = ( $ 1 , $ 2 , $ 3 , $ 4 , $ 5 , $ 6 , $ 7 , $ 8 , $ 9 ) ;
$ before = $` ;
$ after = $' ;
} elsif ( $ suffix =~ /^i$/ ) {
$ ret = $ code =~ s | $ regex | $ to | i ;
( $ a , $ b , $ c , $ d , $ e , $ f , $ g , $ h , $ i ) = ( $ 1 , $ 2 , $ 3 , $ 4 , $ 5 , $ 6 , $ 7 , $ 8 , $ 9 ) ;
$ before = $` ;
$ after = $' ;
} elsif ( $ suffix =~ /^g$/ ) {
$ ret = $ code =~ s | $ regex | $ to | g ;
( $ a , $ b , $ c , $ d , $ e , $ f , $ g , $ h , $ i ) = ( $ 1 , $ 2 , $ 3 , $ 4 , $ 5 , $ 6 , $ 7 , $ 8 , $ 9 ) ;
$ before = $` ;
$ after = $' ;
} elsif ( $ suffix =~ /^ig$/ or $ suffix =~ /^gi$/ ) {
$ ret = $ code =~ s | $ regex | $ to | gi ;
( $ a , $ b , $ c , $ d , $ e , $ f , $ g , $ h , $ i ) = ( $ 1 , $ 2 , $ 3 , $ 4 , $ 5 , $ 6 , $ 7 , $ 8 , $ 9 ) ;
$ before = $` ;
$ after = $' ;
}
if ( $ ret ) {
$ code =~ s/\$1/$a/g ;
$ code =~ s/\$2/$b/g ;
$ code =~ s/\$3/$c/g ;
$ code =~ s/\$4/$d/g ;
$ code =~ s/\$5/$e/g ;
$ code =~ s/\$6/$f/g ;
$ code =~ s/\$7/$g/g ;
$ code =~ s/\$8/$h/g ;
$ code =~ s/\$9/$i/g ;
$ code =~ s/\$`/$before/g ;
$ code =~ s/\$'/$after/g ;
}
return $ ret ;
} ;
if ( $@ ) {
print "$nick: $@\n" ;
exit 0 ;
}
if ( $ ret ) {
$ got_changes = 1 ;
}
$ prevchange = $ code ;
}
if ( $ got_sub and not $ got_changes ) {
print "$nick: No substitutions made.\n" ;
exit 0 ;
} elsif ( $ got_sub and $ got_changes ) {
next ;
}
last ;
}
if ( $# replacements > - 1 ) {
@ replacements = sort { $ a - > { 'from' } cmp $ b - > { 'from' } or $ a - > { 'modifier' } <=> $ b - > { 'modifier' } } @ replacements ;
my ( $ previous_from , $ previous_modifier ) ;
foreach my $ replacement ( @ replacements ) {
my $ from = $ replacement - > { 'from' } ;
my $ to = $ replacement - > { 'to' } ;
my $ modifier = $ replacement - > { 'modifier' } ;
if ( defined $ previous_from ) {
if ( $ previous_from eq $ f rom and $ previous_modifier =~ /^\d+$/ ) {
$ modifier -= $ modifier - $ previous_modifier ;
}
}
if ( defined $ prevchange ) {
$ code = $ prevchange ;
} else {
print "$nick: No recent code to change.\n" ;
exit 0 ;
}
my $ ret = eval {
my $ got_change ;
my ( $ first_char , $ last_char , $ first_bound , $ last_bound ) ;
$ first_char = $ 1 if $ from =~ m/^(.)/ ;
$ last_char = $ 1 if $ from =~ m/(.)$/ ;
if ( $ first_char =~ /\W/ ) {
$ first_bound = '.' ;
} else {
$ first_bound = '\b' ;
}
if ( $ last_char =~ /\W/ ) {
$ last_bound = '\B' ;
} else {
$ last_bound = '\b' ;
}
if ( $ modifier eq 'all' ) {
while ( $ code =~ s/($first_bound)$from($last_bound)/$1$to$2/ ) {
$ got_change = 1 ;
}
} elsif ( $ modifier eq 'last' ) {
if ( $ code =~ s/(.*)($first_bound)$from($last_bound)/$1$2$to$3/ ) {
$ got_change = 1 ;
}
} else {
my $ count = 0 ;
my $ unescaped = $ from ;
$ unescaped =~ s/\\//g ;
if ( $ code =~ s/($first_bound)$from($last_bound)/if(++$count == $modifier) { "$1$to$2"; } else { "$1$unescaped$2"; }/gex ) {
$ got_change = 1 ;
}
}
return $ got_change ;
} ;
if ( $@ ) {
print "$nick: $@\n" ;
exit 0 ;
}
if ( $ ret ) {
$ got_sub = 1 ;
$ got_changes = 1 ;
}
$ prevchange = $ code ;
$ previous_from = $ from ;
$ previous_modifier = $ modifier ;
}
if ( $ got_sub and not $ got_changes ) {
print "$nick: No replacements made.\n" ;
exit 0 ;
}
}
open FILE , "> last_code.txt" ;
unless ( $ got_undo and not $ got_sub ) {
unshift @ last_code , $ code ;
}
my $ i = 0 ;
foreach my $ line ( @ last_code ) {
last if ( + + $ i > $ MAX_UNDO_HISTORY ) ;
print FILE "$line\n" ;
}
2012-02-02 05:14:38 +01:00
2011-01-26 02:59:19 +01:00
close FILE ;
if ( $ got_undo and not $ got_sub ) {
print "$nick: $code\n" ;
exit 0 ;
}
}
# check to see if -flags were added by replacements
2012-01-28 08:39:13 +01:00
$ lang = uc $ 1 if $ code =~ s/-lang=([^\b\s]+)//i ;
2012-07-22 21:22:30 +02:00
$ input = $ 1 if $ code =~ s/-(?:input|stdin)=(.*)$//i ;
2011-01-26 02:59:19 +01:00
$ args . = "$1 " while $ code =~ s/^\s*(-[^ ]+)\s*// ;
$ args =~ s/\s+$// ;
unless ( $ got_run ) {
open FILE , ">> log.txt" ;
2012-02-02 05:14:38 +01:00
print FILE "------------------------------------------------------------------------\n" ;
2011-01-26 02:59:19 +01:00
print FILE localtime ( ) . "\n" ;
print FILE "$nick: $code\n" ;
}
my $ found = 0 ;
my @ langs ;
foreach my $ l ( sort { uc $ a cmp uc $ b } keys % languages ) {
2012-10-24 14:26:18 +02:00
#push @langs, sprintf(" %-30s => %s", $l, $languages{$l});
push @ langs , sprintf ( "%s => %s" , $ l , $ languages { $ l } ) ;
2011-01-26 02:59:19 +01:00
if ( uc $ lang eq uc $ l ) {
$ lang = $ l ;
$ found = 1 ;
}
}
if ( not $ found ) {
2012-10-24 14:26:18 +02:00
print "$nick: Invalid language '$lang'. Supported languages are:\n" , ( join ",\n" , @ langs ) , "\n; For additional languages try the cc2 command." ;
2011-01-26 02:59:19 +01:00
exit 0 ;
}
2012-02-11 06:05:49 +01:00
print "code before: [$code]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
$ code =~ s/#include <([^>]+)>/#include <$1>\n/g ;
2012-09-01 07:20:01 +02:00
# replace \n outside of quotes with literal newline
my $ new_code = "" ;
use constant {
NORMAL = > 0 ,
DOUBLE_QUOTED = > 1 ,
SINGLE_QUOTED = > 2 ,
} ;
my $ state = NORMAL ;
my $ escaped = 0 ;
2012-09-03 09:02:17 +02:00
while ( $ code =~ m/(.)/gs ) {
2012-09-01 07:20:01 +02:00
my $ ch = $ 1 ;
given ( $ ch ) {
when ( '\\' ) {
if ( $ escaped == 0 ) {
$ escaped = 1 ;
next ;
}
}
if ( $ state == NORMAL ) {
when ( $ _ eq '"' and not $ escaped ) {
$ state = DOUBLE_QUOTED ;
}
when ( $ _ eq "'" and not $ escaped ) {
$ state = SINGLE_QUOTED ;
}
when ( $ _ eq 'n' and $ escaped == 1 ) {
$ ch = "\n" ;
$ escaped = 0 ;
}
}
if ( $ state == DOUBLE_QUOTED ) {
when ( $ _ eq '"' and not $ escaped ) {
$ state = NORMAL ;
}
}
if ( $ state == SINGLE_QUOTED ) {
when ( $ _ eq "'" and not $ escaped ) {
$ state = NORMAL ;
}
}
}
$ new_code . = '\\' and $ escaped = 0 if $ escaped ;
$ new_code . = $ ch ;
}
$ code = $ new_code ;
2011-01-26 02:59:19 +01:00
2012-09-17 09:12:16 +02:00
print "code after \\n replacement: [$code]\n" if $ debug ;
my $ single_quote = 0 ;
my $ double_quote = 0 ;
my $ parens = 0 ;
my $ escaped = 0 ;
my $ cpp = 0 ; # preprocessor
while ( $ code =~ m/(.)/msg ) {
my $ ch = $ 1 ;
my $ pos = pos $ code ;
print "adding newlines, ch = [$ch], parens: $parens, cpp: $cpp, single: $single_quote, double: $double_quote, escaped: $escaped, pos: $pos\n" if $ debug >= 10 ;
if ( $ ch eq '\\' ) {
$ escaped = not $ escaped ;
} elsif ( $ ch eq '#' and not $ cpp and not $ escaped and not $ single_quote and not $ double_quote ) {
$ cpp = 1 ;
} elsif ( $ ch eq '"' ) {
$ double_quote = not $ double_quote unless $ escaped ;
$ escaped = 0 ;
} elsif ( $ ch eq '(' and not $ single_quote and not $ double_quote ) {
$ parens + + ;
} elsif ( $ ch eq ')' and not $ single_quote and not $ double_quote ) {
$ parens - - ;
$ parens = 0 if $ parens < 0 ;
} elsif ( $ ch eq ';' and not $ cpp and not $ single_quote and not $ double_quote and $ parens == 0 ) {
if ( not substr ( $ code , $ pos , 1 ) =~ m/[\n\r]/ ) {
substr ( $ code , $ pos , 0 ) = "\n" ;
pos $ code = $ pos + 1 ;
}
} elsif ( $ ch eq "'" ) {
$ single_quote = not $ single_quote unless $ escaped ;
$ escaped = 0 ;
} elsif ( $ ch eq 'n' and $ escaped ) {
if ( not $ single_quote and not $ double_quote ) {
print "added newline\n" if $ debug >= 10 ;
substr ( $ code , $ pos - 2 , 2 ) = "\n" ;
pos $ code = $ pos ;
$ cpp = 0 ;
}
$ escaped = 0 ;
} elsif ( $ ch eq '{' and not $ cpp and not $ single_quote and not $ double_quote ) {
if ( not substr ( $ code , $ pos , 1 ) =~ m/[\n\r]/ ) {
substr ( $ code , $ pos , 0 ) = "\n" ;
pos $ code = $ pos + 1 ;
}
} elsif ( $ ch eq '}' and not $ cpp and not $ single_quote and not $ double_quote ) {
if ( not substr ( $ code , $ pos , 1 ) =~ m/[\n\r;]/ ) {
substr ( $ code , $ pos , 0 ) = "\n" ;
pos $ code = $ pos + 1 ;
}
} elsif ( $ ch eq "\n" and $ cpp and not $ single_quote and not $ double_quote ) {
$ cpp = 0 ;
} else {
$ escaped = 0 ;
}
}
print "code after \\n additions: [$code]\n" if $ debug ;
2012-02-11 06:05:49 +01:00
2011-01-29 21:50:44 +01:00
my $ precode ;
if ( $ code =~ m/#include/ ) {
2012-07-22 21:22:30 +02:00
$ precode = $ code ;
2011-01-29 21:50:44 +01:00
} else {
$ precode = $ preludes { $ lang } . $ code ;
}
2011-01-26 02:59:19 +01:00
$ code = '' ;
2012-09-03 20:48:47 +02:00
print "--- precode: [$precode]\n" if $ debug ;
2012-11-21 20:01:10 +01:00
if ( $ lang eq 'C89' or $ lang eq 'C99' or $ lang eq 'C11' or $ lang eq 'C++' ) {
2011-01-26 02:59:19 +01:00
my $ has_main = 0 ;
2011-02-08 02:27:45 +01:00
2011-01-26 02:59:19 +01:00
my $ prelude = '' ;
2012-09-03 20:48:47 +02:00
while ( $ precode =~ s/^\s*(#.*\n)//g ) {
$ prelude . = $ 1 ;
}
2012-11-21 20:01:10 +01:00
if ( $ precode =~ m/^\s*(#.*)/m ) {
my $ line = $ 1 ;
if ( $ line !~ m/\n/ ) {
$ warn_unterminated_define = 1 ;
}
}
2012-03-21 16:58:07 +01:00
print "*** prelude: [$prelude]\n precode: [$precode]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
2011-02-08 02:24:12 +01:00
# strip C and C++ style comments
2012-10-24 14:26:18 +02:00
$ precode =~ s #/\*[^*]*\*+([^/*][^*]*\*+)*/|//([^\\]|[^\n][\n]?)*?\n|("(\\.|[^"\\])*"|'(\\.|[^'\\])*'|.[^/"'\\]*)#defined $3 ? $3 : " "#gse;
2011-02-08 02:24:12 +01:00
print " precode: [$precode]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
my $ preprecode = $ precode ;
2011-02-08 02:24:12 +01:00
# white-out contents of quoted literals
$ preprecode =~ s/(?:\"((?:\\\"|(?!\").)*)\")/'"' . ('-' x length $1) . '"'/ge ;
$ preprecode =~ s/(?:\'((?:\\\'|(?!\').)*)\')/"'" . ('-' x length $1) . "'"/ge ;
print "preprecode: [$preprecode]\n" if $ debug ;
2012-02-11 06:05:49 +01:00
print "looking for functions, has main: $has_main\n" if $ debug >= 2 ;
2013-02-02 00:35:11 +01:00
my $ func_regex = qr/^([ *\w]+)\s+([*\w]+)\s*\(([^;]*)\s*\)\s*({.*)/ ims ;
2012-03-21 16:58:07 +01:00
2011-02-08 02:24:12 +01:00
# look for potential functions to extract
2012-09-03 20:48:47 +02:00
while ( $ preprecode =~ /$func_regex/ms ) {
2011-02-08 02:24:12 +01:00
my ( $ pre_ret , $ pre_ident , $ pre_params , $ pre_potential_body ) = ( $ 1 , $ 2 , $ 3 , $ 4 ) ;
2012-11-18 20:18:56 +01:00
print "looking for functions, found [$pre_ret][$pre_ident][$pre_params][$pre_potential_body], has main: $has_main\n" if $ debug >= 1 ;
2012-02-11 06:05:49 +01:00
2011-02-08 02:24:12 +01:00
# find the pos at which this function lives, for extracting from precode
$ preprecode =~ m/(\Q$pre_ret\E\s+\Q$pre_ident\E\s*\(\s*\Q$pre_params\E\s*\)\s*\Q$pre_potential_body\E)/g ;
my $ extract_pos = ( pos $ preprecode ) - ( length $ 1 ) ;
# now that we have the pos, substitute out the extracted potential function from preprecode
2012-09-03 20:48:47 +02:00
$ preprecode =~ s/$func_regex//ms ;
2011-02-08 02:24:12 +01:00
# create tmpcode object that starts from extract pos, to skip any quoted code
my $ tmpcode = substr ( $ precode , $ extract_pos ) ;
2011-02-10 02:32:03 +01:00
print "tmpcode: [$tmpcode]\n" if $ debug ;
2011-02-08 02:24:12 +01:00
$ precode = substr ( $ precode , 0 , $ extract_pos ) ;
print "precode: [$precode]\n" if $ debug ;
2012-03-21 16:58:07 +01:00
$ tmpcode =~ m/$func_regex/ms ;
2011-01-26 02:59:19 +01:00
my ( $ ret , $ ident , $ params , $ potential_body ) = ( $ 1 , $ 2 , $ 3 , $ 4 ) ;
2012-09-03 20:48:47 +02:00
print "1st extract: [$ret][$ident][$params][$potential_body]\n" if $ debug ;
2011-02-08 02:24:12 +01:00
2011-01-26 02:59:19 +01:00
$ ret =~ s/^\s+// ;
$ ret =~ s/\s+$// ;
2012-02-29 02:10:12 +01:00
if ( not length $ ret or $ ret eq "else" or $ ret eq "while" or $ ret eq "if" or $ ret eq "for" or $ ident eq "for" or $ ident eq "while" or $ ident eq "if" ) {
2011-01-26 02:59:19 +01:00
$ precode . = "$ret $ident ($params) $potential_body" ;
next ;
} else {
2012-09-03 20:48:47 +02:00
$ tmpcode =~ s/$func_regex//ms ;
2011-01-26 02:59:19 +01:00
}
2011-02-04 03:50:52 +01:00
my @ extract = extract_bracketed ( $ potential_body , '{}' ) ;
2011-01-26 02:59:19 +01:00
my $ body ;
if ( not defined $ extract [ 0 ] ) {
2011-02-08 02:24:12 +01:00
print "error: unmatched brackets for function '$ident';\n" ;
2012-10-24 14:26:18 +02:00
print "body: [$potential_body]\n" ;
2011-02-08 02:24:12 +01:00
exit ;
2011-01-26 02:59:19 +01:00
} else {
$ body = $ extract [ 0 ] ;
$ preprecode . = $ extract [ 1 ] ;
$ precode . = $ extract [ 1 ] ;
}
2011-02-08 02:24:12 +01:00
2012-09-03 20:48:47 +02:00
print "final extract: [$ret][$ident][$params][$body]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
$ code . = "$ret $ident($params) $body\n\n" ;
$ has_main = 1 if $ ident eq 'main' ;
}
$ precode =~ s/^\s+// ;
$ precode =~ s/\s+$// ;
2012-02-29 02:10:12 +01:00
$ precode =~ s/^{(.*)}$/$1/s ;
2012-12-30 09:14:27 +01:00
if ( not $ has_main and not $ got_nomain ) {
2012-10-05 03:59:04 +02:00
$ code = "$prelude\n\n$code\n\nint main(void) {\n$precode\n;\nreturn 0;\n}\n" ;
2011-02-08 02:24:12 +01:00
$ nooutput = "No warnings, errors or output." ;
2011-01-26 02:59:19 +01:00
} else {
2012-03-21 16:58:07 +01:00
print "code: [$code]; precode: [$precode]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
$ code = "$prelude\n\n$precode\n\n$code\n" ;
2011-02-08 02:24:12 +01:00
$ nooutput = "No warnings, errors or output." ;
2011-01-26 02:59:19 +01:00
}
} else {
$ code = $ precode ;
}
2012-02-11 06:05:49 +01:00
print "after func extract, code: [$code]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
$ code =~ s/\|n/\n/g ;
$ code =~ s/^\s+// ;
$ code =~ s/\s+$// ;
2012-09-17 09:12:16 +02:00
$ code =~ s/;\s*;\n/;\n/gs ;
2012-11-18 20:18:56 +01:00
$ code =~ s/({|})\n\s*;\n/$1\n/gs ;
2012-02-11 06:05:49 +01:00
$ code =~ s/(?:\n\n)+/\n\n/g ;
print "final code: [$code]\n" if $ debug ;
2011-01-26 02:59:19 +01:00
2012-11-02 23:08:20 +01:00
print FILE "$nick: [lang:$lang][args:$args][input:$input]\n" , pretty ( $ code ) , "\n" unless $ got_run ;
2011-01-26 02:59:19 +01:00
2012-02-15 23:00:58 +01:00
$ input = "Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet." if not length $ input ;
2011-02-01 01:41:51 +01:00
$ output = compile ( $ lang , pretty ( $ code ) , $ args , $ input , $ USE_LOCAL ) ;
2011-01-26 02:59:19 +01:00
2011-02-08 02:24:12 +01:00
if ( $ output =~ m/^\s*$/ ) {
2011-02-08 02:27:45 +01:00
$ output = $ nooutput
2011-02-08 02:24:12 +01:00
} else {
2012-02-02 05:14:38 +01:00
unless ( $ got_run ) {
print FILE localtime ( ) . "\n" ;
print FILE "$output\n" ;
}
2012-02-29 02:10:12 +01:00
2011-02-08 02:27:45 +01:00
$ output =~ s/cc1: warnings being treated as errors// ;
$ output =~ s/ Line \d+ ://g ;
$ output =~ s/ \(first use in this function\)//g ;
$ output =~ s/error: \(Each undeclared identifier is reported only once.*?\)//msg ;
$ output =~ s/prog\.c:[:\d]*//g ;
$ output =~ s/ld: warning: cannot find entry symbol _start; defaulting to [^ ]+// ;
$ output =~ s/error: (.*?) error/error: $1; error/msg ;
$ output =~ s/\/tmp\/.*\.o://g ;
$ output =~ s/collect2: ld returned \d+ exit status//g ;
$ output =~ s/\(\.text\+[^)]+\)://g ;
$ output =~ s/\[ In/[In/ ;
$ output =~ s/warning: Can't read pathname for load map: Input.output error.//g ;
my $ left_quote = chr ( 226 ) . chr ( 128 ) . chr ( 152 ) ;
my $ right_quote = chr ( 226 ) . chr ( 128 ) . chr ( 153 ) ;
$ output =~ s/$left_quote/'/g ;
$ output =~ s/$right_quote/'/g ;
2012-02-09 19:48:45 +01:00
$ output =~ s/\t/ /g ;
2011-12-31 00:20:29 +01:00
$ output =~ s/\s*In function 'main':\s*//g ;
2012-07-22 21:22:30 +02:00
$ output =~ s/warning: unknown conversion type character 'b' in format \[-Wformat\]\s+warning: too many arguments for format \[-Wformat-extra-args\]/info: %b is a candide extension/g ;
2012-01-28 08:39:13 +01:00
$ output =~ s/warning: unknown conversion type character 'b' in format \[-Wformat\]//g ;
$ output =~ s/\s\(core dumped\)/./ ;
2012-02-09 19:48:45 +01:00
# $output =~ s/\[\s+/[/g;
2012-01-28 08:39:13 +01:00
$ output =~ s/ \[enabled by default\]//g ;
$ output =~ s/initializer\s+warning: \(near/initializer (near/g ;
$ output =~ s/note: each undeclared identifier is reported only once for each function it appears in//g ;
$ output =~ s/\(gdb\)//g ;
2012-02-02 05:14:38 +01:00
$ output =~ s/", '\\(\d{3})' <repeats \d+ times>,? ?"/\\$1/g ;
$ output =~ s/, '\\(\d{3})' <repeats \d+ times>\s*//g ;
$ output =~ s/(\\000)+/\\0/g ;
2012-02-09 19:48:45 +01:00
$ output =~ s/\\0[^">']+/\\0/g ;
2012-09-03 09:02:17 +02:00
$ output =~ s/= (\d+) '\\0'/= $1/g ;
2012-02-02 05:14:38 +01:00
$ output =~ s/\\0"/"/g ;
$ output =~ s/"\\0/"/g ;
$ output =~ s/\.\.\.>/>/g ;
2012-02-04 07:02:52 +01:00
$ output =~ s/(\\\d{3})+//g ;
2012-02-09 19:48:45 +01:00
$ output =~ s/<\s*included at \/home\/compiler\/>\s*//g ;
$ output =~ s/\s*compilation terminated due to -Wfatal-errors\.//g ;
$ output =~ s/^======= Backtrace.*\[vsyscall\]\s*$//ms ;
$ output =~ s/glibc detected \*\*\* \/home\/compiler\/prog: // ;
$ output =~ s/: \/home\/compiler\/prog terminated// ;
2012-02-29 02:10:12 +01:00
$ output =~ s/<Defined at \/home\/compiler\/>/<Defined at \/home\/compiler\/prog.c:0>/g ;
$ output =~ s/\s*In file included from\s+\/usr\/include\/.*?:\d+:\d+:\s*/, /g ;
$ output =~ s/\s*collect2: error: ld returned 1 exit status//g ;
$ output =~ s/In function\s*`main':\s*\/home\/compiler\/ undefined reference to/error: undefined reference to/g ;
2012-07-22 21:22:30 +02:00
$ output =~ s/\/home\/compiler\///g ;
2012-03-12 04:33:54 +01:00
$ output =~ s/compilation terminated.// ;
2012-08-18 05:28:10 +02:00
$ output =~ s/<'(.)' = char>/<'$1' = int>/g ;
2012-10-24 14:26:18 +02:00
$ output =~ s/= (-?\d+) ''/= $1/g ;
2012-08-18 05:28:10 +02:00
$ output =~ s/, <incomplete sequence >//g ;
2012-09-01 07:20:01 +02:00
$ output =~ s/\s*warning: shadowed declaration is here \[-Wshadow\]//g ;
$ output =~ s/preprocessor macro>\s+<at\s+>/preprocessor macro>/g ;
2012-10-05 03:59:04 +02:00
$ output =~ s/<No symbol table is loaded. Use the "file" command.>\s*//g ;
$ output =~ s/cc1: all warnings being treated as; errors//g ;
2012-11-02 23:08:20 +01:00
$ output =~ s/, note: this is the location of the previous definition//g ;
2012-11-18 20:18:56 +01:00
2012-08-18 05:28:10 +02:00
# remove duplicate warnings/infos
2012-09-01 07:20:01 +02:00
$ output =~ s/(\[*.*warning:.*?\s*)\1/$1/g ;
2012-08-18 05:28:10 +02:00
$ output =~ s/(info: .*?\s)\1/$1/g ;
$ output =~ s/^\[\s+(warning:|info:)/[$1/ ; # remove leading spaces in first warning/info
2012-03-12 04:33:54 +01:00
# splint
$ output =~ s/Splint 3.1.2 --- 03 May 2009\s*// ;
$ output =~ s/Finished checking --- \d+ code warning\s*// ;
2012-11-02 23:08:20 +01:00
print FILE "splint: [$output]\n" unless $ got_run ;
2012-03-12 04:33:54 +01:00
$ output =~ s/\s*\(in function main\)\s*Fresh\s*storage\s*.*?\s*not\s*released.*?reference\s+to\s+it\s+is\s+lost.\s*//msg ;
$ output =~ s/\s*\(in function main\)\s*//g ;
$ output =~ s/\s*\(Use\s+.*?\s+to\s+inhibit\s+warning\)//msg ;
$ output =~ s/Suspect modification of observer/Suspect modification of string-literal/g ;
$ output =~ s/Storage\s*declared\s*with\s*observer\s*is\s*possibly\s*modified.\s*Observer\s*storage\s*may\s*not\s*be\s*modified./Such modification is undefined-behavior./gs ;
$ output =~ s/Storage\s*(.*?)?\s*becomes observer\s*//g ;
$ output =~ s/Fresh storage .*? created\s*//g ;
$ output =~ s/Storage .*? becomes null\s*//g ;
$ output =~ s/To\s*make\s*char\s*and\s*int\s*types\s*equivalent,\s*use\s*\+charint.\s*//gs ;
$ output =~ s/To\s*ignore\s*signs\s*in\s*type\s*comparisons\s*use\s*\+ignoresigns\s*//gs ;
$ output =~ s/Fresh storage/Allocated storage/g ;
$ output =~ s/derived\s*from\s*.*?\s*precondition:\s*requires\s*maxSet\(.*?\)\s*>=\s*maxRead\(.*?\)\s*//gs ;
$ output =~ s/\s*needed\s*to\s*satisfy\s*precondition:\s*requires\s*max.*?\(.*?\)\s*>=\s*\d+//gs ;
$ output =~ s/\s*needed\s*to\s*satisfy\s*precondition:\s*requires\s*max.*?\(.*?\)\s*>=\s*.*?@//gs ;
$ output =~ s/\s*To allow all numeric types to match, use \+relaxtypes.//g ;
$ output =~ s/\s*Corresponding format code//g ;
$ output =~ s/Command Line: Setting .*? redundant with current value\s*//g ;
# $output =~ s/maxSet\((.*?)\s*@\s*\)/$1/g;
$ output =~ s/\s*Unable to resolve constraint: requires .*? >= [^ \]]+//gs ;
$ output =~ s/\s*To\s*allow\s*arbitrary\s*integral\s*types\s*to\s*match\s*any\s*integral\s*type,\s*use\s*\+matchanyintegral.//gs ;
2012-12-29 17:19:51 +01:00
$ output =~ s/<Function "main" not defined.>\s+//g ;
$ output =~ s/Make breakpoint pending on future shared library load\? \(y or \[n\]\) \[answered N; input not from terminal\]//g ;
2012-03-12 04:33:54 +01:00
$ output =~ s/\s*Storage\s*.*?\s*becomes\s*static//gs ;
2012-03-21 16:54:43 +01:00
$ output =~ s/Possibly\s*null\s*storage\s*passed\s*as\s*non-null\s*param:/Possibly null storage passed to function:/g ;
2012-03-12 04:33:54 +01:00
$ output =~ s/A\s*possibly\s*null\s*pointer\s*is\s*passed\s*as\s*a\s*parameter\s*corresponding\s*to\s*a\s*formal\s*parameter\s*with\s*no\s*\/\*\@null\@\*\/\s*annotation.\s*If\s*NULL\s*may\s*be\s*used\s*for\s*this\s*parameter,\s*add\s*a\s*\/\*\@null\@\*\/\s*annotation\s*to\s*the\s*function\s*parameter\s*declaration./A possibly null pointer is passed as a parameter to a function./gs ;
2012-08-18 05:28:10 +02:00
$ output =~ s/ called by \?\? \(\)//g ;
2013-02-05 12:14:19 +01:00
$ output =~ s/\s*Copyright\s*\(C\)\s*\d+\s*Free\s*Software\s*Foundation,\s*Inc.\s*This\s*is\s*free\s*software;\s*see\s*the\s*source\s*for\s*copying\s*conditions.\s*\s*There\s*is\s*NO\s*warranty;\s*not\s*even\s*for\s*MERCHANTABILITY\s*or\s*FITNESS\s*FOR\s*A\s*PARTICULAR\s*PURPOSE.//gs ;
2011-02-08 02:24:12 +01:00
}
2011-01-26 02:59:19 +01:00
2012-11-21 20:01:10 +01:00
if ( $ warn_unterminated_define == 1 ) {
if ( $ output =~ m/^\[(warning:|info:)/ ) {
$ output =~ s/^\[/[notice: #define not terminated by \\n, the remainder of the line will be part of this #define / ;
} else {
$ output =~ s/^/[notice: #define not terminated by \\n, the remainder of the line will be part of this #define] / ;
}
}
2011-01-26 02:59:19 +01:00
unless ( $ got_run ) {
2012-02-02 05:14:38 +01:00
print FILE "$nick: $output\n" ;
2011-01-26 02:59:19 +01:00
close FILE ;
}
2012-11-14 19:36:04 +01:00
if ( defined $ got_paste or ( defined $ got_run and $ got_run eq "paste" ) ) {
2012-11-18 20:18:56 +01:00
$ output =~ s/[\r\n]+$// ;
$ code . = "\n\n/************* OUTPUT *************\n$output\n************** OUTPUT **************/\n" ;
2012-11-02 23:08:20 +01:00
my $ uri = paste_sprunge ( pretty ( $ code ) ) ;
print "$nick: $uri\n" ;
exit 0 ;
}
2011-01-26 02:59:19 +01:00
print "$nick: $output\n" ;