3
0
mirror of https://github.com/pragma-/pbot.git synced 2024-11-16 17:09:33 +01:00
pbot/applets/expand_macros.pl

333 lines
9.7 KiB
Perl
Raw Normal View History

2021-02-07 23:37:12 +01:00
#!/usr/bin/env perl
2013-11-28 06:11:54 +01:00
2021-07-11 00:00:22 +02:00
# SPDX-FileCopyrightText: 2021 Pragmatic Software <pragma78@gmail.com>
# SPDX-License-Identifier: MIT
License project under MPL2 This patch adds the file LICENSE which is the verbatim copy of the Mozilla Public License Version 2.0 as retreived from https://www.mozilla.org/media/MPL/2.0/index.815ca599c9df.txt on 2017-03-05. This patch also places license headers for the MPL2 type A variant of the license header in the following files: PBot/AntiFlood.pm PBot/BanTracker.pm PBot/BlackList.pm PBot/BotAdminCommands.pm PBot/BotAdmins.pm PBot/ChanOpCommands.pm PBot/ChanOps.pm PBot/Channels.pm PBot/Commands.pm PBot/DualIndexHashObject.pm PBot/EventDispatcher.pm PBot/FactoidCommands.pm PBot/FactoidModuleLauncher.pm PBot/Factoids.pm PBot/HashObject.pm PBot/IRCHandlers.pm PBot/IgnoreList.pm PBot/IgnoreListCommands.pm PBot/Interpreter.pm PBot/LagChecker.pm PBot/Logger.pm PBot/MessageHistory.pm PBot/MessageHistory_SQLite.pm PBot/NickList.pm PBot/PBot.pm PBot/Plugins.pm PBot/Plugins/AntiAway.pm PBot/Plugins/AntiKickAutoRejoin.pm PBot/Plugins/AntiRepeat.pm PBot/Plugins/AntiTwitter.pm PBot/Plugins/AutoRejoin.pm PBot/Plugins/Counter.pm PBot/Plugins/Quotegrabs.pm PBot/Plugins/Quotegrabs/Quotegrabs_Hashtable.pm PBot/Plugins/Quotegrabs/Quotegrabs_SQLite.pm PBot/Plugins/UrlTitles.pm PBot/Plugins/_Example.pm PBot/Refresher.pm PBot/Registerable.pm PBot/Registry.pm PBot/RegistryCommands.pm PBot/SQLiteLogger.pm PBot/SQLiteLoggerLayer.pm PBot/SelectHandler.pm PBot/StdinReader.pm PBot/Timer.pm PBot/Utils/ParseDate.pm PBot/VERSION.pm build/update-version.pl modules/acronym.pl modules/ago.pl modules/c11std.pl modules/c2english.pl modules/c2english/CGrammar.pm modules/c2english/c2eng.pl modules/c99std.pl modules/cdecl.pl modules/cfaq.pl modules/cjeopardy/IRCColors.pm modules/cjeopardy/QStatskeeper.pm modules/cjeopardy/Scorekeeper.pm modules/cjeopardy/cjeopardy.pl modules/cjeopardy/cjeopardy_answer.pl modules/cjeopardy/cjeopardy_filter.pl modules/cjeopardy/cjeopardy_hint.pl modules/cjeopardy/cjeopardy_qstats.pl modules/cjeopardy/cjeopardy_scores.pl modules/cjeopardy/cjeopardy_show.pl modules/codepad.pl modules/compiler_block.pl modules/compiler_client.pl modules/compiler_vm/Diff.pm modules/compiler_vm/cc modules/compiler_vm/compiler_client.pl modules/compiler_vm/compiler_server.pl modules/compiler_vm/compiler_server_vbox_win32.pl modules/compiler_vm/compiler_server_watchdog.pl modules/compiler_vm/compiler_vm_client.pl modules/compiler_vm/compiler_vm_server.pl modules/compiler_vm/compiler_watchdog.pl modules/compiler_vm/languages/_c_base.pm modules/compiler_vm/languages/_default.pm modules/compiler_vm/languages/bash.pm modules/compiler_vm/languages/bc.pm modules/compiler_vm/languages/bf.pm modules/compiler_vm/languages/c11.pm modules/compiler_vm/languages/c89.pm modules/compiler_vm/languages/c99.pm modules/compiler_vm/languages/clang.pm modules/compiler_vm/languages/clang11.pm modules/compiler_vm/languages/clang89.pm modules/compiler_vm/languages/clang99.pm modules/compiler_vm/languages/clangpp.pm modules/compiler_vm/languages/clisp.pm modules/compiler_vm/languages/cpp.pm modules/compiler_vm/languages/freebasic.pm modules/compiler_vm/languages/go.pm modules/compiler_vm/languages/haskell.pm modules/compiler_vm/languages/java.pm modules/compiler_vm/languages/javascript.pm modules/compiler_vm/languages/ksh.pm modules/compiler_vm/languages/lua.pm modules/compiler_vm/languages/perl.pm modules/compiler_vm/languages/python.pm modules/compiler_vm/languages/python3.pm modules/compiler_vm/languages/qbasic.pm modules/compiler_vm/languages/scheme.pm modules/compiler_vm/languages/server/_c_base.pm modules/compiler_vm/languages/server/_default.pm modules/compiler_vm/languages/server/c11.pm modules/compiler_vm/languages/server/c89.pm modules/compiler_vm/languages/server/c99.pm modules/compiler_vm/languages/server/clang.pm modules/compiler_vm/languages/server/clang11.pm modules/compiler_vm/languages/server/clang89.pm modules/compiler_vm/languages/server/clang99.pm modules/compiler_vm/languages/server/cpp.pm modules/compiler_vm/languages/server/freebasic.pm modules/compiler_vm/languages/server/haskell.pm modules/compiler_vm/languages/server/java.pm modules/compiler_vm/languages/server/qbasic.pm modules/compiler_vm/languages/server/tendra.pm modules/compiler_vm/languages/sh.pm modules/compiler_vm/languages/tendra.pm modules/compliment modules/cstd.pl modules/define.pl modules/dice_roll.pl modules/excuse.sh modules/expand_macros.pl modules/fnord.pl modules/funnyish_quote.pl modules/g.pl modules/gdefine.pl modules/gen_cfacts.pl modules/gencstd.pl modules/get_title.pl modules/getcfact.pl modules/google.pl modules/gspy.pl modules/gtop10.pl modules/gtop15.pl modules/headlines.pl modules/horoscope modules/horrorscope modules/ideone.pl modules/insult.pl modules/love_quote.pl modules/man.pl modules/map.pl modules/math.pl modules/prototype.pl modules/qalc.pl modules/random_quote.pl modules/seen.pl modules/urban modules/weather.pl modules/wikipedia.pl pbot.pl pbot.sh It is highly recommended that this list of files is reviewed to ensure that all files are the copyright of the sole maintainer of the repository. If any files with license headers contain the intellectual property of anyone else, it is recommended that a request is made to revise this patch or that the explicit permission of the co-author is gained to allow for the license of the work to be changed. I (Tomasz Kramkowski), the contributor, take no responsibility for any legal action taken against the maintainer of this repository for incorrectly claiming copyright to any work not owned by the maintainer of this repository.
2017-03-05 22:33:31 +01:00
use warnings;
2013-11-28 06:11:54 +01:00
use strict;
use feature "switch";
no if $] >= 5.018, warnings => 'experimental';
2013-11-28 06:11:54 +01:00
use IPC::Open2;
use Text::Balanced qw(extract_bracketed extract_delimited);
use IO::Socket;
use LWP::UserAgent;
my $debug = 0;
2020-02-15 23:38:32 +01:00
my $USE_LOCAL = defined $ENV{'CC_LOCAL'};
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
my $output = "";
2013-11-28 06:11:54 +01:00
my $nooutput = 'No output.';
if ($#ARGV < 0) {
2020-02-15 23:38:32 +01:00
print "Usage: expand <code>\n";
exit 0;
2013-11-28 06:11:54 +01:00
}
my $code = join ' ', @ARGV;
my $lang = 'C89';
my $args = "";
print " code: [$code]\n" if $debug;
# replace \n outside of quotes with literal newline
my $new_code = "";
use constant {
2020-02-15 23:38:32 +01:00
NORMAL => 0,
DOUBLE_QUOTED => 1,
SINGLE_QUOTED => 2,
2013-11-28 06:11:54 +01:00
};
2020-02-15 23:38:32 +01:00
my $state = NORMAL;
2013-11-28 06:11:54 +01:00
my $escaped = 0;
while ($code =~ m/(.)/gs) {
2020-02-15 23:38:32 +01:00
my $ch = $1;
given ($ch) {
when ('\\') {
if ($escaped == 0) {
$escaped = 1;
next;
}
}
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
if ($state == NORMAL) {
when ($_ eq '"' and not $escaped) { $state = DOUBLE_QUOTED; }
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
when ($_ eq "'" and not $escaped) { $state = SINGLE_QUOTED; }
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
when ($_ eq 'n' and $escaped == 1) {
$ch = "\n";
$escaped = 0;
}
}
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
if ($state == DOUBLE_QUOTED) {
when ($_ eq '"' and not $escaped) { $state = NORMAL; }
}
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
if ($state == SINGLE_QUOTED) {
when ($_ eq "'" and not $escaped) { $state = NORMAL; }
}
2013-11-28 06:11:54 +01:00
}
2020-02-15 23:38:32 +01:00
$new_code .= '\\' and $escaped = 0 if $escaped;
$new_code .= $ch;
2013-11-28 06:11:54 +01:00
}
$code = $new_code;
print "code after \\n replacement: [$code]\n" if $debug;
my $single_quote = 0;
my $double_quote = 0;
2020-02-15 23:38:32 +01:00
my $parens = 0;
my $cpp = 0; # preprocessor
2013-11-28 06:11:54 +01:00
$escaped = 0;
while ($code =~ m/(.)/msg) {
2020-02-15 23:38:32 +01:00
my $ch = $1;
my $pos = pos $code;
print "adding newlines, ch = [$ch], parens: $parens, cpp: $cpp, single: $single_quote, double: $double_quote, escaped: $escaped, pos: $pos\n" if $debug >= 10;
if ($ch eq '\\') { $escaped = not $escaped; }
elsif ($ch eq '#' and not $cpp and not $escaped and not $single_quote and not $double_quote) {
$cpp = 1;
if ($code =~ m/include\s*[<"]([^>"]*)[>"]/msg) {
my $match = $1;
$pos = pos $code;
substr($code, $pos, 0) = "\n";
pos $code = $pos;
$cpp = 0;
} else {
pos $code = $pos;
}
} elsif ($ch eq '"') {
$double_quote = not $double_quote unless $escaped or $single_quote;
$escaped = 0;
} elsif ($ch eq '(' and not $single_quote and not $double_quote) {
$parens++;
} elsif ($ch eq ')' and not $single_quote and not $double_quote) {
$parens--;
$parens = 0 if $parens < 0;
} elsif ($ch eq ';' and not $cpp and not $single_quote and not $double_quote and $parens == 0) {
if (not substr($code, $pos, 1) =~ m/[\n\r]/) {
substr($code, $pos, 0) = "\n";
pos $code = $pos + 1;
}
} elsif ($ch eq "'") {
$single_quote = not $single_quote unless $escaped or $double_quote;
$escaped = 0;
} elsif ($ch eq 'n' and $escaped) {
if (not $single_quote and not $double_quote) {
print "added newline\n" if $debug >= 10;
substr($code, $pos - 2, 2) = "\n";
pos $code = $pos;
$cpp = 0;
}
$escaped = 0;
} elsif ($ch eq '{' and not $cpp and not $single_quote and not $double_quote) {
if (not substr($code, $pos, 1) =~ m/[\n\r]/) {
substr($code, $pos, 0) = "\n";
pos $code = $pos + 1;
}
} elsif ($ch eq '}' and not $cpp and not $single_quote and not $double_quote) {
if (not substr($code, $pos, 1) =~ m/[\n\r;]/) {
substr($code, $pos, 0) = "\n";
pos $code = $pos + 1;
}
} elsif ($ch eq "\n" and $cpp and not $single_quote and not $double_quote) {
$cpp = 0;
2013-11-28 06:11:54 +01:00
} else {
2020-02-15 23:38:32 +01:00
$escaped = 0;
2013-11-28 06:11:54 +01:00
}
}
print "code after \\n additions: [$code]\n" if $debug;
#$code =~ s/#include [<"'].*?['">]//gm;
print "code after include removal: [$code]\n" if $debug;
2013-11-28 06:11:54 +01:00
my $precode = $code;
$code = '';
print "--- precode: [$precode]\n" if $debug;
my $has_main = 0;
if ($lang eq 'C89' or $lang eq 'C99' or $lang eq 'C11' or $lang eq 'C++') {
my $prelude = "#include <stdio.h>\n#include <stddef.h>\n#include <stdlib.h>\n";
2020-02-15 23:38:32 +01:00
while ($precode =~ s/^\s*(#.*\n{1,2})//g) { $prelude .= $1; }
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "*** prelude: [$prelude]\n precode: [$precode]\n" if $debug;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
my $preprecode = $precode;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
# white-out contents of quoted literals
$preprecode =~ s/(?:\"((?:\\\"|(?!\").)*)\")/'"' . ('-' x length $1) . '"'/ge;
$preprecode =~ s/(?:\'((?:\\\'|(?!\').)*)\')/"'" . ('-' x length $1) . "'"/ge;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
# strip C and C++ style comments
if ($lang eq 'C89' or $args =~ m/-std=(gnu89|c89)/i) {
$preprecode =~ s#/\*[^*]*\*+([^/*][^*]*\*+)*/# #gs;
$preprecode =~ s#|//([^\\]|[^\n][\n]?)*?\n|("(\\.|[^"\\])*"|'(\\.|[^'\\])*'|.[^/"'\\]*)#defined $2 ? $2 : ""#gse;
} else {
$preprecode =~ s#|//([^\\]|[^\n][\n]?)*?\n|("(\\.|[^"\\])*"|'(\\.|[^'\\])*'|.[^/"'\\]*)#defined $2 ? $2 : ""#gse;
$preprecode =~ s#/\*[^*]*\*+([^/*][^*]*\*+)*/# #gs;
}
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "preprecode: [$preprecode]\n" if $debug;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "looking for functions, has main: $has_main\n" if $debug >= 2;
2013-11-28 06:11:54 +01:00
my $func_regex = qr/^([ *\w]+)\s+([*\w]+)\s*\(([^;{]*)\s*\)\s*(\{.*|<%.*|\?\?<.*)/ims;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
# look for potential functions to extract
while ($preprecode =~ /$func_regex/ms) {
my ($pre_ret, $pre_ident, $pre_params, $pre_potential_body) = ($1, $2, $3, $4);
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "looking for functions, found [$pre_ret][$pre_ident][$pre_params][$pre_potential_body], has main: $has_main\n" if $debug >= 1;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
# find the pos at which this function lives, for extracting from precode
$preprecode =~ m/(\Q$pre_ret\E\s+\Q$pre_ident\E\s*\(\s*\Q$pre_params\E\s*\)\s*\Q$pre_potential_body\E)/g;
my $extract_pos = (pos $preprecode) - (length $1);
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
# now that we have the pos, substitute out the extracted potential function from preprecode
$preprecode =~ s/$func_regex//ms;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
# create tmpcode object that starts from extract pos, to skip any quoted code
my $tmpcode = substr($precode, $extract_pos);
print "tmpcode: [$tmpcode]\n" if $debug;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
$precode = substr($precode, 0, $extract_pos);
print "precode: [$precode]\n" if $debug;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
$tmpcode =~ m/$func_regex/ms;
my ($ret, $ident, $params, $potential_body) = ($1, $2, $3, $4);
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "1st extract: [$ret][$ident][$params][$potential_body]\n" if $debug;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
$ret =~ s/^\s+//;
$ret =~ s/\s+$//;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
if (not length $ret or $ret eq "else" or $ret eq "while" or $ret eq "if" or $ret eq "for" or $ident eq "for" or $ident eq "while" or $ident eq "if") {
$precode .= "$ret $ident ($params) $potential_body";
next;
} else {
$tmpcode =~ s/$func_regex//ms;
}
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
$potential_body =~ s/^\s*<%/{/ms;
$potential_body =~ s/%>\s*$/}/ms;
$potential_body =~ s/^\s*\?\?</{/ms;
$potential_body =~ s/\?\?>$/}/ms;
my @extract = extract_bracketed($potential_body, '{}');
my $body;
if (not defined $extract[0]) {
if ($debug == 0) { print "error: unmatched brackets\n"; }
else {
print "error: unmatched brackets for function '$ident';\n";
print "body: [$potential_body]\n";
}
exit;
2013-11-28 06:11:54 +01:00
} else {
2020-02-15 23:38:32 +01:00
$body = $extract[0];
$preprecode .= $extract[1];
$precode .= $extract[1];
2013-11-28 06:11:54 +01:00
}
2020-02-15 23:38:32 +01:00
print "final extract: [$ret][$ident][$params][$body]\n" if $debug;
$code .= "$ret $ident($params) $body\n\n";
$has_main = 1 if $ident eq 'main';
}
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
$precode =~ s/^\s+//;
$precode =~ s/\s+$//;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
$precode =~ s/^{(.*)}$/$1/s;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
if (not $has_main) {
$code = "$prelude\n$code" . "int main(void) {\n$precode\n}\n";
$nooutput = "No warnings, errors or output.";
} else {
print "code: [$code]; precode: [$precode]\n" if $debug;
$code = "$prelude\n$precode\n\n$code\n";
$nooutput = "No warnings, errors or output.";
}
2013-11-28 06:11:54 +01:00
} else {
2020-02-15 23:38:32 +01:00
$code = $precode;
2013-11-28 06:11:54 +01:00
}
print "after func extract, code: [$code]\n" if $debug;
$code =~ s/\|n/\n/g;
$code =~ s/^\s+//;
$code =~ s/\s+$//;
$code =~ s/(\{|})\n\s*;\n/$1\n/gs;
2013-11-28 06:11:54 +01:00
$code =~ s/(?:\n\n)+/\n\n/g;
print "final code: [$code]\n" if $debug;
open my $fh, ">prog.c" or die "Couldn't write prog.c: $!";
print $fh $code;
close $fh;
my ($ret, $result) = execute(2, "bash -c \"ulimit -t 1; gcc -E -ftrack-macro-expansion=0 prog.c\"");
2013-11-28 06:11:54 +01:00
$result =~ s/.*# \d+ "prog.c"(\s+\d+)*//ms;
2013-11-28 06:11:54 +01:00
$result =~ s/^#.*$//gm;
$result =~ s/[\n\r]/ /gm;
$result =~ s/\s+/ /gm;
print "result: [$result]\n" if $debug;
if (not $has_main) {
2020-02-15 23:38:32 +01:00
$result =~ s/\s*int main\(void\) \{//;
$result =~ s/\s*\}\s*$//;
2013-11-28 06:11:54 +01:00
}
$output = length $result ? $result : $nooutput;
2013-11-28 06:11:54 +01:00
print "$output\n";
2013-11-28 06:11:54 +01:00
sub execute {
2020-02-15 23:38:32 +01:00
my $timeout = shift @_;
my ($cmdline) = @_;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
my ($ret, $result);
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
($ret, $result) = eval {
print "eval\n" if $debug;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
my $result = '';
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
my $pid = open(my $fh, '-|', "$cmdline 2>&1");
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
local $SIG{ALRM} = sub { print "Time out\n" if $debug; kill 'TERM', $pid; die "$result [Timed-out]\n"; };
alarm($timeout);
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
while (my $line = <$fh>) { $result .= $line; }
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
close $fh;
my $ret = $? >> 8;
alarm 0;
return ($ret, $result);
};
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "done eval\n" if $debug;
alarm 0;
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
if ($@ =~ /Timed-out/) { return (-1, $@); }
2013-11-28 06:11:54 +01:00
2020-02-15 23:38:32 +01:00
print "[$ret, $result]\n" if $debug;
return ($ret, $result);
2013-11-28 06:11:54 +01:00
}