mirror of
https://github.com/pragma-/pbot.git
synced 2025-01-21 01:24:42 +01:00
121 lines
2.8 KiB
Perl
121 lines
2.8 KiB
Perl
|
#!/usr/bin/env perl
|
||
|
|
||
|
package SplitLine;
|
||
|
|
||
|
use 5.020;
|
||
|
|
||
|
use warnings;
|
||
|
use strict;
|
||
|
|
||
|
use feature 'signatures';
|
||
|
no warnings 'experimental::signatures';
|
||
|
|
||
|
use parent qw(Exporter);
|
||
|
our @EXPORT = qw(split_line);
|
||
|
|
||
|
# splits line into arguments separated by unquoted whitespace.
|
||
|
# handles unbalanced quotes by treating them as part of the
|
||
|
# argument they were found within.
|
||
|
sub split_line ($line, %opts) {
|
||
|
my %default_opts = (
|
||
|
strip_quotes => 0,
|
||
|
keep_spaces => 0,
|
||
|
preserve_escapes => 1,
|
||
|
);
|
||
|
|
||
|
%opts = (%default_opts, %opts);
|
||
|
|
||
|
my @chars = split //, $line;
|
||
|
|
||
|
my @args;
|
||
|
my $escaped = 0;
|
||
|
my $quote;
|
||
|
my $token = '';
|
||
|
my $last_token = '';
|
||
|
my $ch = ' ';
|
||
|
my $i = 0;
|
||
|
my $pos = 0;
|
||
|
my $ignore_quote = 0;
|
||
|
my $spaces = 0;
|
||
|
|
||
|
while (1) {
|
||
|
if ($i >= @chars) {
|
||
|
if (defined $quote) {
|
||
|
# reached end, but unbalanced quote... reset to beginning of quote and ignore it
|
||
|
$i = $pos;
|
||
|
$ignore_quote = 1;
|
||
|
$quote = undef;
|
||
|
$token = $last_token;
|
||
|
} else {
|
||
|
# add final token and exit
|
||
|
push @args, $token if length $token;
|
||
|
last;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
$ch = $chars[$i++];
|
||
|
|
||
|
my $dquote = $quote // 'undef';
|
||
|
$spaces = 0 if $ch ne ' ';
|
||
|
|
||
|
if ($escaped) {
|
||
|
if ($opts{preserve_escapes}) {
|
||
|
$token .= "\\$ch";
|
||
|
} else {
|
||
|
$token .= $ch;
|
||
|
}
|
||
|
$escaped = 0;
|
||
|
next;
|
||
|
}
|
||
|
|
||
|
if ($ch eq '\\') {
|
||
|
$escaped = 1;
|
||
|
next;
|
||
|
}
|
||
|
|
||
|
if (defined $quote) {
|
||
|
if ($ch eq $quote) {
|
||
|
# closing quote
|
||
|
$token .= $ch unless $opts{strip_quotes};
|
||
|
$quote = undef;
|
||
|
} else {
|
||
|
# still within quoted argument
|
||
|
$token .= $ch;
|
||
|
}
|
||
|
next;
|
||
|
}
|
||
|
|
||
|
if (not defined $quote and ($ch eq "'" or $ch eq '"')) {
|
||
|
if ($ignore_quote) {
|
||
|
# treat unbalanced quote as part of this argument
|
||
|
$token .= $ch;
|
||
|
$ignore_quote = 0;
|
||
|
} else {
|
||
|
# begin potential quoted argument
|
||
|
$pos = $i - 1;
|
||
|
$quote = $ch;
|
||
|
$last_token = $token;
|
||
|
$token .= $ch unless $opts{strip_quotes};
|
||
|
}
|
||
|
next;
|
||
|
}
|
||
|
|
||
|
if ($ch eq ' ') {
|
||
|
if (++$spaces > 1 and $opts{keep_spaces}) {
|
||
|
$token .= $ch;
|
||
|
next;
|
||
|
} else {
|
||
|
push @args, $token if length $token;
|
||
|
$token = '';
|
||
|
next;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
$token .= $ch;
|
||
|
}
|
||
|
|
||
|
return @args;
|
||
|
}
|
||
|
|
||
|
1;
|