3
0
mirror of https://github.com/pragma-/pbot.git synced 2025-01-25 19:44:26 +01:00
pbot/lib/PBot/Core/Storage/HashObject.pm

282 lines
8.8 KiB
Perl
Raw Normal View History

# File: HashObject.pm
#
2019-06-26 18:34:19 +02:00
# Purpose: Provides a hash-table object with an abstracted API that includes
# setting and deleting values, saving to and loading from files, etc. Provides
# case-insensitive access to the index key while preserving original case when
# displaying index key.
#
# Data is stored in working memory for lightning fast performance. If a filename
2021-07-24 04:22:25 +02:00
# is provided, data is written to the file after any modifications.
2023-02-21 06:31:52 +01:00
# SPDX-FileCopyrightText: 2010-2023 Pragmatic Software <pragma78@gmail.com>
2021-07-11 00:00:22 +02:00
# SPDX-License-Identifier: MIT
License project under MPL2 This patch adds the file LICENSE which is the verbatim copy of the Mozilla Public License Version 2.0 as retreived from https://www.mozilla.org/media/MPL/2.0/index.815ca599c9df.txt on 2017-03-05. This patch also places license headers for the MPL2 type A variant of the license header in the following files: PBot/AntiFlood.pm PBot/BanTracker.pm PBot/BlackList.pm PBot/BotAdminCommands.pm PBot/BotAdmins.pm PBot/ChanOpCommands.pm PBot/ChanOps.pm PBot/Channels.pm PBot/Commands.pm PBot/DualIndexHashObject.pm PBot/EventDispatcher.pm PBot/FactoidCommands.pm PBot/FactoidModuleLauncher.pm PBot/Factoids.pm PBot/HashObject.pm PBot/IRCHandlers.pm PBot/IgnoreList.pm PBot/IgnoreListCommands.pm PBot/Interpreter.pm PBot/LagChecker.pm PBot/Logger.pm PBot/MessageHistory.pm PBot/MessageHistory_SQLite.pm PBot/NickList.pm PBot/PBot.pm PBot/Plugins.pm PBot/Plugins/AntiAway.pm PBot/Plugins/AntiKickAutoRejoin.pm PBot/Plugins/AntiRepeat.pm PBot/Plugins/AntiTwitter.pm PBot/Plugins/AutoRejoin.pm PBot/Plugins/Counter.pm PBot/Plugins/Quotegrabs.pm PBot/Plugins/Quotegrabs/Quotegrabs_Hashtable.pm PBot/Plugins/Quotegrabs/Quotegrabs_SQLite.pm PBot/Plugins/UrlTitles.pm PBot/Plugins/_Example.pm PBot/Refresher.pm PBot/Registerable.pm PBot/Registry.pm PBot/RegistryCommands.pm PBot/SQLiteLogger.pm PBot/SQLiteLoggerLayer.pm PBot/SelectHandler.pm PBot/StdinReader.pm PBot/Timer.pm PBot/Utils/ParseDate.pm PBot/VERSION.pm build/update-version.pl modules/acronym.pl modules/ago.pl modules/c11std.pl modules/c2english.pl modules/c2english/CGrammar.pm modules/c2english/c2eng.pl modules/c99std.pl modules/cdecl.pl modules/cfaq.pl modules/cjeopardy/IRCColors.pm modules/cjeopardy/QStatskeeper.pm modules/cjeopardy/Scorekeeper.pm modules/cjeopardy/cjeopardy.pl modules/cjeopardy/cjeopardy_answer.pl modules/cjeopardy/cjeopardy_filter.pl modules/cjeopardy/cjeopardy_hint.pl modules/cjeopardy/cjeopardy_qstats.pl modules/cjeopardy/cjeopardy_scores.pl modules/cjeopardy/cjeopardy_show.pl modules/codepad.pl modules/compiler_block.pl modules/compiler_client.pl modules/compiler_vm/Diff.pm modules/compiler_vm/cc modules/compiler_vm/compiler_client.pl modules/compiler_vm/compiler_server.pl modules/compiler_vm/compiler_server_vbox_win32.pl modules/compiler_vm/compiler_server_watchdog.pl modules/compiler_vm/compiler_vm_client.pl modules/compiler_vm/compiler_vm_server.pl modules/compiler_vm/compiler_watchdog.pl modules/compiler_vm/languages/_c_base.pm modules/compiler_vm/languages/_default.pm modules/compiler_vm/languages/bash.pm modules/compiler_vm/languages/bc.pm modules/compiler_vm/languages/bf.pm modules/compiler_vm/languages/c11.pm modules/compiler_vm/languages/c89.pm modules/compiler_vm/languages/c99.pm modules/compiler_vm/languages/clang.pm modules/compiler_vm/languages/clang11.pm modules/compiler_vm/languages/clang89.pm modules/compiler_vm/languages/clang99.pm modules/compiler_vm/languages/clangpp.pm modules/compiler_vm/languages/clisp.pm modules/compiler_vm/languages/cpp.pm modules/compiler_vm/languages/freebasic.pm modules/compiler_vm/languages/go.pm modules/compiler_vm/languages/haskell.pm modules/compiler_vm/languages/java.pm modules/compiler_vm/languages/javascript.pm modules/compiler_vm/languages/ksh.pm modules/compiler_vm/languages/lua.pm modules/compiler_vm/languages/perl.pm modules/compiler_vm/languages/python.pm modules/compiler_vm/languages/python3.pm modules/compiler_vm/languages/qbasic.pm modules/compiler_vm/languages/scheme.pm modules/compiler_vm/languages/server/_c_base.pm modules/compiler_vm/languages/server/_default.pm modules/compiler_vm/languages/server/c11.pm modules/compiler_vm/languages/server/c89.pm modules/compiler_vm/languages/server/c99.pm modules/compiler_vm/languages/server/clang.pm modules/compiler_vm/languages/server/clang11.pm modules/compiler_vm/languages/server/clang89.pm modules/compiler_vm/languages/server/clang99.pm modules/compiler_vm/languages/server/cpp.pm modules/compiler_vm/languages/server/freebasic.pm modules/compiler_vm/languages/server/haskell.pm modules/compiler_vm/languages/server/java.pm modules/compiler_vm/languages/server/qbasic.pm modules/compiler_vm/languages/server/tendra.pm modules/compiler_vm/languages/sh.pm modules/compiler_vm/languages/tendra.pm modules/compliment modules/cstd.pl modules/define.pl modules/dice_roll.pl modules/excuse.sh modules/expand_macros.pl modules/fnord.pl modules/funnyish_quote.pl modules/g.pl modules/gdefine.pl modules/gen_cfacts.pl modules/gencstd.pl modules/get_title.pl modules/getcfact.pl modules/google.pl modules/gspy.pl modules/gtop10.pl modules/gtop15.pl modules/headlines.pl modules/horoscope modules/horrorscope modules/ideone.pl modules/insult.pl modules/love_quote.pl modules/man.pl modules/map.pl modules/math.pl modules/prototype.pl modules/qalc.pl modules/random_quote.pl modules/seen.pl modules/urban modules/weather.pl modules/wikipedia.pl pbot.pl pbot.sh It is highly recommended that this list of files is reviewed to ensure that all files are the copyright of the sole maintainer of the repository. If any files with license headers contain the intellectual property of anyone else, it is recommended that a request is made to revise this patch or that the explicit permission of the co-author is gained to allow for the license of the work to be changed. I (Tomasz Kramkowski), the contributor, take no responsibility for any legal action taken against the maintainer of this repository for incorrectly claiming copyright to any work not owned by the maintainer of this repository.
2017-03-05 22:33:31 +01:00
2021-07-24 04:22:25 +02:00
package PBot::Core::Storage::HashObject;
2021-06-19 06:23:34 +02:00
use PBot::Imports;
2019-07-11 03:40:53 +02:00
use Text::Levenshtein::XS qw(distance);
use JSON;
sub new($class, %args) {
2020-02-15 23:38:32 +01:00
my $self = bless {}, $class;
2021-06-19 06:23:34 +02:00
Carp::croak("Missing pbot reference to " . __FILE__) unless exists $args{pbot};
$self->{pbot} = delete $args{pbot};
$self->initialize(%args);
2020-02-15 23:38:32 +01:00
return $self;
}
sub initialize($self, %conf) {
2021-06-19 06:23:34 +02:00
$self->{name} = $conf{name} // 'unnammed';
2020-02-15 23:38:32 +01:00
$self->{hash} = {};
2021-06-19 06:23:34 +02:00
$self->{filename} = $conf{filename};
if (not defined $self->{filename}) {
Carp::carp("Missing filename for $self->{name} HashObject, will not be able to save to or load from file.");
}
}
sub load($self, $filename = undef) {
2021-06-19 06:23:34 +02:00
# allow overriding $self->{filename} with $filename parameter
$filename //= $self->{filename};
2020-02-15 23:38:32 +01:00
2021-06-19 06:23:34 +02:00
# no filename? nothing to load
2020-02-15 23:38:32 +01:00
if (not defined $filename) {
Carp::carp "No $self->{name} filename specified -- skipping loading from file";
return;
}
$self->{pbot}->{logger}->log("Loading $self->{name} from $filename\n");
2020-02-15 23:38:32 +01:00
if (not open(FILE, "< $filename")) {
$self->{pbot}->{logger}->log("Skipping loading from file: Couldn't open $filename: $!\n");
return;
}
2021-06-19 06:23:34 +02:00
# slurp file into $contents
2020-02-15 23:38:32 +01:00
my $contents = do {
local $/;
<FILE>;
};
close FILE;
2021-06-19 06:23:34 +02:00
eval {
# first try to deocde json, throws exception on misparse/errors
my $newhash = decode_json $contents;
# clear current hash only if decode succeeded
$self->clear;
# update internal hash
$self->{hash} = $newhash;
# update existing entries to use _name to preserve typographical casing
# e.g., when someone edits a config file by hand, they might add an
# entry with uppercase characters in its name.
foreach my $index (keys %{$self->{hash}}) {
if (not exists $self->{hash}->{$index}->{_name}) {
if ($index ne lc $index) {
if (exists $self->{hash}->{lc $index}) {
Carp::croak "Cannot update $self->{name} object $index; duplicate object found";
}
my $data = delete $self->{hash}->{$index};
$data->{_name} = $index; # _name is original typographical case
$self->{hash}->{lc $index} = $data; # index key is lowercased
}
2020-02-15 23:38:32 +01:00
}
}
2021-06-19 06:23:34 +02:00
};
if ($@) {
# json parse error or such
$self->{pbot}->{logger}->log("Warning: failed to load $filename: $@\n");
}
}
sub save($self, $filename = undef) {
2021-06-19 06:23:34 +02:00
# allow parameter overriding internal field
$filename //= $self->{filename};
2020-02-15 23:38:32 +01:00
2021-06-19 06:23:34 +02:00
# no filename? nothing to save
2020-02-15 23:38:32 +01:00
if (not defined $filename) {
Carp::carp "No $self->{name} filename specified -- skipping saving to file.\n";
return;
}
2020-02-15 23:38:32 +01:00
$self->{pbot}->{logger}->log("Saving $self->{name} to $filename\n");
2021-06-19 06:23:34 +02:00
# add update_version to metadata
2020-04-22 04:44:14 +02:00
if (not $self->get_data('$metadata$', 'update_version')) {
$self->add('$metadata$', { update_version => PBot::VERSION::BUILD_REVISION });
}
2021-06-19 06:23:34 +02:00
# ensure `name` metadata is current
$self->set('$metadata$', 'name', $self->{name}, 1);
2021-06-19 06:23:34 +02:00
# encode hash as JSON
2020-02-15 23:38:32 +01:00
my $json = JSON->new;
my $json_text = $json->pretty->canonical->utf8->encode($self->{hash});
2021-06-19 06:23:34 +02:00
# print JSON to file
2020-02-15 23:38:32 +01:00
open(FILE, "> $filename") or die "Couldn't open $filename: $!\n";
print FILE "$json_text\n";
close(FILE);
}
sub clear($self) {
2020-02-15 23:38:32 +01:00
$self->{hash} = {};
}
sub levenshtein_matches($self, $keyword) {
2021-06-19 06:23:34 +02:00
my @matches;
2019-06-26 18:34:19 +02:00
2020-02-15 23:38:32 +01:00
foreach my $index (sort keys %{$self->{hash}}) {
my $distance = distance($keyword, $index, 20);
next if not defined $distance;
2021-06-19 06:23:34 +02:00
my $length_a = length $keyword;
my $length_b = length $index;
my $length = $length_a > $length_b ? $length_a : $length_b;
2020-02-15 23:38:32 +01:00
if ($length != 0 && $distance / $length < 0.50) {
2021-06-19 06:23:34 +02:00
push @matches, $index;
2020-02-15 23:38:32 +01:00
}
}
2021-06-19 06:23:34 +02:00
return 'none' if not @matches;
my $result = join ', ', @matches;
# "a, b, c, d" -> "a, b, c or d"
2020-02-15 23:38:32 +01:00
$result =~ s/(.*), /$1 or /;
2021-06-19 06:23:34 +02:00
2020-02-15 23:38:32 +01:00
return $result;
}
sub set($self, $index, $key = undef, $value = undef, $dont_save = 0) {
2020-02-15 23:38:32 +01:00
my $lc_index = lc $index;
2021-06-19 06:23:34 +02:00
# find similarly named keys
2020-02-15 23:38:32 +01:00
if (not exists $self->{hash}->{$lc_index}) {
2021-06-19 06:23:34 +02:00
my $result = "$self->{name}: $index not found; similar matches: ";
2020-02-15 23:38:32 +01:00
$result .= $self->levenshtein_matches($index);
return $result;
}
2020-02-15 23:38:32 +01:00
if (not defined $key) {
2021-06-19 06:23:34 +02:00
# if no key provided, then list all keys and values
my $result = "[$self->{name}] " . $self->get_key_name($lc_index) . " keys: ";
2021-06-19 06:23:34 +02:00
my @entries;
foreach my $key (sort grep { $_ ne '_name' } keys %{$self->{hash}->{$lc_index}}) {
push @entries, "$key: $self->{hash}->{$lc_index}->{$key}";
2020-02-15 23:38:32 +01:00
}
2021-06-19 06:23:34 +02:00
if (@entries) {
$result .= join ";\n", @entries;
} else {
$result .= 'none';
}
2020-02-15 23:38:32 +01:00
return $result;
}
if (not defined $value) {
2021-06-19 06:23:34 +02:00
# if no value provided, then show this key's value
$value = $self->{hash}->{$lc_index}->{$key};
} else {
2021-06-19 06:23:34 +02:00
# otherwise update the value belonging to key
2020-02-15 23:38:32 +01:00
$self->{hash}->{$lc_index}->{$key} = $value;
$self->save unless $dont_save;
}
2021-06-19 06:23:34 +02:00
return "[$self->{name}] " . $self->get_key_name($lc_index) . ": $key " . (defined $value ? "set to $value" : "is not set.");
}
sub unset($self, $index, $key = undef) {
2020-02-15 23:38:32 +01:00
my $lc_index = lc $index;
2020-02-15 23:38:32 +01:00
if (not exists $self->{hash}->{$lc_index}) {
2021-06-19 06:23:34 +02:00
my $result = "$self->{name}: $index not found; similar matches: ";
2020-02-15 23:38:32 +01:00
$result .= $self->levenshtein_matches($index);
return $result;
}
if (defined delete $self->{hash}->{$lc_index}->{$key}) {
$self->save;
return "[$self->{name}] " . $self->get_key_name($lc_index) . ": $key unset.";
2020-02-15 23:38:32 +01:00
} else {
return "[$self->{name}] " . $self->get_key_name($lc_index) . ": $key does not exist.";
2020-02-15 23:38:32 +01:00
}
}
sub exists($self, $index, $data_index = undef) {
2020-02-15 23:38:32 +01:00
return exists $self->{hash}->{lc $index} if not defined $data_index;
return exists $self->{hash}->{lc $index}->{$data_index};
}
sub get_key_name($self, $index) {
my $lc_index = lc $index;
return $lc_index if not exists $self->{hash}->{$lc_index};
return exists $self->{hash}->{$lc_index}->{_name} ? $self->{hash}->{$lc_index}->{_name} : $lc_index;
}
sub get_keys($self, $index = undef) {
2020-04-22 04:44:14 +02:00
return grep { $_ ne '$metadata$' } keys %{$self->{hash}} if not defined $index;
2020-02-15 23:38:32 +01:00
return grep { $_ ne '_name' } keys %{$self->{hash}->{lc $index}};
2020-01-19 06:41:47 +01:00
}
sub get_data($self, $index, $data_index = undef) {
2020-02-15 23:38:32 +01:00
my $lc_index = lc $index;
return undef if not exists $self->{hash}->{$lc_index};
return $self->{hash}->{$lc_index} if not defined $data_index;
return $self->{hash}->{$lc_index}->{$data_index};
2020-02-03 18:47:21 +01:00
}
sub add($self, $index, $data, $dont_save = 0) {
2020-02-15 23:38:32 +01:00
my $lc_index = lc $index;
# preserve case of index
if ($index ne $lc_index) {
$data->{_name} = $index;
}
2020-02-15 23:38:32 +01:00
$self->{hash}->{$lc_index} = $data;
$self->save unless $dont_save;
return "$index added to $self->{name}.";
}
sub remove($self, $index, $data_index = undef, $dont_save = 0) {
2020-02-15 23:38:32 +01:00
my $lc_index = lc $index;
2020-02-15 23:38:32 +01:00
if (not exists $self->{hash}->{$lc_index}) {
2021-06-19 06:23:34 +02:00
my $result = "$self->{name}: $index not found; similar matches: ";
2020-02-15 23:38:32 +01:00
$result .= $self->levenshtein_matches($lc_index);
return $result;
}
2020-02-15 23:38:32 +01:00
if (defined $data_index) {
if (defined delete $self->{hash}->{$lc_index}->{$data_index}) {
delete $self->{hash}->{$lc_index} if keys(%{$self->{hash}->{$lc_index}}) == 1;
$self->save unless $dont_save;
return $self->get_key_name($lc_index) . ".$data_index removed from $self->{name}";
2020-02-15 23:38:32 +01:00
} else {
return "$self->{name}: " . $self->get_key_name($lc_index) . ".$data_index does not exist.";
2020-02-15 23:38:32 +01:00
}
}
2020-02-15 23:38:32 +01:00
my $data = delete $self->{hash}->{$lc_index};
if (defined $data) {
$self->save unless $dont_save;
my $name = exists $data->{_name} ? $data->{_name} : $lc_index;
return "$name removed from $self->{name}.";
2020-02-15 23:38:32 +01:00
} else {
return "$self->{name}: $data_index does not exist.";
}
}
1;