mirror of
https://github.com/ergochat/ergo.git
synced 2025-01-22 10:14:07 +01:00
bd6c2117e8
History couldn't be enabled by rehash if autoresize-window was nonzero.
416 lines
9.7 KiB
Go
416 lines
9.7 KiB
Go
// Copyright (c) 2018 Shivaram Lingamneni <slingamn@cs.stanford.edu>
|
|
// released under the MIT license
|
|
|
|
package history
|
|
|
|
import (
|
|
"github.com/oragono/oragono/irc/utils"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
)
|
|
|
|
type ItemType uint
|
|
|
|
const (
|
|
uninitializedItem ItemType = iota
|
|
Privmsg
|
|
Notice
|
|
Join
|
|
Part
|
|
Kick
|
|
Quit
|
|
Mode
|
|
Tagmsg
|
|
Nick
|
|
)
|
|
|
|
const (
|
|
initialAutoSize = 32
|
|
)
|
|
|
|
// a Tagmsg that consists entirely of transient tags is not stored
|
|
var transientTags = map[string]bool{
|
|
"+draft/typing": true,
|
|
"+typing": true, // future-proofing
|
|
}
|
|
|
|
// Item represents an event (e.g., a PRIVMSG or a JOIN) and its associated data
|
|
type Item struct {
|
|
Type ItemType
|
|
|
|
Nick string
|
|
// this is the uncasefolded account name, if there's no account it should be set to "*"
|
|
AccountName string
|
|
// for non-privmsg items, we may stuff some other data in here
|
|
Message utils.SplitMessage
|
|
Tags map[string]string
|
|
Params [1]string
|
|
}
|
|
|
|
// HasMsgid tests whether a message has the message id `msgid`.
|
|
func (item *Item) HasMsgid(msgid string) bool {
|
|
if item.Message.Msgid == msgid {
|
|
return true
|
|
}
|
|
for _, pair := range item.Message.Wrapped {
|
|
if pair.Msgid == msgid {
|
|
return true
|
|
}
|
|
}
|
|
return false
|
|
}
|
|
|
|
func (item *Item) isStorable() bool {
|
|
if item.Type == Tagmsg {
|
|
for name := range item.Tags {
|
|
if !transientTags[name] {
|
|
return true
|
|
}
|
|
}
|
|
return false // all tags were blacklisted
|
|
} else {
|
|
return true
|
|
}
|
|
}
|
|
|
|
type Predicate func(item Item) (matches bool)
|
|
|
|
// Buffer is a ring buffer holding message/event history for a channel or user
|
|
type Buffer struct {
|
|
sync.RWMutex
|
|
|
|
// ring buffer, see irc/whowas.go for conventions
|
|
buffer []Item
|
|
start int
|
|
end int
|
|
maximumSize int
|
|
window time.Duration
|
|
|
|
lastDiscarded time.Time
|
|
|
|
enabled uint32
|
|
|
|
nowFunc func() time.Time
|
|
}
|
|
|
|
func NewHistoryBuffer(size int, window time.Duration) (result *Buffer) {
|
|
result = new(Buffer)
|
|
result.Initialize(size, window)
|
|
return
|
|
}
|
|
|
|
func (hist *Buffer) Initialize(size int, window time.Duration) {
|
|
hist.buffer = make([]Item, hist.initialSize(size, window))
|
|
hist.start = -1
|
|
hist.end = -1
|
|
hist.window = window
|
|
hist.maximumSize = size
|
|
hist.nowFunc = time.Now
|
|
|
|
hist.setEnabled(size)
|
|
}
|
|
|
|
// compute the initial size for the buffer, taking into account autoresize
|
|
func (hist *Buffer) initialSize(size int, window time.Duration) (result int) {
|
|
result = size
|
|
if window != 0 {
|
|
result = initialAutoSize
|
|
if size < result {
|
|
result = size // min(initialAutoSize, size)
|
|
}
|
|
}
|
|
return
|
|
}
|
|
|
|
func (hist *Buffer) setEnabled(size int) {
|
|
var enabled uint32
|
|
if size != 0 {
|
|
enabled = 1
|
|
}
|
|
atomic.StoreUint32(&hist.enabled, enabled)
|
|
}
|
|
|
|
// Enabled returns whether the buffer is currently storing messages
|
|
// (a disabled buffer blackholes everything it sees)
|
|
func (list *Buffer) Enabled() bool {
|
|
return atomic.LoadUint32(&list.enabled) != 0
|
|
}
|
|
|
|
// Add adds a history item to the buffer
|
|
func (list *Buffer) Add(item Item) {
|
|
// fast path without a lock acquisition for when we are not storing history
|
|
if !list.Enabled() {
|
|
return
|
|
}
|
|
|
|
if !item.isStorable() {
|
|
return
|
|
}
|
|
|
|
if item.Message.Time.IsZero() {
|
|
item.Message.Time = time.Now().UTC()
|
|
}
|
|
|
|
list.Lock()
|
|
defer list.Unlock()
|
|
|
|
list.maybeExpand()
|
|
|
|
var pos int
|
|
if list.start == -1 { // empty
|
|
pos = 0
|
|
list.start = 0
|
|
list.end = 1 % len(list.buffer)
|
|
} else if list.start != list.end { // partially full
|
|
pos = list.end
|
|
list.end = (list.end + 1) % len(list.buffer)
|
|
} else if list.start == list.end { // full
|
|
pos = list.end
|
|
list.end = (list.end + 1) % len(list.buffer)
|
|
list.start = list.end // advance start as well, overwriting first entry
|
|
// record the timestamp of the overwritten item
|
|
if list.lastDiscarded.Before(list.buffer[pos].Message.Time) {
|
|
list.lastDiscarded = list.buffer[pos].Message.Time
|
|
}
|
|
}
|
|
|
|
list.buffer[pos] = item
|
|
}
|
|
|
|
// Reverse reverses an []Item, in-place.
|
|
func Reverse(results []Item) {
|
|
for i, j := 0, len(results)-1; i < j; i, j = i+1, j-1 {
|
|
results[i], results[j] = results[j], results[i]
|
|
}
|
|
}
|
|
|
|
// Between returns all history items with a time `after` <= time <= `before`,
|
|
// with an indication of whether the results are complete or are missing items
|
|
// because some of that period was discarded. A zero value of `before` is considered
|
|
// higher than all other times.
|
|
func (list *Buffer) Between(after, before time.Time, ascending bool, limit int) (results []Item, complete bool) {
|
|
if !list.Enabled() {
|
|
return
|
|
}
|
|
|
|
list.RLock()
|
|
defer list.RUnlock()
|
|
|
|
complete = after.Equal(list.lastDiscarded) || after.After(list.lastDiscarded)
|
|
|
|
satisfies := func(item Item) bool {
|
|
return (after.IsZero() || item.Message.Time.After(after)) && (before.IsZero() || item.Message.Time.Before(before))
|
|
}
|
|
|
|
return list.matchInternal(satisfies, ascending, limit), complete
|
|
}
|
|
|
|
// Match returns all history items such that `predicate` returns true for them.
|
|
// Items are considered in reverse insertion order if `ascending` is false, or
|
|
// in insertion order if `ascending` is true, up to a total of `limit` matches
|
|
// if `limit` > 0 (unlimited otherwise).
|
|
// `predicate` MAY be a closure that maintains its own state across invocations;
|
|
// it MUST NOT acquire any locks or otherwise do anything weird.
|
|
// Results are always returned in insertion order.
|
|
func (list *Buffer) Match(predicate Predicate, ascending bool, limit int) (results []Item) {
|
|
if !list.Enabled() {
|
|
return
|
|
}
|
|
|
|
list.RLock()
|
|
defer list.RUnlock()
|
|
|
|
return list.matchInternal(predicate, ascending, limit)
|
|
}
|
|
|
|
// you must be holding the read lock to call this
|
|
func (list *Buffer) matchInternal(predicate Predicate, ascending bool, limit int) (results []Item) {
|
|
if list.start == -1 {
|
|
return
|
|
}
|
|
|
|
var pos, stop int
|
|
if ascending {
|
|
pos = list.start
|
|
stop = list.prev(list.end)
|
|
} else {
|
|
pos = list.prev(list.end)
|
|
stop = list.start
|
|
}
|
|
|
|
for {
|
|
if predicate(list.buffer[pos]) {
|
|
results = append(results, list.buffer[pos])
|
|
}
|
|
if pos == stop || (limit != 0 && len(results) == limit) {
|
|
break
|
|
}
|
|
if ascending {
|
|
pos = list.next(pos)
|
|
} else {
|
|
pos = list.prev(pos)
|
|
}
|
|
}
|
|
|
|
// TODO sort by time instead?
|
|
if !ascending {
|
|
Reverse(results)
|
|
}
|
|
return
|
|
}
|
|
|
|
// Latest returns the items most recently added, up to `limit`. If `limit` is 0,
|
|
// it returns all items.
|
|
func (list *Buffer) Latest(limit int) (results []Item) {
|
|
matchAll := func(item Item) bool { return true }
|
|
return list.Match(matchAll, false, limit)
|
|
}
|
|
|
|
// LastDiscarded returns the latest time of any entry that was evicted
|
|
// from the ring buffer.
|
|
func (list *Buffer) LastDiscarded() time.Time {
|
|
list.RLock()
|
|
defer list.RUnlock()
|
|
|
|
return list.lastDiscarded
|
|
}
|
|
|
|
func (list *Buffer) prev(index int) int {
|
|
switch index {
|
|
case 0:
|
|
return len(list.buffer) - 1
|
|
default:
|
|
return index - 1
|
|
}
|
|
}
|
|
|
|
func (list *Buffer) next(index int) int {
|
|
switch index {
|
|
case len(list.buffer) - 1:
|
|
return 0
|
|
default:
|
|
return index + 1
|
|
}
|
|
}
|
|
|
|
// return n such that v <= n and n == 2**i for some i
|
|
func roundUpToPowerOfTwo(v int) int {
|
|
// http://graphics.stanford.edu/~seander/bithacks.html
|
|
v -= 1
|
|
v |= v >> 1
|
|
v |= v >> 2
|
|
v |= v >> 4
|
|
v |= v >> 8
|
|
v |= v >> 16
|
|
return v + 1
|
|
}
|
|
|
|
func (list *Buffer) maybeExpand() {
|
|
if list.window == 0 {
|
|
return // autoresize is disabled
|
|
}
|
|
|
|
length := list.length()
|
|
if length < len(list.buffer) {
|
|
return // we have spare capacity already
|
|
}
|
|
|
|
if len(list.buffer) == list.maximumSize {
|
|
return // cannot expand any further
|
|
}
|
|
|
|
wouldDiscard := list.buffer[list.start].Message.Time
|
|
if list.window < list.nowFunc().Sub(wouldDiscard) {
|
|
return // oldest element is old enough to overwrite
|
|
}
|
|
|
|
newSize := roundUpToPowerOfTwo(length + 1)
|
|
if list.maximumSize < newSize {
|
|
newSize = list.maximumSize
|
|
}
|
|
list.resize(newSize)
|
|
}
|
|
|
|
// Resize shrinks or expands the buffer
|
|
func (list *Buffer) Resize(maximumSize int, window time.Duration) {
|
|
list.Lock()
|
|
defer list.Unlock()
|
|
|
|
if list.maximumSize == maximumSize && list.window == window {
|
|
return // no-op
|
|
}
|
|
|
|
list.maximumSize = maximumSize
|
|
list.window = window
|
|
|
|
// three cases where we need to preemptively resize:
|
|
// (1) we are not autoresizing
|
|
// (2) the buffer is currently larger than maximumSize and needs to be shrunk
|
|
// (3) the buffer is currently smaller than the recommended initial size
|
|
// (including the case where it is currently disabled and needs to be enabled)
|
|
// TODO make it possible to shrink the buffer so that it only contains `window`
|
|
if window == 0 || maximumSize < len(list.buffer) {
|
|
list.resize(maximumSize)
|
|
} else {
|
|
initialSize := list.initialSize(maximumSize, window)
|
|
if len(list.buffer) < initialSize {
|
|
list.resize(initialSize)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (list *Buffer) resize(size int) {
|
|
newbuffer := make([]Item, size)
|
|
|
|
list.setEnabled(size)
|
|
|
|
if list.start == -1 {
|
|
// indices are already correct and nothing needs to be copied
|
|
} else if size == 0 {
|
|
// this is now the empty list
|
|
list.start = -1
|
|
list.end = -1
|
|
} else {
|
|
currentLength := list.length()
|
|
start := list.start
|
|
end := list.end
|
|
// if we're truncating, keep the latest entries, not the earliest
|
|
if size < currentLength {
|
|
start = list.end - size
|
|
if start < 0 {
|
|
start += len(list.buffer)
|
|
}
|
|
// update lastDiscarded for discarded entries
|
|
for i := list.start; i != start; i = (i + 1) % len(list.buffer) {
|
|
if list.lastDiscarded.Before(list.buffer[i].Message.Time) {
|
|
list.lastDiscarded = list.buffer[i].Message.Time
|
|
}
|
|
}
|
|
}
|
|
if start < end {
|
|
copied := copy(newbuffer, list.buffer[start:end])
|
|
list.start = 0
|
|
list.end = copied % size
|
|
} else {
|
|
lenInitial := len(list.buffer) - start
|
|
copied := copy(newbuffer, list.buffer[start:])
|
|
copied += copy(newbuffer[lenInitial:], list.buffer[:end])
|
|
list.start = 0
|
|
list.end = copied % size
|
|
}
|
|
}
|
|
|
|
list.buffer = newbuffer
|
|
}
|
|
|
|
func (hist *Buffer) length() int {
|
|
if hist.start == -1 {
|
|
return 0
|
|
} else if hist.start < hist.end {
|
|
return hist.end - hist.start
|
|
} else {
|
|
return len(hist.buffer) - (hist.start - hist.end)
|
|
}
|
|
}
|