[bugfix] html escape special characters in text instead of totally removing them (#719)

* remove minify dependency * tidy up some tests * remove pre + postformat funcs * rework sanitization + formatting * update tests * add some more markdown tests
author: tobi <31960611+tsmethurst@users.noreply.github.com> 2022-07-19 15:21:17 +0200
committer: GitHub <noreply@github.com> 2022-07-19 15:21:17 +0200
commit: c84384e6608368a13a774d6d33a8cc32da7cf209 (patch)
tree: a18aa9c1ced1299d2682c1993e1ba38f46448dba /vendor/github.com/tdewolff/parse/v2/buffer
parent: [chore] use our own logging implementation (#716) (diff)
download: gotosocial-c84384e6608368a13a774d6d33a8cc32da7cf209.tar.xz
5 files changed, 0 insertions, 508 deletions
diff --git a/vendor/github.com/tdewolff/parse/v2/buffer/buffer.go b/vendor/github.com/tdewolff/parse/v2/buffer/buffer.go
deleted file mode 100644
index 671b380d6..000000000
--- a/vendor/github.com/tdewolff/parse/v2/buffer/buffer.go
+++ /dev/null
@@ -1,12 +0,0 @@
-// Package buffer contains buffer and wrapper types for byte slices. It is useful for writing lexers or other high-performance byte slice handling.
-// The `Reader` and `Writer` types implement the `io.Reader` and `io.Writer` respectively and provide a thinner and faster interface than `bytes.Buffer`.
-// The `Lexer` type is useful for building lexers because it keeps track of the start and end position of a byte selection, and shifts the bytes whenever a valid token is found.
-// The `StreamLexer` does the same, but keeps a buffer pool so that it reads a limited amount at a time, allowing to parse from streaming sources.
-package buffer
-
-// defaultBufSize specifies the default initial length of internal buffers.
-var defaultBufSize = 4096
-
-// MinBuf specifies the default initial length of internal buffers.
-// Solely here to support old versions of parse.
-var MinBuf = defaultBufSize
diff --git a/vendor/github.com/tdewolff/parse/v2/buffer/lexer.go b/vendor/github.com/tdewolff/parse/v2/buffer/lexer.go
deleted file mode 100644
index 46e6bdafd..000000000
--- a/vendor/github.com/tdewolff/parse/v2/buffer/lexer.go
+++ /dev/null
@@ -1,164 +0,0 @@
-package buffer
-
-import (
-	"io"
-	"io/ioutil"
-)
-
-var nullBuffer = []byte{0}
-
-// Lexer is a buffered reader that allows peeking forward and shifting, taking an io.Reader.
-// It keeps data in-memory until Free, taking a byte length, is called to move beyond the data.
-type Lexer struct {
-	buf   []byte
-	pos   int // index in buf
-	start int // index in buf
-	err   error
-
-	restore func()
-}
-
-// NewLexer returns a new Lexer for a given io.Reader, and uses ioutil.ReadAll to read it into a byte slice.
-// If the io.Reader implements Bytes, that is used instead.
-// It will append a NULL at the end of the buffer.
-func NewLexer(r io.Reader) *Lexer {
-	var b []byte
-	if r != nil {
-		if buffer, ok := r.(interface {
-			Bytes() []byte
-		}); ok {
-			b = buffer.Bytes()
-		} else {
-			var err error
-			b, err = ioutil.ReadAll(r)
-			if err != nil {
-				return &Lexer{
-					buf: nullBuffer,
-					err: err,
-				}
-			}
-		}
-	}
-	return NewLexerBytes(b)
-}
-
-// NewLexerBytes returns a new Lexer for a given byte slice, and appends NULL at the end.
-// To avoid reallocation, make sure the capacity has room for one more byte.
-func NewLexerBytes(b []byte) *Lexer {
-	z := &Lexer{
-		buf: b,
-	}
-
-	n := len(b)
-	if n == 0 {
-		z.buf = nullBuffer
-	} else {
-		// Append NULL to buffer, but try to avoid reallocation
-		if cap(b) > n {
-			// Overwrite next byte but restore when done
-			b = b[:n+1]
-			c := b[n]
-			b[n] = 0
-
-			z.buf = b
-			z.restore = func() {
-				b[n] = c
-			}
-		} else {
-			z.buf = append(b, 0)
-		}
-	}
-	return z
-}
-
-// Restore restores the replaced byte past the end of the buffer by NULL.
-func (z *Lexer) Restore() {
-	if z.restore != nil {
-		z.restore()
-		z.restore = nil
-	}
-}
-
-// Err returns the error returned from io.Reader or io.EOF when the end has been reached.
-func (z *Lexer) Err() error {
-	return z.PeekErr(0)
-}
-
-// PeekErr returns the error at position pos. When pos is zero, this is the same as calling Err().
-func (z *Lexer) PeekErr(pos int) error {
-	if z.err != nil {
-		return z.err
-	} else if z.pos+pos >= len(z.buf)-1 {
-		return io.EOF
-	}
-	return nil
-}
-
-// Peek returns the ith byte relative to the end position.
-// Peek returns 0 when an error has occurred, Err returns the error.
-func (z *Lexer) Peek(pos int) byte {
-	pos += z.pos
-	return z.buf[pos]
-}
-
-// PeekRune returns the rune and rune length of the ith byte relative to the end position.
-func (z *Lexer) PeekRune(pos int) (rune, int) {
-	// from unicode/utf8
-	c := z.Peek(pos)
-	if c < 0xC0 || z.Peek(pos+1) == 0 {
-		return rune(c), 1
-	} else if c < 0xE0 || z.Peek(pos+2) == 0 {
-		return rune(c&0x1F)<<6 | rune(z.Peek(pos+1)&0x3F), 2
-	} else if c < 0xF0 || z.Peek(pos+3) == 0 {
-		return rune(c&0x0F)<<12 | rune(z.Peek(pos+1)&0x3F)<<6 | rune(z.Peek(pos+2)&0x3F), 3
-	}
-	return rune(c&0x07)<<18 | rune(z.Peek(pos+1)&0x3F)<<12 | rune(z.Peek(pos+2)&0x3F)<<6 | rune(z.Peek(pos+3)&0x3F), 4
-}
-
-// Move advances the position.
-func (z *Lexer) Move(n int) {
-	z.pos += n
-}
-
-// Pos returns a mark to which can be rewinded.
-func (z *Lexer) Pos() int {
-	return z.pos - z.start
-}
-
-// Rewind rewinds the position to the given position.
-func (z *Lexer) Rewind(pos int) {
-	z.pos = z.start + pos
-}
-
-// Lexeme returns the bytes of the current selection.
-func (z *Lexer) Lexeme() []byte {
-	return z.buf[z.start:z.pos:z.pos]
-}
-
-// Skip collapses the position to the end of the selection.
-func (z *Lexer) Skip() {
-	z.start = z.pos
-}
-
-// Shift returns the bytes of the current selection and collapses the position to the end of the selection.
-func (z *Lexer) Shift() []byte {
-	b := z.buf[z.start:z.pos:z.pos]
-	z.start = z.pos
-	return b
-}
-
-// Offset returns the character position in the buffer.
-func (z *Lexer) Offset() int {
-	return z.pos
-}
-
-// Bytes returns the underlying buffer.
-func (z *Lexer) Bytes() []byte {
-	return z.buf[: len(z.buf)-1 : len(z.buf)-1]
-}
-
-// Reset resets position to the underlying buffer.
-func (z *Lexer) Reset() {
-	z.start = 0
-	z.pos = 0
-}
diff --git a/vendor/github.com/tdewolff/parse/v2/buffer/reader.go b/vendor/github.com/tdewolff/parse/v2/buffer/reader.go
deleted file mode 100644
index 9926eef66..000000000
--- a/vendor/github.com/tdewolff/parse/v2/buffer/reader.go
+++ /dev/null
@@ -1,44 +0,0 @@
-package buffer
-
-import "io"
-
-// Reader implements an io.Reader over a byte slice.
-type Reader struct {
-	buf []byte
-	pos int
-}
-
-// NewReader returns a new Reader for a given byte slice.
-func NewReader(buf []byte) *Reader {
-	return &Reader{
-		buf: buf,
-	}
-}
-
-// Read reads bytes into the given byte slice and returns the number of bytes read and an error if occurred.
-func (r *Reader) Read(b []byte) (n int, err error) {
-	if len(b) == 0 {
-		return 0, nil
-	}
-	if r.pos >= len(r.buf) {
-		return 0, io.EOF
-	}
-	n = copy(b, r.buf[r.pos:])
-	r.pos += n
-	return
-}
-
-// Bytes returns the underlying byte slice.
-func (r *Reader) Bytes() []byte {
-	return r.buf
-}
-
-// Reset resets the position of the read pointer to the beginning of the underlying byte slice.
-func (r *Reader) Reset() {
-	r.pos = 0
-}
-
-// Len returns the length of the buffer.
-func (r *Reader) Len() int {
-	return len(r.buf)
-}
diff --git a/vendor/github.com/tdewolff/parse/v2/buffer/streamlexer.go b/vendor/github.com/tdewolff/parse/v2/buffer/streamlexer.go
deleted file mode 100644
index 5ea2dd58d..000000000
--- a/vendor/github.com/tdewolff/parse/v2/buffer/streamlexer.go
+++ /dev/null
@@ -1,223 +0,0 @@
-package buffer
-
-import (
-	"io"
-)
-
-type block struct {
-	buf    []byte
-	next   int // index in pool plus one
-	active bool
-}
-
-type bufferPool struct {
-	pool []block
-	head int // index in pool plus one
-	tail int // index in pool plus one
-
-	pos int // byte pos in tail
-}
-
-func (z *bufferPool) swap(oldBuf []byte, size int) []byte {
-	// find new buffer that can be reused
-	swap := -1
-	for i := 0; i < len(z.pool); i++ {
-		if !z.pool[i].active && size <= cap(z.pool[i].buf) {
-			swap = i
-			break
-		}
-	}
-	if swap == -1 { // no free buffer found for reuse
-		if z.tail == 0 && z.pos >= len(oldBuf) && size <= cap(oldBuf) { // but we can reuse the current buffer!
-			z.pos -= len(oldBuf)
-			return oldBuf[:0]
-		}
-		// allocate new
-		z.pool = append(z.pool, block{make([]byte, 0, size), 0, true})
-		swap = len(z.pool) - 1
-	}
-
-	newBuf := z.pool[swap].buf
-
-	// put current buffer into pool
-	z.pool[swap] = block{oldBuf, 0, true}
-	if z.head != 0 {
-		z.pool[z.head-1].next = swap + 1
-	}
-	z.head = swap + 1
-	if z.tail == 0 {
-		z.tail = swap + 1
-	}
-
-	return newBuf[:0]
-}
-
-func (z *bufferPool) free(n int) {
-	z.pos += n
-	// move the tail over to next buffers
-	for z.tail != 0 && z.pos >= len(z.pool[z.tail-1].buf) {
-		z.pos -= len(z.pool[z.tail-1].buf)
-		newTail := z.pool[z.tail-1].next
-		z.pool[z.tail-1].active = false // after this, any thread may pick up the inactive buffer, so it can't be used anymore
-		z.tail = newTail
-	}
-	if z.tail == 0 {
-		z.head = 0
-	}
-}
-
-// StreamLexer is a buffered reader that allows peeking forward and shifting, taking an io.Reader.
-// It keeps data in-memory until Free, taking a byte length, is called to move beyond the data.
-type StreamLexer struct {
-	r   io.Reader
-	err error
-
-	pool bufferPool
-
-	buf       []byte
-	start     int // index in buf
-	pos       int // index in buf
-	prevStart int
-
-	free int
-}
-
-// NewStreamLexer returns a new StreamLexer for a given io.Reader with a 4kB estimated buffer size.
-// If the io.Reader implements Bytes, that buffer is used instead.
-func NewStreamLexer(r io.Reader) *StreamLexer {
-	return NewStreamLexerSize(r, defaultBufSize)
-}
-
-// NewStreamLexerSize returns a new StreamLexer for a given io.Reader and estimated required buffer size.
-// If the io.Reader implements Bytes, that buffer is used instead.
-func NewStreamLexerSize(r io.Reader, size int) *StreamLexer {
-	// if reader has the bytes in memory already, use that instead
-	if buffer, ok := r.(interface {
-		Bytes() []byte
-	}); ok {
-		return &StreamLexer{
-			err: io.EOF,
-			buf: buffer.Bytes(),
-		}
-	}
-	return &StreamLexer{
-		r:   r,
-		buf: make([]byte, 0, size),
-	}
-}
-
-func (z *StreamLexer) read(pos int) byte {
-	if z.err != nil {
-		return 0
-	}
-
-	// free unused bytes
-	z.pool.free(z.free)
-	z.free = 0
-
-	// get new buffer
-	c := cap(z.buf)
-	p := pos - z.start + 1
-	if 2*p > c { // if the token is larger than half the buffer, increase buffer size
-		c = 2*c + p
-	}
-	d := len(z.buf) - z.start
-	buf := z.pool.swap(z.buf[:z.start], c)
-	copy(buf[:d], z.buf[z.start:]) // copy the left-overs (unfinished token) from the old buffer
-
-	// read in new data for the rest of the buffer
-	var n int
-	for pos-z.start >= d && z.err == nil {
-		n, z.err = z.r.Read(buf[d:cap(buf)])
-		d += n
-	}
-	pos -= z.start
-	z.pos -= z.start
-	z.start, z.buf = 0, buf[:d]
-	if pos >= d {
-		return 0
-	}
-	return z.buf[pos]
-}
-
-// Err returns the error returned from io.Reader. It may still return valid bytes for a while though.
-func (z *StreamLexer) Err() error {
-	if z.err == io.EOF && z.pos < len(z.buf) {
-		return nil
-	}
-	return z.err
-}
-
-// Free frees up bytes of length n from previously shifted tokens.
-// Each call to Shift should at one point be followed by a call to Free with a length returned by ShiftLen.
-func (z *StreamLexer) Free(n int) {
-	z.free += n
-}
-
-// Peek returns the ith byte relative to the end position and possibly does an allocation.
-// Peek returns zero when an error has occurred, Err returns the error.
-// TODO: inline function
-func (z *StreamLexer) Peek(pos int) byte {
-	pos += z.pos
-	if uint(pos) < uint(len(z.buf)) { // uint for BCE
-		return z.buf[pos]
-	}
-	return z.read(pos)
-}
-
-// PeekRune returns the rune and rune length of the ith byte relative to the end position.
-func (z *StreamLexer) PeekRune(pos int) (rune, int) {
-	// from unicode/utf8
-	c := z.Peek(pos)
-	if c < 0xC0 {
-		return rune(c), 1
-	} else if c < 0xE0 {
-		return rune(c&0x1F)<<6 | rune(z.Peek(pos+1)&0x3F), 2
-	} else if c < 0xF0 {
-		return rune(c&0x0F)<<12 | rune(z.Peek(pos+1)&0x3F)<<6 | rune(z.Peek(pos+2)&0x3F), 3
-	}
-	return rune(c&0x07)<<18 | rune(z.Peek(pos+1)&0x3F)<<12 | rune(z.Peek(pos+2)&0x3F)<<6 | rune(z.Peek(pos+3)&0x3F), 4
-}
-
-// Move advances the position.
-func (z *StreamLexer) Move(n int) {
-	z.pos += n
-}
-
-// Pos returns a mark to which can be rewinded.
-func (z *StreamLexer) Pos() int {
-	return z.pos - z.start
-}
-
-// Rewind rewinds the position to the given position.
-func (z *StreamLexer) Rewind(pos int) {
-	z.pos = z.start + pos
-}
-
-// Lexeme returns the bytes of the current selection.
-func (z *StreamLexer) Lexeme() []byte {
-	return z.buf[z.start:z.pos]
-}
-
-// Skip collapses the position to the end of the selection.
-func (z *StreamLexer) Skip() {
-	z.start = z.pos
-}
-
-// Shift returns the bytes of the current selection and collapses the position to the end of the selection.
-// It also returns the number of bytes we moved since the last call to Shift. This can be used in calls to Free.
-func (z *StreamLexer) Shift() []byte {
-	if z.pos > len(z.buf) { // make sure we peeked at least as much as we shift
-		z.read(z.pos - 1)
-	}
-	b := z.buf[z.start:z.pos]
-	z.start = z.pos
-	return b
-}
-
-// ShiftLen returns the number of bytes moved since the last call to ShiftLen. This can be used in calls to Free because it takes into account multiple Shifts or Skips.
-func (z *StreamLexer) ShiftLen() int {
-	n := z.start - z.prevStart
-	z.prevStart = z.start
-	return n
-}
diff --git a/vendor/github.com/tdewolff/parse/v2/buffer/writer.go b/vendor/github.com/tdewolff/parse/v2/buffer/writer.go
deleted file mode 100644
index 6c94201ff..000000000
--- a/vendor/github.com/tdewolff/parse/v2/buffer/writer.go
+++ /dev/null
@@ -1,65 +0,0 @@
-package buffer
-
-import (
-	"io"
-)
-
-// Writer implements an io.Writer over a byte slice.
-type Writer struct {
-	buf    []byte
-	err    error
-	expand bool
-}
-
-// NewWriter returns a new Writer for a given byte slice.
-func NewWriter(buf []byte) *Writer {
-	return &Writer{
-		buf:    buf,
-		expand: true,
-	}
-}
-
-// NewStaticWriter returns a new Writer for a given byte slice. It does not reallocate and expand the byte-slice.
-func NewStaticWriter(buf []byte) *Writer {
-	return &Writer{
-		buf:    buf,
-		expand: false,
-	}
-}
-
-// Write writes bytes from the given byte slice and returns the number of bytes written and an error if occurred. When err != nil, n == 0.
-func (w *Writer) Write(b []byte) (int, error) {
-	n := len(b)
-	end := len(w.buf)
-	if end+n > cap(w.buf) {
-		if !w.expand {
-			w.err = io.EOF
-			return 0, io.EOF
-		}
-		buf := make([]byte, end, 2*cap(w.buf)+n)
-		copy(buf, w.buf)
-		w.buf = buf
-	}
-	w.buf = w.buf[:end+n]
-	return copy(w.buf[end:], b), nil
-}
-
-// Len returns the length of the underlying byte slice.
-func (w *Writer) Len() int {
-	return len(w.buf)
-}
-
-// Bytes returns the underlying byte slice.
-func (w *Writer) Bytes() []byte {
-	return w.buf
-}
-
-// Reset empties and reuses the current buffer. Subsequent writes will overwrite the buffer, so any reference to the underlying slice is invalidated after this call.
-func (w *Writer) Reset() {
-	w.buf = w.buf[:0]
-}
-
-// Close returns the last error.
-func (w *Writer) Close() error {
-	return w.err
-}
author	tobi <31960611+tsmethurst@users.noreply.github.com>	2022-07-19 15:21:17 +0200
committer	GitHub <noreply@github.com>	2022-07-19 15:21:17 +0200
commit	c84384e6608368a13a774d6d33a8cc32da7cf209 (patch)
tree	a18aa9c1ced1299d2682c1993e1ba38f46448dba /vendor/github.com/tdewolff/parse/v2/buffer
parent	[chore] use our own logging implementation (#716) (diff)
download	gotosocial-c84384e6608368a13a774d6d33a8cc32da7cf209.tar.xz