mirror of https://github.com/grafana/loki
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
287 lines
7.4 KiB
287 lines
7.4 KiB
package chunkenc
|
|
|
|
import (
|
|
"bufio"
|
|
"bytes"
|
|
"io"
|
|
"sync"
|
|
|
|
"github.com/golang/snappy"
|
|
"github.com/klauspost/compress/gzip"
|
|
"github.com/pierrec/lz4"
|
|
"github.com/prometheus/prometheus/pkg/pool"
|
|
)
|
|
|
|
// WriterPool is a pool of io.Writer
|
|
// This is used by every chunk to avoid unnecessary allocations.
|
|
type WriterPool interface {
|
|
GetWriter(io.Writer) io.WriteCloser
|
|
PutWriter(io.WriteCloser)
|
|
}
|
|
|
|
// ReaderPool similar to WriterPool but for reading chunks.
|
|
type ReaderPool interface {
|
|
GetReader(io.Reader) io.Reader
|
|
PutReader(io.Reader)
|
|
}
|
|
|
|
var (
|
|
// Gzip is the gnu zip compression pool
|
|
Gzip = GzipPool{level: gzip.DefaultCompression}
|
|
Lz4_64k = LZ4Pool{bufferSize: 1 << 16} // Lz4_64k is the l4z compression pool, with 64k buffer size
|
|
Lz4_256k = LZ4Pool{bufferSize: 1 << 18} // Lz4_256k uses 256k buffer
|
|
Lz4_1M = LZ4Pool{bufferSize: 1 << 20} // Lz4_1M uses 1M buffer
|
|
Lz4_4M = LZ4Pool{bufferSize: 1 << 22} // Lz4_4M uses 4M buffer
|
|
|
|
// Snappy is the snappy compression pool
|
|
Snappy SnappyPool
|
|
// Noop is the no compression pool
|
|
Noop NoopPool
|
|
|
|
// BufReaderPool is bufio.Reader pool
|
|
BufReaderPool = &BufioReaderPool{
|
|
pool: sync.Pool{
|
|
New: func() interface{} { return bufio.NewReader(nil) },
|
|
},
|
|
}
|
|
// BytesBufferPool is a bytes buffer used for lines decompressed.
|
|
// Buckets [0.5KB,1KB,2KB,4KB,8KB]
|
|
BytesBufferPool = pool.New(1<<9, 1<<13, 2, func(size int) interface{} { return make([]byte, 0, size) })
|
|
serializeBytesBufferPool = sync.Pool{
|
|
New: func() interface{} {
|
|
return &bytes.Buffer{}
|
|
},
|
|
}
|
|
)
|
|
|
|
func getWriterPool(enc Encoding) WriterPool {
|
|
return getReaderPool(enc).(WriterPool)
|
|
}
|
|
|
|
func getReaderPool(enc Encoding) ReaderPool {
|
|
switch enc {
|
|
case EncGZIP:
|
|
return &Gzip
|
|
case EncLZ4_64k:
|
|
return &Lz4_64k
|
|
case EncLZ4_256k:
|
|
return &Lz4_256k
|
|
case EncLZ4_1M:
|
|
return &Lz4_1M
|
|
case EncLZ4_4M:
|
|
return &Lz4_4M
|
|
case EncSnappy:
|
|
return &Snappy
|
|
case EncNone:
|
|
return &Noop
|
|
default:
|
|
panic("unknown encoding")
|
|
}
|
|
}
|
|
|
|
// GzipPool is a gun zip compression pool
|
|
type GzipPool struct {
|
|
readers sync.Pool
|
|
writers sync.Pool
|
|
level int
|
|
}
|
|
|
|
// GetReader gets or creates a new CompressionReader and reset it to read from src
|
|
func (pool *GzipPool) GetReader(src io.Reader) io.Reader {
|
|
if r := pool.readers.Get(); r != nil {
|
|
reader := r.(*gzip.Reader)
|
|
err := reader.Reset(src)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
return reader
|
|
}
|
|
reader, err := gzip.NewReader(src)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
return reader
|
|
}
|
|
|
|
// PutReader places back in the pool a CompressionReader
|
|
func (pool *GzipPool) PutReader(reader io.Reader) {
|
|
pool.readers.Put(reader)
|
|
}
|
|
|
|
// GetWriter gets or creates a new CompressionWriter and reset it to write to dst
|
|
func (pool *GzipPool) GetWriter(dst io.Writer) io.WriteCloser {
|
|
if w := pool.writers.Get(); w != nil {
|
|
writer := w.(*gzip.Writer)
|
|
writer.Reset(dst)
|
|
return writer
|
|
}
|
|
|
|
level := pool.level
|
|
if level == 0 {
|
|
level = gzip.DefaultCompression
|
|
}
|
|
w, err := gzip.NewWriterLevel(dst, level)
|
|
if err != nil {
|
|
panic(err) // never happens, error is only returned on wrong compression level.
|
|
}
|
|
return w
|
|
}
|
|
|
|
// PutWriter places back in the pool a CompressionWriter
|
|
func (pool *GzipPool) PutWriter(writer io.WriteCloser) {
|
|
pool.writers.Put(writer)
|
|
}
|
|
|
|
type LZ4Pool struct {
|
|
readers sync.Pool
|
|
writers sync.Pool
|
|
bufferSize int // available values: 1<<16 (64k), 1<<18 (256k), 1<<20 (1M), 1<<22 (4M). Defaults to 4MB, if not set.
|
|
}
|
|
|
|
// lz4Reader is simple wrapper around *lz4.Reader, which remembers max used block size,
|
|
// as reported by this reader. It is used to determine whether we want to reuse it,
|
|
// or throw away and garbage-collect.
|
|
type lz4Reader struct {
|
|
r *lz4.Reader
|
|
maxBlockSize int
|
|
}
|
|
|
|
func (l *lz4Reader) Read(p []byte) (n int, err error) {
|
|
return l.r.Read(p)
|
|
}
|
|
|
|
func (l *lz4Reader) Reset(src io.Reader) {
|
|
l.r.Reset(src)
|
|
}
|
|
|
|
func (l *lz4Reader) onBlockDone(_ int) {
|
|
// remember max block size used.
|
|
if l.r.BlockMaxSize > l.maxBlockSize {
|
|
l.maxBlockSize = l.r.BlockMaxSize
|
|
}
|
|
}
|
|
|
|
func newLz4Reader(src io.Reader) *lz4Reader {
|
|
lz4r := lz4.NewReader(src)
|
|
r := &lz4Reader{r: lz4r}
|
|
lz4r.OnBlockDone = r.onBlockDone
|
|
return r
|
|
}
|
|
|
|
// GetReader gets or creates a new CompressionReader and reset it to read from src
|
|
func (pool *LZ4Pool) GetReader(src io.Reader) io.Reader {
|
|
if r := pool.readers.Get(); r != nil {
|
|
reader := r.(*lz4Reader)
|
|
reader.Reset(src)
|
|
return reader
|
|
}
|
|
// no need to set buffer size here. Reader uses buffer size based on
|
|
// LZ4 header that it is reading.
|
|
return newLz4Reader(src)
|
|
}
|
|
|
|
// PutReader places back in the pool a CompressionReader
|
|
func (pool *LZ4Pool) PutReader(reader io.Reader) {
|
|
r := reader.(*lz4Reader)
|
|
if r.maxBlockSize > pool.bufferSize {
|
|
// Readers base their buffer size based on headers from LZ4 stream.
|
|
// If this reader uses bigger buffer than what we use currently, don't pool it.
|
|
// Reading from a couple of chunks that used big buffer sizes could otherwise quickly lead
|
|
// to high pooled memory usage.
|
|
return
|
|
}
|
|
pool.readers.Put(reader)
|
|
}
|
|
|
|
// GetWriter gets or creates a new CompressionWriter and reset it to write to dst
|
|
func (pool *LZ4Pool) GetWriter(dst io.Writer) io.WriteCloser {
|
|
if w := pool.writers.Get(); w != nil {
|
|
writer := w.(*lz4.Writer)
|
|
writer.Reset(dst)
|
|
return writer
|
|
}
|
|
w := lz4.NewWriter(dst)
|
|
w.BlockMaxSize = pool.bufferSize
|
|
return w
|
|
}
|
|
|
|
// PutWriter places back in the pool a CompressionWriter
|
|
func (pool *LZ4Pool) PutWriter(writer io.WriteCloser) {
|
|
pool.writers.Put(writer)
|
|
}
|
|
|
|
type SnappyPool struct {
|
|
readers sync.Pool
|
|
writers sync.Pool
|
|
}
|
|
|
|
// GetReader gets or creates a new CompressionReader and reset it to read from src
|
|
func (pool *SnappyPool) GetReader(src io.Reader) io.Reader {
|
|
if r := pool.readers.Get(); r != nil {
|
|
reader := r.(*snappy.Reader)
|
|
reader.Reset(src)
|
|
return reader
|
|
}
|
|
return snappy.NewReader(src)
|
|
}
|
|
|
|
// PutReader places back in the pool a CompressionReader
|
|
func (pool *SnappyPool) PutReader(reader io.Reader) {
|
|
pool.readers.Put(reader)
|
|
}
|
|
|
|
// GetWriter gets or creates a new CompressionWriter and reset it to write to dst
|
|
func (pool *SnappyPool) GetWriter(dst io.Writer) io.WriteCloser {
|
|
if w := pool.writers.Get(); w != nil {
|
|
writer := w.(*snappy.Writer)
|
|
writer.Reset(dst)
|
|
return writer
|
|
}
|
|
return snappy.NewBufferedWriter(dst)
|
|
}
|
|
|
|
// PutWriter places back in the pool a CompressionWriter
|
|
func (pool *SnappyPool) PutWriter(writer io.WriteCloser) {
|
|
pool.writers.Put(writer)
|
|
}
|
|
|
|
type NoopPool struct{}
|
|
|
|
// GetReader gets or creates a new CompressionReader and reset it to read from src
|
|
func (pool *NoopPool) GetReader(src io.Reader) io.Reader {
|
|
return src
|
|
}
|
|
|
|
// PutReader places back in the pool a CompressionReader
|
|
func (pool *NoopPool) PutReader(reader io.Reader) {}
|
|
|
|
type noopCloser struct {
|
|
io.Writer
|
|
}
|
|
|
|
func (noopCloser) Close() error { return nil }
|
|
|
|
// GetWriter gets or creates a new CompressionWriter and reset it to write to dst
|
|
func (pool *NoopPool) GetWriter(dst io.Writer) io.WriteCloser {
|
|
return noopCloser{dst}
|
|
}
|
|
|
|
// PutWriter places back in the pool a CompressionWriter
|
|
func (pool *NoopPool) PutWriter(writer io.WriteCloser) {}
|
|
|
|
// BufioReaderPool is a bufio reader that uses sync.Pool.
|
|
type BufioReaderPool struct {
|
|
pool sync.Pool
|
|
}
|
|
|
|
// Get returns a bufio.Reader which reads from r. The buffer size is that of the pool.
|
|
func (bufPool *BufioReaderPool) Get(r io.Reader) *bufio.Reader {
|
|
buf := bufPool.pool.Get().(*bufio.Reader)
|
|
buf.Reset(r)
|
|
return buf
|
|
}
|
|
|
|
// Put puts the bufio.Reader back into the pool.
|
|
func (bufPool *BufioReaderPool) Put(b *bufio.Reader) {
|
|
bufPool.pool.Put(b)
|
|
}
|
|
|