2019-01-09 06:23:04 +05:30
|
|
|
/*
|
2019-04-09 11:39:42 -07:00
|
|
|
* MinIO Cloud Storage, (C) 2019 MinIO, Inc.
|
2019-01-09 06:23:04 +05:30
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package s3select
|
|
|
|
|
|
|
|
import (
|
|
|
|
"compress/bzip2"
|
2019-11-06 01:20:37 +03:00
|
|
|
"errors"
|
2019-01-09 06:23:04 +05:30
|
|
|
"fmt"
|
|
|
|
"io"
|
2019-11-06 01:20:37 +03:00
|
|
|
"sync"
|
2019-01-09 06:23:04 +05:30
|
|
|
"sync/atomic"
|
|
|
|
|
|
|
|
gzip "github.com/klauspost/pgzip"
|
|
|
|
)
|
|
|
|
|
|
|
|
type countUpReader struct {
|
|
|
|
reader io.Reader
|
|
|
|
bytesRead int64
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *countUpReader) Read(p []byte) (n int, err error) {
|
|
|
|
n, err = r.reader.Read(p)
|
|
|
|
atomic.AddInt64(&r.bytesRead, int64(n))
|
|
|
|
return n, err
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *countUpReader) BytesRead() int64 {
|
2020-02-13 14:03:52 -08:00
|
|
|
if r == nil {
|
|
|
|
return 0
|
|
|
|
}
|
2019-01-09 06:23:04 +05:30
|
|
|
return atomic.LoadInt64(&r.bytesRead)
|
|
|
|
}
|
|
|
|
|
|
|
|
func newCountUpReader(reader io.Reader) *countUpReader {
|
|
|
|
return &countUpReader{
|
|
|
|
reader: reader,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type progressReader struct {
|
|
|
|
rc io.ReadCloser
|
|
|
|
scannedReader *countUpReader
|
|
|
|
processedReader *countUpReader
|
2019-11-06 01:20:37 +03:00
|
|
|
|
|
|
|
closedMu sync.Mutex
|
2021-01-19 17:51:46 -08:00
|
|
|
gzr *gzip.Reader
|
2019-11-06 01:20:37 +03:00
|
|
|
closed bool
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
func (pr *progressReader) Read(p []byte) (n int, err error) {
|
2019-11-06 01:20:37 +03:00
|
|
|
// This ensures that Close will block until Read has completed.
|
|
|
|
// This allows another goroutine to close the reader.
|
|
|
|
pr.closedMu.Lock()
|
|
|
|
defer pr.closedMu.Unlock()
|
|
|
|
if pr.closed {
|
|
|
|
return 0, errors.New("progressReader: read after Close")
|
|
|
|
}
|
2019-01-09 06:23:04 +05:30
|
|
|
return pr.processedReader.Read(p)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (pr *progressReader) Close() error {
|
2019-11-06 01:20:37 +03:00
|
|
|
pr.closedMu.Lock()
|
|
|
|
defer pr.closedMu.Unlock()
|
|
|
|
if pr.closed {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
pr.closed = true
|
2021-01-19 17:51:46 -08:00
|
|
|
if pr.gzr != nil {
|
|
|
|
pr.gzr.Close()
|
|
|
|
}
|
2019-01-09 06:23:04 +05:30
|
|
|
return pr.rc.Close()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (pr *progressReader) Stats() (bytesScanned, bytesProcessed int64) {
|
2020-02-13 14:03:52 -08:00
|
|
|
if pr == nil {
|
|
|
|
return 0, 0
|
|
|
|
}
|
2019-01-09 06:23:04 +05:30
|
|
|
return pr.scannedReader.BytesRead(), pr.processedReader.BytesRead()
|
|
|
|
}
|
|
|
|
|
|
|
|
func newProgressReader(rc io.ReadCloser, compType CompressionType) (*progressReader, error) {
|
2021-01-19 17:51:46 -08:00
|
|
|
if rc == nil {
|
|
|
|
return nil, errors.New("newProgressReader: nil reader provided")
|
|
|
|
}
|
2019-01-09 06:23:04 +05:30
|
|
|
scannedReader := newCountUpReader(rc)
|
2021-01-19 17:51:46 -08:00
|
|
|
pr := progressReader{
|
|
|
|
rc: rc,
|
|
|
|
scannedReader: scannedReader,
|
|
|
|
}
|
2019-01-09 06:23:04 +05:30
|
|
|
var err error
|
2021-01-19 17:51:46 -08:00
|
|
|
var r io.Reader
|
2019-01-09 06:23:04 +05:30
|
|
|
|
|
|
|
switch compType {
|
|
|
|
case noneType:
|
|
|
|
r = scannedReader
|
|
|
|
case gzipType:
|
2021-01-19 17:51:46 -08:00
|
|
|
pr.gzr, err = gzip.NewReader(scannedReader)
|
2020-03-12 15:34:11 -07:00
|
|
|
if err != nil {
|
2020-03-05 19:34:04 -08:00
|
|
|
if errors.Is(err, gzip.ErrHeader) || errors.Is(err, gzip.ErrChecksum) {
|
|
|
|
return nil, errInvalidGZIPCompressionFormat(err)
|
|
|
|
}
|
2020-03-12 15:34:11 -07:00
|
|
|
return nil, errTruncatedInput(err)
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
2021-01-19 17:51:46 -08:00
|
|
|
r = pr.gzr
|
2019-01-09 06:23:04 +05:30
|
|
|
case bzip2Type:
|
|
|
|
r = bzip2.NewReader(scannedReader)
|
|
|
|
default:
|
|
|
|
return nil, errInvalidCompressionFormat(fmt.Errorf("unknown compression type '%v'", compType))
|
|
|
|
}
|
2021-01-19 17:51:46 -08:00
|
|
|
pr.processedReader = newCountUpReader(r)
|
2019-01-09 06:23:04 +05:30
|
|
|
|
2021-01-19 17:51:46 -08:00
|
|
|
return &pr, nil
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|