Compare commits
4 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| f61237a1f0 | |||
| 820e06e792 | |||
| 4f8f5f6928 | |||
| 1b5078c7bd |
@@ -17,6 +17,4 @@ Thanks also to [distri's squashfs library](https://github.com/distr1/distri/tree
|
||||
|
||||
## Performance
|
||||
|
||||
This library, decompressing the Firefox AppImage and using go tests, takes about twice as long as `unsquashfs` on my quad core laptop. (~1 second with the library and about half a second with `unsquashfs`).
|
||||
|
||||
**My recents tests have shown the Firefox AppImage might be an outlier and this library might be considerably slower (4x ~ 6x time slower then `unsquashfs`)**
|
||||
Testing on a zstd compressed file, my library is anywhere from 5x ~ 7x slower then `unsquashfs`
|
||||
|
||||
@@ -10,12 +10,14 @@ import (
|
||||
"github.com/CalebQ42/squashfs/internal/inode"
|
||||
)
|
||||
|
||||
// Creates a fuse mount, then mounts the archive on a seperate goroutine.
|
||||
// If waiting for the mount to end, simply do <-con.Ready.
|
||||
func (r *Reader) Mount(mountpoint string) (con *fuse.Conn, err error) {
|
||||
con, err = fuse.Mount(mountpoint, fuse.ReadOnly())
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
err = fs.Serve(con, &squashFuse{r: r})
|
||||
go fs.Serve(con, &squashFuse{r: r})
|
||||
return
|
||||
}
|
||||
|
||||
|
||||
+121
-87
@@ -2,6 +2,7 @@ package data
|
||||
|
||||
import (
|
||||
"io"
|
||||
"sync"
|
||||
|
||||
"github.com/CalebQ42/squashfs/internal/decompress"
|
||||
"github.com/CalebQ42/squashfs/internal/toreader"
|
||||
@@ -26,9 +27,9 @@ func NewFullReader(r io.ReaderAt, start uint64, d decompress.Decompressor, block
|
||||
}
|
||||
}
|
||||
|
||||
func (r *FullReader) AddFragment(rdr func() (io.Reader, error)) {
|
||||
func (r *FullReader) AddFragment(rdr func() (io.Reader, error), size uint32) {
|
||||
r.fragRdr = rdr
|
||||
r.sizes = append(r.sizes, 0)
|
||||
r.sizes = append(r.sizes, size)
|
||||
}
|
||||
|
||||
type outDat struct {
|
||||
@@ -37,50 +38,50 @@ type outDat struct {
|
||||
i int
|
||||
}
|
||||
|
||||
func (r FullReader) process(index int, offset int64, out chan outDat) {
|
||||
var err error
|
||||
var dat []byte
|
||||
var rdr io.ReadCloser
|
||||
func (r FullReader) process(index int, offset int64, od *outDat, out chan *outDat) {
|
||||
defer func() {
|
||||
out <- od
|
||||
}()
|
||||
od.i = index
|
||||
size := realSize(r.sizes[index])
|
||||
if size == 0 {
|
||||
out <- outDat{
|
||||
i: index,
|
||||
err: nil,
|
||||
data: make([]byte, r.blockSize),
|
||||
}
|
||||
od.err = nil
|
||||
od.data = make([]byte, r.blockSize)
|
||||
return
|
||||
}
|
||||
// rdr := io.LimitReader(toreader.NewReader(r.r, offset), int64(size))
|
||||
if size == r.sizes[index] {
|
||||
//Special workaround for zstd for increased performancce.
|
||||
if zstd, ok := r.d.(*decompress.Zstd); ok {
|
||||
dat = make([]byte, size)
|
||||
_, err = r.r.ReadAt(dat, offset)
|
||||
if err == nil {
|
||||
dat, err = zstd.Decode(dat)
|
||||
}
|
||||
} else {
|
||||
rdr, err = r.d.Reader(io.LimitReader(toreader.NewReader(r.r, offset), int64(size)))
|
||||
if err == nil {
|
||||
dat, err = io.ReadAll(rdr)
|
||||
if dec, ok := r.d.(decompress.Decoder); ok {
|
||||
dat := make([]byte, size)
|
||||
_, od.err = r.r.ReadAt(dat, offset)
|
||||
if od.err != nil {
|
||||
return
|
||||
}
|
||||
od.data, od.err = dec.Decode(dat, int(r.blockSize))
|
||||
return
|
||||
}
|
||||
var rdr io.ReadCloser
|
||||
rdr, od.err = r.d.Reader(io.LimitReader(toreader.NewReader(r.r, offset), int64(size)))
|
||||
if od.err != nil {
|
||||
return
|
||||
}
|
||||
od.data = make([]byte, r.blockSize)
|
||||
var read int
|
||||
read, od.err = rdr.Read(od.data)
|
||||
od.data = od.data[:read]
|
||||
rdr.Close()
|
||||
} else {
|
||||
dat = make([]byte, size)
|
||||
_, err = r.r.ReadAt(dat, offset)
|
||||
}
|
||||
out <- outDat{
|
||||
i: index,
|
||||
err: err,
|
||||
data: dat,
|
||||
}
|
||||
if clr, ok := rdr.(io.Closer); ok {
|
||||
clr.Close()
|
||||
od.data = make([]byte, size)
|
||||
_, od.err = r.r.ReadAt(od.data, offset)
|
||||
}
|
||||
}
|
||||
|
||||
func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
|
||||
out := make(chan outDat, len(r.sizes))
|
||||
pol := &sync.Pool{
|
||||
New: func() any {
|
||||
return new(outDat)
|
||||
},
|
||||
}
|
||||
out := make(chan *outDat, len(r.sizes))
|
||||
offset := r.start
|
||||
num := len(r.sizes)
|
||||
start := off / int64(r.blockSize)
|
||||
@@ -100,40 +101,42 @@ func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
|
||||
offset += uint64(realSize(r.sizes[i]))
|
||||
continue
|
||||
}
|
||||
od := pol.Get().(*outDat)
|
||||
if i == num-1 && r.fragRdr != nil {
|
||||
go func() {
|
||||
defer func() {
|
||||
out <- od
|
||||
}()
|
||||
rdr, e := r.fragRdr()
|
||||
if err != nil {
|
||||
out <- outDat{
|
||||
i: num - 1,
|
||||
err: e,
|
||||
}
|
||||
od.i = num - 1
|
||||
od.err = e
|
||||
return
|
||||
}
|
||||
dat, e := io.ReadAll(rdr)
|
||||
out <- outDat{
|
||||
i: num - 1,
|
||||
err: e,
|
||||
data: dat,
|
||||
}
|
||||
od.data = make([]byte, r.sizes[num-1])
|
||||
_, e = rdr.Read(od.data)
|
||||
od.i = num - 1
|
||||
od.err = e
|
||||
if clr, ok := rdr.(io.Closer); ok {
|
||||
clr.Close()
|
||||
}
|
||||
}()
|
||||
continue
|
||||
}
|
||||
go r.process(i, int64(offset), out)
|
||||
go r.process(i, int64(offset), od, out)
|
||||
offset += uint64(realSize(r.sizes[i]))
|
||||
}
|
||||
cur := start
|
||||
cache := make(map[int]outDat)
|
||||
for cur := start; cur < int64(end); {
|
||||
dat := <-out
|
||||
for dat := range out {
|
||||
if dat.err != nil {
|
||||
err = dat.err
|
||||
pol.Put(dat)
|
||||
return
|
||||
}
|
||||
if dat.i != int(cur) {
|
||||
cache[dat.i] = dat
|
||||
cache[dat.i] = *dat
|
||||
pol.Put(dat)
|
||||
continue
|
||||
}
|
||||
if cur == start {
|
||||
@@ -144,16 +147,18 @@ func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
|
||||
}
|
||||
n += len(dat.data)
|
||||
cur++
|
||||
pol.Put(dat)
|
||||
var ok bool
|
||||
var curDat outDat
|
||||
for {
|
||||
dat, ok = cache[int(cur)]
|
||||
curDat, ok = cache[int(cur)]
|
||||
if !ok {
|
||||
break
|
||||
}
|
||||
for i := range dat.data {
|
||||
p[n+i] = dat.data[i]
|
||||
for i := range curDat.data {
|
||||
p[n+i] = curDat.data[i]
|
||||
}
|
||||
n += len(dat.data)
|
||||
n += len(curDat.data)
|
||||
cur++
|
||||
delete(cache, int(cur))
|
||||
}
|
||||
@@ -165,58 +170,57 @@ func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
|
||||
}
|
||||
|
||||
func (r FullReader) WriteTo(w io.Writer) (n int64, err error) {
|
||||
out := make(chan outDat, len(r.sizes))
|
||||
pol := &sync.Pool{
|
||||
New: func() any {
|
||||
return new(outDat)
|
||||
},
|
||||
}
|
||||
out := make(chan *outDat, len(r.sizes))
|
||||
offset := r.start
|
||||
num := len(r.sizes)
|
||||
for i := 0; i < num; i++ {
|
||||
od := pol.Get().(*outDat)
|
||||
if i == num-1 && r.fragRdr != nil {
|
||||
go func() {
|
||||
defer func() {
|
||||
out <- od
|
||||
}()
|
||||
rdr, e := r.fragRdr()
|
||||
if err != nil {
|
||||
out <- outDat{
|
||||
i: num - 1,
|
||||
err: e,
|
||||
}
|
||||
od.i = num - 1
|
||||
od.err = e
|
||||
return
|
||||
}
|
||||
dat, e := io.ReadAll(rdr)
|
||||
out <- outDat{
|
||||
i: num - 1,
|
||||
err: e,
|
||||
data: dat,
|
||||
}
|
||||
buf := make([]byte, r.sizes[num-1])
|
||||
_, e = rdr.Read(buf)
|
||||
od.i = num - 1
|
||||
od.err = e
|
||||
od.data = buf
|
||||
if clr, ok := rdr.(io.Closer); ok {
|
||||
clr.Close()
|
||||
}
|
||||
}()
|
||||
continue
|
||||
}
|
||||
go r.process(i, int64(offset), out)
|
||||
go r.process(i, int64(offset), od, out)
|
||||
offset += uint64(realSize(r.sizes[i]))
|
||||
}
|
||||
cache := make(map[int]outDat)
|
||||
var tmpN int
|
||||
for cur := 0; cur < num; {
|
||||
dat := <-out
|
||||
if dat.err != nil {
|
||||
err = dat.err
|
||||
return
|
||||
}
|
||||
if dat.i != cur {
|
||||
cache[dat.i] = dat
|
||||
continue
|
||||
}
|
||||
tmpN, err = w.Write(dat.data)
|
||||
n += int64(tmpN)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
cur++
|
||||
var ok bool
|
||||
for {
|
||||
dat, ok = cache[cur]
|
||||
if !ok {
|
||||
break
|
||||
wt, ok := w.(io.WriterAt)
|
||||
if !ok {
|
||||
var cur int
|
||||
cache := make(map[int]outDat)
|
||||
var tmpN int
|
||||
var dat *outDat
|
||||
for cur < len(r.sizes) {
|
||||
dat = <-out
|
||||
defer pol.Put(dat)
|
||||
if dat.err != nil {
|
||||
err = dat.err
|
||||
return
|
||||
}
|
||||
if dat.i != cur {
|
||||
cache[dat.i] = *dat
|
||||
continue
|
||||
}
|
||||
tmpN, err = w.Write(dat.data)
|
||||
n += int64(tmpN)
|
||||
@@ -224,6 +228,36 @@ func (r FullReader) WriteTo(w io.Writer) (n int64, err error) {
|
||||
return
|
||||
}
|
||||
cur++
|
||||
var ok bool
|
||||
var curDat outDat
|
||||
for {
|
||||
curDat, ok = cache[cur]
|
||||
if !ok {
|
||||
break
|
||||
}
|
||||
tmpN, err = w.Write(curDat.data)
|
||||
n += int64(tmpN)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
cur++
|
||||
}
|
||||
}
|
||||
} else {
|
||||
var done int
|
||||
var dat *outDat
|
||||
for done < len(r.sizes) {
|
||||
dat = <-out
|
||||
defer pol.Put(dat)
|
||||
if dat.err != nil {
|
||||
err = dat.err
|
||||
return
|
||||
}
|
||||
_, err = wt.WriteAt(dat.data, int64(dat.i*int(r.blockSize)))
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
done++
|
||||
}
|
||||
}
|
||||
return
|
||||
|
||||
@@ -53,14 +53,14 @@ func (r *Reader) advance() (err error) {
|
||||
} else {
|
||||
r.cur = io.LimitReader(r.master, int64(size))
|
||||
if size == r.blockSizes[0] {
|
||||
if r.d.Resetable() {
|
||||
if rs, ok := r.d.(decompress.Resetable); ok {
|
||||
if r.comRdr == nil {
|
||||
r.cur, err = r.d.Reader(r.cur)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
} else {
|
||||
err = r.d.Reset(r.comRdr, r.cur)
|
||||
err = rs.Reset(r.comRdr, r.cur)
|
||||
r.cur = r.comRdr
|
||||
}
|
||||
} else {
|
||||
|
||||
@@ -12,8 +12,6 @@ func (g GZip) Reader(src io.Reader) (io.ReadCloser, error) {
|
||||
return zlib.NewReader(src)
|
||||
}
|
||||
|
||||
func (g GZip) Resetable() bool { return true }
|
||||
|
||||
func (g GZip) Reset(old, src io.Reader) error {
|
||||
return old.(zlib.Resetter).Reset(src, nil)
|
||||
}
|
||||
|
||||
@@ -1,19 +1,22 @@
|
||||
package decompress
|
||||
|
||||
import (
|
||||
"errors"
|
||||
"io"
|
||||
)
|
||||
|
||||
var ErrNotResetable = errors.New("decompressor not resetable")
|
||||
|
||||
type Decompressor interface {
|
||||
//Creates a new decompressor reading from src.
|
||||
Reader(src io.Reader) (io.ReadCloser, error)
|
||||
//Reports whether Reset will work or not.
|
||||
Resetable() bool
|
||||
}
|
||||
|
||||
type Resetable interface {
|
||||
//Reset attempts to re-use an old decompressor with new data.
|
||||
//Will return ErrNotResetable if not Resetable().
|
||||
//Must ALWAYS be provided with a reader created with Reader.
|
||||
Reset(old, src io.Reader) error
|
||||
}
|
||||
|
||||
type Decoder interface {
|
||||
//Decodes a chunk of data all at once.
|
||||
Decode(in []byte, outSize int) ([]byte, error)
|
||||
}
|
||||
|
||||
@@ -12,9 +12,16 @@ func (l Lz4) Reader(r io.Reader) (io.ReadCloser, error) {
|
||||
return io.NopCloser(lz4.NewReader(r)), nil
|
||||
}
|
||||
|
||||
func (l Lz4) Resetable() bool { return true }
|
||||
|
||||
func (l Lz4) Reset(old, src io.Reader) error {
|
||||
old.(*lz4.Reader).Reset(src)
|
||||
return nil
|
||||
}
|
||||
|
||||
func (l Lz4) Decode(in []byte, outSize int) (out []byte, err error) {
|
||||
out = make([]byte, outSize)
|
||||
outLen, err := lz4.UncompressBlock(in, out)
|
||||
if outLen < outSize {
|
||||
out = out[:outLen]
|
||||
}
|
||||
return
|
||||
}
|
||||
|
||||
@@ -12,7 +12,3 @@ func (l Lzma) Reader(r io.Reader) (io.ReadCloser, error) {
|
||||
rdr, err := lzma.NewReader(r)
|
||||
return io.NopCloser(rdr), err
|
||||
}
|
||||
|
||||
func (l Lzma) Resetable() bool { return false }
|
||||
|
||||
func (l Lzma) Reset(old, src io.Reader) error { return ErrNotResetable }
|
||||
|
||||
@@ -16,7 +16,3 @@ func (l Lzo) Reader(r io.Reader) (io.ReadCloser, error) {
|
||||
}
|
||||
return io.NopCloser(bytes.NewReader(cache)), nil
|
||||
}
|
||||
|
||||
func (l Lzo) Resetable() bool { return false }
|
||||
|
||||
func (l Lzo) Reset(old, src io.Reader) error { return ErrNotResetable }
|
||||
|
||||
@@ -13,8 +13,6 @@ func (x Xz) Reader(r io.Reader) (io.ReadCloser, error) {
|
||||
return io.NopCloser(rdr), err
|
||||
}
|
||||
|
||||
func (x Xz) Resetable() bool { return true }
|
||||
|
||||
func (x Xz) Reset(old, src io.Reader) error {
|
||||
return old.(*xz.Reader).Reset(src)
|
||||
}
|
||||
|
||||
@@ -15,15 +15,13 @@ func (z Zstd) Reader(src io.Reader) (io.ReadCloser, error) {
|
||||
return r.IOReadCloser(), err
|
||||
}
|
||||
|
||||
func (z Zstd) Resetable() bool { return true }
|
||||
|
||||
func (z Zstd) Reset(old, src io.Reader) error {
|
||||
return old.(*zstd.Decoder).Reset(src)
|
||||
}
|
||||
|
||||
func (z *Zstd) Decode(in []byte) (out []byte, err error) {
|
||||
func (z Zstd) Decode(in []byte, outSize int) ([]byte, error) {
|
||||
if z.writeToReader == nil {
|
||||
z.writeToReader, _ = zstd.NewReader(nil)
|
||||
}
|
||||
return z.writeToReader.DecodeAll(in, nil)
|
||||
return z.writeToReader.DecodeAll(in, make([]byte, outSize))
|
||||
}
|
||||
|
||||
@@ -26,7 +26,7 @@ func realSize(siz uint16) uint16 {
|
||||
}
|
||||
|
||||
func (r *Reader) advance() (err error) {
|
||||
if !r.d.Resetable() {
|
||||
if _, ok := r.d.(decompress.Resetable); !ok {
|
||||
if clr, ok := r.cur.(io.Closer); ok {
|
||||
clr.Close()
|
||||
}
|
||||
@@ -39,14 +39,14 @@ func (r *Reader) advance() (err error) {
|
||||
size := realSize(raw)
|
||||
r.cur = io.LimitReader(r.master, int64(size))
|
||||
if size == raw {
|
||||
if r.d.Resetable() {
|
||||
if rs, ok := r.d.(decompress.Resetable); ok {
|
||||
if r.comRdr == nil {
|
||||
r.cur, err = r.d.Reader(r.cur)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
} else {
|
||||
err = r.d.Reset(r.comRdr, r.cur)
|
||||
err = rs.Reset(r.comRdr, r.cur)
|
||||
r.cur = r.comRdr
|
||||
}
|
||||
} else {
|
||||
|
||||
@@ -0,0 +1,19 @@
|
||||
package toreader
|
||||
|
||||
import "io"
|
||||
|
||||
type OffsetReader struct {
|
||||
r io.ReaderAt
|
||||
off int64
|
||||
}
|
||||
|
||||
func NewOffsetReader(r io.ReaderAt, off int64) *OffsetReader {
|
||||
return &OffsetReader{
|
||||
r: r,
|
||||
off: off,
|
||||
}
|
||||
}
|
||||
|
||||
func (r OffsetReader) ReadAt(p []byte, off int64) (n int, e error) {
|
||||
return r.r.ReadAt(p, off+r.off)
|
||||
}
|
||||
@@ -6,7 +6,8 @@ type ReaderAt struct {
|
||||
d []byte
|
||||
}
|
||||
|
||||
func NewReaderAt(r io.Reader) (ra ReaderAt, err error) {
|
||||
func NewReaderAt(r io.Reader) (ra *ReaderAt, err error) {
|
||||
ra = new(ReaderAt)
|
||||
ra.d, err = io.ReadAll(r)
|
||||
return
|
||||
}
|
||||
|
||||
@@ -40,6 +40,10 @@ const (
|
||||
ZSTDCompression
|
||||
)
|
||||
|
||||
func NewReaderAtOffset(r io.ReaderAt, off int64) (*Reader, error) {
|
||||
return NewReader(toreader.NewOffsetReader(r, off))
|
||||
}
|
||||
|
||||
// Creates a new squashfs.Reader from the given io.Reader. NOTE: All data from the io.Reader will be read and stored in memory.
|
||||
func NewReaderFromReader(r io.Reader) (*Reader, error) {
|
||||
rdr, err := toreader.NewReaderAt(r)
|
||||
|
||||
+1
-1
@@ -70,7 +70,7 @@ func (r Reader) getReaders(i inode.Inode) (full *data.FullReader, rdr *data.Read
|
||||
}
|
||||
fragRdr = io.LimitReader(fragRdr, int64(fragSize))
|
||||
return fragRdr, nil
|
||||
})
|
||||
}, fragSize)
|
||||
var fragRdr io.Reader
|
||||
fragRdr, err = r.fragReader(fragInd)
|
||||
if err != nil {
|
||||
|
||||
@@ -73,7 +73,6 @@ func TestMisc(t *testing.T) {
|
||||
}
|
||||
|
||||
func BenchmarkRace(b *testing.B) {
|
||||
// tmpDir := b.TempDir()
|
||||
tmpDir := "testing"
|
||||
fil, err := preTest(tmpDir)
|
||||
if err != nil {
|
||||
|
||||
Reference in New Issue
Block a user