Compare commits

...

4 Commits

Author SHA1 Message Date
Caleb Gardner f61237a1f0 Added ReaderAtOffset 2022-12-22 02:00:42 -06:00
Caleb Gardner 820e06e792 fuse Serve in goroutine 2022-12-17 17:06:28 -06:00
Caleb Gardner 4f8f5f6928 Tweaks to decode interface 2022-12-17 16:47:33 -06:00
Caleb Gardner 1b5078c7bd Messing around with optimizations. 2022-12-14 13:48:22 -06:00
17 changed files with 175 additions and 122 deletions
+1 -3
View File
@@ -17,6 +17,4 @@ Thanks also to [distri's squashfs library](https://github.com/distr1/distri/tree
## Performance ## Performance
This library, decompressing the Firefox AppImage and using go tests, takes about twice as long as `unsquashfs` on my quad core laptop. (~1 second with the library and about half a second with `unsquashfs`). Testing on a zstd compressed file, my library is anywhere from 5x ~ 7x slower then `unsquashfs`
**My recents tests have shown the Firefox AppImage might be an outlier and this library might be considerably slower (4x ~ 6x time slower then `unsquashfs`)**
+3 -1
View File
@@ -10,12 +10,14 @@ import (
"github.com/CalebQ42/squashfs/internal/inode" "github.com/CalebQ42/squashfs/internal/inode"
) )
// Creates a fuse mount, then mounts the archive on a seperate goroutine.
// If waiting for the mount to end, simply do <-con.Ready.
func (r *Reader) Mount(mountpoint string) (con *fuse.Conn, err error) { func (r *Reader) Mount(mountpoint string) (con *fuse.Conn, err error) {
con, err = fuse.Mount(mountpoint, fuse.ReadOnly()) con, err = fuse.Mount(mountpoint, fuse.ReadOnly())
if err != nil { if err != nil {
return return
} }
err = fs.Serve(con, &squashFuse{r: r}) go fs.Serve(con, &squashFuse{r: r})
return return
} }
+104 -70
View File
@@ -2,6 +2,7 @@ package data
import ( import (
"io" "io"
"sync"
"github.com/CalebQ42/squashfs/internal/decompress" "github.com/CalebQ42/squashfs/internal/decompress"
"github.com/CalebQ42/squashfs/internal/toreader" "github.com/CalebQ42/squashfs/internal/toreader"
@@ -26,9 +27,9 @@ func NewFullReader(r io.ReaderAt, start uint64, d decompress.Decompressor, block
} }
} }
func (r *FullReader) AddFragment(rdr func() (io.Reader, error)) { func (r *FullReader) AddFragment(rdr func() (io.Reader, error), size uint32) {
r.fragRdr = rdr r.fragRdr = rdr
r.sizes = append(r.sizes, 0) r.sizes = append(r.sizes, size)
} }
type outDat struct { type outDat struct {
@@ -37,50 +38,50 @@ type outDat struct {
i int i int
} }
func (r FullReader) process(index int, offset int64, out chan outDat) { func (r FullReader) process(index int, offset int64, od *outDat, out chan *outDat) {
var err error defer func() {
var dat []byte out <- od
var rdr io.ReadCloser }()
od.i = index
size := realSize(r.sizes[index]) size := realSize(r.sizes[index])
if size == 0 { if size == 0 {
out <- outDat{ od.err = nil
i: index, od.data = make([]byte, r.blockSize)
err: nil,
data: make([]byte, r.blockSize),
}
return return
} }
// rdr := io.LimitReader(toreader.NewReader(r.r, offset), int64(size))
if size == r.sizes[index] { if size == r.sizes[index] {
//Special workaround for zstd for increased performancce. if dec, ok := r.d.(decompress.Decoder); ok {
if zstd, ok := r.d.(*decompress.Zstd); ok { dat := make([]byte, size)
dat = make([]byte, size) _, od.err = r.r.ReadAt(dat, offset)
_, err = r.r.ReadAt(dat, offset) if od.err != nil {
if err == nil { return
dat, err = zstd.Decode(dat)
} }
od.data, od.err = dec.Decode(dat, int(r.blockSize))
return
}
var rdr io.ReadCloser
rdr, od.err = r.d.Reader(io.LimitReader(toreader.NewReader(r.r, offset), int64(size)))
if od.err != nil {
return
}
od.data = make([]byte, r.blockSize)
var read int
read, od.err = rdr.Read(od.data)
od.data = od.data[:read]
rdr.Close()
} else { } else {
rdr, err = r.d.Reader(io.LimitReader(toreader.NewReader(r.r, offset), int64(size))) od.data = make([]byte, size)
if err == nil { _, od.err = r.r.ReadAt(od.data, offset)
dat, err = io.ReadAll(rdr)
}
}
} else {
dat = make([]byte, size)
_, err = r.r.ReadAt(dat, offset)
}
out <- outDat{
i: index,
err: err,
data: dat,
}
if clr, ok := rdr.(io.Closer); ok {
clr.Close()
} }
} }
func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) { func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
out := make(chan outDat, len(r.sizes)) pol := &sync.Pool{
New: func() any {
return new(outDat)
},
}
out := make(chan *outDat, len(r.sizes))
offset := r.start offset := r.start
num := len(r.sizes) num := len(r.sizes)
start := off / int64(r.blockSize) start := off / int64(r.blockSize)
@@ -100,40 +101,42 @@ func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
offset += uint64(realSize(r.sizes[i])) offset += uint64(realSize(r.sizes[i]))
continue continue
} }
od := pol.Get().(*outDat)
if i == num-1 && r.fragRdr != nil { if i == num-1 && r.fragRdr != nil {
go func() { go func() {
defer func() {
out <- od
}()
rdr, e := r.fragRdr() rdr, e := r.fragRdr()
if err != nil { if err != nil {
out <- outDat{ od.i = num - 1
i: num - 1, od.err = e
err: e,
}
return return
} }
dat, e := io.ReadAll(rdr) od.data = make([]byte, r.sizes[num-1])
out <- outDat{ _, e = rdr.Read(od.data)
i: num - 1, od.i = num - 1
err: e, od.err = e
data: dat,
}
if clr, ok := rdr.(io.Closer); ok { if clr, ok := rdr.(io.Closer); ok {
clr.Close() clr.Close()
} }
}() }()
continue continue
} }
go r.process(i, int64(offset), out) go r.process(i, int64(offset), od, out)
offset += uint64(realSize(r.sizes[i])) offset += uint64(realSize(r.sizes[i]))
} }
cur := start
cache := make(map[int]outDat) cache := make(map[int]outDat)
for cur := start; cur < int64(end); { for dat := range out {
dat := <-out
if dat.err != nil { if dat.err != nil {
err = dat.err err = dat.err
pol.Put(dat)
return return
} }
if dat.i != int(cur) { if dat.i != int(cur) {
cache[dat.i] = dat cache[dat.i] = *dat
pol.Put(dat)
continue continue
} }
if cur == start { if cur == start {
@@ -144,16 +147,18 @@ func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
} }
n += len(dat.data) n += len(dat.data)
cur++ cur++
pol.Put(dat)
var ok bool var ok bool
var curDat outDat
for { for {
dat, ok = cache[int(cur)] curDat, ok = cache[int(cur)]
if !ok { if !ok {
break break
} }
for i := range dat.data { for i := range curDat.data {
p[n+i] = dat.data[i] p[n+i] = curDat.data[i]
} }
n += len(dat.data) n += len(curDat.data)
cur++ cur++
delete(cache, int(cur)) delete(cache, int(cur))
} }
@@ -165,45 +170,56 @@ func (r FullReader) ReadAt(p []byte, off int64) (n int, err error) {
} }
func (r FullReader) WriteTo(w io.Writer) (n int64, err error) { func (r FullReader) WriteTo(w io.Writer) (n int64, err error) {
out := make(chan outDat, len(r.sizes)) pol := &sync.Pool{
New: func() any {
return new(outDat)
},
}
out := make(chan *outDat, len(r.sizes))
offset := r.start offset := r.start
num := len(r.sizes) num := len(r.sizes)
for i := 0; i < num; i++ { for i := 0; i < num; i++ {
od := pol.Get().(*outDat)
if i == num-1 && r.fragRdr != nil { if i == num-1 && r.fragRdr != nil {
go func() { go func() {
defer func() {
out <- od
}()
rdr, e := r.fragRdr() rdr, e := r.fragRdr()
if err != nil { if err != nil {
out <- outDat{ od.i = num - 1
i: num - 1, od.err = e
err: e,
}
return return
} }
dat, e := io.ReadAll(rdr) buf := make([]byte, r.sizes[num-1])
out <- outDat{ _, e = rdr.Read(buf)
i: num - 1, od.i = num - 1
err: e, od.err = e
data: dat, od.data = buf
}
if clr, ok := rdr.(io.Closer); ok { if clr, ok := rdr.(io.Closer); ok {
clr.Close() clr.Close()
} }
}() }()
continue continue
} }
go r.process(i, int64(offset), out) go r.process(i, int64(offset), od, out)
offset += uint64(realSize(r.sizes[i])) offset += uint64(realSize(r.sizes[i]))
} }
wt, ok := w.(io.WriterAt)
if !ok {
var cur int
cache := make(map[int]outDat) cache := make(map[int]outDat)
var tmpN int var tmpN int
for cur := 0; cur < num; { var dat *outDat
dat := <-out for cur < len(r.sizes) {
dat = <-out
defer pol.Put(dat)
if dat.err != nil { if dat.err != nil {
err = dat.err err = dat.err
return return
} }
if dat.i != cur { if dat.i != cur {
cache[dat.i] = dat cache[dat.i] = *dat
continue continue
} }
tmpN, err = w.Write(dat.data) tmpN, err = w.Write(dat.data)
@@ -213,12 +229,13 @@ func (r FullReader) WriteTo(w io.Writer) (n int64, err error) {
} }
cur++ cur++
var ok bool var ok bool
var curDat outDat
for { for {
dat, ok = cache[cur] curDat, ok = cache[cur]
if !ok { if !ok {
break break
} }
tmpN, err = w.Write(dat.data) tmpN, err = w.Write(curDat.data)
n += int64(tmpN) n += int64(tmpN)
if err != nil { if err != nil {
return return
@@ -226,5 +243,22 @@ func (r FullReader) WriteTo(w io.Writer) (n int64, err error) {
cur++ cur++
} }
} }
} else {
var done int
var dat *outDat
for done < len(r.sizes) {
dat = <-out
defer pol.Put(dat)
if dat.err != nil {
err = dat.err
return
}
_, err = wt.WriteAt(dat.data, int64(dat.i*int(r.blockSize)))
if err != nil {
return
}
done++
}
}
return return
} }
+2 -2
View File
@@ -53,14 +53,14 @@ func (r *Reader) advance() (err error) {
} else { } else {
r.cur = io.LimitReader(r.master, int64(size)) r.cur = io.LimitReader(r.master, int64(size))
if size == r.blockSizes[0] { if size == r.blockSizes[0] {
if r.d.Resetable() { if rs, ok := r.d.(decompress.Resetable); ok {
if r.comRdr == nil { if r.comRdr == nil {
r.cur, err = r.d.Reader(r.cur) r.cur, err = r.d.Reader(r.cur)
if err != nil { if err != nil {
return return
} }
} else { } else {
err = r.d.Reset(r.comRdr, r.cur) err = rs.Reset(r.comRdr, r.cur)
r.cur = r.comRdr r.cur = r.comRdr
} }
} else { } else {
-2
View File
@@ -12,8 +12,6 @@ func (g GZip) Reader(src io.Reader) (io.ReadCloser, error) {
return zlib.NewReader(src) return zlib.NewReader(src)
} }
func (g GZip) Resetable() bool { return true }
func (g GZip) Reset(old, src io.Reader) error { func (g GZip) Reset(old, src io.Reader) error {
return old.(zlib.Resetter).Reset(src, nil) return old.(zlib.Resetter).Reset(src, nil)
} }
+8 -5
View File
@@ -1,19 +1,22 @@
package decompress package decompress
import ( import (
"errors"
"io" "io"
) )
var ErrNotResetable = errors.New("decompressor not resetable")
type Decompressor interface { type Decompressor interface {
//Creates a new decompressor reading from src. //Creates a new decompressor reading from src.
Reader(src io.Reader) (io.ReadCloser, error) Reader(src io.Reader) (io.ReadCloser, error)
//Reports whether Reset will work or not. }
Resetable() bool
type Resetable interface {
//Reset attempts to re-use an old decompressor with new data. //Reset attempts to re-use an old decompressor with new data.
//Will return ErrNotResetable if not Resetable(). //Will return ErrNotResetable if not Resetable().
//Must ALWAYS be provided with a reader created with Reader. //Must ALWAYS be provided with a reader created with Reader.
Reset(old, src io.Reader) error Reset(old, src io.Reader) error
} }
type Decoder interface {
//Decodes a chunk of data all at once.
Decode(in []byte, outSize int) ([]byte, error)
}
+9 -2
View File
@@ -12,9 +12,16 @@ func (l Lz4) Reader(r io.Reader) (io.ReadCloser, error) {
return io.NopCloser(lz4.NewReader(r)), nil return io.NopCloser(lz4.NewReader(r)), nil
} }
func (l Lz4) Resetable() bool { return true }
func (l Lz4) Reset(old, src io.Reader) error { func (l Lz4) Reset(old, src io.Reader) error {
old.(*lz4.Reader).Reset(src) old.(*lz4.Reader).Reset(src)
return nil return nil
} }
func (l Lz4) Decode(in []byte, outSize int) (out []byte, err error) {
out = make([]byte, outSize)
outLen, err := lz4.UncompressBlock(in, out)
if outLen < outSize {
out = out[:outLen]
}
return
}
-4
View File
@@ -12,7 +12,3 @@ func (l Lzma) Reader(r io.Reader) (io.ReadCloser, error) {
rdr, err := lzma.NewReader(r) rdr, err := lzma.NewReader(r)
return io.NopCloser(rdr), err return io.NopCloser(rdr), err
} }
func (l Lzma) Resetable() bool { return false }
func (l Lzma) Reset(old, src io.Reader) error { return ErrNotResetable }
-4
View File
@@ -16,7 +16,3 @@ func (l Lzo) Reader(r io.Reader) (io.ReadCloser, error) {
} }
return io.NopCloser(bytes.NewReader(cache)), nil return io.NopCloser(bytes.NewReader(cache)), nil
} }
func (l Lzo) Resetable() bool { return false }
func (l Lzo) Reset(old, src io.Reader) error { return ErrNotResetable }
-2
View File
@@ -13,8 +13,6 @@ func (x Xz) Reader(r io.Reader) (io.ReadCloser, error) {
return io.NopCloser(rdr), err return io.NopCloser(rdr), err
} }
func (x Xz) Resetable() bool { return true }
func (x Xz) Reset(old, src io.Reader) error { func (x Xz) Reset(old, src io.Reader) error {
return old.(*xz.Reader).Reset(src) return old.(*xz.Reader).Reset(src)
} }
+2 -4
View File
@@ -15,15 +15,13 @@ func (z Zstd) Reader(src io.Reader) (io.ReadCloser, error) {
return r.IOReadCloser(), err return r.IOReadCloser(), err
} }
func (z Zstd) Resetable() bool { return true }
func (z Zstd) Reset(old, src io.Reader) error { func (z Zstd) Reset(old, src io.Reader) error {
return old.(*zstd.Decoder).Reset(src) return old.(*zstd.Decoder).Reset(src)
} }
func (z *Zstd) Decode(in []byte) (out []byte, err error) { func (z Zstd) Decode(in []byte, outSize int) ([]byte, error) {
if z.writeToReader == nil { if z.writeToReader == nil {
z.writeToReader, _ = zstd.NewReader(nil) z.writeToReader, _ = zstd.NewReader(nil)
} }
return z.writeToReader.DecodeAll(in, nil) return z.writeToReader.DecodeAll(in, make([]byte, outSize))
} }
+3 -3
View File
@@ -26,7 +26,7 @@ func realSize(siz uint16) uint16 {
} }
func (r *Reader) advance() (err error) { func (r *Reader) advance() (err error) {
if !r.d.Resetable() { if _, ok := r.d.(decompress.Resetable); !ok {
if clr, ok := r.cur.(io.Closer); ok { if clr, ok := r.cur.(io.Closer); ok {
clr.Close() clr.Close()
} }
@@ -39,14 +39,14 @@ func (r *Reader) advance() (err error) {
size := realSize(raw) size := realSize(raw)
r.cur = io.LimitReader(r.master, int64(size)) r.cur = io.LimitReader(r.master, int64(size))
if size == raw { if size == raw {
if r.d.Resetable() { if rs, ok := r.d.(decompress.Resetable); ok {
if r.comRdr == nil { if r.comRdr == nil {
r.cur, err = r.d.Reader(r.cur) r.cur, err = r.d.Reader(r.cur)
if err != nil { if err != nil {
return return
} }
} else { } else {
err = r.d.Reset(r.comRdr, r.cur) err = rs.Reset(r.comRdr, r.cur)
r.cur = r.comRdr r.cur = r.comRdr
} }
} else { } else {
+19
View File
@@ -0,0 +1,19 @@
package toreader
import "io"
type OffsetReader struct {
r io.ReaderAt
off int64
}
func NewOffsetReader(r io.ReaderAt, off int64) *OffsetReader {
return &OffsetReader{
r: r,
off: off,
}
}
func (r OffsetReader) ReadAt(p []byte, off int64) (n int, e error) {
return r.r.ReadAt(p, off+r.off)
}
+2 -1
View File
@@ -6,7 +6,8 @@ type ReaderAt struct {
d []byte d []byte
} }
func NewReaderAt(r io.Reader) (ra ReaderAt, err error) { func NewReaderAt(r io.Reader) (ra *ReaderAt, err error) {
ra = new(ReaderAt)
ra.d, err = io.ReadAll(r) ra.d, err = io.ReadAll(r)
return return
} }
+4
View File
@@ -40,6 +40,10 @@ const (
ZSTDCompression ZSTDCompression
) )
func NewReaderAtOffset(r io.ReaderAt, off int64) (*Reader, error) {
return NewReader(toreader.NewOffsetReader(r, off))
}
// Creates a new squashfs.Reader from the given io.Reader. NOTE: All data from the io.Reader will be read and stored in memory. // Creates a new squashfs.Reader from the given io.Reader. NOTE: All data from the io.Reader will be read and stored in memory.
func NewReaderFromReader(r io.Reader) (*Reader, error) { func NewReaderFromReader(r io.Reader) (*Reader, error) {
rdr, err := toreader.NewReaderAt(r) rdr, err := toreader.NewReaderAt(r)
+1 -1
View File
@@ -70,7 +70,7 @@ func (r Reader) getReaders(i inode.Inode) (full *data.FullReader, rdr *data.Read
} }
fragRdr = io.LimitReader(fragRdr, int64(fragSize)) fragRdr = io.LimitReader(fragRdr, int64(fragSize))
return fragRdr, nil return fragRdr, nil
}) }, fragSize)
var fragRdr io.Reader var fragRdr io.Reader
fragRdr, err = r.fragReader(fragInd) fragRdr, err = r.fragReader(fragInd)
if err != nil { if err != nil {
-1
View File
@@ -73,7 +73,6 @@ func TestMisc(t *testing.T) {
} }
func BenchmarkRace(b *testing.B) { func BenchmarkRace(b *testing.B) {
// tmpDir := b.TempDir()
tmpDir := "testing" tmpDir := "testing"
fil, err := preTest(tmpDir) fil, err := preTest(tmpDir)
if err != nil { if err != nil {