2021-10-14 23:39:48 +00:00
|
|
|
package file
|
|
|
|
|
|
|
|
import (
|
|
|
|
"archive/zip"
|
2023-02-15 23:06:12 +00:00
|
|
|
"bytes"
|
2022-07-13 06:30:54 +00:00
|
|
|
"errors"
|
|
|
|
"fmt"
|
2021-10-14 23:39:48 +00:00
|
|
|
"io"
|
|
|
|
"io/fs"
|
2022-07-13 06:30:54 +00:00
|
|
|
"path/filepath"
|
2023-02-15 23:06:12 +00:00
|
|
|
|
|
|
|
"github.com/stashapp/stash/pkg/logger"
|
2023-09-01 00:39:29 +00:00
|
|
|
"github.com/stashapp/stash/pkg/models"
|
2023-02-15 23:06:12 +00:00
|
|
|
"github.com/xWTF/chardet"
|
|
|
|
|
|
|
|
"golang.org/x/net/html/charset"
|
|
|
|
"golang.org/x/text/transform"
|
2021-10-14 23:39:48 +00:00
|
|
|
)
|
|
|
|
|
2022-07-13 06:30:54 +00:00
|
|
|
var (
|
|
|
|
errNotReaderAt = errors.New("not a ReaderAt")
|
|
|
|
errZipFSOpenZip = errors.New("cannot open zip file inside zip file")
|
|
|
|
)
|
2021-10-14 23:39:48 +00:00
|
|
|
|
2022-07-13 06:30:54 +00:00
|
|
|
// ZipFS is a file system backed by a zip file.
|
2023-09-01 00:39:29 +00:00
|
|
|
type zipFS struct {
|
2022-07-13 06:30:54 +00:00
|
|
|
*zip.Reader
|
|
|
|
zipFileCloser io.Closer
|
|
|
|
zipPath string
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2024-09-11 03:58:02 +00:00
|
|
|
func newZipFS(fs models.FS, path string, size int64) (*zipFS, error) {
|
2022-07-13 06:30:54 +00:00
|
|
|
reader, err := fs.Open(path)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
asReaderAt, _ := reader.(io.ReaderAt)
|
|
|
|
if asReaderAt == nil {
|
|
|
|
reader.Close()
|
|
|
|
return nil, errNotReaderAt
|
|
|
|
}
|
|
|
|
|
2024-09-11 03:58:02 +00:00
|
|
|
zipReader, err := zip.NewReader(asReaderAt, size)
|
2022-07-13 06:30:54 +00:00
|
|
|
if err != nil {
|
|
|
|
reader.Close()
|
|
|
|
return nil, err
|
|
|
|
}
|
2021-10-14 23:39:48 +00:00
|
|
|
|
2023-02-15 23:06:12 +00:00
|
|
|
// Concat all Name and Comment for better detection result
|
|
|
|
var buffer bytes.Buffer
|
|
|
|
for _, f := range zipReader.File {
|
|
|
|
buffer.WriteString(f.Name)
|
|
|
|
buffer.WriteString(f.Comment)
|
|
|
|
}
|
|
|
|
buffer.WriteString(zipReader.Comment)
|
|
|
|
|
|
|
|
// Detect encoding
|
|
|
|
d, err := chardet.NewTextDetector().DetectBest(buffer.Bytes())
|
|
|
|
if err != nil {
|
2023-03-23 22:04:48 +00:00
|
|
|
// If we can't detect the encoding, just assume it's UTF8
|
|
|
|
logger.Warnf("Unable to detect decoding for %s: %w", path, err)
|
2023-02-15 23:06:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// If the charset is not UTF8, decode'em
|
2023-03-23 22:04:48 +00:00
|
|
|
if d != nil && d.Charset != "UTF-8" {
|
2023-02-15 23:06:12 +00:00
|
|
|
logger.Debugf("Detected non-utf8 zip charset %s (%s): %s", d.Charset, d.Language, path)
|
|
|
|
|
|
|
|
e, _ := charset.Lookup(d.Charset)
|
|
|
|
if e == nil {
|
2023-03-23 22:04:48 +00:00
|
|
|
// if we can't find the encoding, just assume it's UTF8
|
|
|
|
logger.Warnf("Failed to lookup charset %s, language %s", d.Charset, d.Language)
|
|
|
|
} else {
|
|
|
|
decoder := e.NewDecoder()
|
|
|
|
for _, f := range zipReader.File {
|
|
|
|
newName, _, err := transform.String(decoder, f.Name)
|
|
|
|
if err != nil {
|
|
|
|
reader.Close()
|
|
|
|
logger.Warnf("Failed to decode %v: %v", []byte(f.Name), err)
|
|
|
|
} else {
|
|
|
|
f.Name = newName
|
|
|
|
}
|
|
|
|
// Comments are not decoded cuz stash doesn't use that
|
2023-02-15 23:06:12 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
return &zipFS{
|
2022-07-13 06:30:54 +00:00
|
|
|
Reader: zipReader,
|
|
|
|
zipFileCloser: reader,
|
|
|
|
zipPath: path,
|
|
|
|
}, nil
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) rel(name string) (string, error) {
|
2022-07-13 06:30:54 +00:00
|
|
|
if f.zipPath == name {
|
|
|
|
return ".", nil
|
|
|
|
}
|
|
|
|
|
|
|
|
relName, err := filepath.Rel(f.zipPath, name)
|
|
|
|
if err != nil {
|
|
|
|
return "", fmt.Errorf("internal error getting relative path: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// convert relName to use slash, since zip files do so regardless
|
|
|
|
// of os
|
|
|
|
relName = filepath.ToSlash(relName)
|
|
|
|
|
|
|
|
return relName, nil
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) Stat(name string) (fs.FileInfo, error) {
|
2022-07-13 06:30:54 +00:00
|
|
|
reader, err := f.Open(name)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
2022-07-13 06:30:54 +00:00
|
|
|
defer reader.Close()
|
|
|
|
|
|
|
|
return reader.Stat()
|
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) Lstat(name string) (fs.FileInfo, error) {
|
2022-10-24 23:57:37 +00:00
|
|
|
return f.Stat(name)
|
|
|
|
}
|
|
|
|
|
2024-09-11 03:58:02 +00:00
|
|
|
func (f *zipFS) OpenZip(name string, size int64) (models.ZipFS, error) {
|
2022-07-13 06:30:54 +00:00
|
|
|
return nil, errZipFSOpenZip
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) IsPathCaseSensitive(path string) (bool, error) {
|
2022-10-25 00:37:54 +00:00
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
|
2022-07-13 06:30:54 +00:00
|
|
|
type zipReadDirFile struct {
|
|
|
|
fs.File
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2022-07-13 06:30:54 +00:00
|
|
|
func (f *zipReadDirFile) ReadDir(n int) ([]fs.DirEntry, error) {
|
|
|
|
asReadDirFile, _ := f.File.(fs.ReadDirFile)
|
|
|
|
if asReadDirFile == nil {
|
|
|
|
return nil, fmt.Errorf("internal error: not a ReadDirFile")
|
|
|
|
}
|
|
|
|
|
|
|
|
return asReadDirFile.ReadDir(n)
|
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) Open(name string) (fs.ReadDirFile, error) {
|
2022-07-13 06:30:54 +00:00
|
|
|
relName, err := f.rel(name)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
r, err := f.Reader.Open(relName)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return &zipReadDirFile{
|
|
|
|
File: r,
|
|
|
|
}, nil
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) Close() error {
|
2022-07-13 06:30:54 +00:00
|
|
|
return f.zipFileCloser.Close()
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
|
|
|
|
2022-07-13 06:30:54 +00:00
|
|
|
// openOnly returns a ReadCloser where calling Close will close the zip fs as well.
|
2023-09-01 00:39:29 +00:00
|
|
|
func (f *zipFS) OpenOnly(name string) (io.ReadCloser, error) {
|
2022-07-13 06:30:54 +00:00
|
|
|
r, err := f.Open(name)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|
2022-07-13 06:30:54 +00:00
|
|
|
|
|
|
|
return &wrappedReadCloser{
|
|
|
|
ReadCloser: r,
|
|
|
|
outer: f,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type wrappedReadCloser struct {
|
|
|
|
io.ReadCloser
|
|
|
|
outer io.Closer
|
|
|
|
}
|
|
|
|
|
|
|
|
func (f *wrappedReadCloser) Close() error {
|
|
|
|
_ = f.ReadCloser.Close()
|
|
|
|
return f.outer.Close()
|
2021-10-14 23:39:48 +00:00
|
|
|
}
|