perkeep/pkg/fs/fs.go

423 lines
10 KiB
Go

// +build linux darwin
/*
Copyright 2011 The Perkeep Authors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
// Package fs implements a FUSE filesystem for Camlistore and is
// used by the pk-mount binary.
package fs // import "perkeep.org/pkg/fs"
import (
"context"
"fmt"
"io"
"log"
"os"
"sync"
"time"
"perkeep.org/internal/lru"
"perkeep.org/pkg/blob"
"perkeep.org/pkg/client"
"perkeep.org/pkg/schema"
"bazil.org/fuse"
fusefs "bazil.org/fuse/fs"
)
var serverStart = time.Now()
type CamliFileSystem struct {
fetcher blob.Fetcher
client *client.Client // or nil, if not doing search queries
root fusefs.Node
// IgnoreOwners, if true, collapses all file ownership to the
// uid/gid running the fuse filesystem, and sets all the
// permissions to 0600/0700.
IgnoreOwners bool
blobToSchema *lru.Cache // ~map[blobstring]*schema.Blob
nameToBlob *lru.Cache // ~map[string]blob.Ref
nameToAttr *lru.Cache // ~map[string]*fuse.Attr
}
var _ fusefs.FS = (*CamliFileSystem)(nil)
func newCamliFileSystem(fetcher blob.Fetcher) *CamliFileSystem {
return &CamliFileSystem{
fetcher: fetcher,
blobToSchema: lru.New(1024), // arbitrary; TODO: tunable/smarter?
nameToBlob: lru.New(1024), // arbitrary: TODO: tunable/smarter?
nameToAttr: lru.New(1024), // arbitrary: TODO: tunable/smarter?
}
}
// NewDefaultCamliFileSystem returns a filesystem with a generic base, from which
// users can navigate by blobref, tag, date, etc.
func NewDefaultCamliFileSystem(client *client.Client, fetcher blob.Fetcher) *CamliFileSystem {
if client == nil || fetcher == nil {
panic("nil argument")
}
fs := newCamliFileSystem(fetcher)
fs.root = &root{fs: fs} // root.go
fs.client = client
return fs
}
// NewRootedCamliFileSystem returns a CamliFileSystem with a node based on a blobref
// as its base.
func NewRootedCamliFileSystem(cli *client.Client, fetcher blob.Fetcher, root blob.Ref) (*CamliFileSystem, error) {
fs := newCamliFileSystem(fetcher)
fs.client = cli
n, err := fs.newNodeFromBlobRef(root)
if err != nil {
return nil, err
}
fs.root = n
return fs, nil
}
// node implements fuse.Node with a read-only Camli "file" or
// "directory" blob.
type node struct {
fs *CamliFileSystem
blobref blob.Ref
pnodeModTime time.Time // optionally set by recent.go; modtime of permanode
dmu sync.Mutex // guards dirents. acquire before mu.
dirents []fuse.Dirent // nil until populated once
mu sync.Mutex // guards rest
attr fuse.Attr
meta *schema.Blob
lookMap map[string]blob.Ref
}
var _ fusefs.Node = (*node)(nil)
func (n *node) Attr(ctx context.Context, a *fuse.Attr) error {
if _, err := n.schema(); err != nil {
return err
}
*a = n.attr
return nil
}
func (n *node) addLookupEntry(name string, ref blob.Ref) {
n.mu.Lock()
defer n.mu.Unlock()
if n.lookMap == nil {
n.lookMap = make(map[string]blob.Ref)
}
n.lookMap[name] = ref
}
var _ fusefs.NodeStringLookuper = (*node)(nil)
func (n *node) Lookup(ctx context.Context, name string) (fusefs.Node, error) {
if name == ".quitquitquit" {
// TODO: only in dev mode
log.Fatalf("Shutting down due to .quitquitquit lookup.")
}
// If we haven't done Readdir yet (dirents isn't set), then force a Readdir
// call to populate lookMap.
n.dmu.Lock()
loaded := n.dirents != nil
n.dmu.Unlock()
if !loaded {
n.ReadDirAll(nil)
}
n.mu.Lock()
defer n.mu.Unlock()
ref, ok := n.lookMap[name]
if !ok {
return nil, fuse.ENOENT
}
return &node{fs: n.fs, blobref: ref}, nil
}
func (n *node) schema() (*schema.Blob, error) {
// TODO: use singleflight library here instead of a lock?
n.mu.Lock()
defer n.mu.Unlock()
if n.meta != nil {
return n.meta, nil
}
blob, err := n.fs.fetchSchemaMeta(n.blobref)
if err == nil {
n.meta = blob
n.populateAttr()
}
return blob, err
}
func isWriteFlags(flags fuse.OpenFlags) bool {
// TODO read/writeness are not flags, use O_ACCMODE
return flags&fuse.OpenFlags(os.O_WRONLY|os.O_RDWR|os.O_APPEND|os.O_CREATE) != 0
}
var _ fusefs.NodeOpener = (*node)(nil)
func (n *node) Open(ctx context.Context, req *fuse.OpenRequest, res *fuse.OpenResponse) (fusefs.Handle, error) {
log.Printf("CAMLI Open on %v: %#v", n.blobref, req)
if isWriteFlags(req.Flags) {
return nil, fuse.EPERM
}
ss, err := n.schema()
if err != nil {
log.Printf("open of %v: %v", n.blobref, err)
return nil, fuse.EIO
}
if ss.Type() == "directory" {
return n, nil
}
fr, err := ss.NewFileReader(n.fs.fetcher)
if err != nil {
// Will only happen if ss.Type != "file" or "bytes"
log.Printf("NewFileReader(%s) = %v", n.blobref, err)
return nil, fuse.EIO
}
return &nodeReader{n: n, fr: fr}, nil
}
type nodeReader struct {
n *node
fr *schema.FileReader
}
var _ fusefs.HandleReader = (*nodeReader)(nil)
func (nr *nodeReader) Read(ctx context.Context, req *fuse.ReadRequest, res *fuse.ReadResponse) error {
log.Printf("CAMLI nodeReader READ on %v: %#v", nr.n.blobref, req)
if req.Offset >= nr.fr.Size() {
return nil
}
size := req.Size
if int64(size)+req.Offset >= nr.fr.Size() {
size -= int((int64(size) + req.Offset) - nr.fr.Size())
}
buf := make([]byte, size)
n, err := nr.fr.ReadAt(buf, req.Offset)
if err == io.EOF {
err = nil
}
if err != nil {
log.Printf("camli read on %v at %d: %v", nr.n.blobref, req.Offset, err)
return fuse.EIO
}
res.Data = buf[:n]
return nil
}
var _ fusefs.HandleReleaser = (*nodeReader)(nil)
func (nr *nodeReader) Release(ctx context.Context, req *fuse.ReleaseRequest) error {
log.Printf("CAMLI nodeReader RELEASE on %v", nr.n.blobref)
nr.fr.Close()
return nil
}
var _ fusefs.HandleReadDirAller = (*node)(nil)
func (n *node) ReadDirAll(ctx context.Context) ([]fuse.Dirent, error) {
log.Printf("CAMLI ReadDirAll on %v", n.blobref)
n.dmu.Lock()
defer n.dmu.Unlock()
if n.dirents != nil {
return n.dirents, nil
}
ss, err := n.schema()
if err != nil {
log.Printf("camli.ReadDirAll error on %v: %v", n.blobref, err)
return nil, fuse.EIO
}
dr, err := schema.NewDirReader(n.fs.fetcher, ss.BlobRef())
if err != nil {
log.Printf("camli.ReadDirAll error on %v: %v", n.blobref, err)
return nil, fuse.EIO
}
schemaEnts, err := dr.Readdir(-1)
if err != nil {
log.Printf("camli.ReadDirAll error on %v: %v", n.blobref, err)
return nil, fuse.EIO
}
n.dirents = make([]fuse.Dirent, 0)
for _, sent := range schemaEnts {
if name := sent.FileName(); name != "" {
n.addLookupEntry(name, sent.BlobRef())
n.dirents = append(n.dirents, fuse.Dirent{Name: name})
}
}
return n.dirents, nil
}
// populateAttr should only be called once n.ss is known to be set and
// non-nil
func (n *node) populateAttr() error {
meta := n.meta
n.attr.Mode = meta.FileMode()
if n.fs.IgnoreOwners {
n.attr.Uid = uint32(os.Getuid())
n.attr.Gid = uint32(os.Getgid())
executeBit := n.attr.Mode & 0100
n.attr.Mode = (n.attr.Mode ^ n.attr.Mode.Perm()) | 0400 | executeBit
} else {
n.attr.Uid = uint32(meta.MapUid())
n.attr.Gid = uint32(meta.MapGid())
}
// TODO: inode?
if mt := meta.ModTime(); !mt.IsZero() {
n.attr.Mtime = mt
} else {
n.attr.Mtime = n.pnodeModTime
}
switch meta.Type() {
case "file":
n.attr.Size = uint64(meta.PartsSize())
n.attr.Blocks = 0 // TODO: set?
n.attr.Mode |= 0400
case "directory":
n.attr.Mode |= 0500
case "symlink":
n.attr.Mode |= 0400
default:
log.Printf("unknown attr ss.Type %q in populateAttr", meta.Type())
}
return nil
}
func (fs *CamliFileSystem) Root() (fusefs.Node, error) {
return fs.root, nil
}
var _ fusefs.FSStatfser = (*CamliFileSystem)(nil)
func (fs *CamliFileSystem) Statfs(ctx context.Context, req *fuse.StatfsRequest, res *fuse.StatfsResponse) error {
// Make some stuff up, just to see if it makes "lsof" happy.
res.Blocks = 1 << 35
res.Bfree = 1 << 34
res.Bavail = 1 << 34
res.Files = 1 << 29
res.Ffree = 1 << 28
res.Namelen = 2048
res.Bsize = 1024
return nil
}
// Errors returned are:
// os.ErrNotExist -- blob not found
// os.ErrInvalid -- not JSON or a camli schema blob
func (fs *CamliFileSystem) fetchSchemaMeta(br blob.Ref) (*schema.Blob, error) {
blobStr := br.String()
if blob, ok := fs.blobToSchema.Get(blobStr); ok {
return blob.(*schema.Blob), nil
}
rc, _, err := fs.fetcher.Fetch(br)
if err != nil {
return nil, err
}
defer rc.Close()
blob, err := schema.BlobFromReader(br, rc)
if err != nil {
log.Printf("Error parsing %s as schema blob: %v", br, err)
return nil, os.ErrInvalid
}
if blob.Type() == "" {
log.Printf("blob %s is JSON but lacks camliType", br)
return nil, os.ErrInvalid
}
fs.blobToSchema.Add(blobStr, blob)
return blob, nil
}
// consolated logic for determining a node to mount based on an arbitrary blobref
func (fs *CamliFileSystem) newNodeFromBlobRef(root blob.Ref) (fusefs.Node, error) {
blob, err := fs.fetchSchemaMeta(root)
if err != nil {
return nil, err
}
switch blob.Type() {
case "directory":
n := &node{fs: fs, blobref: root, meta: blob}
n.populateAttr()
return n, nil
case "permanode":
// other mutDirs listed in the default fileystem have names and are displayed
return &mutDir{fs: fs, permanode: root, name: "-"}, nil
}
return nil, fmt.Errorf("Blobref must be of a directory or permanode got a %v", blob.Type())
}
type notImplementDirNode struct{}
var _ fusefs.Node = (*notImplementDirNode)(nil)
func (notImplementDirNode) Attr(ctx context.Context, a *fuse.Attr) error {
a.Mode = os.ModeDir | 0000
a.Uid = uint32(os.Getuid())
a.Gid = uint32(os.Getgid())
return nil
}
type staticFileNode string
var _ fusefs.Node = (*notImplementDirNode)(nil)
func (s staticFileNode) Attr(ctx context.Context, a *fuse.Attr) error {
a.Mode = 0400
a.Uid = uint32(os.Getuid())
a.Gid = uint32(os.Getgid())
a.Size = uint64(len(s))
a.Mtime = serverStart
a.Ctime = serverStart
a.Crtime = serverStart
return nil
}
var _ fusefs.HandleReader = (*staticFileNode)(nil)
func (s staticFileNode) Read(ctx context.Context, req *fuse.ReadRequest, res *fuse.ReadResponse) error {
if req.Offset > int64(len(s)) {
return nil
}
s = s[req.Offset:]
size := req.Size
if size > len(s) {
size = len(s)
}
res.Data = make([]byte, size)
copy(res.Data, s)
return nil
}