Implements a read-only fs.FS view of a txtar.Archive.
It returns an error if the names in the archive are not valid
file system names. The archive cannot be modified while the
file system is in use.

Fixes golang/go#44158

Change-Id: If1e77833545a5b5db28006322e7f214951bc52f6
Reviewed-on: https://go-review.googlesource.com/c/tools/+/598756
Reviewed-by: Ian Lance Taylor <iant@google.com>
LUCI-TryBot-Result: Go LUCI <golang-scoped@luci-project-accounts.iam.gserviceaccount.com>
This commit is contained in:
Tim King 2024-07-16 15:53:06 -07:00
Родитель 2cb2f7d32f
Коммит 2fb3ebe9d9
2 изменённых файлов: 442 добавлений и 0 удалений

259
txtar/fs.go Normal file
Просмотреть файл

@ -0,0 +1,259 @@
// Copyright 2024 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
package txtar
import (
"errors"
"fmt"
"io"
"io/fs"
"path"
"time"
)
// FS returns the file system form of an Archive.
// It returns an error if any of the file names in the archive
// are not valid file system names.
// The archive must not be modified while the FS is in use.
//
// If the file system detects that it has been modified, calls to the
// file system return an ErrModified error.
func FS(a *Archive) (fs.FS, error) {
// Create a filesystem with a root directory.
root := &node{fileinfo: fileinfo{path: ".", mode: readOnlyDir}}
fsys := &filesystem{a, map[string]*node{root.path: root}}
if err := initFiles(fsys); err != nil {
return nil, fmt.Errorf("cannot create fs.FS from txtar.Archive: %s", err)
}
return fsys, nil
}
const (
readOnly fs.FileMode = 0o444 // read only mode
readOnlyDir = readOnly | fs.ModeDir
)
// ErrModified indicates that file system returned by FS
// noticed that the underlying archive has been modified
// since the call to FS. Detection of modification is best effort,
// to help diagnose misuse of the API, and is not guaranteed.
var ErrModified error = errors.New("txtar.Archive has been modified during txtar.FS")
// A filesystem is a simple in-memory file system for txtar archives,
// represented as a map from valid path names to information about the
// files or directories they represent.
//
// File system operations are read only. Modifications to the underlying
// *Archive may race. To help prevent this, the filesystem tries
// to detect modification during Open and return ErrModified if it
// is able to detect a modification.
type filesystem struct {
ar *Archive
nodes map[string]*node
}
// node is a file or directory in the tree of a filesystem.
type node struct {
fileinfo // fs.FileInfo and fs.DirEntry implementation
idx int // index into ar.Files (for files)
entries []fs.DirEntry // subdirectories and files (for directories)
}
var _ fs.FS = (*filesystem)(nil)
var _ fs.DirEntry = (*node)(nil)
// initFiles initializes fsys from fsys.ar.Files. Returns an error if there are any
// invalid file names or collisions between file or directories.
func initFiles(fsys *filesystem) error {
for idx, file := range fsys.ar.Files {
name := file.Name
if !fs.ValidPath(name) {
return fmt.Errorf("file %q is an invalid path", name)
}
n := &node{idx: idx, fileinfo: fileinfo{path: name, size: len(file.Data), mode: readOnly}}
if err := insert(fsys, n); err != nil {
return err
}
}
return nil
}
// insert adds node n as an entry to its parent directory within the filesystem.
func insert(fsys *filesystem, n *node) error {
if m := fsys.nodes[n.path]; m != nil {
return fmt.Errorf("duplicate path %q", n.path)
}
fsys.nodes[n.path] = n
// fsys.nodes contains "." to prevent infinite loops.
parent, err := directory(fsys, path.Dir(n.path))
if err != nil {
return err
}
parent.entries = append(parent.entries, n)
return nil
}
// directory returns the directory node with the path dir and lazily-creates it
// if it does not exist.
func directory(fsys *filesystem, dir string) (*node, error) {
if m := fsys.nodes[dir]; m != nil && m.IsDir() {
return m, nil // pre-existing directory
}
n := &node{fileinfo: fileinfo{path: dir, mode: readOnlyDir}}
if err := insert(fsys, n); err != nil {
return nil, err
}
return n, nil
}
// dataOf returns the data associated with the file t.
// May return ErrModified if fsys.ar has been modified.
func dataOf(fsys *filesystem, n *node) ([]byte, error) {
if n.idx >= len(fsys.ar.Files) {
return nil, ErrModified
}
f := fsys.ar.Files[n.idx]
if f.Name != n.path || len(f.Data) != n.size {
return nil, ErrModified
}
return f.Data, nil
}
func (fsys *filesystem) Open(name string) (fs.File, error) {
if !fs.ValidPath(name) {
return nil, &fs.PathError{Op: "open", Path: name, Err: fs.ErrInvalid}
}
n := fsys.nodes[name]
switch {
case n == nil:
return nil, &fs.PathError{Op: "open", Path: name, Err: fs.ErrNotExist}
case n.IsDir():
return &openDir{fileinfo: n.fileinfo, entries: n.entries}, nil
default:
data, err := dataOf(fsys, n)
if err != nil {
return nil, err
}
return &openFile{fileinfo: n.fileinfo, data: data}, nil
}
}
func (fsys *filesystem) ReadFile(name string) ([]byte, error) {
file, err := fsys.Open(name)
if err != nil {
return nil, err
}
if file, ok := file.(*openFile); ok {
// TODO: use slices.Clone once x/tools has 1.21 available.
cp := make([]byte, file.size)
copy(cp, file.data)
return cp, err
}
return nil, &fs.PathError{Op: "read", Path: name, Err: fs.ErrInvalid}
}
// A fileinfo implements fs.FileInfo and fs.DirEntry for a given archive file.
type fileinfo struct {
path string // unique path to the file or directory within a filesystem
size int
mode fs.FileMode
}
var _ fs.FileInfo = (*fileinfo)(nil)
var _ fs.DirEntry = (*fileinfo)(nil)
func (i *fileinfo) Name() string { return path.Base(i.path) }
func (i *fileinfo) Size() int64 { return int64(i.size) }
func (i *fileinfo) Mode() fs.FileMode { return i.mode }
func (i *fileinfo) Type() fs.FileMode { return i.mode.Type() }
func (i *fileinfo) ModTime() time.Time { return time.Time{} }
func (i *fileinfo) IsDir() bool { return i.mode&fs.ModeDir != 0 }
func (i *fileinfo) Sys() any { return nil }
func (i *fileinfo) Info() (fs.FileInfo, error) { return i, nil }
// An openFile is a regular (non-directory) fs.File open for reading.
type openFile struct {
fileinfo
data []byte
offset int64
}
var _ fs.File = (*openFile)(nil)
func (f *openFile) Stat() (fs.FileInfo, error) { return &f.fileinfo, nil }
func (f *openFile) Close() error { return nil }
func (f *openFile) Read(b []byte) (int, error) {
if f.offset >= int64(len(f.data)) {
return 0, io.EOF
}
if f.offset < 0 {
return 0, &fs.PathError{Op: "read", Path: f.path, Err: fs.ErrInvalid}
}
n := copy(b, f.data[f.offset:])
f.offset += int64(n)
return n, nil
}
func (f *openFile) Seek(offset int64, whence int) (int64, error) {
switch whence {
case 0:
// offset += 0
case 1:
offset += f.offset
case 2:
offset += int64(len(f.data))
}
if offset < 0 || offset > int64(len(f.data)) {
return 0, &fs.PathError{Op: "seek", Path: f.path, Err: fs.ErrInvalid}
}
f.offset = offset
return offset, nil
}
func (f *openFile) ReadAt(b []byte, offset int64) (int, error) {
if offset < 0 || offset > int64(len(f.data)) {
return 0, &fs.PathError{Op: "read", Path: f.path, Err: fs.ErrInvalid}
}
n := copy(b, f.data[offset:])
if n < len(b) {
return n, io.EOF
}
return n, nil
}
// A openDir is a directory fs.File (so also an fs.ReadDirFile) open for reading.
type openDir struct {
fileinfo
entries []fs.DirEntry
offset int
}
var _ fs.ReadDirFile = (*openDir)(nil)
func (d *openDir) Stat() (fs.FileInfo, error) { return &d.fileinfo, nil }
func (d *openDir) Close() error { return nil }
func (d *openDir) Read(b []byte) (int, error) {
return 0, &fs.PathError{Op: "read", Path: d.path, Err: fs.ErrInvalid}
}
func (d *openDir) ReadDir(count int) ([]fs.DirEntry, error) {
n := len(d.entries) - d.offset
if n == 0 && count > 0 {
return nil, io.EOF
}
if count > 0 && n > count {
n = count
}
list := make([]fs.DirEntry, n)
copy(list, d.entries[d.offset:d.offset+n])
d.offset += n
return list, nil
}

183
txtar/fs_test.go Normal file
Просмотреть файл

@ -0,0 +1,183 @@
// Copyright 2024 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
package txtar_test
import (
"io/fs"
"strings"
"testing"
"testing/fstest"
"golang.org/x/tools/txtar"
)
func TestFS(t *testing.T) {
var fstestcases = []struct {
name, input, files string
}{
{
name: "empty",
input: ``,
files: "",
},
{
name: "one",
input: `
-- one.txt --
one
`,
files: "one.txt",
},
{
name: "two",
input: `
-- one.txt --
one
-- two.txt --
two
`,
files: "one.txt two.txt",
},
{
name: "subdirectories",
input: `
-- one.txt --
one
-- 2/two.txt --
two
-- 2/3/three.txt --
three
-- 4/four.txt --
four
`,
files: "one.txt 2/two.txt 2/3/three.txt 4/four.txt",
},
}
for _, tc := range fstestcases {
t.Run(tc.name, func(t *testing.T) {
a := txtar.Parse([]byte(tc.input))
fsys, err := txtar.FS(a)
if err != nil {
t.Fatal(err)
}
files := strings.Fields(tc.files)
if err := fstest.TestFS(fsys, files...); err != nil {
t.Fatal(err)
}
for _, f := range a.Files {
b, err := fs.ReadFile(fsys, f.Name)
if err != nil {
t.Errorf("ReadFile(%q) failed with error: %v", f.Name, err)
}
if got, want := string(b), string(f.Data); got != want {
t.Errorf("ReadFile(%q) = %q; want %q", f.Name, got, want)
}
}
})
}
}
func TestInvalid(t *testing.T) {
invalidtestcases := []struct {
name, want string
input string
}{
{"unclean file names", "invalid path", `
-- 1/../one.txt --
one
-- 2/sub/../two.txt --
two
`},
{"duplicate name", `cannot create fs.FS from txtar.Archive: duplicate path "1/2/one.txt"`, `
-- 1/2/one.txt --
one
-- 1/2/one.txt --
two
`},
{"file conflicts with directory", `duplicate path "1/2"`, `
-- 1/2 --
one
-- 1/2/one.txt --
two
`},
}
for _, tc := range invalidtestcases {
t.Run(tc.name, func(t *testing.T) {
a := txtar.Parse([]byte(tc.input))
_, err := txtar.FS(a)
if err == nil {
t.Fatal("txtar.FS(...) succeeded; expected an error")
}
if got := err.Error(); !strings.Contains(got, tc.want) || tc.want == "" {
t.Errorf("txtar.FS(...) got error %q; want %q", got, tc.want)
}
})
}
}
func TestModified(t *testing.T) {
const input = `
-- one.txt --
one
`
for _, mod := range []func(a *txtar.Archive){
func(a *txtar.Archive) { a.Files[0].Data = []byte("other") },
func(a *txtar.Archive) { a.Files[0].Name = "other" },
func(a *txtar.Archive) { a.Files = nil },
} {
a := txtar.Parse([]byte(input))
if n := len(a.Files); n != 1 {
t.Fatalf("txtar.Parse(%q) got %d files; expected 1", input, n)
}
fsys, err := txtar.FS(a)
if err != nil {
t.Fatal(err)
}
// Confirm we can open "one.txt".
_, err = fsys.Open("one.txt")
if err != nil {
t.Fatal(err)
}
// Modify a to get ErrModified when opening "one.txt".
mod(a)
_, err = fsys.Open("one.txt")
if err != txtar.ErrModified {
t.Errorf("Open(%q) got error %s; want ErrModified", "one.txt", err)
}
}
}
func TestReadFile(t *testing.T) {
const input = `
-- 1/one.txt --
one
`
a := txtar.Parse([]byte(input))
fsys, err := txtar.FS(a)
if err != nil {
t.Fatal(err)
}
readfs := fsys.(fs.ReadFileFS)
_, err = readfs.ReadFile("1")
if err == nil {
t.Errorf("ReadFile(%q) succeeded; expected an error when reading a directory", "1")
}
content, err := readfs.ReadFile("1/one.txt")
if err != nil {
t.Fatal(err)
}
want := "one\n"
if got := string(content); want != got {
t.Errorf("ReadFile(%q) = %q; want %q", "1/one.txt", got, want)
}
}