Skip to content

Commit

Permalink
Merge pull request #3890 from ipfs/fix/sharding-issues
Browse files Browse the repository at this point in the history
Fix sharding memory growth, and fix resolver for unixfs paths
  • Loading branch information
whyrusleeping authored May 1, 2017
2 parents 92f1177 + a22cae1 commit 119ae72
Show file tree
Hide file tree
Showing 9 changed files with 131 additions and 44 deletions.
8 changes: 7 additions & 1 deletion core/coreapi/coreapi.go
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import (
core "github.com/ipfs/go-ipfs/core"
coreiface "github.com/ipfs/go-ipfs/core/coreapi/interface"
ipfspath "github.com/ipfs/go-ipfs/path"
uio "github.com/ipfs/go-ipfs/unixfs/io"

cid "gx/ipfs/QmYhQaCYEcaPPjxJX7YcPcVKkQfRy6sJ7B3XmGFk82XYdQ/go-cid"
)
Expand Down Expand Up @@ -42,8 +43,13 @@ func (api *CoreAPI) ResolvePath(ctx context.Context, p coreiface.Path) (coreifac
return p, nil
}

r := &ipfspath.Resolver{
DAG: api.node.DAG,
ResolveOnce: uio.ResolveUnixfsOnce,
}

p2 := ipfspath.FromString(p.String())
node, err := core.Resolve(ctx, api.node.Namesys, api.node.Resolver, p2)
node, err := core.Resolve(ctx, api.node.Namesys, r, p2)
if err == core.ErrNoNamesys {
return nil, coreiface.ErrOffline
} else if err != nil {
Expand Down
21 changes: 18 additions & 3 deletions core/coreapi/unixfs.go
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@ import (
uio "github.com/ipfs/go-ipfs/unixfs/io"

cid "gx/ipfs/QmYhQaCYEcaPPjxJX7YcPcVKkQfRy6sJ7B3XmGFk82XYdQ/go-cid"
node "gx/ipfs/Qmb3Hm9QDFmfYuET4pu7Kyg8JV78jFa1nvZx5vnCZsK4ck/go-ipld-format"
)

type UnixfsAPI CoreAPI
Expand Down Expand Up @@ -46,9 +47,23 @@ func (api *UnixfsAPI) Ls(ctx context.Context, p coreiface.Path) ([]*coreiface.Li
return nil, err
}

l := dagnode.Links()
links := make([]*coreiface.Link, len(l))
for i, l := range l {
var ndlinks []*node.Link
dir, err := uio.NewDirectoryFromNode(api.node.DAG, dagnode)
switch err {
case nil:
l, err := dir.Links(ctx)
if err != nil {
return nil, err
}
ndlinks = l
case uio.ErrNotADir:
ndlinks = dagnode.Links()
default:
return nil, err
}

links := make([]*coreiface.Link, len(ndlinks))
for i, l := range ndlinks {
links[i] = &coreiface.Link{l.Name, l.Size, l.Cid}
}
return links, nil
Expand Down
8 changes: 7 additions & 1 deletion core/coreapi/unixfs_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@ import (
config "github.com/ipfs/go-ipfs/repo/config"
testutil "github.com/ipfs/go-ipfs/thirdparty/testutil"
unixfs "github.com/ipfs/go-ipfs/unixfs"
cbor "gx/ipfs/QmNrbCt8j9DT5W9Pmjy2SdudT9k8GpaDr4sRuFix3BXhgR/go-ipld-cbor"
)

// `echo -n 'hello, world!' | ipfs add`
Expand Down Expand Up @@ -276,7 +277,12 @@ func TestLsNonUnixfs(t *testing.T) {
t.Error(err)
}

c, err := node.DAG.Add(new(mdag.ProtoNode))
nd, err := cbor.WrapObject(map[string]interface{}{"foo": "bar"})
if err != nil {
t.Fatal(err)
}

c, err := node.DAG.Add(nd)
if err != nil {
t.Error(err)
}
Expand Down
7 changes: 6 additions & 1 deletion core/coreunix/cat.go
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,12 @@ import (
)

func Cat(ctx context.Context, n *core.IpfsNode, pstr string) (uio.DagReader, error) {
dagNode, err := core.Resolve(ctx, n.Namesys, n.Resolver, path.Path(pstr))
r := &path.Resolver{
DAG: n.DAG,
ResolveOnce: uio.ResolveUnixfsOnce,
}

dagNode, err := core.Resolve(ctx, n.Namesys, r, path.Path(pstr))
if err != nil {
return nil, err
}
Expand Down
11 changes: 6 additions & 5 deletions path/resolver.go
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,7 @@ func (e ErrNoLink) Error() string {
type Resolver struct {
DAG dag.DAGService

ResolveOnce func(ctx context.Context, ds dag.DAGService, nd node.Node, name string) (*node.Link, error)
ResolveOnce func(ctx context.Context, ds dag.DAGService, nd node.Node, names []string) (*node.Link, []string, error)
}

func NewBasicResolver(ds dag.DAGService) *Resolver {
Expand Down Expand Up @@ -121,9 +121,10 @@ func (s *Resolver) ResolvePath(ctx context.Context, fpath Path) (node.Node, erro
return nodes[len(nodes)-1], err
}

func ResolveSingle(ctx context.Context, ds dag.DAGService, nd node.Node, name string) (*node.Link, error) {
lnk, _, err := nd.ResolveLink([]string{name})
return lnk, err
// ResolveSingle simply resolves one hop of a path through a graph with no
// extra context (does not opaquely resolve through sharded nodes)
func ResolveSingle(ctx context.Context, ds dag.DAGService, nd node.Node, names []string) (*node.Link, []string, error) {
return nd.ResolveLink(names)
}

// ResolvePathComponents fetches the nodes for each segment of the given path.
Expand Down Expand Up @@ -163,7 +164,7 @@ func (s *Resolver) ResolveLinks(ctx context.Context, ndd node.Node, names []stri
ctx, cancel = context.WithTimeout(ctx, time.Minute)
defer cancel()

lnk, rest, err := nd.ResolveLink(names)
lnk, rest, err := s.ResolveOnce(ctx, s.DAG, nd, names)
if err == dag.ErrLinkNotFound {
return result, ErrNoLink{Name: names[0], Node: nd.Cid()}
} else if err != nil {
Expand Down
5 changes: 5 additions & 0 deletions test/sharness/t0260-sharding-flag.sh
Original file line number Diff line number Diff line change
Expand Up @@ -68,6 +68,11 @@ test_add_large_dir_v1() {
echo "$exphash" > sharddir_exp &&
test_cmp sharddir_exp sharddir_out
'

test_expect_success "can access a path under the dir" '
ipfs cat "$exphash/file20" > file20_out &&
test_cmp testdata/file20 file20_out
'
}

# this hash implies both the directory and the leaf entries are CIDv1
Expand Down
68 changes: 49 additions & 19 deletions unixfs/hamt/hamt.go
Original file line number Diff line number Diff line change
Expand Up @@ -62,7 +62,7 @@ type HamtShard struct {

// child can either be another shard, or a leaf node value
type child interface {
Node() (node.Node, error)
Link() (*node.Link, error)
Label() string
}

Expand Down Expand Up @@ -144,12 +144,12 @@ func (ds *HamtShard) Node() (node.Node, error) {
cindex := ds.indexForBitPos(i)
ch := ds.children[cindex]
if ch != nil {
cnd, err := ch.Node()
clnk, err := ch.Link()
if err != nil {
return nil, err
}

err = out.AddNodeLinkClean(ds.linkNamePrefix(i)+ch.Label(), cnd)
err = out.AddRawLink(ds.linkNamePrefix(i)+ch.Label(), clnk)
if err != nil {
return nil, err
}
Expand Down Expand Up @@ -188,10 +188,11 @@ func (ds *HamtShard) Node() (node.Node, error) {

type shardValue struct {
key string
val node.Node
val *node.Link
}

func (sv *shardValue) Node() (node.Node, error) {
// Link returns a link to this node
func (sv *shardValue) Link() (*node.Link, error) {
return sv.val, nil
}

Expand All @@ -214,7 +215,18 @@ func (ds *HamtShard) Label() string {
// Set sets 'name' = nd in the HAMT
func (ds *HamtShard) Set(ctx context.Context, name string, nd node.Node) error {
hv := &hashBits{b: hash([]byte(name))}
return ds.modifyValue(ctx, hv, name, nd)
_, err := ds.dserv.Add(nd)
if err != nil {
return err
}

lnk, err := node.MakeLink(nd)
if err != nil {
return err
}
lnk.Name = ds.linkNamePrefix(0) + name

return ds.modifyValue(ctx, hv, name, lnk)
}

// Remove deletes the named entry if it exists, this operation is idempotent.
Expand All @@ -223,16 +235,20 @@ func (ds *HamtShard) Remove(ctx context.Context, name string) error {
return ds.modifyValue(ctx, hv, name, nil)
}

func (ds *HamtShard) Find(ctx context.Context, name string) (node.Node, error) {
// Find searches for a child node by 'name' within this hamt
func (ds *HamtShard) Find(ctx context.Context, name string) (*node.Link, error) {
hv := &hashBits{b: hash([]byte(name))}

var out node.Node
var out *node.Link
err := ds.getValue(ctx, hv, name, func(sv *shardValue) error {
out = sv.val
return nil
})
if err != nil {
return nil, err
}

return out, err
return out, nil
}

// getChild returns the i'th child of this shard. If it is cached in the
Expand Down Expand Up @@ -291,9 +307,10 @@ func (ds *HamtShard) loadChild(ctx context.Context, i int) (child, error) {

c = cds
} else {
lnk2 := *lnk
c = &shardValue{
key: lnk.Name[ds.maxpadlen:],
val: nd,
val: &lnk2,
}
}

Expand All @@ -305,16 +322,33 @@ func (ds *HamtShard) setChild(i int, c child) {
ds.children[i] = c
}

func (ds *HamtShard) insertChild(idx int, key string, val node.Node) error {
if val == nil {
// Link returns a merklelink to this shard node
func (ds *HamtShard) Link() (*node.Link, error) {
nd, err := ds.Node()
if err != nil {
return nil, err
}

_, err = ds.dserv.Add(nd)
if err != nil {
return nil, err
}

return node.MakeLink(nd)
}

func (ds *HamtShard) insertChild(idx int, key string, lnk *node.Link) error {
if lnk == nil {
return os.ErrNotExist
}

i := ds.indexForBitPos(idx)
ds.bitfield.SetBit(ds.bitfield, idx, 1)

lnk.Name = ds.linkNamePrefix(idx) + key
sv := &shardValue{
key: key,
val: val,
val: lnk,
}

ds.children = append(ds.children[:i], append([]child{sv}, ds.children[i:]...)...)
Expand Down Expand Up @@ -370,11 +404,7 @@ func (ds *HamtShard) EnumLinks(ctx context.Context) ([]*node.Link, error) {

func (ds *HamtShard) ForEachLink(ctx context.Context, f func(*node.Link) error) error {
return ds.walkTrie(ctx, func(sv *shardValue) error {
lnk, err := node.MakeLink(sv.val)
if err != nil {
return err
}

lnk := sv.val
lnk.Name = sv.key

return f(lnk)
Expand Down Expand Up @@ -414,7 +444,7 @@ func (ds *HamtShard) walkTrie(ctx context.Context, cb func(*shardValue) error) e
return nil
}

func (ds *HamtShard) modifyValue(ctx context.Context, hv *hashBits, key string, val node.Node) error {
func (ds *HamtShard) modifyValue(ctx context.Context, hv *hashBits, key string, val *node.Link) error {
idx := hv.Next(ds.tableSizeLg2)

if ds.bitfield.Bit(idx) != 1 {
Expand Down
14 changes: 11 additions & 3 deletions unixfs/io/dirbuilder.go
Original file line number Diff line number Diff line change
Expand Up @@ -48,10 +48,13 @@ func NewDirectory(dserv mdag.DAGService) *Directory {
return db
}

// ErrNotADir implies that the given node was not a unixfs directory
var ErrNotADir = fmt.Errorf("merkledag node was not a directory or shard")

func NewDirectoryFromNode(dserv mdag.DAGService, nd node.Node) (*Directory, error) {
pbnd, ok := nd.(*mdag.ProtoNode)
if !ok {
return nil, mdag.ErrNotProtobuf
return nil, ErrNotADir
}

pbd, err := format.FromBytes(pbnd.Data())
Expand All @@ -76,7 +79,7 @@ func NewDirectoryFromNode(dserv mdag.DAGService, nd node.Node) (*Directory, erro
shard: shard,
}, nil
default:
return nil, fmt.Errorf("merkledag node was not a directory or shard")
return nil, ErrNotADir
}
}

Expand Down Expand Up @@ -165,7 +168,12 @@ func (d *Directory) Find(ctx context.Context, name string) (node.Node, error) {
return d.dserv.Get(ctx, lnk.Cid)
}

return d.shard.Find(ctx, name)
lnk, err := d.shard.Find(ctx, name)
if err != nil {
return nil, err
}

return lnk.GetNode(ctx, d.dserv)
}

func (d *Directory) RemoveChild(ctx context.Context, name string) error {
Expand Down
33 changes: 22 additions & 11 deletions unixfs/io/resolve.go
Original file line number Diff line number Diff line change
Expand Up @@ -10,37 +10,48 @@ import (
node "gx/ipfs/Qmb3Hm9QDFmfYuET4pu7Kyg8JV78jFa1nvZx5vnCZsK4ck/go-ipld-format"
)

func ResolveUnixfsOnce(ctx context.Context, ds dag.DAGService, nd node.Node, name string) (*node.Link, error) {
// ResolveUnixfsOnce resolves a single hop of a path through a graph in a
// unixfs context. This includes handling traversing sharded directories.
func ResolveUnixfsOnce(ctx context.Context, ds dag.DAGService, nd node.Node, names []string) (*node.Link, []string, error) {
switch nd := nd.(type) {
case *dag.ProtoNode:
upb, err := ft.FromBytes(nd.Data())
if err != nil {
// Not a unixfs node, use standard object traversal code
return nd.GetNodeLink(name)
lnk, err := nd.GetNodeLink(names[0])
if err != nil {
return nil, nil, err
}

return lnk, names[1:], nil
}

switch upb.GetType() {
case ft.THAMTShard:
s, err := hamt.NewHamtFromDag(ds, nd)
if err != nil {
return nil, err
return nil, nil, err
}

// TODO: optimized routine on HAMT for returning a dag.Link to avoid extra disk hits
out, err := s.Find(ctx, name)
out, err := s.Find(ctx, names[0])
if err != nil {
return nil, err
return nil, nil, err
}

return node.MakeLink(out)
return out, names[1:], nil
default:
return nd.GetNodeLink(name)
lnk, err := nd.GetNodeLink(names[0])
if err != nil {
return nil, nil, err
}

return lnk, names[1:], nil
}
default:
lnk, _, err := nd.ResolveLink([]string{name})
lnk, rest, err := nd.ResolveLink(names)
if err != nil {
return nil, err
return nil, nil, err
}
return lnk, nil
return lnk, rest, nil
}
}

0 comments on commit 119ae72

Please sign in to comment.