Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

double hashing implementation #1

Open
wants to merge 23 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
14 changes: 12 additions & 2 deletions dht.go
Original file line number Diff line number Diff line change
Expand Up @@ -34,6 +34,7 @@ import (
goprocessctx "github.com/jbenet/goprocess/context"
"github.com/multiformats/go-base32"
ma "github.com/multiformats/go-multiaddr"
"github.com/multiformats/go-multihash"
"go.opencensus.io/tag"
"go.uber.org/zap"
)
Expand Down Expand Up @@ -683,9 +684,18 @@ func (dht *IpfsDHT) FindLocal(id peer.ID) peer.AddrInfo {
}
}

// nearestPeersToQuery returns the routing tables closest peers.
// nearestPeersToQuery returns the routing tables closest peers.Digest
func (dht *IpfsDHT) nearestPeersToQuery(pmes *pb.Message, count int) []peer.ID {
closer := dht.routingTable.NearestPeers(kb.ConvertKey(string(pmes.GetKey())), count)
key := pmes.GetKey()
// for GET_PROVIDERS messages, or sometimes FIND_NODE messages,
// the message key is the hashed multihash, so don't hash it again
decodedMH, err := multihash.Decode(key)
if err == nil && decodedMH.Code == multihash.DBL_SHA2_256 {
closer := dht.routingTable.NearestPeers(kb.ID(string(decodedMH.Digest)), count)
return closer
}

closer := dht.routingTable.NearestPeers(kb.ConvertKey(string(key)), count)
return closer
}

Expand Down
7 changes: 6 additions & 1 deletion dht_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,7 @@ import (
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"

"github.com/libp2p/go-libp2p-kad-dht/internal"
test "github.com/libp2p/go-libp2p-kad-dht/internal/testing"
pb "github.com/libp2p/go-libp2p-kad-dht/pb"

Expand Down Expand Up @@ -1298,7 +1299,11 @@ func TestClientModeConnect(t *testing.T) {

c := testCaseCids[0]
p := peer.ID("TestPeer")
a.ProviderStore().AddProvider(ctx, c.Hash(), peer.AddrInfo{ID: p})
mhHash := internal.Sha256Multihash(c.Hash())
err := a.ProviderStore().AddProvider(ctx, mhHash[:], peer.AddrInfo{ID: p})
if err != nil {
t.Fatal(err)
}
time.Sleep(time.Millisecond * 5) // just in case...

provs, err := b.FindProviders(ctx, c)
Expand Down
2 changes: 1 addition & 1 deletion dual/dual_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ import (
u "github.com/ipfs/go-ipfs-util"
dht "github.com/libp2p/go-libp2p-kad-dht"
test "github.com/libp2p/go-libp2p-kad-dht/internal/testing"
record "github.com/libp2p/go-libp2p-record"
record "github.com/libp2p/go-libp2p-record" //nolint:typecheck
"github.com/libp2p/go-libp2p/core/host"
"github.com/libp2p/go-libp2p/core/peer"
peerstore "github.com/libp2p/go-libp2p/core/peerstore"
Expand Down
8 changes: 6 additions & 2 deletions fullrt/dht.go
Original file line number Diff line number Diff line change
Expand Up @@ -777,10 +777,14 @@ func (dht *FullRT) Provide(ctx context.Context, key cid.Cid, brdcst bool) (err e
return fmt.Errorf("invalid cid: undefined")
}
keyMH := key.Hash()
logger.Debugw("providing", "cid", key, "mh", internal.LoggableProviderRecordBytes(keyMH))
mhHash := internal.Sha256Multihash(keyMH)

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

do you think it might be a good idea to add a salt for this hash? this way there's another layer of protection that could be used from the provider?
but i can see the other side where if we want to make this easily reproducible, it would be better to leave out the additional step (-:

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

If required, we could add a constant salt (e.g to specify the purpose of the hash).

However, the secret to access the content is already the CID, adding a random salt means that knowledge of both the CID and the salt is required to find the content. If we add a random salt here, it would have to be shared along with the CID, thus it wouldn't add much security. (in other words, it would only make the secret longer)

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

We should consider adding a constant salt (or prefix) to the spec and here - so that the derived hashes are in a known specific domain that doesn't easily have collisions with other things.

logger.Debugw("providing", "cid", key, "mh", internal.LoggableProviderRecordBytes(keyMH), "mhHash", mhHash)

// add self locally
dht.ProviderManager.AddProvider(ctx, keyMH, peer.AddrInfo{ID: dht.h.ID()})
err = dht.ProviderManager.AddProvider(ctx, mhHash, peer.AddrInfo{ID: dht.h.ID()})
if err != nil {
return err
}
if !brdcst {
return nil
}
Expand Down
2 changes: 1 addition & 1 deletion go.mod
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@ module github.com/libp2p/go-libp2p-kad-dht
go 1.18

require (
github.com/ChainSafe/go-keyspace v0.0.0-20220830203127-eae3b7c602f0
github.com/gogo/protobuf v1.3.2
github.com/google/gopacket v1.1.19
github.com/google/uuid v1.3.0
Expand All @@ -29,7 +30,6 @@ require (
github.com/multiformats/go-multihash v0.2.1
github.com/multiformats/go-multistream v0.3.3
github.com/stretchr/testify v1.8.0
github.com/whyrusleeping/go-keyspace v0.0.0-20160322163242-5b898ac5add1
go.opencensus.io v0.23.0
go.opentelemetry.io/otel v1.7.0
go.opentelemetry.io/otel/trace v1.7.0
Expand Down
3 changes: 2 additions & 1 deletion go.sum
Original file line number Diff line number Diff line change
Expand Up @@ -41,6 +41,8 @@ git.apache.org/thrift.git v0.0.0-20180902110319-2566ecd5d999/go.mod h1:fPE2ZNJGy
github.com/AndreasBriese/bbloom v0.0.0-20190306092124-e2d15f34fcf9/go.mod h1:bOvUY6CB00SOBii9/FifXqc0awNKxLFCL/+pkDPuyl8=
github.com/BurntSushi/toml v0.3.1/go.mod h1:xHWCNGjB5oqiDr8zfno3MHue2Ht5sIBksp03qcyfWMU=
github.com/BurntSushi/xgb v0.0.0-20160522181843-27f122750802/go.mod h1:IVnqGOEym/WlBOVXweHU+Q+/VP0lqqI8lqeDx9IjBqo=
github.com/ChainSafe/go-keyspace v0.0.0-20220830203127-eae3b7c602f0 h1:iTTaKZ4D0mS4VWOPJNzQXMhDVNtTAjK8GGCVIz46XtA=
github.com/ChainSafe/go-keyspace v0.0.0-20220830203127-eae3b7c602f0/go.mod h1:NE6Gpl6geZ3MkYhDdbEVhbuNAtISJJx6MRv5l23E22Y=
github.com/OneOfOne/xxhash v1.2.2/go.mod h1:HSdplMjZKSmBqAxg5vPj2TmRDmfkzw+cTzAElWljhcU=
github.com/aead/siphash v1.0.1/go.mod h1:Nywa3cDsYNNK3gaciGTWPwHt0wlpNV15vwmswBAUSII=
github.com/alecthomas/template v0.0.0-20160405071501-a0175ee3bccc/go.mod h1:LOuyumcjzFXgccqObfd/Ljyb9UuFJ6TxHnclSeseNhc=
Expand Down Expand Up @@ -643,7 +645,6 @@ github.com/viant/toolbox v0.24.0/go.mod h1:OxMCG57V0PXuIP2HNQrtJf2CjqdmbrOx5EkMI
github.com/wangjia184/sortedset v0.0.0-20160527075905-f5d03557ba30/go.mod h1:YkocrP2K2tcw938x9gCOmT5G5eCD6jsTz0SZuyAqwIE=
github.com/warpfork/go-wish v0.0.0-20200122115046-b9ea61034e4a h1:G++j5e0OC488te356JvdhaM8YS6nMsjLAYF7JxCv07w=
github.com/warpfork/go-wish v0.0.0-20200122115046-b9ea61034e4a/go.mod h1:x6AKhvSSexNrVSrViXSHUEbICjmGXhtgABaHIySUSGw=
github.com/whyrusleeping/go-keyspace v0.0.0-20160322163242-5b898ac5add1 h1:EKhdznlJHPMoKr0XTrX+IlJs1LH3lyx2nfr1dOlZ79k=
github.com/whyrusleeping/go-keyspace v0.0.0-20160322163242-5b898ac5add1/go.mod h1:8UvriyWtv5Q5EOgjHaSseUEdkQfvwFv1I/In/O2M9gc=
github.com/whyrusleeping/go-logging v0.0.0-20170515211332-0457bb6b88fc/go.mod h1:bopw91TMyo8J3tvftk8xmU2kPmlrt4nScJQZU2hE5EM=
github.com/x-cray/logrus-prefixed-formatter v0.5.2/go.mod h1:2duySbKsL6M18s5GU7VPsoEPHyzalCE06qoARUCeBBE=
Expand Down
5 changes: 4 additions & 1 deletion handlers.go
Original file line number Diff line number Diff line change
Expand Up @@ -359,7 +359,10 @@ func (dht *IpfsDHT) handleAddProvider(ctx context.Context, p peer.ID, pmes *pb.M
continue
}

dht.providerStore.AddProvider(ctx, key, peer.AddrInfo{ID: p})
err := dht.providerStore.AddProvider(ctx, key, peer.AddrInfo{ID: p})
if err != nil {
return nil, err
}
}

return nil, nil
Expand Down
17 changes: 17 additions & 0 deletions internal/utils.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
package internal

import (
"github.com/multiformats/go-multihash"
)

const keysize = 32

func Sha256Multihash(mh multihash.Multihash) multihash.Multihash {
prefix := []byte("CR_DOUBLEHASH")
mh, err := multihash.Sum(append(prefix, mh...), multihash.DBL_SHA2_256, keysize)
if err != nil {
// this shouldn't ever happen
panic(err)
}
return mh
}
5 changes: 3 additions & 2 deletions lookup.go
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ import (
kb "github.com/libp2p/go-libp2p-kbucket"
)

// GetClosestPeers is a Kademlia 'node lookup' operation. Returns a channel of
// GetClosestPeers is a Kademlia 'node lookup' operation. Returns a list of
// the K closest peers to the given key.
//
// If the context is canceled, this function will return the context error along
Expand All @@ -20,7 +20,8 @@ func (dht *IpfsDHT) GetClosestPeers(ctx context.Context, key string) ([]peer.ID,
if key == "" {
return nil, fmt.Errorf("can't lookup empty key")
}
// TODO: I can break the interface! return []peer.ID

//TODO: I can break the interface! return []peer.ID
lookupRes, err := dht.runLookupWithFollowup(ctx, key,
func(ctx context.Context, p peer.ID) ([]*peer.AddrInfo, error) {
// For DHT query command
Expand Down
76 changes: 61 additions & 15 deletions providers/providers_manager_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,10 @@ func TestProviderManager(t *testing.T) {
t.Fatal(err)
}
a := u.Hash([]byte("test"))
p.AddProvider(ctx, a, peer.AddrInfo{ID: peer.ID("testingprovider")})
err = p.AddProvider(ctx, a, peer.AddrInfo{ID: peer.ID("testingprovider")})
if err != nil {
t.Fatal(err)
}

// Not cached
// TODO verify that cache is empty
Expand All @@ -52,8 +55,15 @@ func TestProviderManager(t *testing.T) {
t.Fatal("Could not retrieve provider.")
}

p.AddProvider(ctx, a, peer.AddrInfo{ID: peer.ID("testingprovider2")})
p.AddProvider(ctx, a, peer.AddrInfo{ID: peer.ID("testingprovider3")})
err = p.AddProvider(ctx, a, peer.AddrInfo{ID: peer.ID("testingprovider2")})
if err != nil {
t.Fatal(err)
}
err = p.AddProvider(ctx, a, peer.AddrInfo{ID: peer.ID("testingprovider3")})
if err != nil {
t.Fatal(err)
}

// TODO verify that cache is already up to date
resp, _ = p.GetProviders(ctx, a)
if len(resp) != 3 {
Expand Down Expand Up @@ -88,7 +98,10 @@ func TestProvidersDatastore(t *testing.T) {
for i := 0; i < 100; i++ {
h := u.Hash([]byte(fmt.Sprint(i)))
mhs = append(mhs, h)
p.AddProvider(ctx, h, peer.AddrInfo{ID: friend})
err = p.AddProvider(ctx, h, peer.AddrInfo{ID: friend})
if err != nil {
t.Fatal(err)
}
}

for _, c := range mhs {
Expand Down Expand Up @@ -179,15 +192,27 @@ func TestProvidesExpire(t *testing.T) {
}

for _, h := range mhs[:5] {
p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[0]})
p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[1]})
err = p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[0]})
if err != nil {
t.Fatal(err)
}
err = p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[1]})
if err != nil {
t.Fatal(err)
}
}

time.Sleep(time.Second / 4)

for _, h := range mhs[5:] {
p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[0]})
p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[1]})
err = p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[0]})
if err != nil {
t.Fatal(err)
}
err = p.AddProvider(ctx, h, peer.AddrInfo{ID: peers[1]})
if err != nil {
t.Fatal(err)
}
}

for _, h := range mhs {
Expand Down Expand Up @@ -289,7 +314,10 @@ func TestLargeProvidersSet(t *testing.T) {
h := u.Hash([]byte(fmt.Sprint(i)))
mhs = append(mhs, h)
for _, pid := range peers {
p.AddProvider(ctx, h, peer.AddrInfo{ID: pid})
err = p.AddProvider(ctx, h, peer.AddrInfo{ID: pid})
if err != nil {
t.Fatal(err)
}
}
}

Expand Down Expand Up @@ -324,11 +352,20 @@ func TestUponCacheMissProvidersAreReadFromDatastore(t *testing.T) {
}

// add provider
pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p1})
err = pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p1})
if err != nil {
t.Fatal(err)
}
// make the cached provider for h1 go to datastore
pm.AddProvider(ctx, h2, peer.AddrInfo{ID: p1})
err = pm.AddProvider(ctx, h2, peer.AddrInfo{ID: p1})
if err != nil {
t.Fatal(err)
}
// now just offloaded record should be brought back and joined with p2
pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p2})
err = pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p2})
if err != nil {
t.Fatal(err)
}

h1Provs, _ := pm.GetProviders(ctx, h1)
if len(h1Provs) != 2 {
Expand All @@ -353,11 +390,20 @@ func TestWriteUpdatesCache(t *testing.T) {
}

// add provider
pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p1})
err = pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p1})
if err != nil {
t.Fatal(err)
}
// force into the cache
pm.GetProviders(ctx, h1)
_, err = pm.GetProviders(ctx, h1)
if err != nil {
t.Fatal(err)
}
// add a second provider
pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p2})
err = pm.AddProvider(ctx, h1, peer.AddrInfo{ID: p2})
if err != nil {
t.Fatal(err)
}

c1Provs, _ := pm.GetProviders(ctx, h1)
if len(c1Provs) != 2 {
Expand Down
10 changes: 9 additions & 1 deletion qpeerset/qpeerset.go
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,8 @@ import (
"math/big"
"sort"

ks "github.com/ChainSafe/go-keyspace"
"github.com/libp2p/go-libp2p/core/peer"
ks "github.com/whyrusleeping/go-keyspace"
)

// PeerState describes the state of a peer ID during the lifecycle of an individual lookup.
Expand Down Expand Up @@ -67,6 +67,14 @@ func NewQueryPeerset(key string) *QueryPeerset {
}
}

func NewQueryPeersetFromHash(hash [32]byte) *QueryPeerset {
return &QueryPeerset{
key: ks.XORKeySpace.KeyFromHash(hash),
all: []queryPeerState{},
sorted: false,
}
}

func (qp *QueryPeerset) find(p peer.ID) int {
for i := range qp.all {
if qp.all[i].id == p {
Expand Down
28 changes: 26 additions & 2 deletions query.go
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,7 @@ import (
"github.com/libp2p/go-libp2p/core/peer"
pstore "github.com/libp2p/go-libp2p/core/peerstore"
"github.com/libp2p/go-libp2p/core/routing"
"github.com/multiformats/go-multihash"

"github.com/google/uuid"
"github.com/libp2p/go-libp2p-kad-dht/qpeerset"
Expand Down Expand Up @@ -147,7 +148,21 @@ processFollowUp:

func (dht *IpfsDHT) runQuery(ctx context.Context, target string, queryFn queryFn, stopFn stopFn) (*lookupWithFollowupResult, error) {
// pick the K closest peers to the key in our Routing table.
targetKadID := kb.ConvertKey(target)
var (
targetKadID []byte
isHashed bool
)

decodedMH, err := multihash.Decode([]byte(target))
if err != nil || decodedMH.Code != multihash.DBL_SHA2_256 {
// the target isn't a double hash, so hash it again
targetKadID = kb.ConvertKey(target)
} else if decodedMH.Code == multihash.DBL_SHA2_256 {
// the target is a double hash, so use the 32-byte digest
targetKadID = kb.ID(decodedMH.Digest)
isHashed = true
}

seedPeers := dht.routingTable.NearestPeers(targetKadID, dht.bucketSize)
if len(seedPeers) == 0 {
routing.PublishQueryEvent(ctx, &routing.QueryEvent{
Expand All @@ -157,12 +172,21 @@ func (dht *IpfsDHT) runQuery(ctx context.Context, target string, queryFn queryFn
return nil, kb.ErrLookupFailure
}

var qpset *qpeerset.QueryPeerset
if isHashed {
var hash [32]byte
copy(hash[:], targetKadID)
qpset = qpeerset.NewQueryPeersetFromHash(hash)
} else {
qpset = qpeerset.NewQueryPeerset(target)
}

q := &query{
id: uuid.New(),
key: target,
ctx: ctx,
dht: dht,
queryPeers: qpeerset.NewQueryPeerset(target),
queryPeers: qpset,
seedPeers: seedPeers,
peerTimes: make(map[peer.ID]time.Duration),
terminated: false,
Expand Down
Loading