Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[Merged by Bors] - Support poet certificates #5221

Closed
wants to merge 71 commits into from
Closed
Show file tree
Hide file tree
Changes from 68 commits
Commits
Show all changes
71 commits
Select commit Hold shift + click to select a range
d16cbe7
Support for poet certificates WIP
poszu Nov 1, 2023
08677b3
Support for poet certificates cont
poszu Nov 3, 2023
d68a562
Initial certification using existing ATX or initial POST
poszu Nov 6, 2023
535dfcf
Improve poet HTTP client coverage
poszu Nov 6, 2023
513c29a
Bump certifier
poszu Nov 6, 2023
2bf4807
Use the right post challenge to certify
poszu Nov 8, 2023
54f915b
Fixed POST metadata sent to certifier
poszu Nov 9, 2023
6cc3971
Bump certifier image
poszu Nov 9, 2023
f79232c
Migrate certifier store to localdb
poszu Nov 9, 2023
a2893dc
Remove CertifierInfo struct
poszu Nov 9, 2023
ffd77d0
Add systest for poet registrations with PoW and cert
poszu Nov 10, 2023
326bde0
Configurable certifier retry options
poszu Nov 13, 2023
f2ec6f7
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Nov 13, 2023
e0a6f89
Increase systest CI job timeout
poszu Nov 13, 2023
0054df7
Keep POST proof in localDB for certification
poszu Nov 14, 2023
50fa30f
Take optional poet certificates in config
poszu Nov 14, 2023
2a9210e
Bump poet to v0.10.0
poszu Nov 15, 2023
111576b
Apply suggestions from code review
poszu Nov 20, 2023
678e2c6
update nipost_test.go
poszu Nov 20, 2023
29118cd
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Nov 20, 2023
ca0fcf0
fixup ProofToCertifyMetadata struct name
poszu Nov 20, 2023
f80eb4a
Run poet systests in parallel
poszu Nov 20, 2023
4302d65
Add NodeID to certs passed in config
poszu Nov 20, 2023
cb33ecf
Fix certifier config in systests
poszu Nov 20, 2023
604bd51
Rename NewCertifierOption
poszu Nov 21, 2023
0a86126
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Nov 21, 2023
ce012ca
Apply localdb code migrations on checkpoint recovery
poszu Nov 21, 2023
97df610
Remove importing certificates
poszu Nov 22, 2023
18e8f23
Build initial post if post cannot be found
poszu Nov 23, 2023
98defe3
Remove sourcegraph/conc dep
poszu Nov 23, 2023
4eaa867
Bump certifier-service in systests to v0.6.0
poszu Nov 23, 2023
4270563
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Nov 24, 2023
c1ccfa8
Don't update post in localdb
poszu Nov 24, 2023
b37a705
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Nov 27, 2023
8439433
Fix UT
poszu Nov 27, 2023
5cca828
Autoscale post verifying workers (#5354)
poszu Dec 27, 2023
00edbc3
Fix default value of challenge in initial_post table
poszu Dec 28, 2023
c61e32d
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Jan 5, 2024
9b9f881
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Jan 9, 2024
e81a4c1
Fix flaky TestNIPostBuilder_Close
poszu Jan 9, 2024
7e3961b
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Feb 2, 2024
210c3e1
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Feb 12, 2024
c053552
Fixes
poszu Feb 12, 2024
7319d84
Bump post and certifier services in systests
poszu Feb 12, 2024
314e921
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Mar 21, 2024
97f0ff1
Support for poet certs with expiration
poszu Mar 21, 2024
7e35d3f
Use cert verification shared from poet
poszu Mar 25, 2024
59f45a0
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Mar 25, 2024
bd3130d
Fix linting issues
poszu Mar 25, 2024
87c9284
Bump certifier service in systests
poszu Mar 25, 2024
f347e3d
Rename local sql migration
poszu Mar 25, 2024
377a5d5
Fix staticcheck
poszu Mar 25, 2024
342eee9
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Apr 18, 2024
459f453
Use nipost.Post
poszu Apr 18, 2024
601df9d
More review fixes
poszu Apr 18, 2024
af1e89a
Update poet and post-rs
poszu Apr 18, 2024
b7426fa
update test
poszu Apr 19, 2024
d72d416
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Apr 23, 2024
af29624
Fix UTs
poszu Apr 23, 2024
0ec2d97
Refactor certifier to lookup PoST on its own
poszu Apr 23, 2024
845c12d
Fix systest
poszu Apr 23, 2024
30e322f
Merge remote-tracking branch 'origin/develop' into support-poet-certi…
poszu Apr 26, 2024
c0b306c
Review feedback
poszu Apr 26, 2024
84c1800
Optimize searching for positioning ATX (#5952)
poszu May 22, 2024
f4c358d
Move certification to the poet client
poszu May 22, 2024
d1d597a
Extend E2E activation test to use poet certificates with expiration
poszu May 22, 2024
377c62d
Parallelize certifying initial post
poszu May 22, 2024
62ea324
Avoid redundant certifications for (nodeID, pubkey) pairs
poszu May 22, 2024
879db03
Review feedback
poszu May 23, 2024
c9f3f96
Fix remaining UTs
poszu May 23, 2024
7f83cab
Fix remaining UTs
poszu May 23, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
37 changes: 29 additions & 8 deletions activation/activation.go
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,8 @@
"github.com/spacemeshos/go-spacemesh/sql/localsql/nipost"
)

var ErrNotFound = errors.New("not found")

// PoetConfig is the configuration to interact with the poet server.
type PoetConfig struct {
PhaseShift time.Duration `mapstructure:"phase-shift"`
Expand Down Expand Up @@ -82,6 +84,7 @@
syncer syncer
log *zap.Logger
parentCtx context.Context
poets []PoetClient
poetCfg PoetConfig
poetRetryInterval time.Duration
// delay before PoST in ATX is considered valid (counting from the time it was received)
Expand Down Expand Up @@ -138,6 +141,12 @@
}
}

func WithPoets(poets ...PoetClient) BuilderOption {
return func(b *Builder) {
b.poets = poets
}
}

func WithValidator(v nipostValidator) BuilderOption {
return func(b *Builder) {
b.validator = v
Expand Down Expand Up @@ -323,7 +332,7 @@
return nil
}
// ...and if we haven't stored an initial post yet.
_, err := nipost.InitialPost(b.localDB, nodeID)
_, err := nipost.GetPost(b.localDB, nodeID)
switch {
case err == nil:
b.log.Info("load initial post from db")
Expand All @@ -347,9 +356,10 @@
return errors.New("nil VRF nonce")
}
initialPost := nipost.Post{
Nonce: post.Nonce,
Indices: post.Indices,
Pow: post.Pow,
Nonce: post.Nonce,
Indices: post.Indices,
Pow: post.Pow,
Challenge: shared.ZeroChallenge,

NumUnits: postInfo.NumUnits,
CommitmentATX: postInfo.CommitmentATX,
Expand All @@ -361,7 +371,7 @@
}, postInfo.NumUnits)
if err != nil {
b.log.Error("initial POST is invalid", log.ZShortStringer("smesherID", nodeID), zap.Error(err))
if err := nipost.RemoveInitialPost(b.localDB, nodeID); err != nil {
if err := nipost.RemovePost(b.localDB, nodeID); err != nil {

Check warning on line 374 in activation/activation.go

View check run for this annotation

Codecov / codecov/patch

activation/activation.go#L374

Added line #L374 was not covered by tests
b.log.Fatal("failed to remove initial post", log.ZShortStringer("smesherID", nodeID), zap.Error(err))
}
return fmt.Errorf("initial POST is invalid: %w", err)
Expand All @@ -371,7 +381,7 @@
public.PostSeconds.Set(float64(time.Since(startTime)))
b.log.Info("created the initial post")

return nipost.AddInitialPost(b.localDB, nodeID, initialPost)
return nipost.AddPost(b.localDB, nodeID, initialPost)
}

func (b *Builder) run(ctx context.Context, sig *signing.EdSigner) {
Expand All @@ -390,6 +400,17 @@
case <-b.layerClock.AwaitLayer(currentLayer.Add(1)):
}
}
var eg errgroup.Group
for _, poet := range b.poets {
eg.Go(func() error {
_, err := poet.Certify(ctx, sig.NodeID())
if err != nil {
b.log.Warn("failed to certify poet", zap.Error(err), log.ZShortStringer("smesherID", sig.NodeID()))
}
return nil
})
}
eg.Wait()

for {
err := b.PublishActivationTx(ctx, sig)
Expand Down Expand Up @@ -515,7 +536,7 @@
switch {
case errors.Is(err, sql.ErrNotFound):
logger.Info("no previous ATX found, creating an initial nipost challenge")
post, err := nipost.InitialPost(b.localDB, nodeID)
post, err := nipost.GetPost(b.localDB, nodeID)
if err != nil {
return nil, fmt.Errorf("get initial post: %w", err)
}
Expand All @@ -531,7 +552,7 @@
}, post.NumUnits)
if err != nil {
logger.Error("initial POST is invalid", zap.Error(err))
if err := nipost.RemoveInitialPost(b.localDB, nodeID); err != nil {
if err := nipost.RemovePost(b.localDB, nodeID); err != nil {

Check warning on line 555 in activation/activation.go

View check run for this annotation

Codecov / codecov/patch

activation/activation.go#L555

Added line #L555 was not covered by tests
logger.Fatal("failed to remove initial post", zap.Error(err))
}
return nil, fmt.Errorf("initial POST is invalid: %w", err)
Expand Down
10 changes: 7 additions & 3 deletions activation/activation_multi_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -252,10 +252,12 @@ func Test_Builder_Multi_InitialPost(t *testing.T) {
},
nil,
)
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
err := tab.buildInitialPost(context.Background(), sig.NodeID())
require.NoError(t, err)

// postClient.Proof() should not be called again
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
err = tab.buildInitialPost(context.Background(), sig.NodeID())
require.NoError(t, err)
return nil
})
}
Expand Down Expand Up @@ -397,7 +399,9 @@ func Test_Builder_Multi_HappyPath(t *testing.T) {
VRFNonce: types.VRFPostIndex(rand.Uint64()),
}
nipostState[sig.NodeID()] = state
tab.mnipost.EXPECT().BuildNIPost(gomock.Any(), sig, ref.PublishEpoch, ref.Hash()).Return(state, nil)
tab.mnipost.EXPECT().
BuildNIPost(gomock.Any(), sig, ref.PublishEpoch, ref.Hash()).
Return(state, nil)

// awaiting atx publication epoch log
tab.mclock.EXPECT().CurrentLayer().DoAndReturn(
Expand Down
56 changes: 32 additions & 24 deletions activation/activation_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -666,8 +666,9 @@ func TestBuilder_PublishActivationTx_NoPrevATX(t *testing.T) {
NumUnits: uint32(12),
CommitmentATX: types.RandomATXID(),
VRFNonce: types.VRFPostIndex(rand.Uint64()),
Challenge: shared.ZeroChallenge,
}
require.NoError(t, nipost.AddInitialPost(tab.localDb, sig.NodeID(), post))
require.NoError(t, nipost.AddPost(tab.localDb, sig.NodeID(), post))
initialPost := &types.Post{
Nonce: post.Nonce,
Indices: post.Indices,
Expand Down Expand Up @@ -706,8 +707,9 @@ func TestBuilder_PublishActivationTx_NoPrevATX_PublishFails_InitialPost_preserve
NumUnits: uint32(12),
CommitmentATX: types.RandomATXID(),
VRFNonce: types.VRFPostIndex(rand.Uint64()),
Challenge: shared.ZeroChallenge,
}
require.NoError(t, nipost.AddInitialPost(tab.localDb, sig.NodeID(), refPost))
require.NoError(t, nipost.AddPost(tab.localDb, sig.NodeID(), refPost))
initialPost := &types.Post{
Nonce: refPost.Nonce,
Indices: refPost.Indices,
Expand All @@ -728,12 +730,10 @@ func TestBuilder_PublishActivationTx_NoPrevATX_PublishFails_InitialPost_preserve
genesis := time.Now().Add(-time.Duration(currLayer) * layerDuration)
return genesis.Add(layerDuration * time.Duration(got))
}).AnyTimes()

tab.mnipost.EXPECT().
BuildNIPost(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any()).
Return(nil, ErrATXChallengeExpired)
tab.mnipost.EXPECT().ResetState(sig.NodeID()).Return(nil)

ch := make(chan struct{})
tab.mclock.EXPECT().AwaitLayer(currLayer.Add(1)).Do(func(got types.LayerID) <-chan struct{} {
close(ch)
Expand All @@ -758,7 +758,7 @@ func TestBuilder_PublishActivationTx_NoPrevATX_PublishFails_InitialPost_preserve
}

// initial post is preserved
post, err := nipost.InitialPost(tab.localDB, sig.NodeID())
post, err := nipost.GetPost(tab.localDB, sig.NodeID())
require.NoError(t, err)
require.NotNil(t, post)
require.Equal(t, refPost, *post)
Expand Down Expand Up @@ -824,11 +824,13 @@ func TestBuilder_PublishActivationTx_PrevATXWithoutPrevATX(t *testing.T) {
LabelsPerUnit: DefaultPostConfig().LabelsPerUnit,
}, nil).AnyTimes()

tab.mnipost.EXPECT().BuildNIPost(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any()).DoAndReturn(
func(_ context.Context, _ *signing.EdSigner, _ types.EpochID, _ types.Hash32) (*nipost.NIPostState, error) {
currentLayer = currentLayer.Add(5)
return newNIPostWithPoet(t, poetBytes), nil
})
tab.mnipost.EXPECT().
BuildNIPost(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any()).
DoAndReturn(
func(_ context.Context, _ *signing.EdSigner, _ types.EpochID, _ types.Hash32) (*nipost.NIPostState, error) {
currentLayer = currentLayer.Add(5)
return newNIPostWithPoet(t, poetBytes), nil
})

tab.mValidator.EXPECT().VerifyChain(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any())

Expand Down Expand Up @@ -938,8 +940,9 @@ func TestBuilder_PublishActivationTx_TargetsEpochBasedOnPosAtx(t *testing.T) {
NumUnits: uint32(12),
CommitmentATX: types.RandomATXID(),
VRFNonce: types.VRFPostIndex(rand.Uint64()),
Challenge: shared.ZeroChallenge,
}
require.NoError(t, nipost.AddInitialPost(tab.localDb, sig.NodeID(), post))
require.NoError(t, nipost.AddPost(tab.localDb, sig.NodeID(), post))
initialPost := &types.Post{
Nonce: post.Nonce,
Indices: post.Indices,
Expand Down Expand Up @@ -979,7 +982,9 @@ func TestBuilder_PublishActivationTx_FailsWhenNIPostBuilderFails(t *testing.T) {
return genesis.Add(layerDuration * time.Duration(got))
}).AnyTimes()
nipostErr := errors.New("NIPost builder error")
tab.mnipost.EXPECT().BuildNIPost(gomock.Any(), sig, gomock.Any(), gomock.Any()).Return(nil, nipostErr)
tab.mnipost.EXPECT().
BuildNIPost(gomock.Any(), sig, gomock.Any(), gomock.Any()).
Return(nil, nipostErr)
tab.mValidator.EXPECT().VerifyChain(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any())
require.ErrorIs(t, tab.PublishActivationTx(context.Background(), sig), nipostErr)

Expand Down Expand Up @@ -1027,7 +1032,6 @@ func TestBuilder_RetryPublishActivationTx(t *testing.T) {
require.NoError(t, atxs.Add(tab.db, toAtx(t, prevAtx)))
tab.atxsdata.AddFromAtx(toAtx(t, prevAtx), false)

publishEpoch := prevAtx.PublishEpoch + 1
currLayer := prevAtx.PublishEpoch.FirstLayer()
tab.mclock.EXPECT().CurrentLayer().DoAndReturn(func() types.LayerID { return currLayer }).AnyTimes()
tab.mclock.EXPECT().LayerToTime(gomock.Any()).DoAndReturn(
Expand All @@ -1038,7 +1042,7 @@ func TestBuilder_RetryPublishActivationTx(t *testing.T) {
}).AnyTimes()
done := make(chan struct{})
close(done)
tab.mclock.EXPECT().AwaitLayer(publishEpoch.FirstLayer()).DoAndReturn(
tab.mclock.EXPECT().AwaitLayer(prevAtx.PublishEpoch.Add(1).FirstLayer()).DoAndReturn(
func(got types.LayerID) <-chan struct{} {
// advance to publish layer
if currLayer.Before(got) {
Expand Down Expand Up @@ -1125,9 +1129,6 @@ func TestBuilder_RetryPublishActivationTx(t *testing.T) {
}

// state is cleaned up
_, err = nipost.InitialPost(tab.localDB, sig.NodeID())
require.ErrorIs(t, err, sql.ErrNotFound)

_, err = nipost.Challenge(tab.localDB, sig.NodeID())
require.ErrorIs(t, err, sql.ErrNotFound)
}
Expand Down Expand Up @@ -1169,7 +1170,8 @@ func TestBuilder_InitialProofGeneratedOnce(t *testing.T) {
tab.mValidator.EXPECT().Post(gomock.Any(), sig.NodeID(), post.CommitmentATX, initialPost, metadata, post.NumUnits)
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
// postClient.Proof() should not be called again
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
err := tab.buildInitialPost(context.Background(), sig.NodeID())
require.NoError(t, err)
}

func TestBuilder_InitialPostIsPersisted(t *testing.T) {
Expand Down Expand Up @@ -1201,10 +1203,12 @@ func TestBuilder_InitialPostIsPersisted(t *testing.T) {
LabelsPerUnit: tab.conf.LabelsPerUnit,
}
tab.mValidator.EXPECT().Post(gomock.Any(), sig.NodeID(), commitmentATX, initialPost, metadata, numUnits)
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
err := tab.buildInitialPost(context.Background(), sig.NodeID())
require.NoError(t, err)

// postClient.Proof() should not be called again
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
err = tab.buildInitialPost(context.Background(), sig.NodeID())
require.NoError(t, err)
}

func TestBuilder_InitialPostLogErrorMissingVRFNonce(t *testing.T) {
Expand Down Expand Up @@ -1234,7 +1238,8 @@ func TestBuilder_InitialPostLogErrorMissingVRFNonce(t *testing.T) {
LabelsPerUnit: tab.conf.LabelsPerUnit,
}
tab.mValidator.EXPECT().Post(gomock.Any(), sig.NodeID(), commitmentATX, initialPost, metadata, numUnits)
require.ErrorContains(t, tab.buildInitialPost(context.Background(), sig.NodeID()), "nil VRF nonce")
err := tab.buildInitialPost(context.Background(), sig.NodeID())
require.ErrorContains(t, err, "nil VRF nonce")

observedLogs := tab.observedLogs.FilterLevelExact(zapcore.ErrorLevel)
require.Equal(t, 1, observedLogs.Len(), "expected 1 log message")
Expand All @@ -1256,7 +1261,8 @@ func TestBuilder_InitialPostLogErrorMissingVRFNonce(t *testing.T) {
},
nil,
)
require.NoError(t, tab.buildInitialPost(context.Background(), sig.NodeID()))
err = tab.buildInitialPost(context.Background(), sig.NodeID())
require.NoError(t, err)
}

func TestWaitPositioningAtx(t *testing.T) {
Expand Down Expand Up @@ -1287,7 +1293,8 @@ func TestWaitPositioningAtx(t *testing.T) {
// everything else are stubs that are irrelevant for the test
tab.mpostClient.EXPECT().Info(gomock.Any()).Return(&types.PostInfo{}, nil).AnyTimes()
tab.mnipost.EXPECT().ResetState(sig.NodeID()).Return(nil)
tab.mnipost.EXPECT().BuildNIPost(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any()).
tab.mnipost.EXPECT().
BuildNIPost(gomock.Any(), gomock.Any(), gomock.Any(), gomock.Any()).
Return(&nipost.NIPostState{}, nil)
closed := make(chan struct{})
close(closed)
Expand All @@ -1309,8 +1316,9 @@ func TestWaitPositioningAtx(t *testing.T) {
NumUnits: uint32(12),
CommitmentATX: types.RandomATXID(),
VRFNonce: types.VRFPostIndex(rand.Uint64()),
Challenge: shared.ZeroChallenge,
}
require.NoError(t, nipost.AddInitialPost(tab.localDb, sig.NodeID(), post))
require.NoError(t, nipost.AddPost(tab.localDb, sig.NodeID(), post))
initialPost := &types.Post{
Nonce: post.Nonce,
Indices: post.Indices,
Expand Down
Loading
Loading