chore: bump version number (#226 )

fix(coordinator): use uint32 for timestamp to enable RLP encoding (#225 )
feat(message): replace json.Marshal with rlp.Encode for Signing (#219 )
2026-04-23 03:00:50 -04:00 · 2023-01-13 08:33:53 +08:00 · 2023-01-12 18:24:59 +01:00 · 2023-01-12 22:21:59 +08:00 · 2023-01-12 16:45:11 +08:00 · 2023-01-12 12:55:00 +08:00
23 changed files with 318 additions and 407 deletions
--- a/bridge/cmd/app/app_test.go
+++ b/bridge/cmd/app/app_test.go
@@ -15,5 +15,5 @@ func TestRunBridge(t *testing.T) {

 	// wait result
 	bridge.ExpectWithTimeout(true, time.Second*3, fmt.Sprintf("bridge version %s", version.Version))
-	bridge.RunApp(false)
+	bridge.RunApp(nil)
 }
--- a/bridge/l2/watcher.go
+++ b/bridge/l2/watcher.go
@@ -5,6 +5,7 @@ import (
 	"fmt"
 	"math/big"
 	"reflect"
+	"sync"
 	"time"

 	geth "github.com/scroll-tech/go-ethereum"
@@ -103,18 +104,32 @@ func (w *WatcherClient) Start() {
 					number = 0
 				}

-				if err := w.tryFetchRunningMissingBlocks(w.ctx, number); err != nil {
-					log.Error("failed to fetchRunningMissingBlocks", "err", err)
-				}
+				var wg sync.WaitGroup
+				wg.Add(3)

-				// @todo handle error
-				if err := w.fetchContractEvent(number); err != nil {
-					log.Error("failed to fetchContractEvent", "err", err)
-				}
+				go func() {
+					defer wg.Done()
+					if err := w.tryFetchRunningMissingBlocks(w.ctx, number); err != nil {
+						log.Error("failed to fetchRunningMissingBlocks", "err", err)
+					}
+				}()

-				if err := w.batchProposer.tryProposeBatch(); err != nil {
-					log.Error("failed to tryProposeBatch", "err", err)
-				}
+				go func() {
+					defer wg.Done()
+					// @todo handle error
+					if err := w.fetchContractEvent(number); err != nil {
+						log.Error("failed to fetchContractEvent", "err", err)
+					}
+				}()
+
+				go func() {
+					defer wg.Done()
+					if err := w.batchProposer.tryProposeBatch(); err != nil {
+						log.Error("failed to tryProposeBatch", "err", err)
+					}
+				}()
+
+				wg.Wait()
 			}
 		}
 	}()
--- a/build/.golangci.yml
+++ b/build/.golangci.yml
@@ -179,6 +179,13 @@ linters:
    - depguard
    - gocyclo
    - unparam
+    - exportloopref
+    - sqlclosecheck
+    - rowserrcheck
+    - durationcheck
+    - bidichk
+    - typecheck
+    - unused
  enable-all: false
  disable:

@@ -200,16 +207,7 @@ issues:
    # Exclude some linters from running on tests files.
    - path: _test\.go
      linters:
-        - gocyclo
        - errcheck
-        - dupl
-        - gosec
-
-    # Exclude known linters from partially hard-vendored code,
-    # which is impossible to exclude via "nolint" comments.
-    - path: internal/hmac/
-      text: "weak cryptographic primitive"
-      linters:
        - gosec

    # Exclude some staticcheck messages
@@ -217,18 +215,6 @@ issues:
        - staticcheck
      text: "SA9003:"

-    - linters:
-        - golint
-      text: "package comment should be of the form"
-
-    - linters:
-        - golint
-      text: "don't use ALL_CAPS in Go names;"
-
-    - linters:
-        - golint
-      text: "don't use underscores in Go names;"
-
    # Exclude lll issues for long lines with go:generate
    - linters:
        - lll
--- a/common/cmd/cmd.go
+++ b/common/cmd/cmd.go
@@ -1,17 +1,13 @@
 package cmd

 import (
-	"fmt"
 	"os"
 	"os/exec"
 	"strings"
 	"sync"
 	"testing"
-	"time"

-	"github.com/docker/docker/pkg/reexec"
 	cmap "github.com/orcaman/concurrent-map"
-	"github.com/stretchr/testify/assert"
 )

 var verbose bool
@@ -51,48 +47,6 @@ func NewCmd(t *testing.T, name string, args ...string) *Cmd {
 	}
 }

-// RunApp exec's the current binary using name as argv[0] which will trigger the
-// reexec init function for that name (e.g. "geth-test" in cmd/geth/run_test.go)
-func (t *Cmd) RunApp(parallel bool) {
-	t.Log("cmd: ", append([]string{t.name}, t.args...))
-	cmd := &exec.Cmd{
-		Path:   reexec.Self(),
-		Args:   append([]string{t.name}, t.args...),
-		Stderr: t,
-		Stdout: t,
-	}
-	if parallel {
-		go func() {
-			_ = cmd.Run()
-		}()
-	} else {
-		_ = cmd.Run()
-	}
-	t.mu.Lock()
-	t.cmd = cmd
-	t.mu.Unlock()
-}
-
-// WaitExit wait util process exit.
-func (t *Cmd) WaitExit() {
-	// Wait all the check funcs are finished or test status is failed.
-	for !(t.Failed() || t.checkFuncs.IsEmpty()) {
-		<-time.After(time.Millisecond * 500)
-	}
-
-	// Send interrupt signal.
-	t.mu.Lock()
-	_ = t.cmd.Process.Signal(os.Interrupt)
-	t.mu.Unlock()
-}
-
-// Interrupt send interrupt signal.
-func (t *Cmd) Interrupt() {
-	t.mu.Lock()
-	t.Err = t.cmd.Process.Signal(os.Interrupt)
-	t.mu.Unlock()
-}
-
 // RegistFunc register check func
 func (t *Cmd) RegistFunc(key string, check checkFunc) {
 	t.checkFuncs.Set(key, check)
@@ -103,39 +57,6 @@ func (t *Cmd) UnRegistFunc(key string) {
 	t.checkFuncs.Pop(key)
 }

-// ExpectWithTimeout wait result during timeout time.
-func (t *Cmd) ExpectWithTimeout(parallel bool, timeout time.Duration, keyword string) {
-	if keyword == "" {
-		return
-	}
-	okCh := make(chan struct{}, 1)
-	t.RegistFunc(keyword, func(buf string) {
-		if strings.Contains(buf, keyword) {
-			select {
-			case okCh <- struct{}{}:
-			default:
-				return
-			}
-		}
-	})
-
-	waitResult := func() {
-		defer t.UnRegistFunc(keyword)
-		select {
-		case <-okCh:
-			return
-		case <-time.After(timeout):
-			assert.Fail(t, fmt.Sprintf("didn't get the desired result before timeout, keyword: %s", keyword))
-		}
-	}
-
-	if parallel {
-		go waitResult()
-	} else {
-		waitResult()
-	}
-}
-
 func (t *Cmd) runCmd() {
 	cmd := exec.Command(t.args[0], t.args[1:]...) //nolint:gosec
 	cmd.Stdout = t
--- a/common/cmd/cmd_app.go
+++ b/common/cmd/cmd_app.go
@@ -0,0 +1,114 @@
+package cmd
+
+import (
+	"fmt"
+	"os"
+	"os/exec"
+	"strings"
+	"time"
+
+	"github.com/docker/docker/pkg/reexec"
+	"github.com/stretchr/testify/assert"
+)
+
+// RunApp exec's the current binary using name as argv[0] which will trigger the
+// reexec init function for that name (e.g. "geth-test" in cmd/geth/run_test.go)
+func (t *Cmd) RunApp(waitResult func() bool) {
+	t.Log("cmd: ", append([]string{t.name}, t.args...))
+	cmd := &exec.Cmd{
+		Path:   reexec.Self(),
+		Args:   append([]string{t.name}, t.args...),
+		Stderr: t,
+		Stdout: t,
+	}
+	if waitResult != nil {
+		go func() {
+			_ = cmd.Run()
+		}()
+		waitResult()
+	} else {
+		_ = cmd.Run()
+	}
+
+	t.mu.Lock()
+	t.cmd = cmd
+	t.mu.Unlock()
+}
+
+// WaitExit wait util process exit.
+func (t *Cmd) WaitExit() {
+	// Wait all the check funcs are finished or test status is failed.
+	for !(t.Failed() || t.checkFuncs.IsEmpty()) {
+		<-time.After(time.Millisecond * 500)
+	}
+
+	// Send interrupt signal.
+	t.mu.Lock()
+	_ = t.cmd.Process.Signal(os.Interrupt)
+	t.mu.Unlock()
+}
+
+// Interrupt send interrupt signal.
+func (t *Cmd) Interrupt() {
+	t.mu.Lock()
+	t.Err = t.cmd.Process.Signal(os.Interrupt)
+	t.mu.Unlock()
+}
+
+// WaitResult return true when get the keyword during timeout.
+func (t *Cmd) WaitResult(timeout time.Duration, keyword string) bool {
+	if keyword == "" {
+		return false
+	}
+	okCh := make(chan struct{}, 1)
+	t.RegistFunc(keyword, func(buf string) {
+		if strings.Contains(buf, keyword) {
+			select {
+			case okCh <- struct{}{}:
+			default:
+				return
+			}
+		}
+	})
+	defer t.UnRegistFunc(keyword)
+	select {
+	case <-okCh:
+		return true
+	case <-time.After(timeout):
+		assert.Fail(t, fmt.Sprintf("didn't get the desired result before timeout, keyword: %s", keyword))
+	}
+	return false
+}
+
+// ExpectWithTimeout wait result during timeout time.
+func (t *Cmd) ExpectWithTimeout(parallel bool, timeout time.Duration, keyword string) {
+	if keyword == "" {
+		return
+	}
+	okCh := make(chan struct{}, 1)
+	t.RegistFunc(keyword, func(buf string) {
+		if strings.Contains(buf, keyword) {
+			select {
+			case okCh <- struct{}{}:
+			default:
+				return
+			}
+		}
+	})
+
+	waitResult := func() {
+		defer t.UnRegistFunc(keyword)
+		select {
+		case <-okCh:
+			return
+		case <-time.After(timeout):
+			assert.Fail(t, fmt.Sprintf("didn't get the desired result before timeout, keyword: %s", keyword))
+		}
+	}
+
+	if parallel {
+		go waitResult()
+	} else {
+		waitResult()
+	}
+}
--- a/common/go.mod
+++ b/common/go.mod
@@ -12,7 +12,6 @@ require (
 	github.com/scroll-tech/go-ethereum v1.10.14-0.20221221073256-5ca70bf3a257
 	github.com/stretchr/testify v1.8.0
 	github.com/urfave/cli/v2 v2.10.2
-	golang.org/x/sync v0.1.0
 )

 require (
@@ -81,6 +80,7 @@ require (
 	golang.org/x/crypto v0.4.0 // indirect
 	golang.org/x/mod v0.7.0 // indirect
 	golang.org/x/net v0.3.0 // indirect
+	golang.org/x/sync v0.1.0 // indirect
 	golang.org/x/sys v0.3.0 // indirect
 	golang.org/x/text v0.5.0 // indirect
 	golang.org/x/time v0.0.0-20210220033141-f8bda1e9f3ba // indirect
--- a/common/message/message.go
+++ b/common/message/message.go
@@ -4,12 +4,12 @@ import (
 	"crypto/ecdsa"
 	"crypto/rand"
 	"encoding/hex"
-	"encoding/json"

 	"github.com/scroll-tech/go-ethereum/common"
 	"github.com/scroll-tech/go-ethereum/common/hexutil"
 	"github.com/scroll-tech/go-ethereum/core/types"
 	"github.com/scroll-tech/go-ethereum/crypto"
+	"github.com/scroll-tech/go-ethereum/rlp"
 )

 // RespStatus represents status code from roller to scroll
@@ -36,11 +36,11 @@ type AuthMsg struct {
 type Identity struct {
 	// Roller name
 	Name string `json:"name"`
-	// Time of message creation
-	Timestamp int64 `json:"timestamp"`
+	// Unverified Unix timestamp of message creation
+	Timestamp uint32 `json:"timestamp"`
 	// Roller public key
 	PublicKey string `json:"publicKey"`
-	// Version is common.Version+ZK_VERSION. Use the following to check the latest ZK_VERSION version.
+	// Version is common.Version+ZkVersion. Use the following to check the latest ZkVersion version.
 	// curl -sL https://api.github.com/repos/scroll-tech/scroll-zkevm/commits | jq -r ".[0].sha"
 	Version string `json:"version"`
 	// Random unique token generated by manager
@@ -115,12 +115,11 @@ func (a *AuthMsg) PublicKey() (string, error) {
 // Hash returns the hash of the auth message, which should be the message used
 // to construct the Signature.
 func (i *Identity) Hash() ([]byte, error) {
-	bs, err := json.Marshal(i)
+	byt, err := rlp.EncodeToBytes(i)
 	if err != nil {
 		return nil, err
 	}
-
-	hash := crypto.Keccak256Hash(bs)
+	hash := crypto.Keccak256Hash(byt)
 	return hash[:], nil
 }

@@ -204,12 +203,12 @@ type ProofDetail struct {

 // Hash return proofMsg content hash.
 func (z *ProofDetail) Hash() ([]byte, error) {
-	bs, err := json.Marshal(z)
+	byt, err := rlp.EncodeToBytes(z)
 	if err != nil {
 		return nil, err
 	}

-	hash := crypto.Keccak256Hash(bs)
+	hash := crypto.Keccak256Hash(byt)
 	return hash[:], nil
 }

--- a/common/message/message_test.go
+++ b/common/message/message_test.go
@@ -16,7 +16,7 @@ func TestAuthMessageSignAndVerify(t *testing.T) {
 	authMsg := &AuthMsg{
 		Identity: &Identity{
 			Name:      "testRoller",
-			Timestamp: time.Now().UnixNano(),
+			Timestamp: uint32(time.Now().Unix()),
 		},
 	}
 	assert.NoError(t, authMsg.Sign(privkey))
--- a/common/utils/trace_gas.go
+++ b/common/utils/trace_gas.go
@@ -1,30 +1,10 @@
 package utils

 import (
-	"sync/atomic"
-
 	"github.com/scroll-tech/go-ethereum/core/types"
-	"golang.org/x/sync/errgroup"
 )

 // ComputeTraceGasCost computes gascost based on ExecutionResults.StructLogs.GasCost
 func ComputeTraceGasCost(trace *types.BlockTrace) uint64 {
-	var (
-		gasCost uint64
-		eg      errgroup.Group
-	)
-	for idx := range trace.ExecutionResults {
-		i := idx
-		eg.Go(func() error {
-			var sum uint64
-			for _, log := range trace.ExecutionResults[i].StructLogs {
-				sum += log.GasCost
-			}
-			atomic.AddUint64(&gasCost, sum)
-			return nil
-		})
-	}
-	_ = eg.Wait()
-
-	return gasCost
+	return trace.Header.GasUsed
 }
--- a/common/utils/trace_gas_test.go
+++ b/common/utils/trace_gas_test.go
@@ -19,13 +19,7 @@ func TestComputeTraceCost(t *testing.T) {
 	blockTrace := &types.BlockTrace{}
 	err = json.Unmarshal(templateBlockTrace, blockTrace)
 	assert.NoError(t, err)
-	var sum uint64
-	for _, v := range blockTrace.ExecutionResults {
-		for _, sv := range v.StructLogs {
-			sum += sv.GasCost
-		}
-	}
-
-	res := utils.ComputeTraceGasCost(blockTrace)
-	assert.Equal(t, sum, res)
+	var expected = blockTrace.Header.GasUsed
+	got := utils.ComputeTraceGasCost(blockTrace)
+	assert.Equal(t, expected, got)
 }
--- a/common/version/version.go
+++ b/common/version/version.go
@@ -5,7 +5,7 @@ import (
 	"runtime/debug"
 )

-var tag = "prealpha-v9.2"
+var tag = "prealpha-v10.1"

 var commit = func() string {
 	if info, ok := debug.ReadBuildInfo(); ok {
@@ -22,8 +22,8 @@ var commit = func() string {
 	return ""
 }()

-// ZK_VERSION is commit-id of common/libzkp/impl/cargo.lock/scroll-zkevm
-var ZK_VERSION string
+// ZkVersion is commit-id of common/libzkp/impl/cargo.lock/scroll-zkevm
+var ZkVersion string

 // Version denote the version of scroll protocol, including the l2geth, relayer, coordinator, roller, contracts and etc.
-var Version = fmt.Sprintf("%s-%s-%s", tag, commit, ZK_VERSION)
+var Version = fmt.Sprintf("%s-%s-%s", tag, commit, ZkVersion)
--- a/coordinator/Makefile
+++ b/coordinator/Makefile
@@ -18,7 +18,7 @@ libzkp:
 	cp -r ../common/libzkp/interface ./verifier/lib

 coordinator: libzkp ## Builds the Coordinator instance.
-	go build -ldflags "-X scroll-tech/common/version.ZK_VERSION=${ZK_VERSION}" -o $(PWD)/build/bin/coordinator ./cmd
+	go build -ldflags "-X scroll-tech/common/version.ZkVersion=${ZK_VERSION}" -o $(PWD)/build/bin/coordinator ./cmd

 test-verifier: libzkp
 	go test -tags ffi -timeout 0 -v ./verifier
--- a/coordinator/api_debug.go
+++ b/coordinator/api_debug.go
@@ -1,96 +0,0 @@
-package coordinator
-
-import (
-	"fmt"
-	"time"
-
-	"scroll-tech/database/orm"
-)
-
-// RollerDebugAPI roller api interface in order go get debug message.
-type RollerDebugAPI interface {
-	// ListRollers returns all live rollers
-	ListRollers() ([]*RollerInfo, error)
-	// GetSessionInfo returns the session information given the session id.
-	GetSessionInfo(sessionID string) (*SessionInfo, error)
-}
-
-// RollerInfo records the roller name, pub key and active session info (id, start time).
-type RollerInfo struct {
-	Name                   string    `json:"name"`
-	Version                string    `json:"version"`
-	PublicKey              string    `json:"public_key"`
-	ActiveSession          string    `json:"active_session,omitempty"`
-	ActiveSessionStartTime time.Time `json:"active_session_start_time"` // latest proof start time.
-}
-
-// SessionInfo records proof create or proof verify failed session.
-type SessionInfo struct {
-	ID              string    `json:"id"`
-	Status          string    `json:"status"`
-	StartTime       time.Time `json:"start_time"`
-	FinishTime      time.Time `json:"finish_time,omitempty"`      // set to 0 if not finished
-	AssignedRollers []string  `json:"assigned_rollers,omitempty"` // roller name list
-	Error           string    `json:"error,omitempty"`            // empty string if no error encountered
-}
-
-// ListRollers returns all live rollers.
-func (m *Manager) ListRollers() ([]*RollerInfo, error) {
-	m.mu.RLock()
-	defer m.mu.RUnlock()
-	var res []*RollerInfo
-	for _, pk := range m.rollerPool.Keys() {
-		node, exist := m.rollerPool.Get(pk)
-		if !exist {
-			continue
-		}
-		roller := node.(*rollerNode)
-		info := &RollerInfo{
-			Name:      roller.Name,
-			Version:   roller.Version,
-			PublicKey: pk,
-		}
-		for id, sess := range m.sessions {
-			if _, ok := sess.info.Rollers[pk]; ok {
-				info.ActiveSessionStartTime = time.Unix(sess.info.StartTimestamp, 0)
-				info.ActiveSession = id
-				break
-			}
-		}
-		res = append(res, info)
-	}
-
-	return res, nil
-}
-
-func newSessionInfo(sess *session, status orm.ProvingStatus, errMsg string, finished bool) *SessionInfo {
-	now := time.Now()
-	var nameList []string
-	for pk := range sess.info.Rollers {
-		nameList = append(nameList, sess.info.Rollers[pk].Name)
-	}
-	info := SessionInfo{
-		ID:              sess.info.ID,
-		Status:          status.String(),
-		AssignedRollers: nameList,
-		StartTime:       time.Unix(sess.info.StartTimestamp, 0),
-		Error:           errMsg,
-	}
-	if finished {
-		info.FinishTime = now
-	}
-	return &info
-}
-
-// GetSessionInfo returns the session information given the session id.
-func (m *Manager) GetSessionInfo(sessionID string) (*SessionInfo, error) {
-	m.mu.RLock()
-	defer m.mu.RUnlock()
-	if info, ok := m.failedSessionInfos[sessionID]; ok {
-		return info, nil
-	}
-	if s, ok := m.sessions[sessionID]; ok {
-		return newSessionInfo(s, orm.ProvingTaskAssigned, "", false), nil
-	}
-	return nil, fmt.Errorf("no such session, sessionID: %s", sessionID)
-}
--- a/coordinator/cmd/app/app_test.go
+++ b/coordinator/cmd/app/app_test.go
@@ -15,5 +15,5 @@ func TestRunCoordinator(t *testing.T) {

 	// wait result
 	coordinator.ExpectWithTimeout(true, time.Second*3, fmt.Sprintf("coordinator version %s", version.Version))
-	coordinator.RunApp(false)
+	coordinator.RunApp(nil)
 }
--- a/coordinator/manager.go
+++ b/coordinator/manager.go
@@ -65,9 +65,6 @@ type Manager struct {
 	// A map containing proof failed or verify failed proof.
 	rollerPool cmap.ConcurrentMap

-	// TODO: once put into use, should add to graceful restart.
-	failedSessionInfos map[string]*SessionInfo
-
 	// A direct connection to the Halo2 verifier, used to verify
 	// incoming proofs.
 	verifier *verifier.Verifier
@@ -94,15 +91,14 @@ func New(ctx context.Context, cfg *config.RollerManagerConfig, orm database.OrmF

 	log.Info("Start coordinator successfully.")
 	return &Manager{
-		ctx:                ctx,
-		cfg:                cfg,
-		rollerPool:         cmap.New(),
-		sessions:           make(map[string]*session),
-		failedSessionInfos: make(map[string]*SessionInfo),
-		verifier:           v,
-		orm:                orm,
-		Client:             client,
-		tokenCache:         cache.New(time.Duration(cfg.TokenTimeToLive)*time.Second, 1*time.Hour),
+		ctx:        ctx,
+		cfg:        cfg,
+		rollerPool: cmap.New(),
+		sessions:   make(map[string]*session),
+		verifier:   v,
+		orm:        orm,
+		Client:     client,
+		tokenCache: cache.New(time.Duration(cfg.TokenTimeToLive)*time.Second, 1*time.Hour),
 	}, nil
 }

@@ -198,7 +194,12 @@ func (m *Manager) restorePrevSessions() {

 			log.Info("Coordinator restart reload sessions", "session start time", time.Unix(sess.info.StartTimestamp, 0))
 			for _, roller := range sess.info.Rollers {
-				log.Info("restore roller info for session", "session id", sess.info.ID, "roller name", roller.Name, "public key", roller.PublicKey, "proof status", roller.Status)
+				log.Info(
+					"restore roller info for session",
+					"session id", sess.info.ID,
+					"roller name", roller.Name,
+					"public key", roller.PublicKey,
+					"proof status", roller.Status)
 			}

 			go m.CollectProofs(sess)
@@ -277,8 +278,6 @@ func (m *Manager) handleZkProof(pk string, msg *message.ProofDetail) error {
 		if dbErr = m.orm.UpdateProvingStatus(msg.ID, orm.ProvingTaskFailed); dbErr != nil {
 			log.Error("failed to update task status as failed", "error", dbErr)
 		}
-		// record the failed session.
-		m.addFailedSession(sess, msg.Error)
 		return nil
 	}

@@ -303,8 +302,6 @@ func (m *Manager) handleZkProof(pk string, msg *message.ProofDetail) error {

 	success, err = m.verifier.VerifyProof(msg.Proof)
 	if err != nil {
-		// record failed session.
-		m.addFailedSession(sess, err.Error())
 		// TODO: this is only a temp workaround for testnet, we should return err in real cases
 		success = false
 		log.Error("Failed to verify zk proof", "proof id", msg.ID, "error", err)
@@ -313,75 +310,65 @@ func (m *Manager) handleZkProof(pk string, msg *message.ProofDetail) error {
 		log.Info("Verify zk proof successfully", "verification result", success, "proof id", msg.ID)
 	}

-	var status orm.ProvingStatus
 	if success {
-		status = orm.ProvingTaskVerified
-	} else {
-		// Set status as skipped if verification fails.
-		// Note that this is only a workaround for testnet here.
-		// TODO: In real cases we should reset to orm.ProvingTaskUnassigned
-		// so as to re-distribute the task in the future
-		status = orm.ProvingTaskFailed
+		if dbErr = m.orm.UpdateProvingStatus(msg.ID, orm.ProvingTaskVerified); dbErr != nil {
+			log.Error(
+				"failed to update proving_status",
+				"msg.ID", msg.ID,
+				"status", orm.ProvingTaskVerified,
+				"error", dbErr)
+		}
+		return dbErr
 	}
-	if dbErr = m.orm.UpdateProvingStatus(msg.ID, status); dbErr != nil {
-		log.Error("failed to update proving_status", "msg.ID", msg.ID, "status", status, "error", dbErr)
-	}
-
-	return dbErr
+	return nil
 }

 // CollectProofs collects proofs corresponding to a proof generation session.
 func (m *Manager) CollectProofs(sess *session) {
-	timer := time.NewTimer(time.Duration(m.cfg.CollectionTime) * time.Minute)
-
-	for {
-		select {
-		case <-timer.C:
-			m.mu.Lock()
-
-			// Ensure proper clean-up of resources.
-			defer func() {
-				delete(m.sessions, sess.info.ID)
-				m.mu.Unlock()
-			}()
-
-			// Pick a random winner.
-			// First, round up the keys that actually sent in a valid proof.
-			var participatingRollers []string
-			for pk, roller := range sess.info.Rollers {
-				if roller.Status == orm.RollerProofValid {
-					participatingRollers = append(participatingRollers, pk)
-				}
-			}
-			// Ensure we got at least one proof before selecting a winner.
-			if len(participatingRollers) == 0 {
-				// record failed session.
-				errMsg := "proof generation session ended without receiving any valid proofs"
-				m.addFailedSession(sess, errMsg)
-				log.Warn(errMsg, "session id", sess.info.ID)
-				// Set status as skipped.
-				// Note that this is only a workaround for testnet here.
-				// TODO: In real cases we should reset to orm.ProvingTaskUnassigned
-				// so as to re-distribute the task in the future
-				if err := m.orm.UpdateProvingStatus(sess.info.ID, orm.ProvingTaskFailed); err != nil {
-					log.Error("fail to reset task_status as Unassigned", "id", sess.info.ID, "err", err)
-				}
-				return
-			}
-
-			// Now, select a random index for this slice.
-			randIndex := mathrand.Intn(len(participatingRollers))
-			_ = participatingRollers[randIndex]
-			// TODO: reward winner
-			return
-		case ret := <-sess.finishChan:
-			m.mu.Lock()
-			sess.info.Rollers[ret.pk].Status = ret.status
+	select {
+	case <-time.After(time.Duration(m.cfg.CollectionTime) * time.Minute):
+		m.mu.Lock()
+		defer func() {
+			delete(m.sessions, sess.info.ID)
 			m.mu.Unlock()
-			if err := m.orm.SetSessionInfo(sess.info); err != nil {
-				log.Error("db set session info fail", "pk", ret.pk, "error", err)
+		}()
+
+		// Pick a random winner.
+		// First, round up the keys that actually sent in a valid proof.
+		var participatingRollers []string
+		for pk, roller := range sess.info.Rollers {
+			if roller.Status == orm.RollerProofValid {
+				participatingRollers = append(participatingRollers, pk)
 			}
 		}
+		// Ensure we got at least one proof before selecting a winner.
+		if len(participatingRollers) == 0 {
+			// record failed session.
+			errMsg := "proof generation session ended without receiving any valid proofs"
+			log.Warn(errMsg, "session id", sess.info.ID)
+			// Set status as skipped.
+			// Note that this is only a workaround for testnet here.
+			// TODO: In real cases we should reset to orm.ProvingTaskUnassigned
+			// so as to re-distribute the task in the future
+			if err := m.orm.UpdateProvingStatus(sess.info.ID, orm.ProvingTaskFailed); err != nil {
+				log.Error("fail to reset task_status as Unassigned", "id", sess.info.ID, "err", err)
+			}
+			return
+		}
+
+		// Now, select a random index for this slice.
+		randIndex := mathrand.Intn(len(participatingRollers))
+		_ = participatingRollers[randIndex]
+		// TODO: reward winner
+		return
+
+	case ret := <-sess.finishChan:
+		m.mu.Lock()
+		sess.info.Rollers[ret.pk].Status = ret.status
+		m.mu.Unlock()
+		if err := m.orm.SetSessionInfo(sess.info); err != nil {
+			log.Error("db set session info fail", "pk", ret.pk, "error", err)
+		}
 	}
 }

@@ -393,22 +380,17 @@ func (m *Manager) APIs() []rpc.API {
 			Service:   RollerAPI(m),
 			Public:    true,
 		},
-		{
-			Namespace: "debug",
-			Public:    true,
-			Service:   RollerDebugAPI(m),
-		},
 	}
 }

 // StartProofGenerationSession starts a proof generation session
 func (m *Manager) StartProofGenerationSession(task *orm.BlockBatch) (success bool) {
-	roller := m.selectRoller()
-	if roller == nil {
+	if m.GetNumberOfIdleRollers() == 0 {
+		log.Warn("no idle roller when starting proof generation session", "id", task.ID)
 		return false
 	}
-	log.Info("start proof generation session", "id", task.ID)

+	log.Info("start proof generation session", "id", task.ID)
 	defer func() {
 		if !success {
 			if err := m.orm.UpdateProvingStatus(task.ID, orm.ProvingTaskUnassigned); err != nil {
@@ -416,11 +398,8 @@ func (m *Manager) StartProofGenerationSession(task *orm.BlockBatch) (success boo
 			}
 		}
 	}()
-	if err := m.orm.UpdateProvingStatus(task.ID, orm.ProvingTaskAssigned); err != nil {
-		log.Error("failed to update task status", "id", task.ID, "err", err)
-		return false
-	}

+	// Get block traces.
 	blockInfos, err := m.orm.GetBlockInfos(map[string]interface{}{"batch_id": task.ID})
 	if err != nil {
 		log.Error(
@@ -430,7 +409,6 @@ func (m *Manager) StartProofGenerationSession(task *orm.BlockBatch) (success boo
 		)
 		return false
 	}
-
 	traces := make([]*types.BlockTrace, len(blockInfos))
 	for i, blockInfo := range blockInfos {
 		traces[i], err = m.Client.GetBlockTraceByHash(m.ctx, common.HexToHash(blockInfo.Hash))
@@ -445,41 +423,61 @@ func (m *Manager) StartProofGenerationSession(task *orm.BlockBatch) (success boo
 		}
 	}

-	log.Info("roller is picked", "session id", task.ID, "name", roller.Name, "public_key", roller.PublicKey)
-
-	// send trace to roller
-	if !roller.sendTask(task.ID, traces) {
-		log.Error("send task failed", "roller name", roller.Name, "public_key", roller.PublicKey, "id", task.ID)
+	// Dispatch task to rollers.
+	rollers := make(map[string]*orm.RollerStatus)
+	for i := 0; i < int(m.cfg.RollersPerSession); i++ {
+		roller := m.selectRoller()
+		if roller == nil {
+			break
+		}
+		log.Info("roller is picked", "session id", task.ID, "name", roller.Name, "public key", roller.PublicKey)
+		// send trace to roller
+		if !roller.sendTask(task.ID, traces) {
+			log.Error("send task failed", "roller name", roller.Name, "public key", roller.PublicKey, "id", task.ID)
+			continue
+		}
+		rollers[roller.PublicKey] = &orm.RollerStatus{PublicKey: roller.PublicKey, Name: roller.Name, Status: orm.RollerAssigned}
+	}
+	// No roller assigned.
+	if len(rollers) == 0 {
+		log.Error("no roller assigned", "id", task.ID, "number of idle rollers", m.GetNumberOfIdleRollers())
+		return false
+	}
+
+	// Update session proving status as assigned.
+	if err := m.orm.UpdateProvingStatus(task.ID, orm.ProvingTaskAssigned); err != nil {
+		log.Error("failed to update task status", "id", task.ID, "err", err)
 		return false
 	}

-	pk := roller.PublicKey
 	// Create a proof generation session.
-	s := &session{
+	sess := &session{
 		info: &orm.SessionInfo{
-			ID: task.ID,
-			Rollers: map[string]*orm.RollerStatus{
-				pk: {
-					PublicKey: pk,
-					Name:      roller.Name,
-					Status:    orm.RollerAssigned,
-				},
-			},
+			ID:             task.ID,
+			Rollers:        rollers,
 			StartTimestamp: time.Now().Unix(),
 		},
 		finishChan: make(chan rollerProofStatus, proofAndPkBufferSize),
 	}

 	// Store session info.
-	if err = m.orm.SetSessionInfo(s.info); err != nil {
-		log.Error("db set session info fail", "roller name", roller.Name, "public_key", pk, "error", err)
+	if err = m.orm.SetSessionInfo(sess.info); err != nil {
+		log.Error("db set session info fail", "error", err)
+		for _, roller := range sess.info.Rollers {
+			log.Error(
+				"restore roller info for session",
+				"session id", sess.info.ID,
+				"roller name", roller.Name,
+				"public key", roller.PublicKey,
+				"proof status", roller.Status)
+		}
 		return false
 	}

 	m.mu.Lock()
-	m.sessions[task.ID] = s
+	m.sessions[task.ID] = sess
 	m.mu.Unlock()
-	go m.CollectProofs(s)
+	go m.CollectProofs(sess)

 	return true
 }
@@ -501,10 +499,6 @@ func (m *Manager) IsRollerIdle(hexPk string) bool {
 	return true
 }

-func (m *Manager) addFailedSession(sess *session, errMsg string) {
-	m.failedSessionInfos[sess.info.ID] = newSessionInfo(sess, orm.ProvingTaskFailed, errMsg, true)
-}
-
 // VerifyToken verifies pukey for token and expiration time
 func (m *Manager) VerifyToken(authMsg *message.AuthMsg) (bool, error) {
 	pubkey, _ := authMsg.PublicKey()
--- a/coordinator/manager_test.go
+++ b/coordinator/manager_test.go
@@ -127,7 +127,7 @@ func testFailedHandshake(t *testing.T) {
 	authMsg := &message.AuthMsg{
 		Identity: &message.Identity{
 			Name:      name,
-			Timestamp: time.Now().UnixNano(),
+			Timestamp: uint32(time.Now().Unix()),
 		},
 	}
 	assert.NoError(t, authMsg.Sign(privkey))
@@ -145,7 +145,7 @@ func testFailedHandshake(t *testing.T) {
 	authMsg = &message.AuthMsg{
 		Identity: &message.Identity{
 			Name:      name,
-			Timestamp: time.Now().UnixNano(),
+			Timestamp: uint32(time.Now().Unix()),
 		},
 	}
 	assert.NoError(t, authMsg.Sign(privkey))
@@ -318,10 +318,6 @@ func testGracefulRestart(t *testing.T) {
 	}()

 	for i := range ids {
-		info, err := newRollerManager.GetSessionInfo(ids[i])
-		assert.Equal(t, orm.ProvingTaskAssigned.String(), info.Status)
-		assert.NoError(t, err)
-
 		// at this point, roller haven't submitted
 		status, err := l2db.GetProvingStatusByID(ids[i])
 		assert.NoError(t, err)
@@ -419,7 +415,7 @@ func (r *mockRoller) connectToCoordinator() (*client2.Client, ethereum.Subscript
 	authMsg := &message.AuthMsg{
 		Identity: &message.Identity{
 			Name:      r.rollerName,
-			Timestamp: time.Now().UnixNano(),
+			Timestamp: uint32(time.Now().Unix()),
 		},
 	}
 	_ = authMsg.Sign(r.privKey)
--- a/coordinator/rollers.go
+++ b/coordinator/rollers.go
@@ -41,7 +41,7 @@ func (r *rollerNode) sendTask(id string, traces []*types.BlockTrace) bool {
 	}:
 		r.TaskIDs.Set(id, struct{}{})
 	default:
-		log.Warn("roller channel is full", "roller name", r.Name, "public_key", r.PublicKey)
+		log.Warn("roller channel is full", "roller name", r.Name, "public key", r.PublicKey)
 		return false
 	}
 	return true
@@ -77,7 +77,7 @@ func (m *Manager) register(pubkey string, identity *message.Identity) (<-chan *m
 	roller := node.(*rollerNode)
 	// avoid reconnection too frequently.
 	if time.Since(roller.registerTime) < 60 {
-		log.Warn("roller reconnect too frequently", "roller_name", identity.Name, "public_key", pubkey)
+		log.Warn("roller reconnect too frequently", "roller_name", identity.Name, "public key", pubkey)
 		return nil, fmt.Errorf("roller reconnect too frequently")
 	}
 	// update register time and status
--- a/database/cmd/app/app_test.go
+++ b/database/cmd/app/app_test.go
@@ -15,5 +15,5 @@ func TestRunDatabase(t *testing.T) {

 	// wait result
 	bridge.ExpectWithTimeout(true, time.Second*3, fmt.Sprintf("db_cli version %s", version.Version))
-	bridge.RunApp(false)
+	bridge.RunApp(nil)
 }
--- a/roller/Makefile
+++ b/roller/Makefile
@@ -14,10 +14,10 @@ libzkp:
 	cp -r ../common/libzkp/interface ./prover/lib

 roller: libzkp ## Build the Roller instance.
-	GOBIN=$(PWD)/build/bin go build -ldflags "-X scroll-tech/common/version.ZK_VERSION=${ZK_VERSION}" -o $(PWD)/build/bin/roller ./cmd
+	GOBIN=$(PWD)/build/bin go build -ldflags "-X scroll-tech/common/version.ZkVersion=${ZK_VERSION}" -o $(PWD)/build/bin/roller ./cmd

 gpu-roller: libzkp ## Build the GPU Roller instance.
-	GOBIN=$(PWD)/build/bin go build -ldflags "-X scroll-tech/common/version.ZK_VERSION=${ZK_VERSION}" -tags gpu -o $(PWD)/build/bin/roller ./cmd
+	GOBIN=$(PWD)/build/bin go build -ldflags "-X scroll-tech/common/version.ZkVersion=${ZK_VERSION}" -tags gpu -o $(PWD)/build/bin/roller ./cmd

 mock_roller:
 	GOBIN=$(PWD)/build/bin go build -tags mock_prover -o $(PWD)/build/bin/roller $(PWD)/cmd
--- a/roller/cmd/app/app_test.go
+++ b/roller/cmd/app/app_test.go
@@ -15,5 +15,5 @@ func TestRunRoller(t *testing.T) {

 	// wait result
 	roller.ExpectWithTimeout(true, time.Second*3, fmt.Sprintf("roller version %s", version.Version))
-	roller.RunApp(false)
+	roller.RunApp(nil)
 }
--- a/roller/roller.go
+++ b/roller/roller.go
@@ -5,8 +5,8 @@ import (
 	"crypto/ecdsa"
 	"errors"
 	"fmt"
+	"math"
 	"sort"
-	"strings"
 	"sync/atomic"
 	"time"

@@ -29,8 +29,6 @@ import (
 var (
 	// retry connecting to coordinator
 	retryWait = time.Second * 10
-	// net normal close
-	errNormalClose = errors.New("use of closed network connection")
 )

 // Roller contains websocket conn to coordinator, Stack, unix-socket to ipc-prover.
@@ -107,10 +105,16 @@ func (r *Roller) Start() {

 // Register registers Roller to the coordinator through Websocket.
 func (r *Roller) Register() error {
+	timestamp := time.Now().Unix()
+
+	if timestamp < 0 || timestamp > math.MaxUint32 {
+		panic("Expected current time to be between the years 1970 and 2106")
+	}
+
 	authMsg := &message.AuthMsg{
 		Identity: &message.Identity{
 			Name:      r.cfg.RollerName,
-			Timestamp: time.Now().UnixMilli(),
+			Timestamp: uint32(timestamp),
 			PublicKey: r.PublicKey(),
 			Version:   version.Version,
 		},
@@ -188,9 +192,6 @@ func (r *Roller) ProveLoop() {
 					time.Sleep(time.Second * 3)
 					continue
 				}
-				if strings.Contains(err.Error(), errNormalClose.Error()) {
-					return
-				}
 				log.Error("prove failed", "error", err)
 			}
 		}
@@ -256,25 +257,34 @@ func (r *Roller) prove() error {
 		}
 	}()

-	ok, serr := r.signAndSubmitProof(proofMsg)
-	if !ok {
-		log.Error("submit proof to coordinator failed", "task ID", proofMsg.ID)
-	}
-	return serr
+	r.signAndSubmitProof(proofMsg)
+	return nil
 }

-func (r *Roller) signAndSubmitProof(msg *message.ProofDetail) (bool, error) {
+func (r *Roller) signAndSubmitProof(msg *message.ProofDetail) {
 	authZkProof := &message.ProofMsg{ProofDetail: msg}
 	if err := authZkProof.Sign(r.priv); err != nil {
-		return false, err
+		log.Error("sign proof error", "err", err)
+		return
 	}

-	// When the roller is disconnected from the coordinator,
-	// wait until the roller reconnects to the coordinator.
-	for atomic.LoadInt64(&r.isDisconnected) == 1 {
-		time.Sleep(retryWait)
+	// Retry SubmitProof several times.
+	for i := 0; i < 3; i++ {
+		// When the roller is disconnected from the coordinator,
+		// wait until the roller reconnects to the coordinator.
+		for atomic.LoadInt64(&r.isDisconnected) == 1 {
+			time.Sleep(retryWait)
+		}
+		ok, serr := r.client.SubmitProof(context.Background(), authZkProof)
+		if !ok {
+			log.Error("submit proof to coordinator failed", "task ID", msg.ID)
+			return
+		}
+		if serr == nil {
+			return
+		}
+		log.Error("submit proof to coordinator error", "task ID", msg.ID, "error", serr)
 	}
-	return r.client.SubmitProof(context.Background(), authZkProof)
 }

 // Stop closes the websocket connection.
--- a/tests/integration-test/common.go
+++ b/tests/integration-test/common.go
@@ -80,7 +80,8 @@ func free(t *testing.T) {
 }

 type appAPI interface {
-	RunApp(parallel bool)
+	WaitResult(timeout time.Duration, keyword string) bool
+	RunApp(waitResult func() bool)
 	WaitExit()
 	ExpectWithTimeout(parallel bool, timeout time.Duration, keyword string)
 }
@@ -103,7 +104,7 @@ func runDBCliApp(t *testing.T, option, keyword string) {

 	// Wait expect result.
 	app.ExpectWithTimeout(true, time.Second*3, keyword)
-	app.RunApp(false)
+	app.RunApp(nil)
 }

 func runRollerApp(t *testing.T, args ...string) appAPI {
--- a/tests/integration-test/integration_test.go
+++ b/tests/integration-test/integration_test.go
@@ -28,19 +28,16 @@ func testStartProcess(t *testing.T) {

 	// Start bridge process.
 	bridgeCmd := runBridgeApp(t)
-	bridgeCmd.ExpectWithTimeout(true, time.Second*20, "Start bridge successfully")
-	bridgeCmd.RunApp(true)
+	bridgeCmd.RunApp(func() bool { return bridgeCmd.WaitResult(time.Second*20, "Start bridge successfully") })

 	// Start coordinator process.
 	coordinatorCmd := runCoordinatorApp(t, "--ws", "--ws.port", "8391")
-	coordinatorCmd.ExpectWithTimeout(true, time.Second*20, "Start coordinator successfully")
-	coordinatorCmd.RunApp(true)
+	coordinatorCmd.RunApp(func() bool { return coordinatorCmd.WaitResult(time.Second*20, "Start coordinator successfully") })

 	// Start roller process.
 	rollerCmd := runRollerApp(t)
-	rollerCmd.ExpectWithTimeout(true, time.Second*40, "roller start successfully")
 	rollerCmd.ExpectWithTimeout(true, time.Second*60, "register to coordinator successfully!")
-	rollerCmd.RunApp(true)
+	rollerCmd.RunApp(func() bool { return rollerCmd.WaitResult(time.Second*40, "roller start successfully") })

 	rollerCmd.WaitExit()
 	bridgeCmd.WaitExit()
Author	SHA1	Message	Date
HAOYUatHZ	0bdcce79ba	chore: bump version number (#226 )	2023-01-13 08:33:53 +08:00
Péter Garamvölgyi	fcd29c305d	fix(coordinator): use uint32 for timestamp to enable RLP encoding (#225 )	2023-01-12 18:24:59 +01:00
Lawliet-Chan	54a6ab472a	feat(message): replace `json.Marshal` with `rlp.Encode` for Signing (#219 )	2023-01-12 22:21:59 +08:00
HAOYUatHZ	b2a5baa2ad	feat(bridge): upgrade `TraceGasCost` estimation (#222 )	2023-01-12 16:45:11 +08:00
Lawliet-Chan	dc6b71ca23	chore: improve golang lint rules (#172 ) Co-authored-by: HAOYUatHZ <37070449+HAOYUatHZ@users.noreply.github.com>	2023-01-12 12:55:00 +08:00
Nazarii Denha	e1247a7eb2	refactor(coordinator): remove debug api namespace from manager (#221 ) Co-authored-by: colin <102356659+colinlyguo@users.noreply.github.com>	2023-01-12 10:16:48 +08:00
colin	65699b89bb	feat(coordinator): support rollers-per-session (#215 ) Co-authored-by: colinlyguo <colinlyguo@gmail.com> Co-authored-by: maskpp <maskpp266@gmail.com> Co-authored-by: HAOYUatHZ <37070449+HAOYUatHZ@users.noreply.github.com>	2023-01-11 21:49:37 +08:00
maskpp	a44956a05f	fix(bug): fix data race in common/cmd module. (#220 )	2023-01-11 21:05:46 +08:00
maskpp	b85b4bafc2	refactor(coordinator): refactor `CollectProofs` func (#211 ) Co-authored-by: HAOYUatHZ <37070449+HAOYUatHZ@users.noreply.github.com>	2023-01-11 13:31:42 +08:00
colin	2e3c80c580	feat(roller): add submit proof retry (#217 ) Co-authored-by: colinlyguo <colinlyguo@gmail.com> Co-authored-by: Lawliet-Chan <1576710154@qq.com>	2023-01-11 12:30:33 +08:00
Péter Garamvölgyi	d24392feac	feat(bridge): Propose batches, fetch blocks and events in parallel (#216 )	2023-01-10 23:13:06 +08:00
ChuhanJin	5c6e20a774	build(Jenkins): add docker push job for tag (#214 ) Co-authored-by: vincent <419436363@qq.com>	2023-01-10 14:43:20 +08:00