node.go 13.3 KB
Newer Older
1 2 3 4
package node

import (
	"context"
5
	"errors"
6 7 8
	"fmt"
	"time"

9
	"github.com/hashicorp/go-multierror"
10
	"github.com/libp2p/go-libp2p/core/peer"
11

12 13 14 15
	"github.com/ethereum/go-ethereum"
	"github.com/ethereum/go-ethereum/event"
	"github.com/ethereum/go-ethereum/log"

16
	"github.com/ethereum-optimism/optimism/op-node/client"
17
	"github.com/ethereum-optimism/optimism/op-node/eth"
18 19
	"github.com/ethereum-optimism/optimism/op-node/metrics"
	"github.com/ethereum-optimism/optimism/op-node/p2p"
20
	"github.com/ethereum-optimism/optimism/op-node/rollup/driver"
21
	"github.com/ethereum-optimism/optimism/op-node/sources"
22 23 24 25 26
)

type OpNode struct {
	log        log.Logger
	appVersion string
27
	metrics    *metrics.Metrics
28 29 30 31 32 33 34 35 36 37 38 39

	l1HeadsSub     ethereum.Subscription // Subscription to get L1 heads (automatically re-subscribes on error)
	l1SafeSub      ethereum.Subscription // Subscription to get L1 safe blocks, a.k.a. justified data (polling)
	l1FinalizedSub ethereum.Subscription // Subscription to get L1 safe blocks, a.k.a. justified data (polling)

	l1Source  *sources.L1Client     // L1 Client to fetch data from
	l2Driver  *driver.Driver        // L2 Engine to Sync
	l2Source  *sources.EngineClient // L2 Execution Engine RPC bindings
	server    *rpcServer            // RPC server hosting the rollup-node API
	p2pNode   *p2p.NodeP2P          // P2P node functionality
	p2pSigner p2p.Signer            // p2p gogssip application messages will be signed with this signer
	tracer    Tracer                // tracer to get events for testing/debugging
40
	runCfg    *RuntimeConfig        // runtime configurables
41 42 43 44 45 46 47 48 49 50

	// some resources cannot be stopped directly, like the p2p gossipsub router (not our design),
	// and depend on this ctx to be closed.
	resourcesCtx   context.Context
	resourcesClose context.CancelFunc
}

// The OpNode handles incoming gossip
var _ p2p.GossipIn = (*OpNode)(nil)

51
func New(ctx context.Context, cfg *Config, log log.Logger, snapshotLog log.Logger, appVersion string, m *metrics.Metrics) (*OpNode, error) {
52 53 54 55 56 57 58
	if err := cfg.Check(); err != nil {
		return nil, err
	}

	n := &OpNode{
		log:        log,
		appVersion: appVersion,
59
		metrics:    m,
60 61 62 63 64 65
	}
	// not a context leak, gossipsub is closed with a context.
	n.resourcesCtx, n.resourcesClose = context.WithCancel(context.Background())

	err := n.init(ctx, cfg, snapshotLog)
	if err != nil {
66
		log.Error("Error initializing the rollup node", "err", err)
67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82
		// ensure we always close the node resources if we fail to initialize the node.
		if closeErr := n.Close(); closeErr != nil {
			return nil, multierror.Append(err, closeErr)
		}
		return nil, err
	}
	return n, nil
}

func (n *OpNode) init(ctx context.Context, cfg *Config, snapshotLog log.Logger) error {
	if err := n.initTracer(ctx, cfg); err != nil {
		return err
	}
	if err := n.initL1(ctx, cfg); err != nil {
		return err
	}
83 84 85
	if err := n.initRuntimeConfig(ctx, cfg); err != nil {
		return err
	}
86
	if err := n.initL2(ctx, cfg, snapshotLog); err != nil {
87 88 89 90 91 92 93 94 95 96 97 98
		return err
	}
	if err := n.initP2PSigner(ctx, cfg); err != nil {
		return err
	}
	if err := n.initP2P(ctx, cfg); err != nil {
		return err
	}
	// Only expose the server at the end, ensuring all RPC backend components are initialized.
	if err := n.initRPCServer(ctx, cfg); err != nil {
		return err
	}
99 100 101
	if err := n.initMetricsServer(ctx, cfg); err != nil {
		return err
	}
102 103 104 105 106 107 108 109 110 111 112 113 114
	return nil
}

func (n *OpNode) initTracer(ctx context.Context, cfg *Config) error {
	if cfg.Tracer != nil {
		n.tracer = cfg.Tracer
	} else {
		n.tracer = new(noOpTracer)
	}
	return nil
}

func (n *OpNode) initL1(ctx context.Context, cfg *Config) error {
115
	l1Node, trustRPC, rpcProvKind, err := cfg.L1.Setup(ctx, n.log)
116
	if err != nil {
117
		return fmt.Errorf("failed to get L1 RPC client: %w", err)
118 119
	}

120 121
	n.l1Source, err = sources.NewL1Client(
		client.NewInstrumentedRPC(l1Node, n.metrics), n.log, n.metrics.L1SourceCache,
122
		sources.L1ClientDefaultConfig(&cfg.Rollup, trustRPC, rpcProvKind))
123
	if err != nil {
124
		return fmt.Errorf("failed to create L1 source: %w", err)
125 126
	}

Andreas Bigger's avatar
Andreas Bigger committed
127
	if err := cfg.Rollup.ValidateL1Config(ctx, n.l1Source); err != nil {
128
		return err
129 130
	}

131 132 133 134 135 136 137 138 139 140 141 142 143 144
	// Keep subscribed to the L1 heads, which keeps the L1 maintainer pointing to the best headers to sync
	n.l1HeadsSub = event.ResubscribeErr(time.Second*10, func(ctx context.Context, err error) (event.Subscription, error) {
		if err != nil {
			n.log.Warn("resubscribing after failed L1 subscription", "err", err)
		}
		return eth.WatchHeadChanges(n.resourcesCtx, n.l1Source, n.OnNewL1Head)
	})
	go func() {
		err, ok := <-n.l1HeadsSub.Err()
		if !ok {
			return
		}
		n.log.Error("l1 heads subscription error", "err", err)
	}()
145 146 147 148 149 150 151

	// Poll for the safe L1 block and finalized block,
	// which only change once per epoch at most and may be delayed.
	n.l1SafeSub = eth.PollBlockChanges(n.resourcesCtx, n.log, n.l1Source, n.OnNewL1Safe, eth.Safe,
		cfg.L1EpochPollInterval, time.Second*10)
	n.l1FinalizedSub = eth.PollBlockChanges(n.resourcesCtx, n.log, n.l1Source, n.OnNewL1Finalized, eth.Finalized,
		cfg.L1EpochPollInterval, time.Second*10)
152 153 154
	return nil
}

155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181
func (n *OpNode) initRuntimeConfig(ctx context.Context, cfg *Config) error {
	// attempt to load runtime config, repeat N times
	n.runCfg = NewRuntimeConfig(n.log, n.l1Source, &cfg.Rollup)

	for i := 0; i < 5; i++ {
		fetchCtx, fetchCancel := context.WithTimeout(ctx, time.Second*10)
		l1Head, err := n.l1Source.L1BlockRefByLabel(fetchCtx, eth.Unsafe)
		fetchCancel()
		if err != nil {
			n.log.Error("failed to fetch L1 head for runtime config initialization", "err", err)
			continue
		}

		fetchCtx, fetchCancel = context.WithTimeout(ctx, time.Second*10)
		err = n.runCfg.Load(fetchCtx, l1Head)
		fetchCancel()
		if err != nil {
			n.log.Error("failed to fetch runtime config data", "err", err)
			continue
		}

		return nil
	}

	return errors.New("failed to load runtime configuration repeatedly")
}

182 183 184 185 186
func (n *OpNode) initL2(ctx context.Context, cfg *Config, snapshotLog log.Logger) error {
	rpcClient, err := cfg.L2.Setup(ctx, n.log)
	if err != nil {
		return fmt.Errorf("failed to setup L2 execution-engine RPC client: %w", err)
	}
187 188 189 190 191

	n.l2Source, err = sources.NewEngineClient(
		client.NewInstrumentedRPC(rpcClient, n.metrics), n.log, n.metrics.L2SourceCache,
		sources.EngineClientDefaultConfig(&cfg.Rollup),
	)
192
	if err != nil {
193
		return fmt.Errorf("failed to create Engine client: %w", err)
194 195
	}

Andreas Bigger's avatar
Andreas Bigger committed
196
	if err := cfg.Rollup.ValidateL2Config(ctx, n.l2Source); err != nil {
197
		return err
198 199
	}

clabby's avatar
clabby committed
200
	var syncClient *sources.SyncClient
clabby's avatar
clabby committed
201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217
	// If the L2 sync config is present, use it to create a sync client
	if cfg.L2Sync != nil {
		if err := cfg.L2Sync.Check(); err != nil {
			log.Info("L2 sync config is not present, skipping L2 sync client setup", "err", err)
		} else {
			rpcSyncClient, err := cfg.L2Sync.Setup(ctx, n.log)
			if err != nil {
				return fmt.Errorf("failed to setup L2 execution-engine RPC client for backup sync: %w", err)
			}

			// The sync client's RPC is always trusted
			config := sources.SyncClientDefaultConfig(&cfg.Rollup, true)

			syncClient, err = sources.NewSyncClient(n.OnUnsafeL2Payload, rpcSyncClient, n.log, n.metrics.L2SourceCache, config)
			if err != nil {
				return fmt.Errorf("failed to create sync client: %w", err)
			}
clabby's avatar
clabby committed
218 219 220 221
		}
	}

	n.l2Driver = driver.NewDriver(&cfg.Driver, &cfg.Rollup, n.l2Source, n.l1Source, syncClient, n, n.log, snapshotLog, n.metrics)
222 223 224 225 226

	return nil
}

func (n *OpNode) initRPCServer(ctx context.Context, cfg *Config) error {
227
	server, err := newRPCServer(ctx, &cfg.RPC, &cfg.Rollup, n.l2Source.L2Client, n.l2Driver, n.log, n.appVersion, n.metrics)
228 229 230 231
	if err != nil {
		return err
	}
	if n.p2pNode != nil {
232
		server.EnableP2P(p2p.NewP2PAPIBackend(n.p2pNode, n.log, n.metrics))
233
	}
234
	if cfg.RPC.EnableAdmin {
235
		server.EnableAdminAPI(NewAdminAPI(n.l2Driver, n.metrics))
Michael de Hoog's avatar
Michael de Hoog committed
236
		n.log.Info("Admin RPC enabled")
237
	}
238
	n.log.Info("Starting JSON-RPC server")
239
	if err := server.Start(); err != nil {
240 241
		return fmt.Errorf("unable to start RPC server: %w", err)
	}
242
	n.server = server
243 244 245
	return nil
}

246 247 248 249 250 251 252 253 254 255 256 257 258 259
func (n *OpNode) initMetricsServer(ctx context.Context, cfg *Config) error {
	if !cfg.Metrics.Enabled {
		n.log.Info("metrics disabled")
		return nil
	}
	n.log.Info("starting metrics server", "addr", cfg.Metrics.ListenAddr, "port", cfg.Metrics.ListenPort)
	go func() {
		if err := n.metrics.Serve(ctx, cfg.Metrics.ListenAddr, cfg.Metrics.ListenPort); err != nil {
			log.Crit("error starting metrics server", "err", err)
		}
	}()
	return nil
}

260 261
func (n *OpNode) initP2P(ctx context.Context, cfg *Config) error {
	if cfg.P2P != nil {
262
		p2pNode, err := p2p.NewNodeP2P(n.resourcesCtx, &cfg.Rollup, n.log, cfg.P2P, n, n.runCfg, n.metrics)
263
		if err != nil || p2pNode == nil {
264 265 266
			return err
		}
		n.p2pNode = p2pNode
267 268 269
		if n.p2pNode.Dv5Udp() != nil {
			go n.p2pNode.DiscoveryProcess(n.resourcesCtx, n.log, &cfg.Rollup, cfg.P2P.TargetPeers())
		}
270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285
	}
	return nil
}

func (n *OpNode) initP2PSigner(ctx context.Context, cfg *Config) error {
	// the p2p signer setup is optional
	if cfg.P2PSigner == nil {
		return nil
	}
	// p2pSigner may still be nil, the signer setup may not create any signer, the signer is optional
	var err error
	n.p2pSigner, err = cfg.P2PSigner.SetupSigner(ctx)
	return err
}

func (n *OpNode) Start(ctx context.Context) error {
286
	n.log.Info("Starting execution engine driver")
clabby's avatar
clabby committed
287

288
	// start driving engine: sync blocks by deriving them from L1 and driving them into the engine
clabby's avatar
clabby committed
289
	if err := n.l2Driver.Start(); err != nil {
290 291
		n.log.Error("Could not start a rollup node", "err", err)
		return err
292 293
	}

clabby's avatar
clabby committed
294 295
	// If the backup unsafe sync client is enabled, start its event loop
	if n.l2Driver.L2SyncCl != nil {
clabby's avatar
clabby committed
296
		if err := n.l2Driver.L2SyncCl.Start(); err != nil {
clabby's avatar
clabby committed
297 298 299 300 301
			n.log.Error("Could not start the backup sync client", "err", err)
			return err
		}
	}

302 303 304 305 306 307
	return nil
}

func (n *OpNode) OnNewL1Head(ctx context.Context, sig eth.L1BlockRef) {
	n.tracer.OnNewL1Head(ctx, sig)

308 309 310
	if n.l2Driver == nil {
		return
	}
311 312 313
	// Pass on the event to the L2 Engine
	ctx, cancel := context.WithTimeout(ctx, time.Second*10)
	defer cancel()
314
	if err := n.l2Driver.OnL1Head(ctx, sig); err != nil {
315
		n.log.Warn("failed to notify engine driver of L1 head change", "err", err)
316
	}
317 318 319
}

func (n *OpNode) OnNewL1Safe(ctx context.Context, sig eth.L1BlockRef) {
320 321 322
	if n.l2Driver == nil {
		return
	}
323 324 325 326 327 328 329
	// Pass on the event to the L2 Engine
	ctx, cancel := context.WithTimeout(ctx, time.Second*10)
	defer cancel()
	if err := n.l2Driver.OnL1Safe(ctx, sig); err != nil {
		n.log.Warn("failed to notify engine driver of L1 safe block change", "err", err)
	}
}
330

331
func (n *OpNode) OnNewL1Finalized(ctx context.Context, sig eth.L1BlockRef) {
332 333 334
	if n.l2Driver == nil {
		return
	}
335 336 337 338 339 340
	// Pass on the event to the L2 Engine
	ctx, cancel := context.WithTimeout(ctx, time.Second*10)
	defer cancel()
	if err := n.l2Driver.OnL1Finalized(ctx, sig); err != nil {
		n.log.Warn("failed to notify engine driver of L1 finalized block change", "err", err)
	}
341 342
}

343
func (n *OpNode) PublishL2Payload(ctx context.Context, payload *eth.ExecutionPayload) error {
344 345 346 347 348 349 350 351 352 353 354 355 356 357
	n.tracer.OnPublishL2Payload(ctx, payload)

	// publish to p2p, if we are running p2p at all
	if n.p2pNode != nil {
		if n.p2pSigner == nil {
			return fmt.Errorf("node has no p2p signer, payload %s cannot be published", payload.ID())
		}
		n.log.Info("Publishing signed execution payload on p2p", "id", payload.ID())
		return n.p2pNode.GossipOut().PublishL2Payload(ctx, payload, n.p2pSigner)
	}
	// if p2p is not enabled then we just don't publish the payload
	return nil
}

358
func (n *OpNode) OnUnsafeL2Payload(ctx context.Context, from peer.ID, payload *eth.ExecutionPayload) error {
359 360 361 362 363 364 365 366 367
	// ignore if it's from ourselves
	if n.p2pNode != nil && from == n.p2pNode.Host().ID() {
		return nil
	}

	n.tracer.OnUnsafeL2Payload(ctx, from, payload)

	n.log.Info("Received signed execution payload from p2p", "id", payload.ID(), "peer", from)

368 369 370
	// Pass on the event to the L2 Engine
	ctx, cancel := context.WithTimeout(ctx, time.Second*30)
	defer cancel()
371
	if err := n.l2Driver.OnUnsafeL2Payload(ctx, payload); err != nil {
372
		n.log.Warn("failed to notify engine driver of new L2 payload", "err", err, "id", payload.ID())
373
	}
374

375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390
	return nil
}

func (n *OpNode) P2P() p2p.Node {
	return n.p2pNode
}

// Close closes all resources.
func (n *OpNode) Close() error {
	var result *multierror.Error

	if n.server != nil {
		n.server.Stop()
	}
	if n.p2pNode != nil {
		if err := n.p2pNode.Close(); err != nil {
391
			result = multierror.Append(result, fmt.Errorf("failed to close p2p node: %w", err))
392 393 394 395
		}
	}
	if n.p2pSigner != nil {
		if err := n.p2pSigner.Close(); err != nil {
396
			result = multierror.Append(result, fmt.Errorf("failed to close p2p signer: %w", err))
397 398 399 400 401 402 403 404 405 406 407 408
		}
	}

	if n.resourcesClose != nil {
		n.resourcesClose()
	}

	// stop L1 heads feed
	if n.l1HeadsSub != nil {
		n.l1HeadsSub.Unsubscribe()
	}

409 410 411
	// close L2 driver
	if n.l2Driver != nil {
		if err := n.l2Driver.Close(); err != nil {
412
			result = multierror.Append(result, fmt.Errorf("failed to close L2 engine driver cleanly: %w", err))
413
		}
clabby's avatar
clabby committed
414 415 416 417 418 419 420

		// If the L2 sync client is present & running, close it.
		if n.l2Driver.L2SyncCl != nil {
			if err := n.l2Driver.L2SyncCl.Close(); err != nil {
				result = multierror.Append(result, fmt.Errorf("failed to close L2 engine backup sync client cleanly: %w", err))
			}
		}
421
	}
422

423 424 425
	// close L2 engine RPC client
	if n.l2Source != nil {
		n.l2Source.Close()
426
	}
427

428 429 430 431 432 433
	// close L1 data source
	if n.l1Source != nil {
		n.l1Source.Close()
	}
	return result.ErrorOrNil()
}
434 435 436 437 438 439 440 441

func (n *OpNode) ListenAddr() string {
	return n.server.listenAddr.String()
}

func (n *OpNode) HTTPEndpoint() string {
	return fmt.Sprintf("http://%s", n.ListenAddr())
}