Skip to content
This repository has been archived by the owner on Nov 15, 2023. It is now read-only.

98.6% OF DEVELOPERS CANNOT REVIEW THIS PR! [read more...] #7337

Merged
merged 61 commits into from
Jul 31, 2023
Merged
Show file tree
Hide file tree
Changes from 57 commits
Commits
Show all changes
61 commits
Select commit Hold shift + click to select a range
d2e068d
[WIP] PVF: Split out worker binaries
mrcnski Jun 6, 2023
4ff0a66
Merge branch 'master' into mrcnski/pvf-split-out-worker-binaries
s0me0ne-unkn0wn Jun 8, 2023
5bed726
Address compilation problems and re-design a bit
s0me0ne-unkn0wn Jun 10, 2023
d7a389c
Reorganize once more, fix tests
s0me0ne-unkn0wn Jun 11, 2023
818778c
Reformat with new nightly to make `cargo fmt` test happy
s0me0ne-unkn0wn Jun 11, 2023
f9a9280
Address `clippy` warnings
s0me0ne-unkn0wn Jun 11, 2023
165f116
Merge remote-tracking branch 'origin/master' into mrcnski/pvf-split-o…
s0me0ne-unkn0wn Jun 13, 2023
2f192ea
Merge remote-tracking branch 'origin/master' into mrcnski/pvf-split-o…
s0me0ne-unkn0wn Jun 14, 2023
01b97f8
Merge remote-tracking branch 'origin/master' into mrcnski/pvf-split-o…
s0me0ne-unkn0wn Jun 14, 2023
b5733fa
Add temporary trace to debug zombienet tests
s0me0ne-unkn0wn Jun 14, 2023
235766e
Merge remote-tracking branch 'origin/master' into mrcnski/pvf-split-o…
s0me0ne-unkn0wn Jun 16, 2023
f5ba965
Fix zombienet node upgrade test
s0me0ne-unkn0wn Jun 16, 2023
7079e2f
Fix malus and its CI
s0me0ne-unkn0wn Jun 16, 2023
95e643f
Fix building worker binaries with malus
s0me0ne-unkn0wn Jun 16, 2023
a1c093e
More fixes for malus
s0me0ne-unkn0wn Jun 16, 2023
5382cc7
Merge remote-tracking branch 'origin/master' into mrcnski/pvf-split-o…
s0me0ne-unkn0wn Jun 17, 2023
06de32d
Remove unneeded cli subcommands
s0me0ne-unkn0wn Jun 18, 2023
d7b5a5a
Support placing auxiliary binaries to `/usr/libexec`
s0me0ne-unkn0wn Jun 18, 2023
49475c2
Fix spelling
s0me0ne-unkn0wn Jun 18, 2023
4c72864
Spelling
s0me0ne-unkn0wn Jul 7, 2023
07d876e
Implement review comments (mostly nits)
mrcnski Jul 9, 2023
0da74cd
Merge branch 'master' into mrcnski/pvf-split-out-worker-binaries
mrcnski Jul 9, 2023
126213e
Fix worker node version flag
mrcnski Jul 10, 2023
6640b29
Rework getting the worker paths
mrcnski Jul 10, 2023
633edbc
Address a couple of review comments
mrcnski Jul 11, 2023
41b0a49
Minor restructuring
mrcnski Jul 11, 2023
49d8696
Fix CI error
mrcnski Jul 11, 2023
dc5d6a0
Add tests for worker binaries detection
mrcnski Jul 14, 2023
6ef14fe
Improve tests; try to fix CI
mrcnski Jul 14, 2023
d2bef1f
Move workers module into separate file
mrcnski Jul 16, 2023
3e09438
Try to fix failing test and workers not printing latest version
mrcnski Jul 16, 2023
55365d8
Make a bunch of fixes
mrcnski Jul 17, 2023
751dd04
Rebuild nodes on version change
mrcnski Jul 17, 2023
76c16f3
Fix more issues
mrcnski Jul 18, 2023
a1e21dc
Fix tests
mrcnski Jul 19, 2023
7366c99
Merge remote-tracking branch 'origin/master' into mrcnski/pvf-split-o…
Jul 19, 2023
11bbf59
Pass node version from node into dependencies to avoid recompiles
mrcnski Jul 20, 2023
6244e3f
Some more improvements for smoother tests
mrcnski Jul 20, 2023
6f44e63
Merge remote-tracking branch 'origin/mrcnski/pvf-split-out-worker-bin…
mrcnski Jul 20, 2023
019bd97
Add back rerun to PVF workers
mrcnski Jul 20, 2023
df1117a
Move worker binaries into files in cli crate
mrcnski Jul 21, 2023
cde8dc6
Fix bug (was passing worker version for node version)
mrcnski Jul 23, 2023
98323d2
Move workers out of cli into root src/bin/ dir
mrcnski Jul 24, 2023
ecf0af8
Add some sanity checks for workers to dockerfiles
mrcnski Jul 24, 2023
3f929bb
Update malus
mrcnski Jul 24, 2023
508669c
Try to fix clippy errors
mrcnski Jul 24, 2023
e072517
Merge branch 'master' into mrcnski/pvf-split-out-worker-binaries
mrcnski Jul 24, 2023
432dcf3
Address `cargo run` issue
mrcnski Jul 25, 2023
7407507
Update readme (installation instructions)
mrcnski Jul 25, 2023
0651bf6
Merge branch 'master' into mrcnski/pvf-split-out-worker-binaries
mrcnski Jul 25, 2023
5d9c711
Allow disabling external workers for local/testing setups
mrcnski Jul 25, 2023
1ce0c3e
Revert unnecessary Cargo.lock changes
mrcnski Jul 27, 2023
09f4840
Remove unnecessary build scripts from collators
mrcnski Jul 27, 2023
700ee0d
Merge branch 'master' into mrcnski/pvf-split-out-worker-binaries
mrcnski Jul 27, 2023
8851c20
Add back missing malus commands (should fix failing ZN job)
mrcnski Jul 27, 2023
fd0f018
Some minor fixes
mrcnski Jul 27, 2023
e5771a0
Update Cargo.lock
mrcnski Jul 27, 2023
0a04dd4
Fix some build errors
mrcnski Jul 27, 2023
9f05299
Undo self-contained binaries; cli flag to disable version check
mrcnski Jul 28, 2023
0477550
Try to fix failing job and add some docs for local tests
mrcnski Jul 28, 2023
70cd333
Merge branch 'master' into mrcnski/pvf-split-out-worker-binaries
mrcnski Jul 28, 2023
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
54 changes: 53 additions & 1 deletion Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

18 changes: 18 additions & 0 deletions Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -2,12 +2,21 @@
name = "polkadot"
path = "src/main.rs"

[[bin]]
name = "polkadot-execute-worker"
path = "src/bin/execute-worker.rs"

[[bin]]
name = "polkadot-prepare-worker"
path = "src/bin/prepare-worker.rs"

[package]
name = "polkadot"
description = "Implementation of a `https://polkadot.network` node in Rust based on the Substrate framework."
license = "GPL-3.0-only"
rust-version = "1.64.0" # workspace properties
readme = "README.md"
default-run = "polkadot"
authors.workspace = true
edition.workspace = true
version.workspace = true
Expand All @@ -28,6 +37,10 @@ polkadot-node-core-pvf = { path = "node/core/pvf" }
polkadot-node-core-pvf-prepare-worker = { path = "node/core/pvf/prepare-worker" }
polkadot-overseer = { path = "node/overseer" }

# Needed for worker binaries.
polkadot-node-core-pvf-common = { path = "node/core/pvf/common" }
polkadot-node-core-pvf-execute-worker = { path = "node/core/pvf/execute-worker" }

[dev-dependencies]
assert_cmd = "2.0.4"
nix = { version = "0.26.1", features = ["signal"] }
Expand All @@ -36,6 +49,9 @@ tokio = "1.24.2"
substrate-rpc-client = { git = "https://github.com/paritytech/substrate", branch = "master" }
polkadot-core-primitives = { path = "core-primitives" }

[build-dependencies]
substrate-build-script-utils = { git = "https://github.com/paritytech/substrate", branch = "master" }

[workspace]
members = [
"cli",
Expand Down Expand Up @@ -226,6 +242,8 @@ license-file = ["LICENSE", "0"]
maintainer-scripts = "scripts/packaging/deb-maintainer-scripts"
assets = [
["target/release/polkadot", "/usr/bin/", "755"],
["target/release/polkadot-prepare-worker", "/usr/lib/polkadot/", "755"],
["target/release/polkadot-execute-worker", "/usr/lib/polkadot/", "755"],
["scripts/packaging/polkadot.service", "/lib/systemd/system/", "644"]
]
conf-files = [
Expand Down
4 changes: 3 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -91,7 +91,9 @@ git checkout <latest tagged release>
cargo build --release
```

Note that compilation is a memory intensive process. We recommend having 4 GiB of physical RAM or swap available (keep in mind that if a build hits swap it tends to be very slow).
**Note:** compilation is a memory intensive process. We recommend having 4 GiB of physical RAM or swap available (keep in mind that if a build hits swap it tends to be very slow).

**Note:** if you want to move the built `polkadot` binary somewhere (e.g. into $PATH) you will also need to move `polkadot-execute-worker` and `polkadot-prepare-worker`. You can let cargo do all this for you by running `cargo install --path .`.

#### Build from Source with Docker

Expand Down
3 changes: 3 additions & 0 deletions node/core/pvf/build.rs → build.rs
Original file line number Diff line number Diff line change
Expand Up @@ -16,4 +16,7 @@

fn main() {
substrate_build_script_utils::generate_cargo_keys();
// For the node/worker version check, make sure we always rebuild the node and binary workers
// when the version changes.
substrate_build_script_utils::rerun_if_git_head_changed();
}
3 changes: 3 additions & 0 deletions cli/build.rs
Original file line number Diff line number Diff line change
Expand Up @@ -19,4 +19,7 @@ fn main() {
println!("cargo:rustc-cfg=build_type=\"{}\"", profile);
}
substrate_build_script_utils::generate_cargo_keys();
// For the node/worker version check, make sure we always rebuild the node when the version
// changes.
substrate_build_script_utils::rerun_if_git_head_changed();
}
15 changes: 15 additions & 0 deletions cli/src/cli.rs
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,10 @@
//! Polkadot CLI library.

use clap::Parser;
use std::path::PathBuf;

/// The version of the node. The passed-in version of the workers should match this.
pub const NODE_VERSION: &'static str = env!("SUBSTRATE_CLI_IMPL_VERSION");

#[allow(missing_docs)]
#[derive(Debug, Parser)]
Expand Down Expand Up @@ -148,6 +152,17 @@ pub struct RunCmd {
/// **Dangerous!** Do not touch unless explicitly adviced to.
#[arg(long)]
pub overseer_channel_capacity_override: Option<usize>,

/// Path to the directory where auxiliary worker binaries reside. If not specified, the main
/// binary's directory is searched first, then `/usr/lib/polkadot` is searched. TESTING ONLY: if
/// the path points to an executable rather then directory, that executable is used both as
/// preparation and execution worker.
#[arg(long, value_name = "PATH")]
pub workers_path: Option<PathBuf>,

/// TESTING ONLY: don't use secure external PVF worker binaries.
#[arg(long, hide = true)]
pub dont_use_external_workers: bool,
}

#[allow(missing_docs)]
Expand Down
60 changes: 41 additions & 19 deletions cli/src/command.rs
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@
// You should have received a copy of the GNU General Public License
// along with Polkadot. If not, see <http://www.gnu.org/licenses/>.

use crate::cli::{Cli, Subcommand};
use crate::cli::{Cli, Subcommand, NODE_VERSION};
use frame_benchmarking_cli::{BenchmarkCmd, ExtrinsicFactory, SUBSTRATE_REFERENCE_HARDWARE};
use futures::future::TryFutureExt;
use log::info;
Expand Down Expand Up @@ -55,7 +55,7 @@ impl SubstrateCli for Cli {
}

fn impl_version() -> String {
env!("SUBSTRATE_CLI_IMPL_VERSION").into()
NODE_VERSION.into()
}

fn description() -> String {
Expand Down Expand Up @@ -222,15 +222,23 @@ pub fn run_node(
run: Cli,
overseer_gen: impl service::OverseerGen,
malus_finality_delay: Option<u32>,
dont_use_external_workers: bool,
) -> Result<()> {
run_node_inner(run, overseer_gen, malus_finality_delay, |_logger_builder, _config| {})
run_node_inner(
run,
overseer_gen,
malus_finality_delay,
|_logger_builder, _config| {},
dont_use_external_workers,
)
}

fn run_node_inner<F>(
cli: Cli,
overseer_gen: impl service::OverseerGen,
maybe_malus_finality_delay: Option<u32>,
logger_hook: F,
dont_use_external_workers: bool,
) -> Result<()>
where
F: FnOnce(&mut sc_cli::LoggerBuilder, &sc_service::Configuration),
Expand Down Expand Up @@ -283,16 +291,24 @@ where
let database_source = config.database.clone();
let task_manager = service::build_full(
config,
service::IsCollator::No,
grandpa_pause,
enable_beefy,
jaeger_agent,
None,
false,
overseer_gen,
cli.run.overseer_channel_capacity_override,
maybe_malus_finality_delay,
hwbench,
service::NewFullParams {
is_collator: service::IsCollator::No,
grandpa_pause,
enable_beefy,
jaeger_agent,
telemetry_worker_handle: None,
node_version: Some(NODE_VERSION.to_string()),
workers_path: cli.run.workers_path,
workers_names: None,
dont_use_external_workers,
overseer_enable_anyways: false,
overseer_gen,
overseer_message_channel_capacity_override: cli
.run
.overseer_channel_capacity_override,
malus_finality_delay: maybe_malus_finality_delay,
hwbench,
},
)
.map(|full| full.task_manager)?;

Expand Down Expand Up @@ -335,12 +351,16 @@ pub fn run() -> Result<()> {
}

match &cli.subcommand {
None => run_node_inner(
cli,
service::RealOverseerGen,
None,
polkadot_node_metrics::logger_hook(),
),
None => {
let dont_use_external_workers = cli.run.dont_use_external_workers;
run_node_inner(
cli,
service::RealOverseerGen,
None,
polkadot_node_metrics::logger_hook(),
dont_use_external_workers,
)
},
Some(Subcommand::BuildSpec(cmd)) => {
let runner = cli.create_runner(cmd)?;
Ok(runner.sync_run(|config| cmd.run(config.chain_spec, config.network))?)
Expand Down Expand Up @@ -436,6 +456,7 @@ pub fn run() -> Result<()> {
{
polkadot_node_core_pvf_prepare_worker::worker_entrypoint(
&cmd.socket_path,
Some(NODE_VERSION),
Some(&cmd.node_impl_version),
);
Ok(())
Expand All @@ -458,6 +479,7 @@ pub fn run() -> Result<()> {
{
polkadot_node_core_pvf_execute_worker::worker_entrypoint(
&cmd.socket_path,
Some(NODE_VERSION),
Some(&cmd.node_impl_version),
);
Ok(())
Expand Down
31 changes: 16 additions & 15 deletions node/core/candidate-validation/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -93,9 +93,12 @@ const DEFAULT_APPROVAL_EXECUTION_TIMEOUT: Duration = Duration::from_secs(12);
pub struct Config {
/// The path where candidate validation can store compiled artifacts for PVFs.
pub artifacts_cache_path: PathBuf,
/// The path to the executable which can be used for spawning PVF compilation & validation
/// workers.
pub program_path: PathBuf,
/// The version of the node. `None` can be passed to skip the version check (only for tests).
pub node_version: Option<String>,
/// Path to the preparation worker binary
pub prep_worker_path: PathBuf,
/// Path to the execution worker binary
pub exec_worker_path: PathBuf,
}

/// The candidate validation subsystem.
Expand Down Expand Up @@ -124,15 +127,9 @@ impl CandidateValidationSubsystem {
#[overseer::subsystem(CandidateValidation, error=SubsystemError, prefix=self::overseer)]
impl<Context> CandidateValidationSubsystem {
fn start(self, ctx: Context) -> SpawnedSubsystem {
let future = run(
ctx,
self.metrics,
self.pvf_metrics,
self.config.artifacts_cache_path,
self.config.program_path,
)
.map_err(|e| SubsystemError::with_origin("candidate-validation", e))
.boxed();
let future = run(ctx, self.metrics, self.pvf_metrics, self.config)
.map_err(|e| SubsystemError::with_origin("candidate-validation", e))
.boxed();
SpawnedSubsystem { name: "candidate-validation-subsystem", future }
}
}
Expand All @@ -142,11 +139,15 @@ async fn run<Context>(
mut ctx: Context,
metrics: Metrics,
pvf_metrics: polkadot_node_core_pvf::Metrics,
cache_path: PathBuf,
program_path: PathBuf,
Config { artifacts_cache_path, node_version, prep_worker_path, exec_worker_path }: Config,
) -> SubsystemResult<()> {
let (validation_host, task) = polkadot_node_core_pvf::start(
polkadot_node_core_pvf::Config::new(cache_path, program_path),
polkadot_node_core_pvf::Config::new(
artifacts_cache_path,
node_version,
prep_worker_path,
exec_worker_path,
),
pvf_metrics,
);
ctx.spawn_blocking("pvf-validation-host", task.boxed())?;
Expand Down
3 changes: 0 additions & 3 deletions node/core/pvf/common/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,3 @@ landlock = "0.2.0"
[dev-dependencies]
assert_matches = "1.4.0"
tempfile = "3.3.0"

[build-dependencies]
substrate-build-script-utils = { git = "https://github.com/paritytech/substrate", branch = "master" }
Loading