Skip to content
This repository has been archived by the owner on Nov 15, 2023. It is now read-only.

Use CPU clock timeout for PVF jobs #6282

Merged
merged 23 commits into from
Nov 30, 2022
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
23 commits
Select commit Hold shift + click to select a range
aad7de7
Put in skeleton logic for CPU-time-preparation
mrcnski Nov 10, 2022
c62a8e1
Continue filling in logic for prepare worker CPU time changes
mrcnski Nov 13, 2022
9c68422
Fix compiler errors
mrcnski Nov 13, 2022
9fac3a4
Update lenience factor
mrcnski Nov 14, 2022
9f67150
Fix some clippy lints for PVF module
mrcnski Nov 14, 2022
e34825a
Fix compilation errors
mrcnski Nov 15, 2022
fe139e1
Address some review comments
mrcnski Nov 16, 2022
7b7886c
Add logging
mrcnski Nov 16, 2022
6006fe0
Add another log
mrcnski Nov 16, 2022
ebc9825
Merge branch 'master' into m-cat/pvf-preparation-cpu-time
mrcnski Nov 20, 2022
80d2cf6
Address some review comments; change Mutex to AtomicBool
mrcnski Nov 20, 2022
8e5139f
Refactor handling response bytes
mrcnski Nov 20, 2022
d8add29
Add CPU clock timeout logic for execute jobs
mrcnski Nov 20, 2022
c50a08f
Properly handle AtomicBool flag
mrcnski Nov 20, 2022
bc6172e
Use `Ordering::Relaxed`
mrcnski Nov 20, 2022
eb9372c
Refactor thread coordination logic
mrcnski Nov 21, 2022
6576ea1
Fix bug
mrcnski Nov 22, 2022
ec60713
Add some timing information to execute tests
mrcnski Nov 22, 2022
efd50fe
Merge branch 'master' into m-cat/pvf-preparation-cpu-time
mrcnski Nov 23, 2022
09560ee
Add section about the mitigation to the IG
mrcnski Nov 23, 2022
7c859d6
minor: Change more `Ordering`s to `Relaxed`
mrcnski Nov 25, 2022
fb6c5e9
candidate-validation: Fix build errors
mrcnski Nov 28, 2022
3e98ee6
Merge branch 'master' into m-cat/pvf-preparation-cpu-time
mrcnski Nov 30, 2022
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
Fix bug
  • Loading branch information
mrcnski committed Nov 22, 2022
commit 6576ea12e687dbbe12e5660e22a435df0cf3c777
21 changes: 11 additions & 10 deletions node/core/pvf/src/execute/worker.rs
Original file line number Diff line number Diff line change
Expand Up @@ -90,7 +90,9 @@ pub async fn start_work(
artifact.path.display(),
);

if let Err(error) = send_request(&mut stream, &artifact.path, &validation_params).await {
if let Err(error) =
send_request(&mut stream, &artifact.path, &validation_params, execution_timeout).await
{
gum::warn!(
target: LOG_TARGET,
worker_pid = %pid,
Expand Down Expand Up @@ -170,9 +172,11 @@ async fn send_request(
stream: &mut UnixStream,
artifact_path: &Path,
validation_params: &[u8],
execution_timeout: Duration,
) -> io::Result<()> {
framed_send(stream, path_to_bytes(artifact_path)).await?;
framed_send(stream, validation_params).await
framed_send(stream, validation_params).await?;
framed_send(stream, &execution_timeout.encode()).await
}

async fn recv_request(stream: &mut UnixStream) -> io::Result<(PathBuf, Vec<u8>, Duration)> {
Expand Down Expand Up @@ -266,15 +270,12 @@ pub fn worker_entrypoint(socket_path: &str) {
})
})?;

let response = validate_using_artifact(
&artifact_path,
&params,
&executor,
cpu_time_start,
)
.await;

let lock_result = lock.compare_exchange(false, true, Ordering::Relaxed, Ordering::Relaxed);
let response =
validate_using_artifact(&artifact_path, &params, &executor, cpu_time_start).await;

let lock_result =
lock.compare_exchange(false, true, Ordering::Relaxed, Ordering::Relaxed);
if lock_result.is_err() {
// The other thread is still sending an error response over the socket. Wait on it
// and return.
Expand Down
3 changes: 1 addition & 2 deletions node/core/pvf/src/prepare/worker.rs
Original file line number Diff line number Diff line change
Expand Up @@ -375,8 +375,7 @@ pub fn worker_entrypoint(socket_path: &str) {
"worker: writing artifact to {}",
dest.display(),
);
async_std::fs::write(&dest, &compiled_artifact)
.await?;
async_std::fs::write(&dest, &compiled_artifact).await?;

Ok(cpu_time_elapsed)
},
Expand Down
11 changes: 7 additions & 4 deletions node/core/pvf/tests/it/main.rs
Original file line number Diff line number Diff line change
Expand Up @@ -124,11 +124,14 @@ async fn parallel_execution() {
let start = std::time::Instant::now();
let (_, _) = futures::join!(execute_pvf_future_1, execute_pvf_future_2);

// total time should be < 2 x EXECUTION_TIMEOUT_SEC
const EXECUTION_TIMEOUT_SEC: u64 = 3;
// total time should be < 2 x TEST_EXECUTION_TIMEOUT
let duration = std::time::Instant::now().duration_since(start);
let expected_duration = TEST_EXECUTION_TIMEOUT * 2;
assert!(
std::time::Instant::now().duration_since(start) <
std::time::Duration::from_secs(EXECUTION_TIMEOUT_SEC * 2)
duration < expected_duration,
"Expected duration {}s to be less than {}s",
duration.as_secs(),
expected_duration.as_secs()
);
}

Expand Down