From 89c1269fd163f4aa38b1ae475ce2b780bd229d43 Mon Sep 17 00:00:00 2001 From: Ted Kaminski Date: Thu, 14 Jul 2022 17:07:55 -0500 Subject: [PATCH] Revise first steps tutorial (#1330) --- docs/src/tutorial-first-steps.md | 96 ++++++++++++------- docs/src/tutorial-kinds-of-failure.md | 4 +- ....expected => check_estimate_size.expected} | 0 .../first-steps-v1/src/{main.rs => lib.rs} | 2 +- .../first-steps-v2/src/{main.rs => lib.rs} | 2 +- .../{main.expected => will_fail.expected} | 0 6 files changed, 66 insertions(+), 38 deletions(-) rename docs/src/tutorial/first-steps-v1/{main.expected => check_estimate_size.expected} (100%) rename docs/src/tutorial/first-steps-v1/src/{main.rs => lib.rs} (97%) rename docs/src/tutorial/first-steps-v2/src/{main.rs => lib.rs} (98%) rename docs/src/tutorial/first-steps-v2/{main.expected => will_fail.expected} (100%) diff --git a/docs/src/tutorial-first-steps.md b/docs/src/tutorial-first-steps.md index b2efa9c5b8b0c..42520b33d2a28 100644 --- a/docs/src/tutorial-first-steps.md +++ b/docs/src/tutorial-first-steps.md @@ -2,12 +2,12 @@ Kani is unlike the testing tools you may already be familiar with. Much of testing is concerned with thinking of new corner cases that need to be covered. -With Kani, all the corner cases are covered from the start, and the new concern is narrowing down the scope to something manageable for the checker. +With Kani, all the corner cases are covered from the start, and the new concern is narrowing down the scope to something manageable for the verifier. Consider this first program (which can be found under [`first-steps-v1`](https://github.com/model-checking/kani/tree/main/docs/src/tutorial/first-steps-v1/)): ```rust -{{#include tutorial/first-steps-v1/src/main.rs:code}} +{{#include tutorial/first-steps-v1/src/lib.rs:code}} ``` Think about the test harness you would need to write to test this function. @@ -18,7 +18,7 @@ And if this function was more complicated—for example, if some of the branches We can try to property test a function like this, but if we're naive about it (and consider all possible `u32` inputs), then it's unlikely we'll ever find the bug. ```rust -{{#include tutorial/first-steps-v1/src/main.rs:proptest}} +{{#include tutorial/first-steps-v1/src/lib.rs:proptest}} ``` ``` @@ -29,10 +29,11 @@ test tests::doesnt_crash ... ok There's only 1 in 4 billion inputs that fail, so it's vanishingly unlikely the property test will find it, even with a million samples. -With Kani, however, we can use `kani::any()` to represent all possible `u32` values: +Let's write a Kani _proof harness_ for `estimate_size`. +This is a lot like a test harness, but now we can use `kani::any()` to represent all possible `u32` values: ```rust -{{#include tutorial/first-steps-v1/src/main.rs:kani}} +{{#include tutorial/first-steps-v1/src/lib.rs:kani}} ``` ``` @@ -50,22 +51,33 @@ VERIFICATION:- FAILED Kani has immediately found a failure. Notably, we haven't had to write explicit assertions in our proof harness: by default, Kani will find a host of erroneous conditions which include a reachable call to `panic` or a failing `assert`. +If Kani had run successfully on this harness, this amounts to a mathematical proof that there is no input that could cause a panic in `estimate_size`. ### Getting a trace By default, Kani only reports failures, not how the failure happened. -This is because, in its full generality, understanding how a failure happened requires exploring a full (potentially large) execution trace. -Here, we've just got some nondeterministic inputs up front, but that's something of a special case that has a "simpler" explanation (just the choice of nondeterministic input). +In this running example, it seems obvious what we're interested in (the value of `x` that caused the failure) because we just have one unknown input at the start (similar to the property test), but that's kind of a special case. +In general, understanding how a failure happened requires exploring a full (potentially large) _execution trace_. -To see traces, run: +An execution trace is a record of exactly how a failure can occur. +Nondeterminism (like a call to `kani::any()`, which could return any value) can appear in the middle of its execution. +A trace is a record of exactly how execution proceeded, including concrete choices (like `1023`) for all of these nondeterministic values. + +To get a trace for a failing check in Kani, run: ``` -kani --visualize src/main.rs +cargo kani --visualize ``` -This command runs Kani and generates the HTML report in `report-main/html/index.html`. +This command runs Kani and generates an HTML report that includes a trace. Open the report with your preferred browser. -From this report, we can find the trace of the failure and filter through it to find the relevant line (at present time, an unfortunate amount of generated code is present in the trace): +Under the "Errors" heading, click on the "trace" link to find the trace for this failure. + +From this trace report, we can filter through it to find relevant lines. +A good rule of thumb is to search for either `kani::any()` or assignments to variables you're interested in. +At present time, an unfortunate amount of generated code is present in the trace. +This code isn't a part of the Rust code you wrote, but is an internal implementation detail of how Kani runs proof harnesses. +Still, searching for `kani::any()` quickly finds us these lines: ``` let x: u32 = kani::any(); @@ -73,8 +85,8 @@ x = 1023u ``` Here we're seeing the line of code and the value assigned in this particular trace. -Like property testing, this is just one example of a failure. -To find more, we'd presumably fix this issue and then re-run Kani. +Like property testing, this is just one **example** of a failure. +To proceed, we recommend fixing the code to avoid this particular issue and then re-running Kani to see if you find more issues. ### Exercise: Try other failures @@ -106,14 +118,14 @@ But Kani still catches the issue: [...] RESULTS: [...] -Check 2: foo.pointer_dereference.1 +Check 2: estimate_size.pointer_dereference.1 - Status: FAILURE - Description: "dereference failure: pointer NULL" [...] VERIFICATION:- FAILED ``` -**Can you find an example where the Rust compiler will not complain, and Kani will?** +**Exercise: Can you find an example where the Rust compiler will not complain, and Kani will?**
Click to show one possible answer @@ -127,11 +139,11 @@ Overflow (in addition, multiplication or, in this case, [bit-shifting by too muc ``` RESULTS: [...] -Check 3: foo.assertion.1 +Check 1: estimate_size.assertion.1 - Status: FAILURE - Description: "attempt to shift left with overflow" -Check 4: foo.undefined-shift.1 +Check 3: estimate_size.undefined-shift.1 - Status: FAILURE - Description: "shift distance too large" [...] @@ -142,38 +154,43 @@ VERIFICATION:- FAILED ## Assertions, Assumptions, and Harnesses -It seems a bit odd that we can take billions of inputs when our function only handles up to a few thousand. -Let's encode this fact about our function by asserting some reasonable bound on our input, after we've fixed our bug (code available under -[`first-steps-v2`](https://github.com/model-checking/kani/tree/main/docs/src/tutorial/first-steps-v2/)): +It seems a bit odd that our example function is tested against billions of possible inputs, when it really only seems to be designed to handle a few thousand. +Let's encode this fact about our function by asserting some reasonable upper bound on our input, after we've fixed our bug. +(New code available under [`first-steps-v2`](https://github.com/model-checking/kani/tree/main/docs/src/tutorial/first-steps-v2/)): ```rust -{{#include tutorial/first-steps-v2/src/main.rs:code}} +{{#include tutorial/first-steps-v2/src/lib.rs:code}} ``` -Now we've stated our previously implicit expectation: this function should never be called with inputs that are too big. -But if we attempt to verify this, we get a problem: +Now we've explicitly stated our previously implicit expectation: this function should never be called with inputs that are too big. +But if we attempt to verify this modified function, we run into a problem: ``` [...] RESULTS: [...] -Check 3: final_form::estimate_size.assertion.1 +Check 3: estimate_size.assertion.1 - Status: FAILURE - Description: "assertion failed: x < 4096" [...] VERIFICATION:- FAILED ``` -We intended this to be a precondition of calling the function, but Kani is treating it like a failure. -If we call this function with too large of a value, it will crash with an assertion failure. -But we know that, that was our intention. +What we want is a _precondition_ for `estimate_size`. +That is, something that should always be true every time we call the function. +By putting the assertion at the beginning, we ensure the function immediately fails if that expectation is not met. + +But our proof harness will still call this function with any integer, even ones that just don't meet the function's preconditions. +That's... not a useful or interesting result. +We know that won't work already. +How do we go back to successfully verifying this function? -This is the purpose of _proof harnesses_. +This is the purpose of writing a proof harness. Much like property testing (which would also fail in this assertion), we need to set up our preconditions, call the function in question, then assert our postconditions. Here's a revised example of the proof harness, one that now succeeds: ```rust -{{#include tutorial/first-steps-v2/src/main.rs:kani}} +{{#include tutorial/first-steps-v2/src/lib.rs:kani}} ``` But now we must wonder if we've really fully tested our function. @@ -183,14 +200,25 @@ Fortunately, Kani is able to report a coverage metric for each proof harness. Try running: ``` -kani --visualize src/main.rs --harness verify_success -open report-verify_success/html/index.html +cargo kani --visualize --harness verify_success ``` The beginning of the report includes coverage information. Clicking through to the file will show fully-covered lines in green. Lines not covered by our proof harness will show in red. -1. Try changing the assumption in the proof harness to `x < 2048`. Now the harness won't be testing all possible cases. -2. Rerun `kani --visualize` on the file -3. Look at the report: you'll see we no longer have 100% coverage of the function. +Try changing the assumption in the proof harness to `x < 2048`. +Now the harness won't be testing all possible cases. +Rerun `cargo kani --visualize`. +Look at the report: you'll see we no longer have 100% coverage of the function. + +## Summary + +In this section: + +1. We saw Kani find panics, assertion failures, and even some other failures like unsafe dereferencing of null pointers. +2. We saw Kani find failures that testing could not easily find. +3. We saw how to write a proof harness and use `kani::any()`. +4. We saw how to get a failing **trace** using `kani --visualize` +5. We saw how proof harnesses are used to set up preconditions with `kani::assume()`. +6. We saw how to obtain **coverage** metrics and use them to ensure our proofs are covering as much as they should be. diff --git a/docs/src/tutorial-kinds-of-failure.md b/docs/src/tutorial-kinds-of-failure.md index 5af5c39101f5a..29236b95db0ca 100644 --- a/docs/src/tutorial-kinds-of-failure.md +++ b/docs/src/tutorial-kinds-of-failure.md @@ -126,11 +126,11 @@ In this case, where we just have a couple of `kani::any` values in our proof har In this trace we find (and the values you get may be different): ``` -Step 36: Function bound_check, File src/bounds_check.rs, Line 43 +Step 36: Function bound_check, File src/bounds_check.rs, Line 37 let size: usize = kani::any(); size = 2464ul -Step 39: Function main, File src/bounds_check.rs, Line 45 +Step 39: Function bound_check, File src/bounds_check.rs, Line 39 let index: usize = kani::any(); index = 2463ul ``` diff --git a/docs/src/tutorial/first-steps-v1/main.expected b/docs/src/tutorial/first-steps-v1/check_estimate_size.expected similarity index 100% rename from docs/src/tutorial/first-steps-v1/main.expected rename to docs/src/tutorial/first-steps-v1/check_estimate_size.expected diff --git a/docs/src/tutorial/first-steps-v1/src/main.rs b/docs/src/tutorial/first-steps-v1/src/lib.rs similarity index 97% rename from docs/src/tutorial/first-steps-v1/src/main.rs rename to docs/src/tutorial/first-steps-v1/src/lib.rs index 19004231eeeb4..d4b64df8f3e38 100644 --- a/docs/src/tutorial/first-steps-v1/src/main.rs +++ b/docs/src/tutorial/first-steps-v1/src/lib.rs @@ -49,7 +49,7 @@ mod tests { // ANCHOR: kani #[cfg(kani)] #[kani::proof] -fn main() { +fn check_estimate_size() { let x: u32 = kani::any(); estimate_size(x); } diff --git a/docs/src/tutorial/first-steps-v2/src/main.rs b/docs/src/tutorial/first-steps-v2/src/lib.rs similarity index 98% rename from docs/src/tutorial/first-steps-v2/src/main.rs rename to docs/src/tutorial/first-steps-v2/src/lib.rs index a1cdf31aa0918..0a29eb7933571 100644 --- a/docs/src/tutorial/first-steps-v2/src/main.rs +++ b/docs/src/tutorial/first-steps-v2/src/lib.rs @@ -61,7 +61,7 @@ fn verify_success() { #[cfg(kani)] #[kani::proof] -fn main() { +fn will_fail() { let x: u32 = kani::any(); let y = estimate_size(x); } diff --git a/docs/src/tutorial/first-steps-v2/main.expected b/docs/src/tutorial/first-steps-v2/will_fail.expected similarity index 100% rename from docs/src/tutorial/first-steps-v2/main.expected rename to docs/src/tutorial/first-steps-v2/will_fail.expected