From aa9a282cd0615aa2937fc3d897758c8e9e1539d3 Mon Sep 17 00:00:00 2001 From: Kyle J Strand Date: Tue, 1 Oct 2024 22:54:54 -0600 Subject: [PATCH] panic runtime and C-unwind documentation --- src/SUMMARY.md | 2 + src/behavior-considered-undefined.md | 15 +++- src/crates-and-source-files.md | 12 ++++ src/destructors.md | 23 +++++- src/expressions/array-expr.md | 3 +- src/items/external-blocks.md | 32 ++++++--- src/items/functions.md | 56 +++++++++++++-- src/linkage.md | 18 +++++ src/panic.md | 101 +++++++++++++++++++++++++++ src/runtime.md | 7 +- 10 files changed, 249 insertions(+), 20 deletions(-) create mode 100644 src/panic.md diff --git a/src/SUMMARY.md b/src/SUMMARY.md index 2b17bf45d..2df5bc711 100644 --- a/src/SUMMARY.md +++ b/src/SUMMARY.md @@ -114,6 +114,8 @@ - [Memory allocation and lifetime](memory-allocation-and-lifetime.md) - [Variables](variables.md) +- [Panic](panic.md) + - [Linkage](linkage.md) - [Inline assembly](inline-assembly.md) diff --git a/src/behavior-considered-undefined.md b/src/behavior-considered-undefined.md index 63fa28f63..7a7a6e95f 100644 --- a/src/behavior-considered-undefined.md +++ b/src/behavior-considered-undefined.md @@ -49,7 +49,9 @@ undefined behavior, it is *unsound*. * Invoking undefined behavior via compiler intrinsics. * Executing code compiled with platform features that the current platform does not support (see [`target_feature`]), *except* if the platform explicitly documents this to be safe. -* Calling a function with the wrong call ABI or unwinding from a function with the wrong unwind ABI. +* Calling a function with the wrong [call ABI][abi], or unwinding past a stack + frame that does not allow unwinding (e.g. by calling a `"C-unwind"` function + imported or transmuted as a `"C"` function or function pointer). * Producing an [invalid value][invalid-values]. "Producing" a value happens any time a value is assigned to or read from a place, passed to a function/primitive operation or returned from a function/primitive @@ -61,6 +63,14 @@ undefined behavior, it is *unsound*. some allocated object as a non-pointer type (such as integers). 'Reinterpreting' refers to loading the pointer value at integer type without a cast, e.g. by doing raw pointer casts or using a union. +* Violating assumptions of the Rust runtime. This is only possible using + mechanisms outside Rust. Most assumptions of the Rust runtime are currently + not explicitly documented. + * For assumptions specifically related to unwinding, see the [panic + documentation][unwinding-ffi]. + * The runtime assumes that a Rust stack frame is not deallocated without + executing destructors for local variables owned by the stack frame. This assumption + can be violated by C functions like `longjmp`. > **Note**: Undefined behavior affects the entire program. For example, calling > a function in C that exhibits undefined behavior of C means your entire @@ -160,11 +170,11 @@ a restricted set of valid values. In other words, the only cases in which reading uninitialized memory is permitted are inside `union`s and in "padding" (the gaps between the fields of a type). - [`bool`]: types/boolean.md [`const`]: items/constant-items.md [noalias]: http://llvm.org/docs/LangRef.html#noalias [pointer aliasing rules]: http://llvm.org/docs/LangRef.html#pointer-aliasing-rules +[abi]: abi.md [undef]: http://llvm.org/docs/LangRef.html#undefined-values [`target_feature`]: attributes/codegen.md#the-target_feature-attribute [`UnsafeCell`]: std::cell::UnsafeCell @@ -178,4 +188,5 @@ reading uninitialized memory is permitted are inside `union`s and in "padding" [project-field]: expressions/field-expr.md [project-tuple]: expressions/tuple-expr.md#tuple-indexing-expressions [project-slice]: expressions/array-expr.md#array-and-slice-indexing-expressions +[unwinding-ffi]: panic.md#unwinding-across-ffi-boundaries [const-promoted]: destructors.md#constant-promotion diff --git a/src/crates-and-source-files.md b/src/crates-and-source-files.md index 426ee26f1..5afbaaaf3 100644 --- a/src/crates-and-source-files.md +++ b/src/crates-and-source-files.md @@ -103,6 +103,17 @@ use foo::bar as main; +### Uncaught foreign unwinding + +When a "foreign" unwind (e.g. an exception thrown from C++ code, or a `panic!` +in Rust code compiled or linked with a different runtime) is not caught before +reaching the `main` function, the process will be safely terminated. This may +take the form of an abort, in which case it is not guaranteed that any `Drop` +calls will be executed, and the error output may be less informative than if the +runtime had been terminated by a "native" Rust `panic`. + +For more information, see the [panic documentation][panic-docs]. + ### The `no_main` attribute The *`no_main` [attribute]* may be applied at the crate level to disable @@ -142,6 +153,7 @@ or `_` (U+005F) characters. [function]: items/functions.md [module]: items/modules.md [module path]: paths.md +[panic-docs]: panic.md#unwinding-across-ffi-boundaries [shebang]: input-format.md#shebang-removal [trait or lifetime bounds]: trait-bounds.md [where clauses]: items/generics.md#where-clauses diff --git a/src/destructors.md b/src/destructors.md index a536221f4..03f337df8 100644 --- a/src/destructors.md +++ b/src/destructors.md @@ -268,7 +268,8 @@ Temporaries are also created to hold the result of operands to an expression while the other operands are evaluated. The temporaries are associated to the scope of the expression with that operand. Since the temporaries are moved from once the expression is evaluated, dropping them has no effect unless one of the -operands to an expression breaks out of the expression, returns, or panics. +operands to an expression breaks out of the expression, returns, or +[panics][panic]. ```rust # struct PrintOnDrop(&'static str); @@ -407,6 +408,8 @@ let x = (&temp()).use_temp(); // ERROR ## Not running destructors +### `forget` + r[destructors.forget] [`std::mem::forget`] can be used to prevent the destructor of a variable from being run, @@ -416,6 +419,20 @@ variable or field from being dropped automatically. > Note: Preventing a destructor from being run via [`std::mem::forget`] or other means is safe even if it has a type that isn't `'static`. > Besides the places where destructors are guaranteed to run as defined by this document, types may *not* safely rely on a destructor being run for soundness. +### Process termination without unwinding + +There are some ways to terminate the process without [unwinding], in which case +destructors will not be run. + +The standard library provides [`std::process::exit`] and +[`std::process::abort`] to do this explicitly. Additionally, if the +[panic-mode] is set to `abort`, panicking will always terminate the process +without destructors being run. + +There is one additional case to be aware of: when a panic reaches a +[non-unwinding ABI boundary], either no destructors will run, or all +destructors up until the ABI boundary will run. + [Assignment]: expressions/operator-expr.md#assignment-expressions [binding modes]: patterns.md#binding-modes [closure]: types/closure.md @@ -425,11 +442,15 @@ variable or field from being dropped automatically. [initialized]: glossary.md#initialized [interior mutability]: interior-mutability.md [lazy boolean expression]: expressions/operator-expr.md#lazy-boolean-operators +[non-unwinding ABI boundary]: items/functions.md#unwinding +[panic]: panic.md +[panic-mode]: panic.md#panic-runtimes [place context]: expressions.md#place-expressions-and-value-expressions [promoted]: destructors.md#constant-promotion [scrutinee]: glossary.md#scrutinee [statement]: statements.md [temporary]: expressions.md#temporaries +[unwinding]: panic.md#unwinding [variable]: variables.md [array]: types/array.md diff --git a/src/expressions/array-expr.md b/src/expressions/array-expr.md index 52d31940d..66f69c93f 100644 --- a/src/expressions/array-expr.md +++ b/src/expressions/array-expr.md @@ -53,7 +53,7 @@ Just as with methods, Rust will also insert dereference operations on `a` repeat Indices are zero-based for arrays and slices. Array access is a [constant expression], so bounds can be checked at compile-time with a constant index value. -Otherwise a check will be performed at run-time that will put the thread in a _panicked state_ if it fails. +Otherwise a check will be performed at run-time that will put the thread in a [_panicked state_][panic] if it fails. ```rust,should_panic // lint is deny by default. @@ -84,5 +84,6 @@ The array index expression can be implemented for types other than arrays and sl [constant item]: ../items/constant-items.md [literal]: ../tokens.md#literals [memory location]: ../expressions.md#place-expressions-and-value-expressions +[panic]: ../panic.md [path]: path-expr.md [slice]: ../types/slice.md diff --git a/src/items/external-blocks.md b/src/items/external-blocks.md index dbd55fb33..cf6507143 100644 --- a/src/items/external-blocks.md +++ b/src/items/external-blocks.md @@ -70,7 +70,7 @@ standard C ABI on the specific platform. Other ABIs may be specified using an unsafe extern "stdcall" { } ``` -There are three ABI strings which are cross-platform, and which all compilers +There are five ABI strings which are cross-platform, and which all compilers are guaranteed to support: * `unsafe extern "Rust"` -- The default ABI when you write a normal `fn foo()` in any @@ -80,6 +80,9 @@ are guaranteed to support: * `unsafe extern "system"` -- Usually the same as `extern "C"`, except on Win32, in which case it's `"stdcall"`, or what you should use to link to the Windows API itself +* `extern "C-unwind"` and `extern "system-unwind"` -- identical to `"C"` and + `"system"`, respectively, but with [different behavior][unwind-behavior] when + the callee unwinds (by panicking or throwing a C++ style exception). There are also some platform-specific ABI strings: @@ -96,6 +99,18 @@ There are also some platform-specific ABI strings: `__thiscall` and GCC and clang's `__attribute__((thiscall))` * `unsafe extern "efiapi"` -- The ABI used for [UEFI] functions. +Like `"C"` and `"system"`, most platform-specific ABI strings also have a +[corresponding `-unwind` variant][unwind-behavior]; specifically, these are: + +* `"cdecl-unwind"` +* `"stdcall-unwind"` +* `"fastcall-unwind"` +* `"vectorcall-unwind"` +* `"thiscall-unwind"` +* `"aapcs-unwind"` +* `"win64-unwind"` +* `"sysv64-unwind"` + ## Variadic functions Functions within external blocks may be variadic by specifying `...` as the @@ -316,10 +331,9 @@ Attributes on extern function parameters follow the same rules and restrictions as [regular function parameters]. [IDENTIFIER]: ../identifiers.md +[PE Format]: https://learn.microsoft.com/windows/win32/debug/pe-format#import-name-type [UEFI]: https://uefi.org/specifications [WebAssembly module]: https://webassembly.github.io/spec/core/syntax/modules.html -[functions]: functions.md -[statics]: static-items.md [_Abi_]: functions.md [_Function_]: functions.md [_InnerAttribute_]: ../attributes.md @@ -329,11 +343,13 @@ restrictions as [regular function parameters]. [_OuterAttribute_]: ../attributes.md [_StaticItem_]: static-items.md [_Visibility_]: ../visibility-and-privacy.md -[attributes]: ../attributes.md -[regular function parameters]: functions.md#attributes-on-function-parameters [`bundle` documentation for rustc]: ../../rustc/command-line-arguments.html#linking-modifiers-bundle -[`whole-archive` documentation for rustc]: ../../rustc/command-line-arguments.html#linking-modifiers-whole-archive -[`verbatim` documentation for rustc]: ../../rustc/command-line-arguments.html#linking-modifiers-verbatim [`dylib` versus `raw-dylib`]: #dylib-versus-raw-dylib -[PE Format]: https://learn.microsoft.com/windows/win32/debug/pe-format#import-name-type +[`verbatim` documentation for rustc]: ../../rustc/command-line-arguments.html#linking-modifiers-verbatim +[`whole-archive` documentation for rustc]: ../../rustc/command-line-arguments.html#linking-modifiers-whole-archive +[attributes]: ../attributes.md +[functions]: functions.md +[regular function parameters]: functions.md#attributes-on-function-parameters +[statics]: static-items.md +[unwind-behavior]: functions.md#unwinding [value namespace]: ../names/namespaces.md diff --git a/src/items/functions.md b/src/items/functions.md index d3f2c4548..f9d1fb595 100644 --- a/src/items/functions.md +++ b/src/items/functions.md @@ -214,12 +214,56 @@ extern "C" fn new_i32() -> i32 { 0 } let fptr: extern "C" fn() -> i32 = new_i32; ``` -Functions with an ABI that differs from `"Rust"` do not support unwinding in the -exact same way that Rust does. Therefore, unwinding past the end of functions -with such ABIs causes the process to abort. - -> **Note**: The LLVM backend of the `rustc` implementation -aborts the process by executing an illegal instruction. +### Unwinding + +Most ABI strings come in two variants, one with an `-unwind` suffix and one without. +The `Rust` ABI always permits unwinding, so there is no `Rust-unwind` ABI. + +The choice of ABI, together with the runtime [panic mode][panic-modes], +determines the behavior when unwinding out of a function. + +The table below indicates the behavior of an unwinding operation reaching each +type of ABI boundary (function declaration or definition using the +corresponding ABI string). Note that the Rust runtime is not affected by, and +cannot have an effect on, any unwinding that occurs entirely within another +language's runtime, that is, unwinds that are thrown and caught without +reaching a Rust ABI boundary. + +The `panic`-unwind column refers to [panicking] via the `panic!` macro and +similar standard library mechanisms, as well as to any other Rust operations +that cause a panic, such as out-of-bounds array indexing or integer overflow. + +The "unwinding" ABI category refers to `"Rust"` (the implicit ABI of Rust +functions not marked `extern`), `"C-unwind"`, and any other ABI with `-unwind` +in its name. The "non-unwinding" ABI category refers to all other ABI strings, +including `"C"` and `"stdcall"`. + +Native unwinding is defined per-target. On targets that support throwing and +catching C++ exceptions, it refers to the mechanism used to implement this +feature. Some platforms implement a form of unwinding referred to as ["forced +unwinding"][forced-unwinding]; `longjmp` on Windows and `pthread_exit` in +`glibc` are implemented this way. Forced unwinding is explicitly excluded +from the "Native unwind" column in the table. + +| panic runtime | ABI | `panic`-unwind | Native unwind (unforced) | +| -------------- | ------------ | ------------------------------------- | ----------------------- | +| `panic=unwind` | unwinding | unwind | unwind | +| `panic=unwind` | non-unwinding | abort (see note below) | [undefined behavior] | +| `panic=abort` | unwinding | `panic` aborts without unwinding | abort | +| `panic=abort` | non-unwinding | `panic` aborts without unwinding | [undefined behavior] | + +> Note: With `panic=unwind`, when a `panic` is turned into an abort by a +> non-unwinding ABI boundary, either no destructors (`Drop` calls) will run, or +> all destructors up until the ABI boundary will run. + +For other considerations and limitations regarding unwinding across FFI +boundaries, see the [relevant section in the Panic documentation][panic-ffi]. + +[forced-unwinding]: https://rust-lang.github.io/rfcs/2945-c-unwind-abi.html#forced-unwinding +[panic-modes]: ../panic.md#panic-runtimes +[panic-ffi]: ../panic.md#unwinding-across-ffi-boundaries +[panicking]: ../panic.md +[undefined behavior]: ../behavior-considered-undefined.md ## Const functions diff --git a/src/linkage.md b/src/linkage.md index 48a1c8e58..8abc388ff 100644 --- a/src/linkage.md +++ b/src/linkage.md @@ -226,6 +226,24 @@ a statically linked binary on MSVC you would execute: RUSTFLAGS='-C target-feature=+crt-static' cargo build --target x86_64-pc-windows-msvc ``` +## Prohibited linkage scenarios + +No crate may be linked with [the `panic=abort` runtime][panic-runtime] if it has +both of the following characteristics: + +* It contains a call to an `-unwind` foreign function or function pointer +* It was compiled with `panic=unwind` + +`rustc` enforces this restriction at link-time. To guarantee that +a library will be linkable regardless of the panic mode used at +link-time, the [`ffi_unwind_calls` lint] may be used. The lint flags any +calls to `-unwind` foreign functions or function pointers. + +Note: Cargo will automatically unify all crates to use the same `panic` +runtime, so this prohibition does not apply to projects compiled with Cargo. + [`cfg` attribute `target_feature` option]: conditional-compilation.md#target_feature +[`ffi_unwind_calls` lint]: ../rustc/lints/listing/allowed-by-default.html#ffi-unwind-calls [configuration option]: conditional-compilation.md +[panic-runtime]: panic.md#panic-runtimes [procedural macros]: procedural-macros.md diff --git a/src/panic.md b/src/panic.md new file mode 100644 index 000000000..b0462dbd1 --- /dev/null +++ b/src/panic.md @@ -0,0 +1,101 @@ +# Panic + +Rust provides a mechanism to prevent a function from returning normally, and +instead "panic," which is a response to an error condition that is typically +not expected to be recoverable within the context in which the error is +encountered. + +Some language constructs, such as out-of-bounds [array indexing], panic +automatically. There are also language features that provide a level of control +over panic behavior: +* A [_panic runtime_](#panic-runtimes) defined how a panic is handled during + runtime. +* [FFI ABIs](items/functions.md#unwinding) may alter how panics behave. + +> **Note**: The standard library provides the capability to explicitly panic +> via the [`panic!` macro][macro-panic]. + +## Unwinding + +Panicking may either be recoverable or non-recoverable, though it can be +configured (via `panic=abort`) to always be non-recoverable. (The converse is +not true: `panic=unwind` does not guarantee that all panics are recoverable, +only that panicking via the `panic!` macro and similar standard library +mechanisms is recoverable.) When panic recovery occurs, the runtime "unwinds" +Rust frames, just as C++'s `throw` unwinds C++ frames, until the panic reaches +the point of recovery (for instance at a thread boundary). This means that as +the panic traverses Rust frames, live objects in those frames that [implement +`Drop`][destructors] will have their `drop` methods called. Thus, when normal +execution resumes, no-longer-accessible objects will have been "cleaned up" +just as if they had gone out of scope normally. + +> **Note**: As long as this guarantee of resource-cleanup is preserved, +> "unwinding" may be implemented without actually using the mechanism used by +> C++ for the target platform. + +> **Note**: The standard library provides two mechanisms for recovering from a panic, +> [`catch_unwind`][fn-catch-unwind] (which enables recovery within the +> panicking thread) and [`thread::spawn`][thread-spawn] (which automatically +> sets up panic recovery for the spawned thread so that other threads may +> continue running). + +### Unwinding across FFI boundaries + +It is possible to unwind across FFI boundaries using an [appropriate ABI +declaration][unwind-abi]. While useful in certain cases, this creates unique +opportunities for undefined behavior, especially when multiple language runtimes +are involved. + +Unwinding with the wrong ABI is undefined behavior: + +* Causing an unwind into Rust code from a foreign function that was called via a + function declaration or pointer declared with a non-unwinding ABI, such as `"C"`, + `"system"`, etc. (For example, this case occurs when such a function written in + C++ throws an exception that is uncaught and propagates to Rust.) +* Calling a Rust `extern` function that unwinds (with `extern "C-unwind"` or + another ABI that permits unwinding) from a runtime that does not support. + unwinding, such as code compiled with GCC or Clang using `-fno-exceptions` + +Catching a foreign unwinding operation (such as a C++ exception) using +`catch_unwind`, `JoinHandle::join`, or by letting it propagate all the way to a +Rust `main()` function will have one of two behaviors, and it is unspecified +which will occur: +* The process aborts. +* The function returns a `Result::Err` containing an opaque type. + +Note that Rust code compiled or linked with a different runtime counts as a +"foreign exception" for the purpose of this guarantee. Thus, a library that +uses `panic!` and is linked against one version of the Rust standard library, +invoked from an application that uses a different version of the standard +library, may cause the entire application to crash even if the library is only +used within a child thread. + +There are currently no guarantees about the behavior that occurs when a foreign +runtime attempts to dispose of, or rethrow, a Rust `panic` payload. In other +words, an unwind originated from a Rust runtime must either lead to termination +of the process or be caught by the same runtime. + +## Panic runtimes + +The actual behavior and implementation of `panic!` is controlled by the _panic +runtime_. + +> **Note**: The Rust standard library provides two panic runtimes: +> `panic_unwind` (which unwinds the stack and is potentially recoverable) and +> `panic_abort` (which aborts the process and is non-recoverable). The default +> runtime depends on the target platform, but is generally `panic_unwind` on +> platforms with native support for C++ exceptions. + +When compiling code that is guaranteed to be linked to a non-recoverable panic +runtime, the optimizer may assume that unwinding across Rust frames is +impossible, which can result in both code-size and runtime speed improvements. + +See also the [`panic_handler` attribute](runtime.md#the-panic_handler-attribute) which can be used to change the behavior of panics. + +[array indexing]: expressions/array-expr.md#array-and-slice-indexing-expressions +[destructors]: destructors.md +[fn-catch-unwind]: ../std/panic/fn.catch_unwind.html +[macro-panic]: ../std/macro.panic.html +[runtime]: runtime.md +[thread-spawn]: ../std/thread/fn.spawn.html +[unwind-abi]: items/functions.md#unwinding diff --git a/src/runtime.md b/src/runtime.md index a673834f8..6b3f4a23a 100644 --- a/src/runtime.md +++ b/src/runtime.md @@ -47,8 +47,10 @@ fn panic(info: &PanicInfo) -> ! { The standard library provides an implementation of `panic_handler` that defaults to unwinding the stack but that can be [changed to abort the -process][abort]. The standard library's panic behavior can be modified at -runtime with the [set_hook] function. +process][abort]. See [panic runtimes] for more details. + +The standard library's panic behavior can be modified at runtime with the +[`set_hook` function][set_hook]. ## The `global_allocator` attribute @@ -80,6 +82,7 @@ display a console window on startup. It will run detached from any existing cons [abort]: ../book/ch09-01-unrecoverable-errors-with-panic.html [attribute]: attributes.md [crate types]: linkage.md +[panic runtimes]: panic.md#panic-runtimes [set_hook]: std::panic::set_hook [static item]: items/static-items.md [subsystem]: https://msdn.microsoft.com/en-us/library/fcc1zstk.aspx