Skip to content

Commit 012ae13

Browse files
committed
Auto merge of rust-lang#132549 - Zalathar:rust-string, r=cuviper
Make `RustString` an extern type to avoid `improper_ctypes` warnings Currently, any FFI function that uses `&RustString` needs to also add `#[ignore(improper_ctypes)]` to silence a warning. The warning is not _completely_ bogus, because `RustString` contains `Vec<u8>` and therefore does not have a guaranteed layout. But we have no way of telling the lint that this doesn't matter, because the C++ code only uses that pointer opaquely and never relies on its underlying layout. Ideally there would be some way to silence `improper_ctypes` at the type-definition site. But because there isn't, casting to and from a separate extern type is better than having to annotate every single use site.
2 parents 328b759 + 89d7efa commit 012ae13

File tree

6 files changed

+60
-47
lines changed

6 files changed

+60
-47
lines changed

compiler/rustc_codegen_llvm/src/llvm/ffi.rs

-17
Original file line numberDiff line numberDiff line change
@@ -1766,11 +1766,9 @@ unsafe extern "C" {
17661766
pub fn LLVMRustGetLastError() -> *const c_char;
17671767

17681768
/// Prints the timing information collected by `-Ztime-llvm-passes`.
1769-
#[expect(improper_ctypes)]
17701769
pub(crate) fn LLVMRustPrintPassTimings(OutStr: &RustString);
17711770

17721771
/// Prints the statistics collected by `-Zprint-codegen-stats`.
1773-
#[expect(improper_ctypes)]
17741772
pub(crate) fn LLVMRustPrintStatistics(OutStr: &RustString);
17751773

17761774
/// Prepares inline assembly.
@@ -1791,7 +1789,6 @@ unsafe extern "C" {
17911789
ConstraintsLen: size_t,
17921790
) -> bool;
17931791

1794-
#[allow(improper_ctypes)]
17951792
pub(crate) fn LLVMRustCoverageWriteFilenamesToBuffer(
17961793
Filenames: *const *const c_char,
17971794
FilenamesLen: size_t,
@@ -1800,7 +1797,6 @@ unsafe extern "C" {
18001797
BufferOut: &RustString,
18011798
);
18021799

1803-
#[allow(improper_ctypes)]
18041800
pub(crate) fn LLVMRustCoverageWriteFunctionMappingsToBuffer(
18051801
VirtualFileMappingIDs: *const c_uint,
18061802
NumVirtualFileMappingIDs: size_t,
@@ -1824,13 +1820,10 @@ unsafe extern "C" {
18241820
) -> &Value;
18251821
pub(crate) fn LLVMRustCoverageHashBytes(Bytes: *const c_char, NumBytes: size_t) -> u64;
18261822

1827-
#[allow(improper_ctypes)]
18281823
pub(crate) fn LLVMRustCoverageWriteCovmapSectionNameToString(M: &Module, OutStr: &RustString);
18291824

1830-
#[allow(improper_ctypes)]
18311825
pub(crate) fn LLVMRustCoverageWriteCovfunSectionNameToString(M: &Module, OutStr: &RustString);
18321826

1833-
#[allow(improper_ctypes)]
18341827
pub(crate) fn LLVMRustCoverageWriteCovmapVarNameToString(OutStr: &RustString);
18351828

18361829
pub(crate) fn LLVMRustCoverageMappingVersion() -> u32;
@@ -2185,14 +2178,11 @@ unsafe extern "C" {
21852178
pub fn LLVMRustDIBuilderCreateOpPlusUconst() -> u64;
21862179
pub fn LLVMRustDIBuilderCreateOpLLVMFragment() -> u64;
21872180

2188-
#[allow(improper_ctypes)]
21892181
pub fn LLVMRustWriteTypeToString(Type: &Type, s: &RustString);
2190-
#[allow(improper_ctypes)]
21912182
pub fn LLVMRustWriteValueToString(value_ref: &Value, s: &RustString);
21922183

21932184
pub fn LLVMRustHasFeature(T: &TargetMachine, s: *const c_char) -> bool;
21942185

2195-
#[allow(improper_ctypes)]
21962186
pub(crate) fn LLVMRustPrintTargetCPUs(TM: &TargetMachine, OutStr: &RustString);
21972187
pub fn LLVMRustGetTargetFeaturesCount(T: &TargetMachine) -> size_t;
21982188
pub fn LLVMRustGetTargetFeature(
@@ -2297,10 +2287,8 @@ unsafe extern "C" {
22972287
pub fn LLVMRustArchiveIteratorFree<'a>(AIR: &'a mut ArchiveIterator<'a>);
22982288
pub fn LLVMRustDestroyArchive(AR: &'static mut Archive);
22992289

2300-
#[allow(improper_ctypes)]
23012290
pub fn LLVMRustWriteTwineToString(T: &Twine, s: &RustString);
23022291

2303-
#[allow(improper_ctypes)]
23042292
pub fn LLVMRustUnpackOptimizationDiagnostic<'a>(
23052293
DI: &'a DiagnosticInfo,
23062294
pass_name_out: &RustString,
@@ -2318,7 +2306,6 @@ unsafe extern "C" {
23182306
message_out: &mut Option<&'a Twine>,
23192307
);
23202308

2321-
#[allow(improper_ctypes)]
23222309
pub fn LLVMRustWriteDiagnosticInfoToString(DI: &DiagnosticInfo, s: &RustString);
23232310
pub fn LLVMRustGetDiagInfoKind(DI: &DiagnosticInfo) -> DiagnosticKind;
23242311

@@ -2327,7 +2314,6 @@ unsafe extern "C" {
23272314
cookie_out: &mut c_uint,
23282315
) -> &'a SMDiagnostic;
23292316

2330-
#[allow(improper_ctypes)]
23312317
pub fn LLVMRustUnpackSMDiagnostic(
23322318
d: &SMDiagnostic,
23332319
message_out: &RustString,
@@ -2374,7 +2360,6 @@ unsafe extern "C" {
23742360
pub fn LLVMRustModuleBufferLen(p: &ModuleBuffer) -> usize;
23752361
pub fn LLVMRustModuleBufferFree(p: &'static mut ModuleBuffer);
23762362
pub fn LLVMRustModuleCost(M: &Module) -> u64;
2377-
#[allow(improper_ctypes)]
23782363
pub fn LLVMRustModuleInstructionStats(M: &Module, Str: &RustString);
23792364

23802365
pub fn LLVMRustThinLTOBufferCreate(
@@ -2427,7 +2412,6 @@ unsafe extern "C" {
24272412
bytecode_len: usize,
24282413
) -> bool;
24292414
pub fn LLVMRustLinkerFree<'a>(linker: &'a mut Linker<'a>);
2430-
#[allow(improper_ctypes)]
24312415
pub fn LLVMRustComputeLTOCacheKey(
24322416
key_out: &RustString,
24332417
mod_id: *const c_char,
@@ -2450,7 +2434,6 @@ unsafe extern "C" {
24502434
pgo_available: bool,
24512435
);
24522436

2453-
#[allow(improper_ctypes)]
24542437
pub fn LLVMRustGetMangledName(V: &Value, out: &RustString);
24552438

24562439
pub fn LLVMRustGetElementTypeArgIndex(CallSite: &Value) -> i32;

compiler/rustc_codegen_llvm/src/llvm/mod.rs

+2-7
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,5 @@
11
#![allow(non_snake_case)]
22

3-
use std::cell::RefCell;
43
use std::ffi::{CStr, CString};
54
use std::ops::Deref;
65
use std::ptr;
@@ -301,15 +300,11 @@ pub fn set_value_name(value: &Value, name: &[u8]) {
301300
}
302301

303302
pub fn build_string(f: impl FnOnce(&RustString)) -> Result<String, FromUtf8Error> {
304-
let sr = RustString { bytes: RefCell::new(Vec::new()) };
305-
f(&sr);
306-
String::from_utf8(sr.bytes.into_inner())
303+
String::from_utf8(RustString::build_byte_buffer(f))
307304
}
308305

309306
pub fn build_byte_buffer(f: impl FnOnce(&RustString)) -> Vec<u8> {
310-
let sr = RustString { bytes: RefCell::new(Vec::new()) };
311-
f(&sr);
312-
sr.bytes.into_inner()
307+
RustString::build_byte_buffer(f)
313308
}
314309

315310
pub fn twine_to_string(tr: &Twine) -> String {

compiler/rustc_llvm/llvm-wrapper/LLVMWrapper.h

+3-2
Original file line numberDiff line numberDiff line change
@@ -104,8 +104,9 @@ typedef struct OpaqueRustString *RustStringRef;
104104
typedef struct LLVMOpaqueTwine *LLVMTwineRef;
105105
typedef struct LLVMOpaqueSMDiagnostic *LLVMSMDiagnosticRef;
106106

107-
extern "C" void LLVMRustStringWriteImpl(RustStringRef Str, const char *Ptr,
108-
size_t Size);
107+
extern "C" void LLVMRustStringWriteImpl(RustStringRef buf,
108+
const char *slice_ptr,
109+
size_t slice_len);
109110

110111
class RawRustStringOstream : public llvm::raw_ostream {
111112
RustStringRef Str;

compiler/rustc_llvm/llvm-wrapper/PassWrapper.cpp

+2-1
Original file line numberDiff line numberDiff line change
@@ -1624,5 +1624,6 @@ extern "C" void LLVMRustComputeLTOCacheKey(RustStringRef KeyOut,
16241624
CfiFunctionDefs, CfiFunctionDecls);
16251625
#endif
16261626

1627-
LLVMRustStringWriteImpl(KeyOut, Key.c_str(), Key.size());
1627+
auto OS = RawRustStringOstream(KeyOut);
1628+
OS << Key.str();
16281629
}

compiler/rustc_llvm/llvm-wrapper/RustWrapper.cpp

+2-2
Original file line numberDiff line numberDiff line change
@@ -1510,8 +1510,8 @@ LLVMRustUnpackSMDiagnostic(LLVMSMDiagnosticRef DRef, RustStringRef MessageOut,
15101510
const SourceMgr &LSM = *D.getSourceMgr();
15111511
const MemoryBuffer *LBuf =
15121512
LSM.getMemoryBuffer(LSM.FindBufferContainingLoc(D.getLoc()));
1513-
LLVMRustStringWriteImpl(BufferOut, LBuf->getBufferStart(),
1514-
LBuf->getBufferSize());
1513+
auto BufferOS = RawRustStringOstream(BufferOut);
1514+
BufferOS << LBuf->getBuffer();
15151515

15161516
*LocOut = D.getLoc().getPointer() - LBuf->getBufferStart();
15171517

compiler/rustc_llvm/src/lib.rs

+51-18
Original file line numberDiff line numberDiff line change
@@ -2,42 +2,75 @@
22
#![allow(internal_features)]
33
#![doc(html_root_url = "https://doc.rust-lang.org/nightly/nightly-rustc/")]
44
#![doc(rust_logo)]
5+
#![feature(extern_types)]
56
#![feature(rustdoc_internals)]
67
#![warn(unreachable_pub)]
78
// tidy-alphabetical-end
89

9-
// NOTE: This crate only exists to allow linking on mingw targets.
10-
1110
use std::cell::RefCell;
12-
use std::slice;
11+
use std::{ptr, slice};
1312

14-
use libc::{c_char, size_t};
13+
use libc::size_t;
1514

16-
#[repr(C)]
17-
pub struct RustString {
18-
pub bytes: RefCell<Vec<u8>>,
15+
unsafe extern "C" {
16+
/// Opaque type that allows C++ code to write bytes to a Rust-side buffer,
17+
/// in conjunction with `RawRustStringOstream`. Use this as `&RustString`
18+
/// (Rust) and `RustStringRef` (C++) in FFI signatures.
19+
pub type RustString;
1920
}
2021

2122
impl RustString {
22-
pub fn len(&self) -> usize {
23-
self.bytes.borrow().len()
23+
pub fn build_byte_buffer(closure: impl FnOnce(&Self)) -> Vec<u8> {
24+
let buf = RustStringInner::default();
25+
closure(buf.as_opaque());
26+
buf.into_inner()
2427
}
28+
}
2529

26-
pub fn is_empty(&self) -> bool {
27-
self.bytes.borrow().is_empty()
30+
/// Underlying implementation of [`RustString`].
31+
///
32+
/// Having two separate types makes it possible to use the opaque [`RustString`]
33+
/// in FFI signatures without `improper_ctypes` warnings. This is a workaround
34+
/// for the fact that there is no way to opt out of `improper_ctypes` when
35+
/// _declaring_ a type (as opposed to using that type).
36+
#[derive(Default)]
37+
struct RustStringInner {
38+
bytes: RefCell<Vec<u8>>,
39+
}
40+
41+
impl RustStringInner {
42+
fn as_opaque(&self) -> &RustString {
43+
let ptr: *const RustStringInner = ptr::from_ref(self);
44+
// We can't use `ptr::cast` here because extern types are `!Sized`.
45+
let ptr = ptr as *const RustString;
46+
unsafe { &*ptr }
47+
}
48+
49+
fn from_opaque(opaque: &RustString) -> &Self {
50+
// SAFETY: A valid `&RustString` must have been created via `as_opaque`.
51+
let ptr: *const RustString = ptr::from_ref(opaque);
52+
let ptr: *const RustStringInner = ptr.cast();
53+
unsafe { &*ptr }
54+
}
55+
56+
fn into_inner(self) -> Vec<u8> {
57+
self.bytes.into_inner()
2858
}
2959
}
3060

31-
/// Appending to a Rust string -- used by RawRustStringOstream.
61+
/// Appends the contents of a byte slice to a [`RustString`].
62+
///
63+
/// This function is implemented in `rustc_llvm` so that the C++ code in this
64+
/// crate can link to it directly, without an implied link-time dependency on
65+
/// `rustc_codegen_llvm`.
3266
#[unsafe(no_mangle)]
3367
pub unsafe extern "C" fn LLVMRustStringWriteImpl(
34-
sr: &RustString,
35-
ptr: *const c_char,
36-
size: size_t,
68+
buf: &RustString,
69+
slice_ptr: *const u8, // Same ABI as `*const c_char`
70+
slice_len: size_t,
3771
) {
38-
let slice = unsafe { slice::from_raw_parts(ptr as *const u8, size) };
39-
40-
sr.bytes.borrow_mut().extend_from_slice(slice);
72+
let slice = unsafe { slice::from_raw_parts(slice_ptr, slice_len) };
73+
RustStringInner::from_opaque(buf).bytes.borrow_mut().extend_from_slice(slice);
4174
}
4275

4376
/// Initialize targets enabled by the build script via `cfg(llvm_component = "...")`.

0 commit comments

Comments
 (0)