Make protobuf_upb::Arena into a proper Rust RAII type.

PiperOrigin-RevId: 525775419
pull/12507/head
Miguel Young de la Sota 2 years ago committed by Copybara-Service
parent 44ac124713
commit 8e53046d94
  1. 73
      rust/cpp_kernel/cpp.rs
  2. 5
      rust/protobuf.rs
  3. 1
      rust/shared.rs
  4. 122
      rust/upb_kernel/upb.rs
  5. 1
      src/google/protobuf/compiler/rust/generator.cc
  6. 37
      src/google/protobuf/compiler/rust/message.cc

@ -30,27 +30,73 @@
// Rust Protobuf runtime using the C++ kernel. // Rust Protobuf runtime using the C++ kernel.
use std::alloc::{dealloc, Layout}; use std::alloc;
use std::alloc::Layout;
use std::boxed::Box; use std::boxed::Box;
use std::cell::UnsafeCell;
use std::fmt;
use std::marker::PhantomData;
use std::mem::MaybeUninit;
use std::ops::Deref; use std::ops::Deref;
use std::ptr::NonNull; use std::ptr::NonNull;
use std::slice; use std::slice;
/// A wrapper over a `proto2::Arena`.
///
/// This is not a safe wrapper per se, because the allocation functions still
/// have sharp edges (see their safety docs for more info).
///
/// This is an owning type and will automatically free the arena when
/// dropped.
///
/// Note that this type is neither `Sync` nor `Send`.
///
/// TODO(b/272728844): Replace this placeholder code with a real implementation. /// TODO(b/272728844): Replace this placeholder code with a real implementation.
#[repr(C)]
pub struct Arena { pub struct Arena {
_data: [u8; 0], ptr: NonNull<u8>,
_not_sync: PhantomData<UnsafeCell<()>>,
} }
impl Arena { impl Arena {
pub unsafe fn new() -> *mut Self { /// Allocates a fresh arena.
let arena = Box::new(Arena { _data: [] }); #[inline]
Box::leak(arena) as *mut _ pub fn new() -> Self {
Self { ptr: NonNull::dangling(), _not_sync: PhantomData }
}
/// Returns the raw, C++-managed pointer to the arena.
#[inline]
pub fn raw(&self) -> ! {
unimplemented!()
}
/// Allocates some memory on the arena.
///
/// # Safety
///
/// `layout`'s alignment must be less than `UPB_MALLOC_ALIGN`.
#[inline]
pub unsafe fn alloc(&self, layout: Layout) -> &mut [MaybeUninit<u8>] {
unimplemented!()
}
/// Resizes some memory on the arena.
///
/// # Safety
///
/// After calling this function, `ptr` is essentially zapped. `old` must
/// be the layout `ptr` was allocated with via [`Arena::alloc()`]. `new`'s
/// alignment must be less than `UPB_MALLOC_ALIGN`.
#[inline]
pub unsafe fn resize(&self, ptr: *mut u8, old: Layout, new: Layout) -> &[MaybeUninit<u8>] {
unimplemented!()
} }
}
pub unsafe fn free(arena: *mut Self) { impl Drop for Arena {
let arena = Box::from_raw(arena); #[inline]
std::mem::drop(arena); fn drop(&mut self) {
// unimplemented
} }
} }
@ -63,7 +109,6 @@ impl Arena {
// LINT.IfChange // LINT.IfChange
// copybara:strip_end // copybara:strip_end
#[repr(C)] #[repr(C)]
#[derive(Debug)]
pub struct SerializedData { pub struct SerializedData {
/// Owns the memory. /// Owns the memory.
data: NonNull<u8>, data: NonNull<u8>,
@ -89,11 +134,17 @@ impl Deref for SerializedData {
impl Drop for SerializedData { impl Drop for SerializedData {
fn drop(&mut self) { fn drop(&mut self) {
unsafe { unsafe {
dealloc(self.data.as_ptr(), Layout::array::<u8>(self.len).unwrap()); alloc::dealloc(self.data.as_ptr(), Layout::array::<u8>(self.len).unwrap());
}; };
} }
} }
impl fmt::Debug for SerializedData {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
fmt::Debug::fmt(self.deref(), f)
}
}
#[cfg(test)] #[cfg(test)]
mod tests { mod tests {
use super::*; use super::*;

@ -35,12 +35,7 @@
//! this crate exists is to be able to use `protobuf` as a crate name for both //! this crate exists is to be able to use `protobuf` as a crate name for both
//! cpp and upb kernels from user code. //! cpp and upb kernels from user code.
#[cfg(cpp_kernel)]
pub use protobuf_cpp::__runtime;
#[cfg(cpp_kernel)] #[cfg(cpp_kernel)]
pub use protobuf_cpp::*; pub use protobuf_cpp::*;
#[cfg(upb_kernel)]
pub use protobuf_upb::__runtime;
#[cfg(upb_kernel)] #[cfg(upb_kernel)]
pub use protobuf_upb::*; pub use protobuf_upb::*;

@ -38,7 +38,6 @@ pub extern crate cpp as __runtime;
#[cfg(upb_kernel)] #[cfg(upb_kernel)]
pub extern crate upb as __runtime; pub extern crate upb as __runtime;
pub use __runtime::Arena;
pub use __runtime::SerializedData; pub use __runtime::SerializedData;
use std::fmt; use std::fmt;

@ -28,46 +28,122 @@
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
// Rust Protobuf runtime using the UPB kernel. //! UPB FFI wrapper code for use by Rust Protobuf.
/// Represents UPB's upb_Arena. use std::alloc;
use std::alloc::Layout;
use std::cell::UnsafeCell;
use std::fmt;
use std::marker::PhantomData;
use std::mem::MaybeUninit;
use std::ops::Deref; use std::ops::Deref;
use std::ptr::NonNull; use std::ptr::NonNull;
use std::slice; use std::slice;
/// See `upb/port/def.inc`.
const UPB_MALLOC_ALIGN: usize = 8;
/// A UPB-managed pointer to a raw arena.
pub type RawArena = NonNull<RawArenaData>;
/// The data behind a [`RawArena`]. Do not use this type.
#[repr(C)] #[repr(C)]
pub struct Arena { pub struct RawArenaData {
_data: [u8; 0], _data: [u8; 0],
_marker: core::marker::PhantomData<(*mut u8, core::marker::PhantomPinned)>, }
/// A wrapper over a `upb_Arena`.
///
/// This is not a safe wrapper per se, because the allocation functions still
/// have sharp edges (see their safety docs for more info).
///
/// This is an owning type and will automatically free the arena when
/// dropped.
///
/// Note that this type is neither `Sync` nor `Send`.
pub struct Arena {
raw: RawArena,
_not_sync: PhantomData<UnsafeCell<()>>,
}
extern "C" {
fn upb_Arena_New() -> RawArena;
fn upb_Arena_Free(arena: RawArena);
fn upb_Arena_Malloc(arena: RawArena, size: usize) -> *mut u8;
fn upb_Arena_Realloc(arena: RawArena, ptr: *mut u8, old: usize, new: usize) -> *mut u8;
} }
impl Arena { impl Arena {
pub unsafe fn new() -> *mut Self { /// Allocates a fresh arena.
upb_Arena_New() #[inline]
pub fn new() -> Self {
Self { raw: unsafe { upb_Arena_New() }, _not_sync: PhantomData }
}
/// Returns the raw, UPB-managed pointer to the arena.
#[inline]
pub fn raw(&self) -> RawArena {
self.raw
} }
pub unsafe fn free(arena: *mut Self) { /// Allocates some memory on the arena.
upb_Arena_Free(arena) ///
/// # Safety
///
/// `layout`'s alignment must be less than `UPB_MALLOC_ALIGN`.
#[inline]
pub unsafe fn alloc(&self, layout: Layout) -> &mut [MaybeUninit<u8>] {
debug_assert!(layout.align() <= UPB_MALLOC_ALIGN);
let ptr = upb_Arena_Malloc(self.raw, layout.size());
if ptr.is_null() {
alloc::handle_alloc_error(layout);
}
slice::from_raw_parts_mut(ptr.cast(), layout.size())
}
/// Resizes some memory on the arena.
///
/// # Safety
///
/// After calling this function, `ptr` is essentially zapped. `old` must
/// be the layout `ptr` was allocated with via [`Arena::alloc()`]. `new`'s
/// alignment must be less than `UPB_MALLOC_ALIGN`.
#[inline]
pub unsafe fn resize(&self, ptr: *mut u8, old: Layout, new: Layout) -> &[MaybeUninit<u8>] {
debug_assert!(new.align() <= UPB_MALLOC_ALIGN);
let ptr = upb_Arena_Realloc(self.raw, ptr, old.size(), new.size());
if ptr.is_null() {
alloc::handle_alloc_error(new);
}
slice::from_raw_parts_mut(ptr.cast(), new.size())
} }
} }
extern "C" { impl Drop for Arena {
pub fn upb_Arena_New() -> *mut Arena; #[inline]
pub fn upb_Arena_Free(arena: *mut Arena); fn drop(&mut self) {
unsafe {
upb_Arena_Free(self.raw);
}
}
} }
/// Represents serialized Protobuf wire format data. It's typically produced by /// Represents serialized Protobuf wire format data.
/// `<Message>.serialize()`. ///
#[derive(Debug)] /// It's typically produced by `<Message>::serialize()`.
pub struct SerializedData { pub struct SerializedData {
data: NonNull<u8>, data: NonNull<u8>,
len: usize, len: usize,
arena: *mut Arena,
// The arena that owns `data`.
_arena: Arena,
} }
impl SerializedData { impl SerializedData {
pub unsafe fn from_raw_parts(arena: *mut Arena, data: NonNull<u8>, len: usize) -> Self { pub unsafe fn from_raw_parts(arena: Arena, data: NonNull<u8>, len: usize) -> Self {
SerializedData { arena, data, len } SerializedData { _arena: arena, data, len }
} }
} }
@ -78,9 +154,9 @@ impl Deref for SerializedData {
} }
} }
impl Drop for SerializedData { impl fmt::Debug for SerializedData {
fn drop(&mut self) { fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
unsafe { Arena::free(self.arena) }; fmt::Debug::fmt(self.deref(), f)
} }
} }
@ -90,13 +166,13 @@ mod tests {
#[test] #[test]
fn test_arena_new_and_free() { fn test_arena_new_and_free() {
let arena = unsafe { Arena::new() }; let arena = Arena::new();
unsafe { Arena::free(arena) }; drop(arena);
} }
#[test] #[test]
fn test_serialized_data_roundtrip() { fn test_serialized_data_roundtrip() {
let arena = unsafe { Arena::new() }; let arena = Arena::new();
let original_data = b"Hello world"; let original_data = b"Hello world";
let len = original_data.len(); let len = original_data.len();

@ -97,6 +97,7 @@ bool RustGenerator::Generate(const FileDescriptor* file_desc,
auto v = file.printer().WithVars({ auto v = file.printer().WithVars({
{"std", "::__std"}, {"std", "::__std"},
{"pb", "::__pb"}, {"pb", "::__pb"},
{"pbi", "::__pb::__runtime"},
{"NonNull", "::__std::ptr::NonNull"}, {"NonNull", "::__std::ptr::NonNull"},
}); });

@ -56,7 +56,10 @@ void MessageStructFields(Context<Descriptor> msg) {
case Kernel::kUpb: case Kernel::kUpb:
msg.Emit(R"rs( msg.Emit(R"rs(
msg: $NonNull$<u8>, msg: $NonNull$<u8>,
arena: *mut $pb$::Arena, //~ rustc incorrectly thinks this field is never read, even though
//~ it has a destructor!
#[allow(dead_code)]
arena: $pbi$::Arena,
)rs"); )rs");
return; return;
} }
@ -74,9 +77,11 @@ void MessageNew(Context<Descriptor> msg) {
case Kernel::kUpb: case Kernel::kUpb:
msg.Emit({{"new_thunk", Thunk(msg, "new")}}, R"rs( msg.Emit({{"new_thunk", Thunk(msg, "new")}}, R"rs(
let arena = unsafe { $pb$::Arena::new() }; let arena = unsafe { $pbi$::Arena::new() };
let msg = unsafe { $new_thunk$(arena) }; Self {
$Msg$ { msg, arena } msg: unsafe { $new_thunk$(arena.raw()) },
arena,
}
)rs"); )rs");
return; return;
} }
@ -94,10 +99,10 @@ void MessageSerialize(Context<Descriptor> msg) {
case Kernel::kUpb: case Kernel::kUpb:
msg.Emit({{"serialize_thunk", Thunk(msg, "serialize")}}, R"rs( msg.Emit({{"serialize_thunk", Thunk(msg, "serialize")}}, R"rs(
let arena = unsafe { $pb$::__runtime::upb_Arena_New() }; let arena = $pbi$::Arena::new();
let mut len = 0; let mut len = 0;
unsafe { unsafe {
let data = $serialize_thunk$(self.msg, arena, &mut len); let data = $serialize_thunk$(self.msg, arena.raw(), &mut len);
$pb$::SerializedData::from_raw_parts(arena, data, len) $pb$::SerializedData::from_raw_parts(arena, data, len)
} }
)rs"); )rs");
@ -152,7 +157,7 @@ void MessageExterns(Context<Descriptor> msg) {
fn $new_thunk$() -> $NonNull$<u8>; fn $new_thunk$() -> $NonNull$<u8>;
fn $delete_thunk$(raw_msg: $NonNull$<u8>); fn $delete_thunk$(raw_msg: $NonNull$<u8>);
fn $serialize_thunk$(raw_msg: $NonNull$<u8>) -> $pb$::SerializedData; fn $serialize_thunk$(raw_msg: $NonNull$<u8>) -> $pb$::SerializedData;
fn $deserialize_thunk$( raw_msg: $NonNull$<u8>, data: $pb$::SerializedData) -> bool; fn $deserialize_thunk$(raw_msg: $NonNull$<u8>, data: $pb$::SerializedData) -> bool;
)rs"); )rs");
return; return;
@ -163,13 +168,9 @@ void MessageExterns(Context<Descriptor> msg) {
{"serialize_thunk", Thunk(msg, "serialize")}, {"serialize_thunk", Thunk(msg, "serialize")},
}, },
R"rs( R"rs(
fn $new_thunk$(arena: *mut $pb$::Arena) -> $NonNull$<u8>; fn $new_thunk$(arena: $pbi$::RawArena) -> $NonNull$<u8>;
fn $serialize_thunk$( fn $serialize_thunk$(msg: $NonNull$<u8>, arena: $pbi$::RawArena, len: &mut usize) -> $NonNull$<u8>;
msg: $NonNull$<u8>, )rs");
arena: *mut $pb$::Arena,
len: &mut usize,
) -> $NonNull$<u8>;
)rs");
return; return;
} }
@ -347,12 +348,12 @@ void MessageGenerator::GenerateThunksCc(Context<Descriptor> msg) {
}}, }},
}, },
R"cc( R"cc(
// $abi$ is a workaround for a syntax highlight bug in VSCode. However, //~ $abi$ is a workaround for a syntax highlight bug in VSCode. However,
// that confuses clang-format (it refuses to keep the newline after //~ that confuses clang-format (it refuses to keep the newline after
// `$abi${`). Disabling clang-format for the block. //~ `$abi${`). Disabling clang-format for the block.
// clang-format off // clang-format off
extern $abi$ { extern $abi$ {
void * $new_thunk$(){return new $QualifiedMsg$(); } void* $new_thunk$(){return new $QualifiedMsg$(); }
void $delete_thunk$(void* ptr) { delete static_cast<$QualifiedMsg$*>(ptr); } void $delete_thunk$(void* ptr) { delete static_cast<$QualifiedMsg$*>(ptr); }
google::protobuf::rust_internal::SerializedData $serialize_thunk$($QualifiedMsg$* msg) { google::protobuf::rust_internal::SerializedData $serialize_thunk$($QualifiedMsg$* msg) {
return google::protobuf::rust_internal::SerializeMsg(msg); return google::protobuf::rust_internal::SerializeMsg(msg);

Loading…
Cancel
Save