// Protocol Buffers - Google's data interchange format // Copyright 2023 Google Inc. All rights reserved. // https://developers.google.com/protocol-buffers/ // // Redistribution and use in source and binary forms, with or without // modification, are permitted provided that the following conditions are // met: // // * Redistributions of source code must retain the above copyright // notice, this list of conditions and the following disclaimer. // * Redistributions in binary form must reproduce the above // copyright notice, this list of conditions and the following disclaimer // in the documentation and/or other materials provided with the // distribution. // * Neither the name of Google Inc. nor the names of its // contributors may be used to endorse or promote products derived from // this software without specific prior written permission. // // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. //! Operating on borrowed data owned by a message is a central concept in //! Protobuf (and Rust in general). The way this is normally accomplished in //! Rust is to pass around references and operate on those. Unfortunately, //! references come with two major drawbacks: //! //! * We must store the value somewhere in the memory to create a reference to //! it. The value must be readable by a single load. However for Protobuf //! fields it happens that the actual memory representation of a value differs //! from what users expect and it is an implementation detail that can change //! as more optimizations are implemented. For example, rarely accessed //! `int64` fields can be represented in a packed format with 32 bits for the //! value in the common case. Or, a single logical value can be spread across //! multiple memory locations. For example, presence information for all the //! fields in a protobuf message is centralized in a bitset. //! * We cannot store extra data on the reference that might be necessary for //! correctly manipulating it (and custom-metadata DSTs do not exist yet in //! Rust). Concretely, messages, string, bytes, and repeated fields in UPB //! need to carry around an arena parameter separate from the data pointer to //! enable mutation (for example adding an element to a repeated field) or //! potentially to enable optimizations (for example referencing a string //! value using a Cord-like type instead of copying it if the source and //! target messages are on the same arena already). Mutable references to //! messages have one additional drawback: Rust allows users to //! indiscriminately run a bytewise swap() on mutable references, which could //! result in pointers to the wrong arena winding up on a message. For //! example, imagine swapping a submessage across two root messages allocated //! on distinct arenas A and B; after the swap, the message allocated in A may //! contain pointers from B by way of the submessage, because the swap does //! not know to fix up those pointers as needed. The C++ API uses //! message-owned arenas, and this ends up resembling self-referential types, //! which need `Pin` in order to be sound. However, `Pin` has much stronger //! guarantees than we need to uphold. //! //! These drawbacks put the "idiomatic Rust" goal in conflict with the //! "performance", "evolvability", and "safety" goals. Given the project design //! priorities we decided to not use plain Rust references. Instead, we //! implemented the concept of "proxy" types. Proxy types are a reference-like //! indirection between the user and the internal memory representation. use std::fmt::Debug; use std::marker::{Send, Sync}; /// A type that can be accessed through a reference-like proxy. /// /// An instance of a `Proxied` can be accessed /// immutably via `Proxied::View` and mutably via `Proxied::Mut`. /// /// All Protobuf field types implement `Proxied`. pub trait Proxied { /// The proxy type that provides shared access to a `T`, like a `&'a T`. /// /// Most code should use the type alias [`View`]. type View<'a>: ViewProxy<'a, Proxied = Self> + Copy + Send where Self: 'a; /// The proxy type that provides exclusive mutable access to a `T`, like a /// `&'a mut T`. /// /// Most code should use the type alias [`Mut`]. type Mut<'a>: MutProxy<'a, Proxied = Self> where Self: 'a; } /// A proxy type that provides shared access to a `T`, like a `&'a T`. /// /// This is more concise than fully spelling the associated type. #[allow(dead_code)] pub type View<'a, T> = ::View<'a>; /// A proxy type that provides exclusive mutable access to a `T`, like a /// `&'a mut T`. /// /// This is more concise than fully spelling the associated type. #[allow(dead_code)] pub type Mut<'a, T> = ::Mut<'a>; /// Declares conversion operations common to all views. /// /// This trait is intentionally made non-object-safe to prevent a potential /// future incompatible change. pub trait ViewProxy<'a>: 'a + Sized + Sync + Unpin + Sized + Debug { type Proxied: 'a + Proxied + ?Sized; /// Converts a borrow into a `View` with the lifetime of that borrow. /// /// In non-generic code we don't need to use `as_view` because the proxy /// types are covariant over `'a`. However, generic code conservatively /// treats `'a` as [invariant], therefore we need to call /// `as_view` to explicitly perform the operation that in concrete code /// coercion would perform implicitly. /// /// For example, the call to `.as_view()` in the following snippet /// wouldn't be necessary in concrete code: /// ``` /// fn reborrow<'a, 'b, T>(x: &'b View<'a, T>) -> View<'b, T> /// where 'a: 'b, T: Proxied /// { /// x.as_view() /// } /// ``` /// /// [invariant]: https://doc.rust-lang.org/nomicon/subtyping.html#variance fn as_view(&self) -> View<'_, Self::Proxied>; /// Converts into a `View` with a potentially shorter lifetime. /// /// In non-generic code we don't need to use `into_view` because the proxy /// types are covariant over `'a`. However, generic code conservatively /// treats `'a` as [invariant], therefore we need to call /// `into_view` to explicitly perform the operation that in concrete /// code coercion would perform implicitly. /// /// ``` /// fn reborrow_generic_view_into_view<'a, 'b, T>( /// x: View<'a, T>, /// y: View<'b, T>, /// ) -> [View<'b, T>; 2] /// where /// T: Proxied, /// 'a: 'b, /// { /// // `[x, y]` fails to compile because `'a` is not the same as `'b` and the `View` /// // lifetime parameter is (conservatively) invariant. /// // `[x.as_view(), y]` fails because that borrow cannot outlive `'b`. /// [x.into_view(), y] /// } /// ``` /// /// [invariant]: https://doc.rust-lang.org/nomicon/subtyping.html#variance fn into_view<'shorter>(self) -> View<'shorter, Self::Proxied> where 'a: 'shorter; } /// Declares operations common to all mutators. /// /// This trait is intentionally made non-object-safe to prevent a potential /// future incompatible change. pub trait MutProxy<'a>: ViewProxy<'a> { /// Converts a borrow into a `Mut` with the lifetime of that borrow. /// /// This function enables calling multiple methods consuming `self`, for /// example: /// /// ```ignore /// let mut sub: Mut = msg.submsg_mut().or_default(); /// sub.as_mut().field_x_mut().set(10); // field_x_mut is fn(self) /// sub.field_y_mut().set(20); // `sub` is now consumed /// ``` /// /// `as_mut` is also useful in generic code to explicitly perform the /// operation that in concrete code coercion would perform implicitly. fn as_mut(&mut self) -> Mut<'_, Self::Proxied>; /// Converts into a `Mut` with a potentially shorter lifetime. /// /// In non-generic code we don't need to use `into_mut` because the proxy /// types are covariant over `'a`. However, generic code conservatively /// treats `'a` as [invariant], therefore we need to call /// `into_mut` to explicitly perform the operation that in concrete code /// coercion would perform implicitly. /// /// ``` /// fn reborrow_generic_mut_into_mut<'a, 'b, T>(x: Mut<'a, T>, y: Mut<'b, T>) -> [Mut<'b, T>; 2] /// where /// T: Proxied, /// 'a: 'b, /// { /// // `[x, y]` fails to compile because `'a` is not the same as `'b` and the `Mut` /// // lifetime parameter is (conservatively) invariant. /// // `[x.as_mut(), y]` fails because that borrow cannot outlive `'b`. /// [x.into_mut(), y] /// } /// ``` /// /// [invariant]: https://doc.rust-lang.org/nomicon/subtyping.html#variance fn into_mut<'shorter>(self) -> Mut<'shorter, Self::Proxied> where 'a: 'shorter; } #[cfg(test)] mod tests { use super::*; #[derive(Debug, PartialEq)] struct MyProxied { val: String, } impl MyProxied { fn as_view(&self) -> View<'_, Self> { MyProxiedView { my_proxied_ref: self } } fn as_mut(&mut self) -> Mut<'_, Self> { MyProxiedMut { my_proxied_ref: self } } } impl Proxied for MyProxied { type View<'a> = MyProxiedView<'a>; type Mut<'a> = MyProxiedMut<'a>; } #[derive(Debug, Clone, Copy)] struct MyProxiedView<'a> { my_proxied_ref: &'a MyProxied, } impl MyProxiedView<'_> { fn val(&self) -> &str { &self.my_proxied_ref.val } } impl<'a> ViewProxy<'a> for MyProxiedView<'a> { type Proxied = MyProxied; fn as_view(&self) -> View<'a, MyProxied> { *self } fn into_view<'shorter>(self) -> View<'shorter, MyProxied> where 'a: 'shorter, { self } } #[derive(Debug)] struct MyProxiedMut<'a> { my_proxied_ref: &'a mut MyProxied, } impl MyProxiedMut<'_> { fn set_val(&mut self, new_val: String) { self.my_proxied_ref.val = new_val; } } impl<'a> ViewProxy<'a> for MyProxiedMut<'a> { type Proxied = MyProxied; fn as_view(&self) -> View<'_, MyProxied> { MyProxiedView { my_proxied_ref: self.my_proxied_ref } } fn into_view<'shorter>(self) -> View<'shorter, MyProxied> where 'a: 'shorter, { MyProxiedView { my_proxied_ref: self.my_proxied_ref } } } impl<'a> MutProxy<'a> for MyProxiedMut<'a> { fn as_mut(&mut self) -> Mut<'_, MyProxied> { MyProxiedMut { my_proxied_ref: self.my_proxied_ref } } fn into_mut<'shorter>(self) -> Mut<'shorter, MyProxied> where 'a: 'shorter, { self } } #[test] fn test_as_view() { let my_proxied = MyProxied { val: "Hello World".to_string() }; let my_view = my_proxied.as_view(); assert_eq!(my_view.val(), my_proxied.val); } #[test] fn test_as_mut() { let mut my_proxied = MyProxied { val: "Hello World".to_string() }; let mut my_mut = my_proxied.as_mut(); my_mut.set_val("Hello indeed".to_string()); let val_after_set = my_mut.as_view().val().to_string(); assert_eq!(my_proxied.val, val_after_set); assert_eq!(my_proxied.val, "Hello indeed"); } fn reborrow_mut_into_view<'a>(x: Mut<'a, MyProxied>) -> View<'a, MyProxied> { // x.as_view() fails to compile with: // `ERROR: attempt to return function-local borrowed content` x.into_view() // OK: we return the same lifetime as we got in. } #[test] fn test_mut_into_view() { let mut my_proxied = MyProxied { val: "Hello World".to_string() }; reborrow_mut_into_view(my_proxied.as_mut()); } fn require_unified_lifetimes<'a>(_x: Mut<'a, MyProxied>, _y: View<'a, MyProxied>) {} #[test] fn test_require_unified_lifetimes() { let mut my_proxied = MyProxied { val: "Hello1".to_string() }; let my_mut = my_proxied.as_mut(); { let other_proxied = MyProxied { val: "Hello2".to_string() }; let other_view = other_proxied.as_view(); require_unified_lifetimes(my_mut, other_view); } } fn reborrow_generic_as_view<'a, 'b, T>( x: &'b mut Mut<'a, T>, y: &'b View<'a, T>, ) -> [View<'b, T>; 2] where T: Proxied, 'a: 'b, { // `[x, y]` fails to compile because `'a` is not the same as `'b` and the `View` // lifetime parameter is (conservatively) invariant. [x.as_view(), y.as_view()] } #[test] fn test_reborrow_generic_as_view() { let mut my_proxied = MyProxied { val: "Hello1".to_string() }; let mut my_mut = my_proxied.as_mut(); let my_ref = &mut my_mut; { let other_proxied = MyProxied { val: "Hello2".to_string() }; let other_view = other_proxied.as_view(); reborrow_generic_as_view::(my_ref, &other_view); } } fn reborrow_generic_view_into_view<'a, 'b, T>( x: View<'a, T>, y: View<'b, T>, ) -> [View<'b, T>; 2] where T: Proxied, 'a: 'b, { // `[x, y]` fails to compile because `'a` is not the same as `'b` and the `View` // lifetime parameter is (conservatively) invariant. // `[x.as_view(), y]` fails because that borrow cannot outlive `'b`. [x.into_view(), y] } #[test] fn test_reborrow_generic_into_view() { let my_proxied = MyProxied { val: "Hello1".to_string() }; let my_view = my_proxied.as_view(); { let other_proxied = MyProxied { val: "Hello2".to_string() }; let other_view = other_proxied.as_view(); reborrow_generic_view_into_view::(my_view, other_view); } } fn reborrow_generic_mut_into_view<'a, 'b, T>(x: Mut<'a, T>, y: View<'b, T>) -> [View<'b, T>; 2] where T: Proxied, 'a: 'b, { [x.into_view(), y] } #[test] fn test_reborrow_generic_mut_into_view() { let mut my_proxied = MyProxied { val: "Hello1".to_string() }; let my_mut = my_proxied.as_mut(); { let other_proxied = MyProxied { val: "Hello2".to_string() }; let other_view = other_proxied.as_view(); reborrow_generic_mut_into_view::(my_mut, other_view); } } fn reborrow_generic_mut_into_mut<'a, 'b, T>(x: Mut<'a, T>, y: Mut<'b, T>) -> [Mut<'b, T>; 2] where T: Proxied, 'a: 'b, { // `[x, y]` fails to compile because `'a` is not the same as `'b` and the `Mut` // lifetime parameter is (conservatively) invariant. // `[x.as_mut(), y]` fails because that borrow cannot outlive `'b`. [x.into_mut(), y] } #[test] fn test_reborrow_generic_mut_into_mut() { let mut my_proxied = MyProxied { val: "Hello1".to_string() }; let my_mut = my_proxied.as_mut(); { let mut other_proxied = MyProxied { val: "Hello2".to_string() }; let other_mut = other_proxied.as_mut(); // No need to reborrow, even though lifetime of &other_view is different // than the lifetiem of my_ref. Rust references are covariant over their // lifetime. reborrow_generic_mut_into_mut::(my_mut, other_mut); } } }