/* * Copyright 2018 Google Inc. All rights reserved. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ use core::cmp::Ordering; use core::fmt::{Debug, Formatter, Result}; use core::iter::{DoubleEndedIterator, ExactSizeIterator, FusedIterator}; #[cfg(nightly)] use core::iter::TrustedLen; use core::marker::PhantomData; use core::mem::{align_of, size_of}; use core::str::from_utf8_unchecked; use crate::endian_scalar::read_scalar_at; use crate::follow::Follow; use crate::primitives::*; pub struct Vector<'a, T: 'a>(&'a [u8], usize, PhantomData); impl<'a, T: 'a> Default for Vector<'a, T> { fn default() -> Self { // Static, length 0 vector. // Note that derived default causes UB due to issues in read_scalar_at /facepalm. Self(&[0; core::mem::size_of::()], 0, Default::default()) } } impl<'a, T> Debug for Vector<'a, T> where T: 'a + Follow<'a>, >::Inner: Debug, { fn fmt(&self, f: &mut Formatter) -> Result { f.debug_list().entries(self.iter()).finish() } } // We cannot use derive for these two impls, as it would only implement Copy // and Clone for `T: Copy` and `T: Clone` respectively. However `Vector<'a, T>` // can always be copied, no matter that `T` you have. impl<'a, T> Copy for Vector<'a, T> {} impl<'a, T> Clone for Vector<'a, T> { fn clone(&self) -> Self { *self } } impl<'a, T: 'a> Vector<'a, T> { /// # Safety /// /// `buf` contains a valid vector at `loc` consisting of /// /// - UOffsetT element count /// - Consecutive list of `T` elements #[inline(always)] pub unsafe fn new(buf: &'a [u8], loc: usize) -> Self { Vector(buf, loc, PhantomData) } #[inline(always)] pub fn len(&self) -> usize { // Safety: // Valid vector at time of construction starting with UOffsetT element count unsafe { read_scalar_at::(self.0, self.1) as usize } } #[inline(always)] pub fn is_empty(&self) -> bool { self.len() == 0 } #[inline(always)] pub fn bytes(&self) -> &'a [u8] { let sz = size_of::(); let len = self.len(); &self.0[self.1 + SIZE_UOFFSET..self.1 + SIZE_UOFFSET + sz * len] } } impl<'a, T: Follow<'a> + 'a> Vector<'a, T> { #[inline(always)] pub fn get(&self, idx: usize) -> T::Inner { assert!(idx < self.len()); let sz = size_of::(); debug_assert!(sz > 0); // Safety: // Valid vector at time of construction, verified that idx < element count unsafe { T::follow(self.0, self.1 as usize + SIZE_UOFFSET + sz * idx) } } #[inline(always)] pub fn lookup_by_key( &self, key: K, f: fn(&>::Inner, &K) -> Ordering, ) -> Option { if self.is_empty() { return None; } let mut left: usize = 0; let mut right = self.len() - 1; while left <= right { let mid = (left + right) / 2; let value = self.get(mid); match f(&value, &key) { Ordering::Equal => return Some(value), Ordering::Less => left = mid + 1, Ordering::Greater => { if mid == 0 { return None; } right = mid - 1; } } } None } #[inline(always)] pub fn iter(&self) -> VectorIter<'a, T> { VectorIter::from_vector(*self) } } /// # Safety /// /// `buf` must contain a value of T at `loc` and have alignment of 1 pub unsafe fn follow_cast_ref<'a, T: Sized + 'a>(buf: &'a [u8], loc: usize) -> &'a T { assert_eq!(align_of::(), 1); let sz = size_of::(); let buf = &buf[loc..loc + sz]; let ptr = buf.as_ptr() as *const T; // SAFETY // buf contains a value at loc of type T and T has no alignment requirements &*ptr } impl<'a> Follow<'a> for &'a str { type Inner = &'a str; unsafe fn follow(buf: &'a [u8], loc: usize) -> Self::Inner { let len = read_scalar_at::(buf, loc) as usize; let slice = &buf[loc + SIZE_UOFFSET..loc + SIZE_UOFFSET + len]; from_utf8_unchecked(slice) } } impl<'a> Follow<'a> for &'a [u8] { type Inner = &'a [u8]; unsafe fn follow(buf: &'a [u8], loc: usize) -> Self::Inner { let len = read_scalar_at::(buf, loc) as usize; &buf[loc + SIZE_UOFFSET..loc + SIZE_UOFFSET + len] } } /// Implement Follow for all possible Vectors that have Follow-able elements. impl<'a, T: Follow<'a> + 'a> Follow<'a> for Vector<'a, T> { type Inner = Vector<'a, T>; unsafe fn follow(buf: &'a [u8], loc: usize) -> Self::Inner { Vector::new(buf, loc) } } /// An iterator over a `Vector`. #[derive(Debug)] pub struct VectorIter<'a, T: 'a> { buf: &'a [u8], loc: usize, remaining: usize, phantom: PhantomData, } impl<'a, T: 'a> VectorIter<'a, T> { #[inline] pub fn from_vector(inner: Vector<'a, T>) -> Self { VectorIter { buf: inner.0, // inner.1 is the location of the data for the vector. // The first SIZE_UOFFSET bytes is the length. We skip // that to get to the actual vector content. loc: inner.1 + SIZE_UOFFSET, remaining: inner.len(), phantom: PhantomData, } } /// Creates a new `VectorIter` from the provided slice /// /// # Safety /// /// buf must contain a contiguous sequence of `items_num` values of `T` /// #[inline] pub unsafe fn from_slice(buf: &'a [u8], items_num: usize) -> Self { VectorIter { buf, loc: 0, remaining: items_num, phantom: PhantomData } } } impl<'a, T: Follow<'a> + 'a> Clone for VectorIter<'a, T> { #[inline] fn clone(&self) -> Self { VectorIter { buf: self.buf, loc: self.loc, remaining: self.remaining, phantom: self.phantom, } } } impl<'a, T: Follow<'a> + 'a> Iterator for VectorIter<'a, T> { type Item = T::Inner; #[inline] fn next(&mut self) -> Option { let sz = size_of::(); debug_assert!(sz > 0); if self.remaining == 0 { None } else { // Safety: // VectorIter can only be created from a contiguous sequence of `items_num` // And remaining is initialized to `items_num` let result = unsafe { T::follow(self.buf, self.loc) }; self.loc += sz; self.remaining -= 1; Some(result) } } #[inline] fn nth(&mut self, n: usize) -> Option { let sz = size_of::(); debug_assert!(sz > 0); self.remaining = self.remaining.saturating_sub(n); // Note that this might overflow, but that is okay because // in that case self.remaining will have been set to zero. self.loc = self.loc.wrapping_add(sz * n); self.next() } #[inline] fn size_hint(&self) -> (usize, Option) { (self.remaining, Some(self.remaining)) } } impl<'a, T: Follow<'a> + 'a> DoubleEndedIterator for VectorIter<'a, T> { #[inline] fn next_back(&mut self) -> Option { let sz = size_of::(); debug_assert!(sz > 0); if self.remaining == 0 { None } else { self.remaining -= 1; // Safety: // VectorIter can only be created from a contiguous sequence of `items_num` // And remaining is initialized to `items_num` Some(unsafe { T::follow(self.buf, self.loc + sz * self.remaining) }) } } #[inline] fn nth_back(&mut self, n: usize) -> Option { self.remaining = self.remaining.saturating_sub(n); self.next_back() } } impl<'a, T: 'a + Follow<'a>> ExactSizeIterator for VectorIter<'a, T> { #[inline] fn len(&self) -> usize { self.remaining } } #[cfg(nightly)] unsafe impl<'a, T: Follow<'a> + 'a> TrustedLen for VectorIter<'a, T> {} impl<'a, T: 'a + Follow<'a>> FusedIterator for VectorIter<'a, T> {} impl<'a, T: Follow<'a> + 'a> IntoIterator for Vector<'a, T> { type Item = T::Inner; type IntoIter = VectorIter<'a, T>; #[inline] fn into_iter(self) -> Self::IntoIter { self.iter() } } impl<'a, 'b, T: Follow<'a> + 'a> IntoIterator for &'b Vector<'a, T> { type Item = T::Inner; type IntoIter = VectorIter<'a, T>; fn into_iter(self) -> Self::IntoIter { self.iter() } } #[cfg(feature = "serialize")] impl<'a, T> serde::ser::Serialize for Vector<'a, T> where T: 'a + Follow<'a>, >::Inner: serde::ser::Serialize, { fn serialize(&self, serializer: S) -> std::result::Result where S: serde::ser::Serializer, { use serde::ser::SerializeSeq; let mut seq = serializer.serialize_seq(Some(self.len()))?; for element in self { seq.serialize_element(&element)?; } seq.end() } }