forked from BigfootDev/flatbuffers
* feat: add lookup_index_by_key to Rust Vector for index-based binary search * fix: remove duplicated code
352 lines
10 KiB
Rust
352 lines
10 KiB
Rust
/*
|
|
* Copyright 2018 Google Inc. All rights reserved.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
use core::cmp::Ordering;
|
|
use core::fmt::{Debug, Formatter, Result};
|
|
use core::iter::{DoubleEndedIterator, ExactSizeIterator, FusedIterator};
|
|
#[cfg(nightly)]
|
|
use core::iter::TrustedLen;
|
|
use core::marker::PhantomData;
|
|
use core::mem::{align_of, size_of};
|
|
use core::str::from_utf8_unchecked;
|
|
|
|
use crate::endian_scalar::read_scalar_at;
|
|
use crate::follow::Follow;
|
|
use crate::primitives::*;
|
|
|
|
pub struct Vector<'a, T: 'a>(&'a [u8], usize, PhantomData<T>);
|
|
|
|
impl<'a, T: 'a> Default for Vector<'a, T> {
|
|
fn default() -> Self {
|
|
// Static, length 0 vector.
|
|
// Note that derived default causes UB due to issues in read_scalar_at /facepalm.
|
|
Self(&[0; core::mem::size_of::<UOffsetT>()], 0, Default::default())
|
|
}
|
|
}
|
|
|
|
impl<'a, T> Debug for Vector<'a, T>
|
|
where
|
|
T: 'a + Follow<'a>,
|
|
<T as Follow<'a>>::Inner: Debug,
|
|
{
|
|
fn fmt(&self, f: &mut Formatter) -> Result {
|
|
f.debug_list().entries(self.iter()).finish()
|
|
}
|
|
}
|
|
|
|
// We cannot use derive for these two impls, as it would only implement Copy
|
|
// and Clone for `T: Copy` and `T: Clone` respectively. However `Vector<'a, T>`
|
|
// can always be copied, no matter that `T` you have.
|
|
impl<'a, T> Copy for Vector<'a, T> {}
|
|
|
|
impl<'a, T> Clone for Vector<'a, T> {
|
|
fn clone(&self) -> Self {
|
|
*self
|
|
}
|
|
}
|
|
|
|
impl<'a, T: 'a> Vector<'a, T> {
|
|
/// # Safety
|
|
///
|
|
/// `buf` contains a valid vector at `loc` consisting of
|
|
///
|
|
/// - UOffsetT element count
|
|
/// - Consecutive list of `T` elements
|
|
#[inline(always)]
|
|
pub unsafe fn new(buf: &'a [u8], loc: usize) -> Self {
|
|
Vector(buf, loc, PhantomData)
|
|
}
|
|
|
|
#[inline(always)]
|
|
pub fn len(&self) -> usize {
|
|
// Safety:
|
|
// Valid vector at time of construction starting with UOffsetT element count
|
|
unsafe { read_scalar_at::<UOffsetT>(self.0, self.1) as usize }
|
|
}
|
|
|
|
#[inline(always)]
|
|
pub fn is_empty(&self) -> bool {
|
|
self.len() == 0
|
|
}
|
|
|
|
#[inline(always)]
|
|
pub fn bytes(&self) -> &'a [u8] {
|
|
let sz = size_of::<T>();
|
|
let len = self.len();
|
|
&self.0[self.1 + SIZE_UOFFSET..self.1 + SIZE_UOFFSET + sz * len]
|
|
}
|
|
}
|
|
|
|
impl<'a, T: Follow<'a> + 'a> Vector<'a, T> {
|
|
#[inline(always)]
|
|
pub fn get(&self, idx: usize) -> T::Inner {
|
|
assert!(idx < self.len());
|
|
let sz = size_of::<T>();
|
|
debug_assert!(sz > 0);
|
|
// Safety:
|
|
// Valid vector at time of construction, verified that idx < element count
|
|
unsafe { T::follow(self.0, self.1 as usize + SIZE_UOFFSET + sz * idx) }
|
|
}
|
|
|
|
#[inline(always)]
|
|
pub fn lookup_by_key<K: Ord>(
|
|
&self,
|
|
key: K,
|
|
f: fn(&<T as Follow<'a>>::Inner, &K) -> Ordering,
|
|
) -> Option<T::Inner> {
|
|
self.lookup_index_by_key(key, f).map(|idx| self.get(idx))
|
|
}
|
|
|
|
/// Binary search by key, returning the index of the matching element.
|
|
///
|
|
/// This is similar to `lookup_by_key`, but returns the index of the found
|
|
/// element rather than the element itself. This is useful when you need
|
|
/// to reference elements by their position in the vector.
|
|
#[inline(always)]
|
|
pub fn lookup_index_by_key<K: Ord>(
|
|
&self,
|
|
key: K,
|
|
f: fn(&<T as Follow<'a>>::Inner, &K) -> Ordering,
|
|
) -> Option<usize> {
|
|
if self.is_empty() {
|
|
return None;
|
|
}
|
|
|
|
let mut left: usize = 0;
|
|
let mut right = self.len() - 1;
|
|
|
|
while left <= right {
|
|
let mid = (left + right) / 2;
|
|
let value = self.get(mid);
|
|
match f(&value, &key) {
|
|
Ordering::Equal => return Some(mid),
|
|
Ordering::Less => left = mid + 1,
|
|
Ordering::Greater => {
|
|
if mid == 0 {
|
|
return None;
|
|
}
|
|
right = mid - 1;
|
|
}
|
|
}
|
|
}
|
|
|
|
None
|
|
}
|
|
|
|
#[inline(always)]
|
|
pub fn iter(&self) -> VectorIter<'a, T> {
|
|
VectorIter::from_vector(*self)
|
|
}
|
|
}
|
|
|
|
/// # Safety
|
|
///
|
|
/// `buf` must contain a value of T at `loc` and have alignment of 1
|
|
pub unsafe fn follow_cast_ref<'a, T: Sized + 'a>(buf: &'a [u8], loc: usize) -> &'a T {
|
|
assert_eq!(align_of::<T>(), 1);
|
|
let sz = size_of::<T>();
|
|
let buf = &buf[loc..loc + sz];
|
|
let ptr = buf.as_ptr() as *const T;
|
|
// SAFETY
|
|
// buf contains a value at loc of type T and T has no alignment requirements
|
|
&*ptr
|
|
}
|
|
|
|
impl<'a> Follow<'a> for &'a str {
|
|
type Inner = &'a str;
|
|
unsafe fn follow(buf: &'a [u8], loc: usize) -> Self::Inner {
|
|
let len = read_scalar_at::<UOffsetT>(buf, loc) as usize;
|
|
let slice = &buf[loc + SIZE_UOFFSET..loc + SIZE_UOFFSET + len];
|
|
from_utf8_unchecked(slice)
|
|
}
|
|
}
|
|
|
|
impl<'a> Follow<'a> for &'a [u8] {
|
|
type Inner = &'a [u8];
|
|
unsafe fn follow(buf: &'a [u8], loc: usize) -> Self::Inner {
|
|
let len = read_scalar_at::<UOffsetT>(buf, loc) as usize;
|
|
&buf[loc + SIZE_UOFFSET..loc + SIZE_UOFFSET + len]
|
|
}
|
|
}
|
|
|
|
/// Implement Follow for all possible Vectors that have Follow-able elements.
|
|
impl<'a, T: Follow<'a> + 'a> Follow<'a> for Vector<'a, T> {
|
|
type Inner = Vector<'a, T>;
|
|
unsafe fn follow(buf: &'a [u8], loc: usize) -> Self::Inner {
|
|
Vector::new(buf, loc)
|
|
}
|
|
}
|
|
|
|
/// An iterator over a `Vector`.
|
|
#[derive(Debug)]
|
|
pub struct VectorIter<'a, T: 'a> {
|
|
buf: &'a [u8],
|
|
loc: usize,
|
|
remaining: usize,
|
|
phantom: PhantomData<T>,
|
|
}
|
|
|
|
impl<'a, T: 'a> VectorIter<'a, T> {
|
|
#[inline]
|
|
pub fn from_vector(inner: Vector<'a, T>) -> Self {
|
|
VectorIter {
|
|
buf: inner.0,
|
|
// inner.1 is the location of the data for the vector.
|
|
// The first SIZE_UOFFSET bytes is the length. We skip
|
|
// that to get to the actual vector content.
|
|
loc: inner.1 + SIZE_UOFFSET,
|
|
remaining: inner.len(),
|
|
phantom: PhantomData,
|
|
}
|
|
}
|
|
|
|
/// Creates a new `VectorIter` from the provided slice
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// buf must contain a contiguous sequence of `items_num` values of `T`
|
|
///
|
|
#[inline]
|
|
pub unsafe fn from_slice(buf: &'a [u8], items_num: usize) -> Self {
|
|
VectorIter { buf, loc: 0, remaining: items_num, phantom: PhantomData }
|
|
}
|
|
}
|
|
|
|
impl<'a, T: Follow<'a> + 'a> Clone for VectorIter<'a, T> {
|
|
#[inline]
|
|
fn clone(&self) -> Self {
|
|
VectorIter {
|
|
buf: self.buf,
|
|
loc: self.loc,
|
|
remaining: self.remaining,
|
|
phantom: self.phantom,
|
|
}
|
|
}
|
|
}
|
|
|
|
impl<'a, T: Follow<'a> + 'a> Iterator for VectorIter<'a, T> {
|
|
type Item = T::Inner;
|
|
|
|
#[inline]
|
|
fn next(&mut self) -> Option<T::Inner> {
|
|
let sz = size_of::<T>();
|
|
debug_assert!(sz > 0);
|
|
|
|
if self.remaining == 0 {
|
|
None
|
|
} else {
|
|
// Safety:
|
|
// VectorIter can only be created from a contiguous sequence of `items_num`
|
|
// And remaining is initialized to `items_num`
|
|
let result = unsafe { T::follow(self.buf, self.loc) };
|
|
self.loc += sz;
|
|
self.remaining -= 1;
|
|
Some(result)
|
|
}
|
|
}
|
|
|
|
#[inline]
|
|
fn nth(&mut self, n: usize) -> Option<T::Inner> {
|
|
let sz = size_of::<T>();
|
|
debug_assert!(sz > 0);
|
|
|
|
self.remaining = self.remaining.saturating_sub(n);
|
|
|
|
// Note that this might overflow, but that is okay because
|
|
// in that case self.remaining will have been set to zero.
|
|
self.loc = self.loc.wrapping_add(sz * n);
|
|
|
|
self.next()
|
|
}
|
|
|
|
#[inline]
|
|
fn size_hint(&self) -> (usize, Option<usize>) {
|
|
(self.remaining, Some(self.remaining))
|
|
}
|
|
}
|
|
|
|
impl<'a, T: Follow<'a> + 'a> DoubleEndedIterator for VectorIter<'a, T> {
|
|
#[inline]
|
|
fn next_back(&mut self) -> Option<T::Inner> {
|
|
let sz = size_of::<T>();
|
|
debug_assert!(sz > 0);
|
|
|
|
if self.remaining == 0 {
|
|
None
|
|
} else {
|
|
self.remaining -= 1;
|
|
// Safety:
|
|
// VectorIter can only be created from a contiguous sequence of `items_num`
|
|
// And remaining is initialized to `items_num`
|
|
Some(unsafe { T::follow(self.buf, self.loc + sz * self.remaining) })
|
|
}
|
|
}
|
|
|
|
#[inline]
|
|
fn nth_back(&mut self, n: usize) -> Option<T::Inner> {
|
|
self.remaining = self.remaining.saturating_sub(n);
|
|
self.next_back()
|
|
}
|
|
}
|
|
|
|
impl<'a, T: 'a + Follow<'a>> ExactSizeIterator for VectorIter<'a, T> {
|
|
#[inline]
|
|
fn len(&self) -> usize {
|
|
self.remaining
|
|
}
|
|
}
|
|
|
|
#[cfg(nightly)]
|
|
unsafe impl<'a, T: Follow<'a> + 'a> TrustedLen for VectorIter<'a, T> {}
|
|
|
|
impl<'a, T: 'a + Follow<'a>> FusedIterator for VectorIter<'a, T> {}
|
|
|
|
impl<'a, T: Follow<'a> + 'a> IntoIterator for Vector<'a, T> {
|
|
type Item = T::Inner;
|
|
type IntoIter = VectorIter<'a, T>;
|
|
#[inline]
|
|
fn into_iter(self) -> Self::IntoIter {
|
|
self.iter()
|
|
}
|
|
}
|
|
|
|
impl<'a, 'b, T: Follow<'a> + 'a> IntoIterator for &'b Vector<'a, T> {
|
|
type Item = T::Inner;
|
|
type IntoIter = VectorIter<'a, T>;
|
|
fn into_iter(self) -> Self::IntoIter {
|
|
self.iter()
|
|
}
|
|
}
|
|
|
|
#[cfg(feature = "serialize")]
|
|
impl<'a, T> serde::ser::Serialize for Vector<'a, T>
|
|
where
|
|
T: 'a + Follow<'a>,
|
|
<T as Follow<'a>>::Inner: serde::ser::Serialize,
|
|
{
|
|
fn serialize<S>(&self, serializer: S) -> std::result::Result<S::Ok, S::Error>
|
|
where
|
|
S: serde::ser::Serializer,
|
|
{
|
|
use serde::ser::SerializeSeq;
|
|
let mut seq = serializer.serialize_seq(Some(self.len()))?;
|
|
for element in self {
|
|
seq.serialize_element(&element)?;
|
|
}
|
|
seq.end()
|
|
}
|
|
}
|