2023-03-14 16:37:47 +01:00
|
|
|
use std::fmt;
|
2023-03-06 19:21:55 +01:00
|
|
|
use std::hash::Hash;
|
|
|
|
use std::marker::PhantomData;
|
|
|
|
|
2023-03-08 09:55:53 +01:00
|
|
|
use fxhash::FxHashMap;
|
|
|
|
|
2023-03-30 09:56:18 +02:00
|
|
|
use super::small_bitmap::SmallBitmap;
|
|
|
|
|
2023-03-16 09:58:59 +01:00
|
|
|
/// An index within an interner ([`FixedSizeInterner`], [`DedupInterner`], or [`MappedInterner`]).
|
2023-03-06 19:21:55 +01:00
|
|
|
pub struct Interned<T> {
|
2023-03-14 16:37:47 +01:00
|
|
|
idx: u16,
|
2023-03-06 19:21:55 +01:00
|
|
|
_phantom: PhantomData<T>,
|
|
|
|
}
|
|
|
|
impl<T> Interned<T> {
|
2023-03-16 09:58:59 +01:00
|
|
|
/// Create an interned value manually from its raw index within the interner.
|
|
|
|
pub fn from_raw(idx: u16) -> Self {
|
2023-03-06 19:21:55 +01:00
|
|
|
Self { idx, _phantom: PhantomData }
|
|
|
|
}
|
2023-03-16 09:58:59 +01:00
|
|
|
/// Get the raw index from the interned value
|
|
|
|
pub fn into_raw(self) -> u16 {
|
2023-03-14 16:37:47 +01:00
|
|
|
self.idx
|
|
|
|
}
|
2023-03-06 19:21:55 +01:00
|
|
|
}
|
2023-03-13 12:46:32 +01:00
|
|
|
|
2023-03-16 09:58:59 +01:00
|
|
|
/// A [`DedupInterner`] is used to store a unique copy of a value of type `T`. This value
|
2023-03-08 13:26:29 +01:00
|
|
|
/// is then identified by a lightweight index of type [`Interned<T>`], which can
|
|
|
|
/// be copied, compared, and hashed efficiently. An immutable reference to the original value
|
2023-03-16 09:58:59 +01:00
|
|
|
/// can be retrieved using `self.get(interned)`. A set of values within the interner can be
|
|
|
|
/// efficiently managed using [`SmallBitmap<T>`](super::small_bitmap::SmallBitmap).
|
2023-03-16 11:52:51 +01:00
|
|
|
///
|
|
|
|
/// A dedup-interner can contain a maximum of `u16::MAX` values.
|
2023-03-13 14:03:48 +01:00
|
|
|
#[derive(Clone)]
|
2023-03-14 16:37:47 +01:00
|
|
|
pub struct DedupInterner<T> {
|
2023-03-06 19:21:55 +01:00
|
|
|
stable_store: Vec<T>,
|
2023-03-21 10:44:40 +01:00
|
|
|
lookup: FxHashMap<T, Interned<T>>, // TODO: Arc
|
2023-03-06 19:21:55 +01:00
|
|
|
}
|
2023-03-14 16:37:47 +01:00
|
|
|
impl<T> Default for DedupInterner<T> {
|
2023-03-06 19:21:55 +01:00
|
|
|
fn default() -> Self {
|
|
|
|
Self { stable_store: Default::default(), lookup: Default::default() }
|
|
|
|
}
|
|
|
|
}
|
2023-03-14 16:37:47 +01:00
|
|
|
impl<T> DedupInterner<T> {
|
2023-03-16 11:52:51 +01:00
|
|
|
/// Convert the dedup-interner into a fixed-size interner, such that new
|
|
|
|
/// elements cannot be added to it anymore.
|
2023-03-14 16:37:47 +01:00
|
|
|
pub fn freeze(self) -> FixedSizeInterner<T> {
|
|
|
|
FixedSizeInterner { stable_store: self.stable_store }
|
|
|
|
}
|
|
|
|
}
|
2023-03-06 19:21:55 +01:00
|
|
|
|
2023-03-14 16:37:47 +01:00
|
|
|
impl<T> DedupInterner<T>
|
2023-03-06 19:21:55 +01:00
|
|
|
where
|
|
|
|
T: Clone + Eq + Hash,
|
|
|
|
{
|
2023-03-16 11:52:51 +01:00
|
|
|
/// Insert the given value into the dedup-interner, and return
|
|
|
|
/// its index.
|
2023-03-06 19:21:55 +01:00
|
|
|
pub fn insert(&mut self, s: T) -> Interned<T> {
|
|
|
|
if let Some(interned) = self.lookup.get(&s) {
|
|
|
|
*interned
|
|
|
|
} else {
|
2023-03-14 16:37:47 +01:00
|
|
|
assert!(self.stable_store.len() < u16::MAX as usize);
|
2023-03-06 19:21:55 +01:00
|
|
|
self.stable_store.push(s.clone());
|
2023-03-16 09:58:59 +01:00
|
|
|
let interned = Interned::from_raw(self.stable_store.len() as u16 - 1);
|
2023-03-06 19:21:55 +01:00
|
|
|
self.lookup.insert(s, interned);
|
|
|
|
interned
|
|
|
|
}
|
|
|
|
}
|
2023-03-16 11:52:51 +01:00
|
|
|
/// Get a reference to the interned value.
|
2023-03-06 19:21:55 +01:00
|
|
|
pub fn get(&self, interned: Interned<T>) -> &T {
|
|
|
|
&self.stable_store[interned.idx as usize]
|
|
|
|
}
|
|
|
|
}
|
2023-03-14 16:37:47 +01:00
|
|
|
|
2023-03-16 11:52:51 +01:00
|
|
|
/// A fixed-length store for values of type `T`, where each value is identified
|
|
|
|
/// by an index of type [`Interned<T>`].
|
2023-03-14 16:37:47 +01:00
|
|
|
#[derive(Clone)]
|
|
|
|
pub struct FixedSizeInterner<T> {
|
|
|
|
stable_store: Vec<T>,
|
|
|
|
}
|
|
|
|
impl<T: Clone> FixedSizeInterner<T> {
|
2023-03-16 11:52:51 +01:00
|
|
|
/// Create a fixed-size interner of the given length containing
|
|
|
|
/// clones of the given value.
|
2023-03-14 16:37:47 +01:00
|
|
|
pub fn new(length: u16, value: T) -> Self {
|
|
|
|
Self { stable_store: vec![value; length as usize] }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<T> FixedSizeInterner<T> {
|
|
|
|
pub fn from_vec(store: Vec<T>) -> Self {
|
|
|
|
Self { stable_store: store }
|
|
|
|
}
|
2023-03-30 09:56:18 +02:00
|
|
|
pub fn all_interned_values(&self) -> SmallBitmap<T> {
|
|
|
|
let mut b = SmallBitmap::for_interned_values_in(self);
|
|
|
|
for i in self.indexes() {
|
|
|
|
b.insert(i);
|
|
|
|
}
|
|
|
|
b
|
|
|
|
}
|
2023-03-14 16:37:47 +01:00
|
|
|
pub fn get(&self, interned: Interned<T>) -> &T {
|
|
|
|
&self.stable_store[interned.idx as usize]
|
|
|
|
}
|
|
|
|
pub fn get_mut(&mut self, interned: Interned<T>) -> &mut T {
|
|
|
|
&mut self.stable_store[interned.idx as usize]
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn len(&self) -> u16 {
|
|
|
|
self.stable_store.len() as u16
|
|
|
|
}
|
2023-03-30 09:56:18 +02:00
|
|
|
pub fn map_move<U>(self, map_f: impl Fn(T) -> U) -> FixedSizeInterner<U> {
|
|
|
|
FixedSizeInterner { stable_store: self.stable_store.into_iter().map(map_f).collect() }
|
|
|
|
}
|
2023-03-20 09:37:11 +01:00
|
|
|
pub fn map<U>(&self, map_f: impl Fn(&T) -> U) -> MappedInterner<T, U> {
|
2023-03-14 16:37:47 +01:00
|
|
|
MappedInterner {
|
|
|
|
stable_store: self.stable_store.iter().map(map_f).collect(),
|
|
|
|
_phantom: PhantomData,
|
|
|
|
}
|
|
|
|
}
|
2023-03-30 09:56:18 +02:00
|
|
|
pub fn map_indexes<U>(&self, map_f: impl Fn(Interned<T>) -> U) -> MappedInterner<T, U> {
|
|
|
|
MappedInterner { stable_store: self.indexes().map(map_f).collect(), _phantom: PhantomData }
|
|
|
|
}
|
|
|
|
pub fn indexes(&self) -> impl Iterator<Item = Interned<T>> {
|
|
|
|
(0..self.stable_store.len()).map(|i| Interned::from_raw(i as u16))
|
|
|
|
}
|
|
|
|
pub fn iter(&self) -> impl Iterator<Item = (Interned<T>, &T)> {
|
|
|
|
self.stable_store.iter().enumerate().map(|(i, x)| (Interned::from_raw(i as u16), x))
|
|
|
|
}
|
|
|
|
pub fn iter_mut(&mut self) -> impl Iterator<Item = (Interned<T>, &mut T)> {
|
|
|
|
self.stable_store.iter_mut().enumerate().map(|(i, x)| (Interned::from_raw(i as u16), x))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// A fixed-length store for values of type `T`, where each value is identified
|
|
|
|
/// by an index of type [`Interned<T>`].
|
|
|
|
#[derive(Clone)]
|
|
|
|
pub struct Interner<T> {
|
|
|
|
stable_store: Vec<T>,
|
|
|
|
}
|
|
|
|
impl<T> Default for Interner<T> {
|
|
|
|
fn default() -> Self {
|
|
|
|
Self { stable_store: vec![] }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<T> Interner<T> {
|
|
|
|
pub fn from_vec(v: Vec<T>) -> Self {
|
|
|
|
Self { stable_store: v }
|
|
|
|
}
|
|
|
|
pub fn get(&self, interned: Interned<T>) -> &T {
|
|
|
|
&self.stable_store[interned.idx as usize]
|
|
|
|
}
|
|
|
|
pub fn get_mut(&mut self, interned: Interned<T>) -> &mut T {
|
|
|
|
&mut self.stable_store[interned.idx as usize]
|
|
|
|
}
|
|
|
|
pub fn push(&mut self, value: T) -> Interned<T> {
|
|
|
|
assert!(self.stable_store.len() < u16::MAX as usize);
|
|
|
|
self.stable_store.push(value);
|
|
|
|
Interned::from_raw(self.stable_store.len() as u16 - 1)
|
|
|
|
}
|
|
|
|
pub fn len(&self) -> u16 {
|
|
|
|
self.stable_store.len() as u16
|
|
|
|
}
|
|
|
|
pub fn map<U>(&self, map_f: impl Fn(&T) -> U) -> MappedInterner<T, U> {
|
|
|
|
MappedInterner {
|
|
|
|
stable_store: self.stable_store.iter().map(map_f).collect(),
|
|
|
|
_phantom: PhantomData,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
pub fn map_indexes<U>(&self, map_f: impl Fn(Interned<T>) -> U) -> MappedInterner<T, U> {
|
|
|
|
MappedInterner { stable_store: self.indexes().map(map_f).collect(), _phantom: PhantomData }
|
|
|
|
}
|
2023-03-14 16:37:47 +01:00
|
|
|
pub fn indexes(&self) -> impl Iterator<Item = Interned<T>> {
|
2023-03-16 09:58:59 +01:00
|
|
|
(0..self.stable_store.len()).map(|i| Interned::from_raw(i as u16))
|
2023-03-14 16:37:47 +01:00
|
|
|
}
|
|
|
|
pub fn iter(&self) -> impl Iterator<Item = (Interned<T>, &T)> {
|
2023-03-16 09:58:59 +01:00
|
|
|
self.stable_store.iter().enumerate().map(|(i, x)| (Interned::from_raw(i as u16), x))
|
2023-03-14 16:37:47 +01:00
|
|
|
}
|
|
|
|
pub fn iter_mut(&mut self) -> impl Iterator<Item = (Interned<T>, &mut T)> {
|
2023-03-16 09:58:59 +01:00
|
|
|
self.stable_store.iter_mut().enumerate().map(|(i, x)| (Interned::from_raw(i as u16), x))
|
2023-03-14 16:37:47 +01:00
|
|
|
}
|
|
|
|
}
|
2023-03-16 11:52:51 +01:00
|
|
|
|
|
|
|
/// A store of values of type `T`, each linked to a value of type `From`
|
|
|
|
/// stored in another interner. To create a mapped interner, use the
|
|
|
|
/// `map` method on [`FixedSizeInterner`] or [`MappedInterner`].
|
|
|
|
///
|
|
|
|
/// Values in this interner are indexed with [`Interned<From>`].
|
2023-03-14 16:37:47 +01:00
|
|
|
#[derive(Clone)]
|
2023-03-20 09:37:11 +01:00
|
|
|
pub struct MappedInterner<From, T> {
|
2023-03-14 16:37:47 +01:00
|
|
|
stable_store: Vec<T>,
|
|
|
|
_phantom: PhantomData<From>,
|
|
|
|
}
|
2023-03-06 19:21:55 +01:00
|
|
|
|
2023-03-20 09:37:11 +01:00
|
|
|
impl<From, T> MappedInterner<From, T> {
|
2023-03-14 16:37:47 +01:00
|
|
|
pub fn get(&self, interned: Interned<From>) -> &T {
|
|
|
|
&self.stable_store[interned.idx as usize]
|
|
|
|
}
|
|
|
|
pub fn get_mut(&mut self, interned: Interned<From>) -> &mut T {
|
|
|
|
&mut self.stable_store[interned.idx as usize]
|
|
|
|
}
|
2023-03-20 09:37:11 +01:00
|
|
|
pub fn map<U>(&self, map_f: impl Fn(&T) -> U) -> MappedInterner<From, U> {
|
2023-03-14 16:37:47 +01:00
|
|
|
MappedInterner {
|
|
|
|
stable_store: self.stable_store.iter().map(map_f).collect(),
|
|
|
|
_phantom: PhantomData,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
pub fn iter(&self) -> impl Iterator<Item = (Interned<From>, &T)> {
|
2023-03-16 09:58:59 +01:00
|
|
|
self.stable_store.iter().enumerate().map(|(i, x)| (Interned::from_raw(i as u16), x))
|
2023-03-14 16:37:47 +01:00
|
|
|
}
|
|
|
|
pub fn iter_mut(&mut self) -> impl Iterator<Item = (Interned<From>, &mut T)> {
|
2023-03-16 09:58:59 +01:00
|
|
|
self.stable_store.iter_mut().enumerate().map(|(i, x)| (Interned::from_raw(i as u16), x))
|
2023-03-14 16:37:47 +01:00
|
|
|
}
|
|
|
|
}
|
2023-03-06 19:21:55 +01:00
|
|
|
// Interned<T> boilerplate implementations
|
|
|
|
|
|
|
|
impl<T> Hash for Interned<T> {
|
|
|
|
fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
|
|
|
|
self.idx.hash(state);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-03-18 15:04:34 +01:00
|
|
|
impl<T> Ord for Interned<T> {
|
2023-03-06 19:21:55 +01:00
|
|
|
fn cmp(&self, other: &Self) -> std::cmp::Ordering {
|
|
|
|
self.idx.cmp(&other.idx)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<T> PartialOrd for Interned<T> {
|
|
|
|
fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
|
|
|
|
self.idx.partial_cmp(&other.idx)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<T> Eq for Interned<T> {}
|
|
|
|
|
|
|
|
impl<T> PartialEq for Interned<T> {
|
|
|
|
fn eq(&self, other: &Self) -> bool {
|
|
|
|
self.idx == other.idx
|
|
|
|
}
|
|
|
|
}
|
|
|
|
impl<T> Clone for Interned<T> {
|
|
|
|
fn clone(&self) -> Self {
|
|
|
|
Self { idx: self.idx, _phantom: PhantomData }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<T> Copy for Interned<T> {}
|
2023-03-14 16:37:47 +01:00
|
|
|
|
|
|
|
impl<T> fmt::Display for Interned<T> {
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
|
|
fmt::Display::fmt(&self.idx, f)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
impl<T> fmt::Debug for Interned<T> {
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
|
|
fmt::Debug::fmt(&self.idx, f)
|
|
|
|
}
|
|
|
|
}
|