Unnamed repository; edit this file 'description' to name the repository.
-rw-r--r--lib/text-size/src/lib.rs3
-rw-r--r--lib/text-size/src/range.rs64
-rw-r--r--lib/text-size/src/size.rs30
3 files changed, 66 insertions, 31 deletions
diff --git a/lib/text-size/src/lib.rs b/lib/text-size/src/lib.rs
index 32262de12c..e194e2317b 100644
--- a/lib/text-size/src/lib.rs
+++ b/lib/text-size/src/lib.rs
@@ -13,3 +13,6 @@ mod traits;
mod serde_impls;
pub use crate::{range::TextRange, size::TextSize, traits::TextSized};
+
+#[cfg(target_pointer_width = "16")]
+compile_error!("text-size assumes usize >= u32 and does not work on 16-bit targets");
diff --git a/lib/text-size/src/range.rs b/lib/text-size/src/range.rs
index df5296af14..35c487afed 100644
--- a/lib/text-size/src/range.rs
+++ b/lib/text-size/src/range.rs
@@ -2,30 +2,25 @@ use {
crate::TextSize,
std::{
cmp, fmt,
- ops::{Bound, Index, IndexMut, Range, RangeBounds},
+ ops::{Bound, Index, IndexMut, Range, RangeBounds, RangeFrom},
},
};
/// A range in text, represented as a pair of [`TextSize`][struct@TextSize].
///
-/// It is a logical error to have `end() < start()`, but
-/// code must not assume this is true for `unsafe` guarantees.
-///
/// # Translation from `text_unit`
///
-/// - `TextRange::from_to(from, to)` ⟹ `TextRange::from(from..to)`
-/// - `TextRange::offset_len(offset, size)` ⟹ `TextRange::from(offset..offset + size)`
+/// - `TextRange::from_to(from, to)` ⟹ `TextRange(from, to)`
+/// - `TextRange::offset_len(offset, size)` ⟹ `TextRange::to(size).offset(offset)`
/// - `range.start()` ⟹ `range.start()`
/// - `range.end()` ⟹ `range.end()`
-/// - `range.len()` ⟹ `range.len()`<sup>†</sup>
+/// - `range.len()` ⟹ `range.len()`
/// - `range.is_empty()` ⟹ `range.is_empty()`
-/// - `a.is_subrange(b)` ⟹ `b.contains(a)`
+/// - `a.is_subrange(b)` ⟹ `b.contains_range(a)`
/// - `a.intersection(b)` ⟹ `TextRange::intersection(a, b)`
/// - `a.extend_to(b)` ⟹ `TextRange::covering(a, b)`
-/// - `range.contains(offset)` ⟹ `range.contains_exclusive(point)`
+/// - `range.contains(offset)` ⟹ `range.contains(point)`
/// - `range.contains_inclusive(offset)` ⟹ `range.contains_inclusive(point)`
-///
-/// † See the note on [`TextRange::len`] for differing behavior for incorrect reverse ranges.
#[derive(Copy, Clone, Eq, PartialEq, Hash)]
pub struct TextRange {
// Invariant: start <= end
@@ -39,7 +34,7 @@ impl fmt::Debug for TextRange {
}
}
-/// Creates a new `TextRange` with given `start` and `end.
+/// Creates a new `TextRange` with the given `start` and `end` (`start..end`).
///
/// # Panics
///
@@ -50,16 +45,47 @@ pub fn TextRange(start: TextSize, end: TextSize) -> TextRange {
TextRange { start, end }
}
-/// Identity methods.
impl TextRange {
- /// Creates a zero-length range at the specified offset.
- pub const fn empty(self, offset: TextSize) -> TextRange {
+ /// Create a zero-length range at the specified offset (`offset..offset`).
+ pub const fn empty(offset: TextSize) -> TextRange {
TextRange {
start: offset,
end: offset,
}
}
+ /// Create a range up to the given end (`..end`).
+ pub const fn before(end: TextSize) -> TextRange {
+ TextRange {
+ start: TextSize::zero(),
+ end,
+ }
+ }
+
+ /// Create a range after the given start (`start..`).
+ ///
+ /// This returns a std [`RangeFrom`] rather than `TextRange` because
+ /// `TextRange` does not support right-unbounded ranges. As such, this
+ /// should only be used for direct indexing, and bounded ranges should be
+ /// used for persistent ranges (`TextRange(start, TextSize::of(text))`).
+ pub const fn after(start: TextSize) -> RangeFrom<usize> {
+ start.raw as usize..
+ }
+
+ /// Offset this range by some amount.
+ ///
+ /// This is typically used to convert a range from one coordinate space to
+ /// another, such as from within a substring to within an entire document.
+ pub fn offset(self, offset: TextSize) -> TextRange {
+ TextRange(
+ self.start().checked_add(offset).unwrap(),
+ self.end().checked_add(offset).unwrap(),
+ )
+ }
+}
+
+/// Identity methods.
+impl TextRange {
/// The start point of this range.
pub const fn start(self) -> TextSize {
self.start
@@ -76,10 +102,7 @@ impl TextRange {
TextSize(self.end().raw - self.start().raw)
}
- /// Check if this range empty or reversed.
- ///
- /// When `end() < start()`, this returns false.
- /// Code should prefer `is_empty()` to `len() == 0`.
+ /// Check if this range is empty.
pub const fn is_empty(self) -> bool {
// HACK for const fn: math on primitives only
self.start().raw == self.end().raw
@@ -99,8 +122,7 @@ impl TextRange {
///
/// The end index is considered included.
pub fn contains_inclusive(self, offset: TextSize) -> bool {
- let point = offset.into();
- self.start() <= point && point <= self.end()
+ self.start() <= offset && offset <= self.end()
}
/// Check if this range completely contains another range.
diff --git a/lib/text-size/src/size.rs b/lib/text-size/src/size.rs
index 454327a015..5b435e896c 100644
--- a/lib/text-size/src/size.rs
+++ b/lib/text-size/src/size.rs
@@ -11,15 +11,23 @@ use {
/// A measure of text length. Also, equivalently, an index into text.
///
-/// This is a utf8-bytes-offset stored as `u32`, but
+/// This is a UTF-8 bytes offset stored as `u32`, but
/// most clients should treat it as an opaque measure.
///
+/// For cases that need to escape `TextSize` and return to working directly
+/// with primitive integers, `TextSize` can be converted losslessly to/from
+/// `u32` via [`From`] conversions as well as losslessly be converted [`Into`]
+/// `usize`. The `usize -> TextSize` direction can be done via [`TryFrom`].
+///
+/// These escape hatches are primarily required for unit testing and when
+/// converting from UTF-8 size to another coordinate space, such as UTF-16.
+///
/// # Translation from `text_unit`
///
/// - `TextUnit::of_char(c)` ⟹ `TextSize::of(c)`
-/// - `TextUnit::of_str(s)` ⟹ `TextSize:of(s)`
+/// - `TextUnit::of_str(s)` ⟹ `TextSize::of(s)`
/// - `TextUnit::from_usize(size)` ⟹ `TextSize::try_from(size).unwrap_or_else(|| panic!(_))`
-/// - `unit.to_usize()` ⟹ `usize::try_from(size).unwrap_or_else(|| panic!(_))`
+/// - `unit.to_usize()` ⟹ `usize::from(size)`
#[derive(Clone, Copy, Default, PartialEq, Eq, PartialOrd, Ord, Hash)]
pub struct TextSize {
pub(crate) raw: u32,
@@ -49,6 +57,11 @@ impl TextSize {
pub const fn zero() -> TextSize {
TextSize(0)
}
+
+ /// A size of one.
+ pub const fn one() -> TextSize {
+ TextSize(1)
+ }
}
/// Methods to act like a primitive integer type, where reasonably applicable.
@@ -58,6 +71,8 @@ impl TextSize {
pub const MIN: TextSize = TextSize(u32::MIN);
/// The largest representable text size. (`u32::MAX`)
pub const MAX: TextSize = TextSize(u32::MAX);
+ /// The text size of a single ASCII character.
+ pub const ONE: TextSize = TextSize(1);
#[allow(missing_docs)]
pub fn checked_add(self, rhs: TextSize) -> Option<TextSize> {
@@ -72,7 +87,7 @@ impl TextSize {
impl From<u32> for TextSize {
fn from(raw: u32) -> Self {
- TextSize { raw }
+ TextSize(raw)
}
}
@@ -91,12 +106,7 @@ impl TryFrom<usize> for TextSize {
impl From<TextSize> for usize {
fn from(value: TextSize) -> Self {
- assert_lossless_conversion();
- return value.raw as usize;
-
- const fn assert_lossless_conversion() {
- [()][(std::mem::size_of::<usize>() < std::mem::size_of::<u32>()) as usize]
- }
+ value.raw as usize
}
}