//! Selections are the primary editing construct. Even cursors are //! defined as a selection range. //! //! All positioning is done via `char` offsets into the buffer. use crate::{ graphemes::{ ensure_grapheme_boundary_next, ensure_grapheme_boundary_prev, next_grapheme_boundary, prev_grapheme_boundary, }, movement::Direction, Assoc, ChangeSet, RopeGraphemes, RopeSlice, }; use smallvec::{smallvec, SmallVec}; use std::borrow::Cow; /// A single selection range. /// /// A range consists of an "anchor" and "head" position in /// the text. The head is the part that the user moves when /// directly extending a selection. The head and anchor /// can be in any order, or even share the same position. /// /// The anchor and head positions use gap indexing, meaning /// that their indices represent the the gaps *between* `char`s /// rather than the `char`s themselves. For example, 1 /// represents the position between the first and second `char`. /// /// Below are some example `Range` configurations to better /// illustrate. The anchor and head indices are show as /// "(anchor, head)", followed by example text with "[" and "]" /// inserted to represent the anchor and head positions: /// /// - (0, 3): `[Som]e text`. /// - (3, 0): `]Som[e text`. /// - (2, 7): `So[me te]xt`. /// - (1, 1): `S[]ome text`. /// /// Ranges are considered to be inclusive on the left and /// exclusive on the right, regardless of anchor-head ordering. /// This means, for example, that non-zero-width ranges that /// are directly adjecent, sharing an edge, do not overlap. /// However, a zero-width range will overlap with the shared /// left-edge of another range. /// /// By convention, user-facing ranges are considered to have /// a block cursor on the head-side of the range that spans a /// single grapheme inward from the range's edge. There are a /// variety of helper methods on `Range` for working in terms of /// that block cursor, all of which have `cursor` in their name. #[derive(Debug, Clone, Copy, PartialEq, Eq)] pub struct Range { /// The anchor of the range: the side that doesn't move when extending. pub anchor: usize, /// The head of the range, moved when extending. pub head: usize, pub horiz: Option<u32>, } impl Range { pub fn new(anchor: usize, head: usize) -> Self { Self { anchor, head, horiz: None, } } pub fn point(head: usize) -> Self { Self::new(head, head) } /// Start of the range. #[inline] #[must_use] pub fn from(&self) -> usize { std::cmp::min(self.anchor, self.head) } /// End of the range. #[inline] #[must_use] pub fn to(&self) -> usize { std::cmp::max(self.anchor, self.head) } /// Total length of the range. #[inline] #[must_use] pub fn len(&self) -> usize { self.to() - self.from() } /// The (inclusive) range of lines that the range overlaps. #[inline] #[must_use] pub fn line_range(&self, text: RopeSlice) -> (usize, usize) { let from = self.from(); let to = if self.is_empty() { self.to() } else { prev_grapheme_boundary(text, self.to()).max(from) }; (text.char_to_line(from), text.char_to_line(to)) } /// `true` when head and anchor are at the same position. #[inline] pub fn is_empty(&self) -> bool { self.anchor == self.head } /// `Direction::Backward` when head < anchor. /// `Direction::Backward` otherwise. #[inline] #[must_use] pub fn direction(&self) -> Direction { if self.head < self.anchor { Direction::Backward } else { Direction::Forward } } /// Flips the direction of the selection pub fn flip(&self) -> Self { Self { anchor: self.head, head: self.anchor, horiz: self.horiz, } } /// Returns the selection if it goes in the direction of `direction`, /// flipping the selection otherwise. pub fn with_direction(self, direction: Direction) -> Self { if self.direction() == direction { self } else { self.flip() } } /// Check two ranges for overlap. #[must_use] pub fn overlaps(&self, other: &Self) -> bool { // To my eye, it's non-obvious why this works, but I arrived // at it after transforming the slower version that explicitly // enumerated more cases. The unit tests are thorough. self.from() == other.from() || (self.to() > other.from() && other.to() > self.from()) } #[inline] pub fn contains_range(&self, other: &Self) -> bool { self.from() <= other.from() && self.to() >= other.to() } pub fn contains(&self, pos: usize) -> bool { self.from() <= pos && pos < self.to() } /// Map a range through a set of changes. Returns a new range representing the same position /// after the changes are applied. pub fn map(self, changes: &ChangeSet) -> Self { use std::cmp::Ordering; let (anchor, head) = match self.anchor.cmp(&self.head) { Ordering::Equal => ( changes.map_pos(self.anchor, Assoc::After), changes.map_pos(self.head, Assoc::After), ), Ordering::Less => ( changes.map_pos(self.anchor, Assoc::After), changes.map_pos(self.head, Assoc::Before), ), Ordering::Greater => ( changes.map_pos(self.anchor, Assoc::Before), changes.map_pos(self.head, Assoc::After), ), }; // We want to return a new `Range` with `horiz == None` every time, // even if the anchor and head haven't changed, because we don't // know if the *visual* position hasn't changed due to // character-width or grapheme changes earlier in the text. Self { anchor, head, horiz: None, } } /// Extend the range to cover at least `from` `to`. #[must_use] pub fn extend(&self, from: usize, to: usize) -> Self { debug_assert!(from <= to); if self.anchor <= self.head { Self { anchor: self.anchor.min(from), head: self.head.max(to), horiz: None, } } else { Self { anchor: self.anchor.max(to), head: self.head.min(from), horiz: None, } } } /// Returns a range that encompasses both input ranges. /// /// This is like `extend()`, but tries to negotiate the /// anchor/head ordering between the two input ranges. #[must_use] pub fn merge(&self, other: Self) -> Self { if self.anchor > self.head && other.anchor > other.head { Range { anchor: self.anchor.max(other.anchor), head: self.head.min(other.head), horiz: None, } } else { Range { anchor: self.from().min(other.from()), head: self.to().max(other.to()), horiz: None, } } } // groupAt /// Returns the text inside this range given the text of the whole buffer. /// /// The returned `Cow` is a reference if the range of text is inside a single /// chunk of the rope. Otherwise a copy of the text is returned. Consider /// using `slice` instead if you do not need a `Cow` or `String` to avoid copying. #[inline] pub fn fragment<'a, 'b: 'a>(&'a self, text: RopeSlice<'b>) -> Cow<'b, str> { self.slice(text).into() } /// Returns the text inside this range given the text of the whole buffer. /// /// The returned value is a reference to the passed slice. This method never /// copies any contents. #[inline] pub fn slice<'a, 'b: 'a>(&'a self, text: RopeSlice<'b>) -> RopeSlice<'b> { text.slice(self.from()..self.to()) } //-------------------------------- // Alignment methods. /// Compute a possibly new range from this range, with its ends /// shifted as needed to align with grapheme boundaries. /// /// Zero-width ranges will always stay zero-width, and non-zero-width /// ranges will never collapse to zero-width. #[must_use] pub fn grapheme_aligned(&self, slice: RopeSlice) -> Self { use std::cmp::Ordering; let (new_anchor, new_head) = match self.anchor.cmp(&self.head) { Ordering::Equal => { let pos = ensure_grapheme_boundary_prev(slice, self.anchor); (pos, pos) } Ordering::Less => ( ensure_grapheme_boundary_prev(slice, self.anchor), ensure_grapheme_boundary_next(slice, self.head), ), Ordering::Greater => ( ensure_grapheme_boundary_next(slice, self.anchor), ensure_grapheme_boundary_prev(slice, self.head), ), }; Range { anchor: new_anchor, head: new_head, horiz: if new_anchor == self.anchor { self.horiz } else { None }, } } /// Compute a possibly new range from this range, attempting to ensure /// a minimum range width of 1 char by shifting the head in the forward /// direction as needed. /// /// This method will never shift the anchor, and will only shift the /// head in the forward direction. Therefore, this method can fail /// at ensuring the minimum width if and only if the passed range is /// both zero-width and at the end of the `RopeSlice`. /// /// If the input range is grapheme-boundary aligned, the returned range /// will also be. Specifically, if the head needs to shift to achieve /// the minimum width, it will shift to the next grapheme boundary. #[must_use] #[inline] pub fn min_width_1(&self, slice: RopeSlice) -> Self { if self.anchor == self.head { Range { anchor: self.anchor, head: next_grapheme_boundary(slice, self.head), horiz: self.horiz, } } else { *self } } //-------------------------------- // Block-cursor methods. /// Gets the left-side position of the block cursor. #[must_use] #[inline] pub fn cursor(self, text: RopeSlice) -> usize { if self.head > self.anchor { prev_grapheme_boundary(text, self.head) } else { self.head } } /// Puts the left side of the block cursor at `char_idx`, optionally extending. /// /// This follows "1-width" semantics, and therefore does a combination of anchor /// and head moves to behave as if both the front and back of the range are 1-width /// blocks /// /// This method assumes that the range and `char_idx` are already properly /// grapheme-aligned. #[must_use] #[inline] pub fn put_cursor(self, text: RopeSlice, char_idx: usize, extend: bool) -> Range { if extend { let anchor = if self.head >= self.anchor && char_idx < self.anchor { next_grapheme_boundary(text, self.anchor) } else if self.head < self.anchor && char_idx >= self.anchor { prev_grapheme_boundary(text, self.anchor) } else { self.anchor }; if anchor <= char_idx { Range::new(anchor, next_grapheme_boundary(text, char_idx)) } else { Range::new(anchor, char_idx) } } else { Range::point(char_idx) } } /// The line number that the block-cursor is on. #[inline] #[must_use] pub fn cursor_line(&self, text: RopeSlice) -> usize { text.char_to_line(self.cursor(text)) } /// Returns true if this Range covers a single grapheme in the given text pub fn is_single_grapheme(&self, doc: RopeSlice) -> bool { let mut graphemes = RopeGraphemes::new(doc.slice(self.from()..self.to())); let first = graphemes.next(); let second = graphemes.next(); first.is_some() && second.is_none() } } impl From<(usize, usize)> for Range { fn from((anchor, head): (usize, usize)) -> Self { Self { anchor, head, horiz: None, } } } /// A selection consists of one or more selection ranges. /// invariant: A selection can never be empty (always contains at least primary range). #[derive(Debug, Clone, PartialEq, Eq)] pub struct Selection { ranges: SmallVec<[Range; 1]>, primary_index: usize, } #[allow(clippy::len_without_is_empty)] // a Selection is never empty impl Selection { // eq #[inline] #[must_use] pub fn primary(&self) -> Range { self.ranges[self.primary_index] } #[inline] #[must_use] pub fn primary_mut(&mut self) -> &mut Range { &mut self.ranges[self.primary_index] } /// Ensure selection containing only the primary selection. pub fn into_single(self) -> Self { if self.ranges.len() == 1 { self } else { Self { ranges: smallvec![self.ranges[self.primary_index]], primary_index: 0, } } } /// Adds a new range to the selection and makes it the primary range. pub fn push(mut self, range: Range) -> Self { self.ranges.push(range); self.set_primary_index(self.ranges().len() - 1); self.normalize() } /// Removes a range from the selection. pub fn remove(mut self, index: usize) -> Self { assert!( self.ranges.len() > 1, "can't remove the last range from a selection!" ); self.ranges.remove(index); if index < self.primary_index || self.primary_index == self.ranges.len() { self.primary_index -= 1; } self } /// Replace a range in the selection with a new range. pub fn replace(mut self, index: usize, range: Range) -> Self { self.ranges[index] = range; self.normalize() } /// Map selections over a set of changes. Useful for adjusting the selection position after /// applying changes to a document. pub fn map(self, changes: &ChangeSet) -> Self { if changes.is_empty() { return self; } Self::new( self.ranges .into_iter() .map(|range| range.map(changes)) .collect(), self.primary_index, ) } pub fn ranges(&self) -> &[Range] { &self.ranges } pub fn primary_index(&self) -> usize { self.primary_index } pub fn set_primary_index(&mut self, idx: usize) { assert!(idx < self.ranges.len()); self.primary_index = idx; } #[must_use] /// Constructs a selection holding a single range. pub fn single(anchor: usize, head: usize) -> Self { Self { ranges: smallvec![Range { anchor, head, horiz: None }], primary_index: 0, } } /// Constructs a selection holding a single cursor. pub fn point(pos: usize) -> Self { Self::single(pos, pos) } /// Normalizes a `Selection`. fn normalize(mut self) -> Self { let primary = self.ranges[self.primary_index]; self.ranges.sort_unstable_by_key(Range::from); self.primary_index = self .ranges .iter() .position(|&range| range == primary) .unwrap(); let mut prev_i = 0; for i in 1..self.ranges.len() { if self.ranges[prev_i].overlaps(&self.ranges[i]) { self.ranges[prev_i] = self.ranges[prev_i].merge(self.ranges[i]); } else { prev_i += 1; self.ranges[prev_i] = self.ranges[i]; } if i == self.primary_index { self.primary_index = prev_i; } } self.ranges.truncate(prev_i + 1); self } // TODO: consume an iterator or a vec to reduce allocations? #[must_use] pub fn new(ranges: SmallVec<[Range; 1]>, primary_index: usize) -> Self { assert!(!ranges.is_empty()); debug_assert!(primary_index < ranges.len()); let mut selection = Self { ranges, primary_index, }; if selection.ranges.len() > 1 { // TODO: only normalize if needed (any ranges out of order) selection = selection.normalize(); } selection } /// Takes a closure and maps each `Range` over the closure. pub fn transform<F>(mut self, f: F) -> Self where F: Fn(Range) -> Range, { for range in self.ranges.iter_mut() { *range = f(*range) } self.normalize() } // Ensures the selection adheres to the following invariants: // 1. All ranges are grapheme aligned. // 2. All ranges are at least 1 character wide, unless at the // very end of the document. // 3. Ranges are non-overlapping. // 4. Ranges are sorted by their position in the text. pub fn ensure_invariants(self, text: RopeSlice) -> Self { self.transform(|r| r.min_width_1(text).grapheme_aligned(text)) .normalize() } /// Transforms the selection into all of the left-side head positions, /// using block-cursor semantics. pub fn cursors(self, text: RopeSlice) -> Self { self.transform(|range| Range::point(range.cursor(text))) } pub fn fragments<'a>(&'a self, text: RopeSlice<'a>) -> impl Iterator<Item = Cow<str>> + 'a { self.ranges.iter().map(move |range| range.fragment(text)) } pub fn slices<'a>(&'a self, text: RopeSlice<'a>) -> impl Iterator<Item = RopeSlice> + 'a { self.ranges.iter().map(move |range| range.slice(text)) } #[inline(always)] pub fn iter(&self) -> std::slice::Iter<'_, Range> { self.ranges.iter() } #[inline(always)] pub fn len(&self) -> usize { self.ranges.len() } // returns true if self ⊇ other pub fn contains(&self, other: &Selection) -> bool { // can't contain other if it is larger if other.len() > self.len() { return false; } let (mut iter_self, mut iter_other) = (self.iter(), other.iter()); let (mut ele_self, mut ele_other) = (iter_self.next(), iter_other.next()); loop { match (ele_self, ele_other) { (Some(ra), Some(rb)) => { if !ra.contains_range(rb) { // `self` doesn't contain next element from `other`, advance `self`, we need to match all from `other` ele_self = iter_self.next(); } else { // matched element from `other`, advance `other` ele_other = iter_other.next(); }; } (None, Some(_)) => { // exhausted `self`, we can't match the reminder of `other` return false; } (_, None) => { // no elements from `other` left to match, `self` contains `other` return true; } } } } } impl<'a> IntoIterator for &'a Selection { type Item = &'a Range; type IntoIter = std::slice::Iter<'a, Range>; fn into_iter(self) -> std::slice::Iter<'a, Range> { self.ranges().iter() } } // TODO: checkSelection -> check if valid for doc length && sorted pub fn keep_or_remove_matches( text: RopeSlice, selection: &Selection, regex: &crate::regex::Regex, remove: bool, ) -> Option<Selection> { let result: SmallVec<_> = selection .iter() .filter(|range| regex.is_match(&range.fragment(text)) ^ remove) .copied() .collect(); // TODO: figure out a new primary index if !result.is_empty() { return Some(Selection::new(result, 0)); } None } pub fn select_on_matches( text: RopeSlice, selection: &Selection, regex: &crate::regex::Regex, ) -> Option<Selection> { let mut result = SmallVec::with_capacity(selection.len()); for sel in selection { // TODO: can't avoid occasional allocations since Regex can't operate on chunks yet let fragment = sel.fragment(text); let sel_start = sel.from(); let start_byte = text.char_to_byte(sel_start); for mat in regex.find_iter(&fragment) { // TODO: retain range direction let start = text.byte_to_char(start_byte + mat.start()); let end = text.byte_to_char(start_byte + mat.end()); let range = Range::new(start, end); // Make sure the match is not right outside of the selection. // These invalid matches can come from using RegEx anchors like `^`, `$` if range != Range::point(sel.to()) { result.push(range); } } } // TODO: figure out a new primary index if !result.is_empty() { return Some(Selection::new(result, 0)); } None } // TODO: support to split on capture #N instead of whole match pub fn split_on_matches( text: RopeSlice, selection: &Selection, regex: &crate::regex::Regex, ) -> Selection { let mut result = SmallVec::with_capacity(selection.len()); for sel in selection { // Special case: zero-width selection. if sel.from() == sel.to() { result.push(*sel); continue; } // TODO: can't avoid occasional allocations since Regex can't operate on chunks yet let fragment = sel.fragment(text); let sel_start = sel.from(); let sel_end = sel.to(); let start_byte = text.char_to_byte(sel_start); let mut start = sel_start; for mat in regex.find_iter(&fragment) { // TODO: retain range direction let end = text.byte_to_char(start_byte + mat.start()); result.push(Range::new(start, end)); start = text.byte_to_char(start_byte + mat.end()); } if start < sel_end { result.push(Range::new(start, sel_end)); } } // TODO: figure out a new primary index Selection::new(result, 0) } #[cfg(test)] mod test { use super::*; use crate::Rope; #[test] #[should_panic] fn test_new_empty() { let _ = Selection::new(smallvec![], 0); } #[test] fn test_create_normalizes_and_merges() { let sel = Selection::new( smallvec![ Range::new(10, 12), Range::new(6, 7), Range::new(4, 5), Range::new(3, 4), Range::new(0, 6), Range::new(7, 8), Range::new(9, 13), Range::new(13, 14), ], 0, ); let res = sel .ranges .into_iter() .map(|range| format!("{}/{}", range.anchor, range.head)) .collect::<Vec<String>>() .join(","); assert_eq!(res, "0/6,6/7,7/8,9/13,13/14"); // it correctly calculates a new primary index let sel = Selection::new( smallvec![Range::new(0, 2), Range::new(1, 5), Range::new(4, 7)], 2, ); let res = sel .ranges .into_iter() .map(|range| format!("{}/{}", range.anchor, range.head)) .collect::<Vec<String>>() .join(","); assert_eq!(res, "0/7"); assert_eq!(sel.primary_index, 0); } #[test] fn test_create_merges_adjacent_points() { let sel = Selection::new( smallvec![ Range::new(10, 12), Range::new(12, 12), Range::new(12, 12), Range::new(10, 10), Range::new(8, 10), ], 0, ); let res = sel .ranges .into_iter() .map(|range| format!("{}/{}", range.anchor, range.head)) .collect::<Vec<String>>() .join(","); assert_eq!(res, "8/10,10/12,12/12"); } #[test] fn test_contains() { let range = Range::new(10, 12); assert!(!range.contains(9)); assert!(range.contains(10)); assert!(range.contains(11)); assert!(!range.contains(12)); assert!(!range.contains(13)); let range = Range::new(9, 6); assert!(!range.contains(9)); assert!(range.contains(7)); assert!(range.contains(6)); } #[test] fn test_overlaps() { fn overlaps(a: (usize, usize), b: (usize, usize)) -> bool { Range::new(a.0, a.1).overlaps(&Range::new(b.0, b.1)) } // Two non-zero-width ranges, no overlap. assert!(!overlaps((0, 3), (3, 6))); assert!(!overlaps((0, 3), (6, 3))); assert!(!overlaps((3, 0), (3, 6))); assert!(!overlaps((3, 0), (6, 3))); assert!(!overlaps((3, 6), (0, 3))); assert!(!overlaps((3, 6), (3, 0))); assert!(!overlaps((6, 3), (0, 3))); assert!(!overlaps((6, 3), (3, 0))); // Two non-zero-width ranges, overlap. assert!(overlaps((0, 4), (3, 6))); assert!(overlaps((0, 4), (6, 3))); assert!(overlaps((4, 0), (3, 6))); assert!(overlaps((4, 0), (6, 3))); assert!(overlaps((3, 6), (0, 4))); assert!(overlaps((3, 6), (4, 0))); assert!(overlaps((6, 3), (0, 4))); assert!(overlaps((6, 3), (4, 0))); // Zero-width and non-zero-width range, no overlap. assert!(!overlaps((0, 3), (3, 3))); assert!(!overlaps((3, 0), (3, 3))); assert!(!overlaps((3, 3), (0, 3))); assert!(!overlaps((3, 3), (3, 0))); // Zero-width and non-zero-width range, overlap. assert!(overlaps((1, 4), (1, 1))); assert!(overlaps((4, 1), (1, 1))); assert!(overlaps((1, 1), (1, 4))); assert!(overlaps((1, 1), (4, 1))); assert!(overlaps((1, 4), (3, 3))); assert!(overlaps((4, 1), (3, 3))); assert!(overlaps((3, 3), (1, 4))); assert!(overlaps((3, 3), (4, 1))); // Two zero-width ranges, no overlap. assert!(!overlaps((0, 0), (1, 1))); assert!(!overlaps((1, 1), (0, 0))); // Two zero-width ranges, overlap. assert!(overlaps((1, 1), (1, 1))); } #[test] fn test_grapheme_aligned() { let r = Rope::from_str("\r\nHi\r\n"); let s = r.slice(..); // Zero-width. assert_eq!(Range::new(0, 0).grapheme_aligned(s), Range::new(0, 0)); assert_eq!(Range::new(1, 1).grapheme_aligned(s), Range::new(0, 0)); assert_eq!(Range::new(2, 2).grapheme_aligned(s), Range::new(2, 2)); assert_eq!(Range::new(3, 3).grapheme_aligned(s), Range::new(3, 3)); assert_eq!(Range::new(4, 4).grapheme_aligned(s), Range::new(4, 4)); assert_eq!(Range::new(5, 5).grapheme_aligned(s), Range::new(4, 4)); assert_eq!(Range::new(6, 6).grapheme_aligned(s), Range::new(6, 6)); // Forward. assert_eq!(Range::new(0, 1).grapheme_aligned(s), Range::new(0, 2)); assert_eq!(Range::new(1, 2).grapheme_aligned(s), Range::new(0, 2)); assert_eq!(Range::new(2, 3).grapheme_aligned(s), Range::new(2, 3)); assert_eq!(Range::new(3, 4).grapheme_aligned(s), Range::new(3, 4)); assert_eq!(Range::new(4, 5).grapheme_aligned(s), Range::new(4, 6)); assert_eq!(Range::new(5, 6).grapheme_aligned(s), Range::new(4, 6)); assert_eq!(Range::new(0, 2).grapheme_aligned(s), Range::new(0, 2)); assert_eq!(Range::new(1, 3).grapheme_aligned(s), Range::new(0, 3)); assert_eq!(Range::new(2, 4).grapheme_aligned(s), Range::new(2, 4)); assert_eq!(Range::new(3, 5).grapheme_aligned(s), Range::new(3, 6)); assert_eq!(Range::new(4, 6).grapheme_aligned(s), Range::new(4, 6)); // Reverse. assert_eq!(Range::new(1, 0).grapheme_aligned(s), Range::new(2, 0)); assert_eq!(Range::new(2, 1).grapheme_aligned(s), Range::new(2, 0)); assert_eq!(Range::new(3, 2).grapheme_aligned(s), Range::new(3, 2)); assert_eq!(Range::new(4, 3).grapheme_aligned(s), Range::new(4, 3)); assert_eq!(Range::new(5, 4).grapheme_aligned(s), Range::new(6, 4)); assert_eq!(Range::new(6, 5).grapheme_aligned(s), Range::new(6, 4)); assert_eq!(Range::new(2, 0).grapheme_aligned(s), Range::new(2, 0)); assert_eq!(Range::new(3, 1).grapheme_aligned(s), Range::new(3, 0)); assert_eq!(Range::new(4, 2).grapheme_aligned(s), Range::new(4, 2)); assert_eq!(Range::new(5, 3).grapheme_aligned(s), Range::new(6, 3)); assert_eq!(Range::new(6, 4).grapheme_aligned(s), Range::new(6, 4)); } #[test] fn test_min_width_1() { let r = Rope::from_str("\r\nHi\r\n"); let s = r.slice(..); // Zero-width. assert_eq!(Range::new(0, 0).min_width_1(s), Range::new(0, 2)); assert_eq!(Range::new(1, 1).min_width_1(s), Range::new(1, 2)); assert_eq!(Range::new(2, 2).min_width_1(s), Range::new(2, 3)); assert_eq!(Range::new(3, 3).min_width_1(s), Range::new(3, 4)); assert_eq!(Range::new(4, 4).min_width_1(s), Range::new(4, 6)); assert_eq!(Range::new(5, 5).min_width_1(s), Range::new(5, 6)); assert_eq!(Range::new(6, 6).min_width_1(s), Range::new(6, 6)); // Forward. assert_eq!(Range::new(0, 1).min_width_1(s), Range::new(0, 1)); assert_eq!(Range::new(1, 2).min_width_1(s), Range::new(1, 2)); assert_eq!(Range::new(2, 3).min_width_1(s), Range::new(2, 3)); assert_eq!(Range::new(3, 4).min_width_1(s), Range::new(3, 4)); assert_eq!(Range::new(4, 5).min_width_1(s), Range::new(4, 5)); assert_eq!(Range::new(5, 6).min_width_1(s), Range::new(5, 6)); // Reverse. assert_eq!(Range::new(1, 0).min_width_1(s), Range::new(1, 0)); assert_eq!(Range::new(2, 1).min_width_1(s), Range::new(2, 1)); assert_eq!(Range::new(3, 2).min_width_1(s), Range::new(3, 2)); assert_eq!(Range::new(4, 3).min_width_1(s), Range::new(4, 3)); assert_eq!(Range::new(5, 4).min_width_1(s), Range::new(5, 4)); assert_eq!(Range::new(6, 5).min_width_1(s), Range::new(6, 5)); } #[test] fn test_select_on_matches() { use crate::regex::{Regex, RegexBuilder}; let r = Rope::from_str("Nobody expects the Spanish inquisition"); let s = r.slice(..); let selection = Selection::single(0, r.len_chars()); assert_eq!( select_on_matches(s, &selection, &Regex::new(r"[A-Z][a-z]*").unwrap()), Some(Selection::new( smallvec![Range::new(0, 6), Range::new(19, 26)], 0 )) ); let r = Rope::from_str("This\nString\n\ncontains multiple\nlines"); let s = r.slice(..); let start_of_line = RegexBuilder::new(r"^").multi_line(true).build().unwrap(); let end_of_line = RegexBuilder::new(r"$").multi_line(true).build().unwrap(); // line without ending assert_eq!( select_on_matches(s, &Selection::single(0, 4), &start_of_line), Some(Selection::single(0, 0)) ); assert_eq!( select_on_matches(s, &Selection::single(0, 4), &end_of_line), None ); // line with ending assert_eq!( select_on_matches(s, &Selection::single(0, 5), &start_of_line), Some(Selection::single(0, 0)) ); assert_eq!( select_on_matches(s, &Selection::single(0, 5), &end_of_line), Some(Selection::single(4, 4)) ); // line with start of next line assert_eq!( select_on_matches(s, &Selection::single(0, 6), &start_of_line), Some(Selection::new( smallvec![Range::point(0), Range::point(5)], 0 )) ); assert_eq!( select_on_matches(s, &Selection::single(0, 6), &end_of_line), Some(Selection::single(4, 4)) ); // multiple lines assert_eq!( select_on_matches( s, &Selection::single(0, s.len_chars()), &RegexBuilder::new(r"^[a-z ]*$") .multi_line(true) .build() .unwrap() ), Some(Selection::new( smallvec![Range::point(12), Range::new(13, 30), Range::new(31, 36)], 0 )) ); } #[test] fn test_line_range() { let r = Rope::from_str("\r\nHi\r\nthere!"); let s = r.slice(..); // Zero-width ranges. assert_eq!(Range::new(0, 0).line_range(s), (0, 0)); assert_eq!(Range::new(1, 1).line_range(s), (0, 0)); assert_eq!(Range::new(2, 2).line_range(s), (1, 1)); assert_eq!(Range::new(3, 3).line_range(s), (1, 1)); // Forward ranges. assert_eq!(Range::new(0, 1).line_range(s), (0, 0)); assert_eq!(Range::new(0, 2).line_range(s), (0, 0)); assert_eq!(Range::new(0, 3).line_range(s), (0, 1)); assert_eq!(Range::new(1, 2).line_range(s), (0, 0)); assert_eq!(Range::new(2, 3).line_range(s), (1, 1)); assert_eq!(Range::new(3, 8).line_range(s), (1, 2)); assert_eq!(Range::new(0, 12).line_range(s), (0, 2)); // Reverse ranges. assert_eq!(Range::new(1, 0).line_range(s), (0, 0)); assert_eq!(Range::new(2, 0).line_range(s), (0, 0)); assert_eq!(Range::new(3, 0).line_range(s), (0, 1)); assert_eq!(Range::new(2, 1).line_range(s), (0, 0)); assert_eq!(Range::new(3, 2).line_range(s), (1, 1)); assert_eq!(Range::new(8, 3).line_range(s), (1, 2)); assert_eq!(Range::new(12, 0).line_range(s), (0, 2)); } #[test] fn test_cursor() { let r = Rope::from_str("\r\nHi\r\nthere!"); let s = r.slice(..); // Zero-width ranges. assert_eq!(Range::new(0, 0).cursor(s), 0); assert_eq!(Range::new(2, 2).cursor(s), 2); assert_eq!(Range::new(3, 3).cursor(s), 3); // Forward ranges. assert_eq!(Range::new(0, 2).cursor(s), 0); assert_eq!(Range::new(0, 3).cursor(s), 2); assert_eq!(Range::new(3, 6).cursor(s), 4); // Reverse ranges. assert_eq!(Range::new(2, 0).cursor(s), 0); assert_eq!(Range::new(6, 2).cursor(s), 2); assert_eq!(Range::new(6, 3).cursor(s), 3); } #[test] fn test_put_cursor() { let r = Rope::from_str("\r\nHi\r\nthere!"); let s = r.slice(..); // Zero-width ranges. assert_eq!(Range::new(0, 0).put_cursor(s, 0, true), Range::new(0, 2)); assert_eq!(Range::new(0, 0).put_cursor(s, 2, true), Range::new(0, 3)); assert_eq!(Range::new(2, 3).put_cursor(s, 4, true), Range::new(2, 6)); assert_eq!(Range::new(2, 8).put_cursor(s, 4, true), Range::new(2, 6)); assert_eq!(Range::new(8, 8).put_cursor(s, 4, true), Range::new(9, 4)); // Forward ranges. assert_eq!(Range::new(3, 6).put_cursor(s, 0, true), Range::new(4, 0)); assert_eq!(Range::new(3, 6).put_cursor(s, 2, true), Range::new(4, 2)); assert_eq!(Range::new(3, 6).put_cursor(s, 3, true), Range::new(3, 4)); assert_eq!(Range::new(3, 6).put_cursor(s, 4, true), Range::new(3, 6)); assert_eq!(Range::new(3, 6).put_cursor(s, 6, true), Range::new(3, 7)); assert_eq!(Range::new(3, 6).put_cursor(s, 8, true), Range::new(3, 9)); // Reverse ranges. assert_eq!(Range::new(6, 3).put_cursor(s, 0, true), Range::new(6, 0)); assert_eq!(Range::new(6, 3).put_cursor(s, 2, true), Range::new(6, 2)); assert_eq!(Range::new(6, 3).put_cursor(s, 3, true), Range::new(6, 3)); assert_eq!(Range::new(6, 3).put_cursor(s, 4, true), Range::new(6, 4)); assert_eq!(Range::new(6, 3).put_cursor(s, 6, true), Range::new(4, 7)); assert_eq!(Range::new(6, 3).put_cursor(s, 8, true), Range::new(4, 9)); } #[test] fn test_split_on_matches() { use crate::regex::Regex; let text = Rope::from(" abcd efg wrs xyz 123 456"); let selection = Selection::new(smallvec![Range::new(0, 9), Range::new(11, 20),], 0); let result = split_on_matches(text.slice(..), &selection, &Regex::new(r"\s+").unwrap()); assert_eq!( result.ranges(), &[ // TODO: rather than this behavior, maybe we want it // to be based on which side is the anchor? // // We get a leading zero-width range when there's // a leading match because ranges are inclusive on // the left. Imagine, for example, if the entire // selection range were matched: you'd still want // at least one range to remain after the split. Range::new(0, 0), Range::new(1, 5), Range::new(6, 9), Range::new(11, 13), Range::new(16, 19), // In contrast to the comment above, there is no // _trailing_ zero-width range despite the trailing // match, because ranges are exclusive on the right. ] ); assert_eq!( result.fragments(text.slice(..)).collect::<Vec<_>>(), &["", "abcd", "efg", "rs", "xyz"] ); } #[test] fn test_selection_contains() { fn contains(a: Vec<(usize, usize)>, b: Vec<(usize, usize)>) -> bool { let sela = Selection::new(a.iter().map(|a| Range::new(a.0, a.1)).collect(), 0); let selb = Selection::new(b.iter().map(|b| Range::new(b.0, b.1)).collect(), 0); sela.contains(&selb) } // exact match assert!(contains(vec!((1, 1)), vec!((1, 1)))); // larger set contains smaller assert!(contains(vec!((1, 1), (2, 2), (3, 3)), vec!((2, 2)))); // multiple matches assert!(contains(vec!((1, 1), (2, 2)), vec!((1, 1), (2, 2)))); // smaller set can't contain bigger assert!(!contains(vec!((1, 1)), vec!((1, 1), (2, 2)))); assert!(contains( vec!((1, 1), (2, 4), (5, 6), (7, 9), (10, 13)), vec!((3, 4), (7, 9)) )); assert!(!contains(vec!((1, 1), (5, 6)), vec!((1, 6)))); } }