2022-03-03 12:41:39 +04:00
|
|
|
use std::borrow::Cow;
|
|
|
|
|
2021-03-18 08:39:34 +04:00
|
|
|
use crate::{
|
2021-06-21 02:09:10 +04:00
|
|
|
chars::char_is_line_ending,
|
2022-03-03 12:41:39 +04:00
|
|
|
graphemes::{ensure_grapheme_boundary_prev, grapheme_width, RopeGraphemes},
|
2021-07-21 05:15:34 +04:00
|
|
|
line_ending::line_end_char_index,
|
2021-07-01 23:24:22 +04:00
|
|
|
RopeSlice,
|
2021-03-18 08:39:34 +04:00
|
|
|
};
|
|
|
|
|
2020-09-17 09:57:49 +04:00
|
|
|
/// Represents a single point in a text buffer. Zero indexed.
|
|
|
|
#[derive(Debug, Default, Clone, Copy, PartialEq, Eq, PartialOrd, Ord)]
|
|
|
|
pub struct Position {
|
|
|
|
pub row: usize,
|
|
|
|
pub col: usize,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Position {
|
|
|
|
pub const fn new(row: usize, col: usize) -> Self {
|
|
|
|
Self { row, col }
|
|
|
|
}
|
|
|
|
|
|
|
|
pub const fn is_zero(self) -> bool {
|
|
|
|
self.row == 0 && self.col == 0
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: generalize
|
|
|
|
pub fn traverse(self, text: &crate::Tendril) -> Self {
|
|
|
|
let Self { mut row, mut col } = self;
|
|
|
|
// TODO: there should be a better way here
|
2021-06-21 02:09:10 +04:00
|
|
|
let mut chars = text.chars().peekable();
|
|
|
|
while let Some(ch) = chars.next() {
|
|
|
|
if char_is_line_ending(ch) && !(ch == '\r' && chars.peek() == Some(&'\n')) {
|
2020-09-17 09:57:49 +04:00
|
|
|
row += 1;
|
|
|
|
col = 0;
|
|
|
|
} else {
|
|
|
|
col += 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Self { row, col }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl From<(usize, usize)> for Position {
|
|
|
|
fn from(tuple: (usize, usize)) -> Self {
|
2021-03-24 09:52:13 +04:00
|
|
|
Self {
|
2020-09-17 09:57:49 +04:00
|
|
|
row: tuple.0,
|
|
|
|
col: tuple.1,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-01-19 11:16:15 +04:00
|
|
|
impl From<Position> for tree_sitter::Point {
|
|
|
|
fn from(pos: Position) -> Self {
|
|
|
|
Self::new(pos.row, pos.col)
|
2020-09-17 09:57:49 +04:00
|
|
|
}
|
|
|
|
}
|
2021-03-18 08:39:34 +04:00
|
|
|
/// Convert a character index to (line, column) coordinates.
|
2021-07-21 05:15:34 +04:00
|
|
|
///
|
2021-11-03 07:02:29 +04:00
|
|
|
/// column in `char` count which can be used for row:column display in
|
|
|
|
/// status line. See [`visual_coords_at_pos`] for a visual one.
|
2021-03-18 08:39:34 +04:00
|
|
|
pub fn coords_at_pos(text: RopeSlice, pos: usize) -> Position {
|
|
|
|
let line = text.char_to_line(pos);
|
2021-07-21 05:15:34 +04:00
|
|
|
|
2021-03-18 08:39:34 +04:00
|
|
|
let line_start = text.line_to_char(line);
|
2021-07-21 05:15:34 +04:00
|
|
|
let pos = ensure_grapheme_boundary_prev(text, pos);
|
2021-07-23 00:21:44 +04:00
|
|
|
let col = RopeGraphemes::new(text.slice(line_start..pos)).count();
|
2021-07-21 05:15:34 +04:00
|
|
|
|
2021-03-18 08:39:34 +04:00
|
|
|
Position::new(line, col)
|
|
|
|
}
|
|
|
|
|
2021-11-03 07:02:29 +04:00
|
|
|
/// Convert a character index to (line, column) coordinates visually.
|
|
|
|
///
|
|
|
|
/// Takes \t, double-width characters (CJK) into account as well as text
|
|
|
|
/// not in the document in the future.
|
|
|
|
/// See [`coords_at_pos`] for an "objective" one.
|
|
|
|
pub fn visual_coords_at_pos(text: RopeSlice, pos: usize, tab_width: usize) -> Position {
|
|
|
|
let line = text.char_to_line(pos);
|
|
|
|
|
|
|
|
let line_start = text.line_to_char(line);
|
|
|
|
let pos = ensure_grapheme_boundary_prev(text, pos);
|
2022-03-03 12:41:39 +04:00
|
|
|
|
|
|
|
let mut col = 0;
|
|
|
|
|
|
|
|
for grapheme in RopeGraphemes::new(text.slice(line_start..pos)) {
|
|
|
|
if grapheme == "\t" {
|
2022-03-04 06:01:33 +04:00
|
|
|
col += tab_width - (col % tab_width);
|
2022-03-03 12:41:39 +04:00
|
|
|
} else {
|
|
|
|
let grapheme = Cow::from(grapheme);
|
|
|
|
col += grapheme_width(&grapheme);
|
|
|
|
}
|
|
|
|
}
|
2021-11-03 07:02:29 +04:00
|
|
|
|
|
|
|
Position::new(line, col)
|
|
|
|
}
|
|
|
|
|
2021-03-18 08:39:34 +04:00
|
|
|
/// Convert (line, column) coordinates to a character index.
|
2021-07-21 05:15:34 +04:00
|
|
|
///
|
2021-08-08 02:34:01 +04:00
|
|
|
/// If the `line` coordinate is beyond the end of the file, the EOF
|
|
|
|
/// position will be returned.
|
|
|
|
///
|
|
|
|
/// If the `column` coordinate is past the end of the given line, the
|
|
|
|
/// line-end position will be returned. What constitutes the "line-end
|
|
|
|
/// position" depends on the parameter `limit_before_line_ending`. If it's
|
|
|
|
/// `true`, the line-end position will be just *before* the line ending
|
|
|
|
/// character. If `false` it will be just *after* the line ending
|
|
|
|
/// character--on the border between the current line and the next.
|
|
|
|
///
|
|
|
|
/// Usually you only want `limit_before_line_ending` to be `true` if you're working
|
|
|
|
/// with left-side block-cursor positions, as this prevents the the block cursor
|
|
|
|
/// from jumping to the next line. Otherwise you typically want it to be `false`,
|
|
|
|
/// such as when dealing with raw anchor/head positions.
|
2021-07-23 00:21:44 +04:00
|
|
|
///
|
|
|
|
/// TODO: this should be changed to work in terms of visual row/column, not
|
|
|
|
/// graphemes.
|
2021-08-08 02:34:01 +04:00
|
|
|
pub fn pos_at_coords(text: RopeSlice, coords: Position, limit_before_line_ending: bool) -> usize {
|
2022-01-23 11:54:03 +04:00
|
|
|
let Position { mut row, col } = coords;
|
|
|
|
if limit_before_line_ending {
|
|
|
|
row = row.min(text.len_lines() - 1);
|
|
|
|
};
|
2021-03-18 08:39:34 +04:00
|
|
|
let line_start = text.line_to_char(row);
|
2021-08-08 02:34:01 +04:00
|
|
|
let line_end = if limit_before_line_ending {
|
2021-07-21 05:15:34 +04:00
|
|
|
line_end_char_index(&text, row)
|
|
|
|
} else {
|
|
|
|
text.line_to_char((row + 1).min(text.len_lines()))
|
|
|
|
};
|
|
|
|
|
|
|
|
let mut col_char_offset = 0;
|
2021-07-23 00:21:44 +04:00
|
|
|
for (i, g) in RopeGraphemes::new(text.slice(line_start..line_end)).enumerate() {
|
|
|
|
if i == col {
|
2021-07-21 05:15:34 +04:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
col_char_offset += g.chars().count();
|
|
|
|
}
|
|
|
|
|
|
|
|
line_start + col_char_offset
|
2021-03-18 08:39:34 +04:00
|
|
|
}
|
2020-09-17 09:57:49 +04:00
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod test {
|
|
|
|
use super::*;
|
2021-07-01 23:24:22 +04:00
|
|
|
use crate::Rope;
|
2020-09-17 09:57:49 +04:00
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_ordering() {
|
|
|
|
// (0, 5) is less than (1, 0)
|
|
|
|
assert!(Position::new(0, 5) < Position::new(1, 0));
|
|
|
|
}
|
2021-03-18 08:39:34 +04:00
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_coords_at_pos() {
|
2021-07-21 05:15:34 +04:00
|
|
|
let text = Rope::from("ḧëḷḷö\nẅöṛḷḋ");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(coords_at_pos(slice, 0), (0, 0).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 5), (0, 5).into()); // position on \n
|
|
|
|
assert_eq!(coords_at_pos(slice, 6), (1, 0).into()); // position on w
|
|
|
|
assert_eq!(coords_at_pos(slice, 7), (1, 1).into()); // position on o
|
|
|
|
assert_eq!(coords_at_pos(slice, 10), (1, 4).into()); // position on d
|
|
|
|
|
|
|
|
// Test with wide characters.
|
|
|
|
let text = Rope::from("今日はいい\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(coords_at_pos(slice, 0), (0, 0).into());
|
2021-07-23 00:21:44 +04:00
|
|
|
assert_eq!(coords_at_pos(slice, 1), (0, 1).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 2), (0, 2).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 3), (0, 3).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 4), (0, 4).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 5), (0, 5).into());
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(coords_at_pos(slice, 6), (1, 0).into());
|
2021-03-18 08:39:34 +04:00
|
|
|
|
2021-07-23 00:21:44 +04:00
|
|
|
// Test with grapheme clusters.
|
2021-03-18 08:39:34 +04:00
|
|
|
let text = Rope::from("a̐éö̲\r\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(coords_at_pos(slice, 0), (0, 0).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 2), (0, 1).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 4), (0, 2).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 7), (0, 3).into());
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(coords_at_pos(slice, 9), (1, 0).into());
|
2021-03-18 08:39:34 +04:00
|
|
|
|
2021-07-23 00:21:44 +04:00
|
|
|
// Test with wide-character grapheme clusters.
|
2021-07-21 05:15:34 +04:00
|
|
|
let text = Rope::from("किमपि\n");
|
2021-03-18 08:39:34 +04:00
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(coords_at_pos(slice, 0), (0, 0).into());
|
2021-07-23 00:21:44 +04:00
|
|
|
assert_eq!(coords_at_pos(slice, 2), (0, 1).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 3), (0, 2).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 5), (0, 3).into());
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(coords_at_pos(slice, 6), (1, 0).into());
|
2021-07-23 00:21:44 +04:00
|
|
|
|
|
|
|
// Test with tabs.
|
|
|
|
let text = Rope::from("\tHello\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(coords_at_pos(slice, 0), (0, 0).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 1), (0, 1).into());
|
|
|
|
assert_eq!(coords_at_pos(slice, 2), (0, 2).into());
|
2021-03-18 08:39:34 +04:00
|
|
|
}
|
|
|
|
|
2021-11-03 07:02:29 +04:00
|
|
|
#[test]
|
|
|
|
fn test_visual_coords_at_pos() {
|
|
|
|
let text = Rope::from("ḧëḷḷö\nẅöṛḷḋ");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 0, 8), (0, 0).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 5, 8), (0, 5).into()); // position on \n
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 6, 8), (1, 0).into()); // position on w
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 7, 8), (1, 1).into()); // position on o
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 10, 8), (1, 4).into()); // position on d
|
|
|
|
|
|
|
|
// Test with wide characters.
|
|
|
|
let text = Rope::from("今日はいい\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 0, 8), (0, 0).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 1, 8), (0, 2).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 2, 8), (0, 4).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 3, 8), (0, 6).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 4, 8), (0, 8).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 5, 8), (0, 10).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 6, 8), (1, 0).into());
|
|
|
|
|
|
|
|
// Test with grapheme clusters.
|
|
|
|
let text = Rope::from("a̐éö̲\r\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 0, 8), (0, 0).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 2, 8), (0, 1).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 4, 8), (0, 2).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 7, 8), (0, 3).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 9, 8), (1, 0).into());
|
|
|
|
|
|
|
|
// Test with wide-character grapheme clusters.
|
|
|
|
// TODO: account for cluster.
|
|
|
|
let text = Rope::from("किमपि\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 0, 8), (0, 0).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 2, 8), (0, 2).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 3, 8), (0, 3).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 5, 8), (0, 5).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 6, 8), (1, 0).into());
|
|
|
|
|
|
|
|
// Test with tabs.
|
|
|
|
let text = Rope::from("\tHello\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 0, 8), (0, 0).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 1, 8), (0, 8).into());
|
|
|
|
assert_eq!(visual_coords_at_pos(slice, 2, 8), (0, 9).into());
|
|
|
|
}
|
|
|
|
|
2021-03-18 08:39:34 +04:00
|
|
|
#[test]
|
|
|
|
fn test_pos_at_coords() {
|
|
|
|
let text = Rope::from("ḧëḷḷö\nẅöṛḷḋ");
|
|
|
|
let slice = text.slice(..);
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (0, 0).into(), false), 0);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 5).into(), false), 5); // position on \n
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 6).into(), false), 6); // position after \n
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 6).into(), true), 5); // position after \n
|
|
|
|
assert_eq!(pos_at_coords(slice, (1, 0).into(), false), 6); // position on w
|
|
|
|
assert_eq!(pos_at_coords(slice, (1, 1).into(), false), 7); // position on o
|
|
|
|
assert_eq!(pos_at_coords(slice, (1, 4).into(), false), 10); // position on d
|
|
|
|
|
|
|
|
// Test with wide characters.
|
2021-07-23 00:21:44 +04:00
|
|
|
// TODO: account for character width.
|
2021-07-21 05:15:34 +04:00
|
|
|
let text = Rope::from("今日はいい\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 0).into(), false), 0);
|
2021-07-23 00:21:44 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (0, 1).into(), false), 1);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 2).into(), false), 2);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 3).into(), false), 3);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 4).into(), false), 4);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 5).into(), false), 5);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 6).into(), false), 6);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 6).into(), true), 5);
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (1, 0).into(), false), 6);
|
2021-03-18 08:39:34 +04:00
|
|
|
|
2021-07-23 00:21:44 +04:00
|
|
|
// Test with grapheme clusters.
|
2021-03-18 08:39:34 +04:00
|
|
|
let text = Rope::from("a̐éö̲\r\n");
|
|
|
|
let slice = text.slice(..);
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (0, 0).into(), false), 0);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 1).into(), false), 2);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 2).into(), false), 4);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 3).into(), false), 7); // \r\n is one char here
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 4).into(), false), 9);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 4).into(), true), 7);
|
|
|
|
assert_eq!(pos_at_coords(slice, (1, 0).into(), false), 9);
|
|
|
|
|
2021-07-23 00:21:44 +04:00
|
|
|
// Test with wide-character grapheme clusters.
|
|
|
|
// TODO: account for character width.
|
2021-03-18 08:39:34 +04:00
|
|
|
let text = Rope::from("किमपि");
|
|
|
|
// 2 - 1 - 2 codepoints
|
|
|
|
// TODO: delete handling as per https://news.ycombinator.com/item?id=20058454
|
|
|
|
let slice = text.slice(..);
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (0, 0).into(), false), 0);
|
2021-07-23 00:21:44 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (0, 1).into(), false), 2);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 2).into(), false), 3);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 3).into(), false), 5);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 3).into(), true), 5);
|
|
|
|
|
|
|
|
// Test with tabs.
|
|
|
|
// Todo: account for tab stops.
|
|
|
|
let text = Rope::from("\tHello\n");
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 0).into(), false), 0);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 1).into(), false), 1);
|
2021-07-21 05:15:34 +04:00
|
|
|
assert_eq!(pos_at_coords(slice, (0, 2).into(), false), 2);
|
2022-01-23 11:54:03 +04:00
|
|
|
|
|
|
|
// Test out of bounds.
|
|
|
|
let text = Rope::new();
|
|
|
|
let slice = text.slice(..);
|
|
|
|
assert_eq!(pos_at_coords(slice, (10, 0).into(), true), 0);
|
|
|
|
assert_eq!(pos_at_coords(slice, (0, 10).into(), true), 0);
|
|
|
|
assert_eq!(pos_at_coords(slice, (10, 10).into(), true), 0);
|
2021-03-18 08:39:34 +04:00
|
|
|
}
|
2020-09-17 09:57:49 +04:00
|
|
|
}
|