commit cda2ec7e06c28cf78b1944b169fe5463c96c1c35 · nonbinary.computer/weaver

-17

Cargo.lock

··· 4990 ] 4991 4992 [[package]] 4993 - name = "jumprope" 4994 - version = "1.1.2" 4995 - source = "registry+https://github.com/rust-lang/crates.io-index" 4996 - checksum = "829c74fe88dda0d2a5425b022b44921574a65c4eb78e6e39a61b40eb416a4ef8" 4997 - dependencies = [ 4998 - "rand 0.8.5", 4999 - "str_indices", 5000 - ] 5001 - 5002 - [[package]] 5003 name = "k256" 5004 version = "0.13.4" 5005 source = "registry+https://github.com/rust-lang/crates.io-index" ··· 8349 checksum = "a2eb9349b6444b326872e140eb1cf5e7c522154d69e7a0ffb0fb81c06b37543f" 8350 8351 [[package]] 8352 - name = "str_indices" 8353 - version = "0.4.4" 8354 - source = "registry+https://github.com/rust-lang/crates.io-index" 8355 - checksum = "d08889ec5408683408db66ad89e0e1f93dff55c73a4ccc71c427d5b277ee47e6" 8356 - 8357 - [[package]] 8358 name = "string_cache" 8359 version = "0.8.9" 8360 source = "registry+https://github.com/rust-lang/crates.io-index" ··· 9963 "jacquard-identity", 9964 "jacquard-lexicon", 9965 "js-sys", 9966 - "jumprope", 9967 "lol_alloc", 9968 "loro", 9969 "markdown-weaver",

··· 4990 ] 4991 4992 [[package]] 4993 name = "k256" 4994 version = "0.13.4" 4995 source = "registry+https://github.com/rust-lang/crates.io-index" ··· 8339 checksum = "a2eb9349b6444b326872e140eb1cf5e7c522154d69e7a0ffb0fb81c06b37543f" 8340 8341 [[package]] 8342 name = "string_cache" 8343 version = "0.8.9" 8344 source = "registry+https://github.com/rust-lang/crates.io-index" ··· 9947 "jacquard-identity", 9948 "jacquard-lexicon", 9949 "js-sys", 9950 "lol_alloc", 9951 "loro", 9952 "markdown-weaver",

-1

crates/weaver-app/Cargo.toml

··· 49 serde_html_form = "0.2.8" 50 tracing.workspace = true 51 serde_ipld_dagcbor = { version = "0.6" } 52 - jumprope = { version = "1.1", features = ["wchar_conversion"] } 53 loro = "1.9.1" 54 markdown-weaver-escape = { workspace = true } 55

··· 49 serde_html_form = "0.2.8" 50 tracing.workspace = true 51 serde_ipld_dagcbor = { version = "0.6" } 52 loro = "1.9.1" 53 markdown-weaver-escape = { workspace = true } 54

+9 -11

crates/weaver-app/src/components/editor/cursor.rs

··· 8 //! 4. Setting cursor with web_sys Selection API 9 10 use super::offset_map::{find_mapping_for_char, OffsetMapping}; 11 - use jumprope::JumpRopeBuf; 12 13 #[cfg(all(target_family = "wasm", target_os = "unknown"))] 14 use wasm_bindgen::JsCast; ··· 16 /// Restore cursor position in the DOM after re-render. 17 /// 18 /// # Arguments 19 - /// - `rope`: The document content (for length bounds checking) 20 - /// - `char_offset`: Cursor position as char offset in rope 21 /// - `offset_map`: Mappings from source to DOM positions 22 /// - `editor_id`: DOM ID of the contenteditable element 23 /// ··· 28 /// 4. Set cursor with Selection API 29 #[cfg(all(target_family = "wasm", target_os = "unknown"))] 30 pub fn restore_cursor_position( 31 - rope: &JumpRopeBuf, 32 char_offset: usize, 33 offset_map: &[OffsetMapping], 34 editor_id: &str, 35 ) -> Result<(), wasm_bindgen::JsValue> { 36 - // Bounds check 37 - let max_offset = rope.len_chars(); 38 - if char_offset > max_offset { 39 - return Err(format!("cursor offset {} > document length {}", char_offset, max_offset).into()); 40 } 41 42 - // Empty document - no cursor to restore 43 - if offset_map.is_empty() || max_offset == 0 { 44 return Ok(()); 45 } 46 ··· 159 /// Non-WASM stub for testing 160 #[cfg(not(all(target_family = "wasm", target_os = "unknown")))] 161 pub fn restore_cursor_position( 162 - _rope: &JumpRopeBuf, 163 _char_offset: usize, 164 _offset_map: &[OffsetMapping], 165 _editor_id: &str,

··· 8 //! 4. Setting cursor with web_sys Selection API 9 10 use super::offset_map::{find_mapping_for_char, OffsetMapping}; 11 12 #[cfg(all(target_family = "wasm", target_os = "unknown"))] 13 use wasm_bindgen::JsCast; ··· 15 /// Restore cursor position in the DOM after re-render. 16 /// 17 /// # Arguments 18 + /// - `char_offset`: Cursor position as char offset in document 19 /// - `offset_map`: Mappings from source to DOM positions 20 /// - `editor_id`: DOM ID of the contenteditable element 21 /// ··· 26 /// 4. Set cursor with Selection API 27 #[cfg(all(target_family = "wasm", target_os = "unknown"))] 28 pub fn restore_cursor_position( 29 char_offset: usize, 30 offset_map: &[OffsetMapping], 31 editor_id: &str, 32 ) -> Result<(), wasm_bindgen::JsValue> { 33 + // Empty document - no cursor to restore 34 + if offset_map.is_empty() { 35 + return Ok(()); 36 } 37 38 + // Bounds check using offset map 39 + let max_offset = offset_map.iter().map(|m| m.char_range.end).max().unwrap_or(0); 40 + if char_offset > max_offset { 41 + tracing::warn!("cursor offset {} > max mapping offset {}", char_offset, max_offset); 42 + // Don't error, just skip restoration - this can happen during edits 43 return Ok(()); 44 } 45 ··· 158 /// Non-WASM stub for testing 159 #[cfg(not(all(target_family = "wasm", target_os = "unknown")))] 160 pub fn restore_cursor_position( 161 _char_offset: usize, 162 _offset_map: &[OffsetMapping], 163 _editor_id: &str,

+129 -32

crates/weaver-app/src/components/editor/document.rs

··· 1 //! Core data structures for the markdown editor. 2 3 - use jumprope::JumpRopeBuf; 4 5 /// Single source of truth for editor state. 6 /// 7 - /// Contains the document text, cursor position, selection, and IME composition state. 8 - #[derive(Clone, Debug)] 9 pub struct EditorDocument { 10 - /// The rope storing document text (uses char offsets, not bytes). 11 - /// Uses JumpRopeBuf to batch consecutive edits for performance. 12 - pub rope: JumpRopeBuf, 13 14 /// Current cursor position (char offset) 15 pub cursor: CursorState, ··· 28 /// Cursor state including position and affinity. 29 #[derive(Clone, Debug, Copy)] 30 pub struct CursorState { 31 - /// Character offset in rope (NOT byte offset!) 32 pub offset: usize, 33 34 /// Prefer left/right when at boundary (for vertical cursor movement) ··· 85 return true; 86 } 87 88 - // Find distance from previous newline by scanning forward and tracking last newline 89 - let rope = self.rope.borrow(); 90 let mut last_newline_pos: Option<usize> = None; 91 92 - for (i, c) in rope.slice_chars(0..pos).enumerate() { 93 if c == '\n' { 94 last_newline_pos = Some(i); 95 } 96 } 97 98 let chars_from_line_start = match last_newline_pos { 99 - Some(nl_pos) => pos - nl_pos - 1, // -1 because newline itself is not part of current line 100 - None => pos, // No newline found, distance is from document start 101 }; 102 103 chars_from_line_start <= BLOCK_SYNTAX_ZONE ··· 105 106 /// Create a new editor document with the given content. 107 pub fn new(content: String) -> Self { 108 Self { 109 - rope: JumpRopeBuf::from(content.as_str()), 110 cursor: CursorState { 111 offset: 0, 112 affinity: Affinity::Before, ··· 117 } 118 } 119 120 /// Convert the document to a string. 121 pub fn to_string(&self) -> String { 122 - self.rope.to_string() 123 } 124 125 /// Get the length of the document in characters. 126 pub fn len_chars(&self) -> usize { 127 - self.rope.len_chars() 128 } 129 130 /// Check if the document is empty. 131 pub fn is_empty(&self) -> bool { 132 - self.rope.len_chars() == 0 133 } 134 135 /// Insert text and record edit info for incremental rendering. 136 - pub fn insert_tracked(&mut self, pos: usize, text: &str) { 137 let in_block_syntax_zone = self.is_in_block_syntax_zone(pos); 138 self.last_edit = Some(EditInfo { 139 edit_char_pos: pos, ··· 142 contains_newline: text.contains('\n'), 143 in_block_syntax_zone, 144 }); 145 - self.rope.insert(pos, text); 146 } 147 148 /// Remove text range and record edit info for incremental rendering. 149 - pub fn remove_tracked(&mut self, range: std::ops::Range<usize>) { 150 - // Check if deleted region contains newline - borrow inner JumpRope 151 - let contains_newline = self.rope.borrow().slice_chars(range.clone()).any(|c| c == '\n'); 152 - let in_block_syntax_zone = self.is_in_block_syntax_zone(range.start); 153 self.last_edit = Some(EditInfo { 154 - edit_char_pos: range.start, 155 inserted_len: 0, 156 - deleted_len: range.end - range.start, 157 contains_newline, 158 in_block_syntax_zone, 159 }); 160 - self.rope.remove(range); 161 } 162 163 /// Replace text (delete then insert) and record combined edit info. 164 - pub fn replace_tracked(&mut self, range: std::ops::Range<usize>, text: &str) { 165 - let delete_has_newline = self.rope.borrow().slice_chars(range.clone()).any(|c| c == '\n'); 166 - let in_block_syntax_zone = self.is_in_block_syntax_zone(range.start); 167 self.last_edit = Some(EditInfo { 168 - edit_char_pos: range.start, 169 inserted_len: text.chars().count(), 170 - deleted_len: range.end - range.start, 171 contains_newline: delete_has_newline || text.contains('\n'), 172 in_block_syntax_zone, 173 }); 174 - self.rope.remove(range); 175 - self.rope.insert(self.last_edit.as_ref().unwrap().edit_char_pos, text); 176 } 177 }

··· 1 //! Core data structures for the markdown editor. 2 + //! 3 + //! Uses Loro CRDT for text storage with built-in undo/redo support. 4 5 + use loro::{LoroDoc, LoroResult, LoroText, UndoManager}; 6 7 /// Single source of truth for editor state. 8 /// 9 + /// Contains the document text (backed by Loro CRDT), cursor position, 10 + /// selection, and IME composition state. 11 + #[derive(Debug)] 12 pub struct EditorDocument { 13 + /// The Loro document containing all editor state. 14 + /// Using full LoroDoc (not just LoroText) to support future 15 + /// expansion to blobs, metadata, etc. 16 + doc: LoroDoc, 17 + 18 + /// Handle to the text container within the doc. 19 + text: LoroText, 20 + 21 + /// Undo manager for the document. 22 + undo_mgr: UndoManager, 23 24 /// Current cursor position (char offset) 25 pub cursor: CursorState, ··· 38 /// Cursor state including position and affinity. 39 #[derive(Clone, Debug, Copy)] 40 pub struct CursorState { 41 + /// Character offset in text (NOT byte offset!) 42 pub offset: usize, 43 44 /// Prefer left/right when at boundary (for vertical cursor movement) ··· 95 return true; 96 } 97 98 + let content = self.text.to_string(); 99 let mut last_newline_pos: Option<usize> = None; 100 101 + for (i, c) in content.chars().take(pos).enumerate() { 102 if c == '\n' { 103 last_newline_pos = Some(i); 104 } 105 } 106 107 let chars_from_line_start = match last_newline_pos { 108 + Some(nl_pos) => pos - nl_pos - 1, 109 + None => pos, 110 }; 111 112 chars_from_line_start <= BLOCK_SYNTAX_ZONE ··· 114 115 /// Create a new editor document with the given content. 116 pub fn new(content: String) -> Self { 117 + let doc = LoroDoc::new(); 118 + let text = doc.get_text("content"); 119 + 120 + // Insert initial content if any 121 + if !content.is_empty() { 122 + text.insert(0, &content).expect("failed to insert initial content"); 123 + } 124 + 125 + // Set up undo manager with merge interval for batching keystrokes 126 + let mut undo_mgr = UndoManager::new(&doc); 127 + undo_mgr.set_merge_interval(300); // 300ms merge window 128 + undo_mgr.set_max_undo_steps(100); 129 + 130 Self { 131 + doc, 132 + text, 133 + undo_mgr, 134 cursor: CursorState { 135 offset: 0, 136 affinity: Affinity::Before, ··· 141 } 142 } 143 144 + /// Get the underlying LoroText for read operations. 145 + pub fn loro_text(&self) -> &LoroText { 146 + &self.text 147 + } 148 + 149 /// Convert the document to a string. 150 pub fn to_string(&self) -> String { 151 + self.text.to_string() 152 } 153 154 /// Get the length of the document in characters. 155 pub fn len_chars(&self) -> usize { 156 + self.text.len_unicode() 157 + } 158 + 159 + /// Get the length of the document in UTF-8 bytes. 160 + pub fn len_bytes(&self) -> usize { 161 + self.text.len_utf8() 162 + } 163 + 164 + /// Get the length of the document in UTF-16 code units. 165 + pub fn len_utf16(&self) -> usize { 166 + self.text.len_utf16() 167 } 168 169 /// Check if the document is empty. 170 pub fn is_empty(&self) -> bool { 171 + self.text.len_unicode() == 0 172 } 173 174 /// Insert text and record edit info for incremental rendering. 175 + pub fn insert_tracked(&mut self, pos: usize, text: &str) -> LoroResult<()> { 176 let in_block_syntax_zone = self.is_in_block_syntax_zone(pos); 177 self.last_edit = Some(EditInfo { 178 edit_char_pos: pos, ··· 181 contains_newline: text.contains('\n'), 182 in_block_syntax_zone, 183 }); 184 + self.text.insert(pos, text) 185 } 186 187 /// Remove text range and record edit info for incremental rendering. 188 + pub fn remove_tracked(&mut self, start: usize, len: usize) -> LoroResult<()> { 189 + let content = self.text.to_string(); 190 + let end = start + len; 191 + let contains_newline = content 192 + .chars() 193 + .skip(start) 194 + .take(len) 195 + .any(|c| c == '\n'); 196 + let in_block_syntax_zone = self.is_in_block_syntax_zone(start); 197 + 198 self.last_edit = Some(EditInfo { 199 + edit_char_pos: start, 200 inserted_len: 0, 201 + deleted_len: len, 202 contains_newline, 203 in_block_syntax_zone, 204 }); 205 + self.text.delete(start, len) 206 } 207 208 /// Replace text (delete then insert) and record combined edit info. 209 + pub fn replace_tracked(&mut self, start: usize, len: usize, text: &str) -> LoroResult<()> { 210 + let content = self.text.to_string(); 211 + let delete_has_newline = content 212 + .chars() 213 + .skip(start) 214 + .take(len) 215 + .any(|c| c == '\n'); 216 + let in_block_syntax_zone = self.is_in_block_syntax_zone(start); 217 + 218 self.last_edit = Some(EditInfo { 219 + edit_char_pos: start, 220 inserted_len: text.chars().count(), 221 + deleted_len: len, 222 contains_newline: delete_has_newline || text.contains('\n'), 223 in_block_syntax_zone, 224 }); 225 + 226 + // Use splice for atomic replace 227 + self.text.splice(start, len, text)?; 228 + Ok(()) 229 + } 230 + 231 + /// Undo the last operation. 232 + /// Returns true if an undo was performed. 233 + pub fn undo(&mut self) -> LoroResult<bool> { 234 + self.undo_mgr.undo() 235 + } 236 + 237 + /// Redo the last undone operation. 238 + /// Returns true if a redo was performed. 239 + pub fn redo(&mut self) -> LoroResult<bool> { 240 + self.undo_mgr.redo() 241 + } 242 + 243 + /// Check if undo is available. 244 + pub fn can_undo(&self) -> bool { 245 + self.undo_mgr.can_undo() 246 + } 247 + 248 + /// Check if redo is available. 249 + pub fn can_redo(&self) -> bool { 250 + self.undo_mgr.can_redo() 251 + } 252 + 253 + /// Get a slice of the document text. 254 + /// Returns None if the range is invalid. 255 + pub fn slice(&self, start: usize, end: usize) -> Option<String> { 256 + self.text.slice(start, end).ok() 257 + } 258 + } 259 + 260 + // EditorDocument can't derive Clone because LoroDoc/LoroText/UndoManager don't implement Clone. 261 + // This is intentional - the document should be the single source of truth. 262 + 263 + impl Clone for EditorDocument { 264 + fn clone(&self) -> Self { 265 + // Create a new document with the same content 266 + let content = self.to_string(); 267 + let mut new_doc = Self::new(content); 268 + new_doc.cursor = self.cursor; 269 + new_doc.selection = self.selection; 270 + new_doc.composition = self.composition.clone(); 271 + new_doc.last_edit = self.last_edit.clone(); 272 + new_doc 273 } 274 }

+60 -55

crates/weaver-app/src/components/editor/formatting.rs

··· 21 /// 22 /// Expands to whitespace boundaries. Used when applying formatting 23 /// without a selection. 24 - pub fn find_word_boundaries(rope: &jumprope::JumpRopeBuf, offset: usize) -> (usize, usize) { 25 - let rope = rope.borrow(); 26 let mut start = 0; 27 - let mut end = rope.len_chars(); 28 - 29 - // Find start by scanning backwards 30 - let mut char_pos = 0; 31 - for substr in rope.slice_substrings(0..offset) { 32 - for c in substr.chars() { 33 - if c.is_whitespace() { 34 - start = char_pos + 1; 35 } 36 - char_pos += 1; 37 } 38 } 39 40 - // Find end by scanning forwards 41 - char_pos = offset; 42 - let byte_len = rope.len_bytes(); 43 - for substr in rope.slice_substrings(offset..byte_len) { 44 - for c in substr.chars() { 45 - if c.is_whitespace() { 46 - end = char_pos; 47 - return (start, end); 48 } 49 - char_pos += 1; 50 } 51 } 52 ··· 62 (sel.anchor.min(sel.head), sel.anchor.max(sel.head)) 63 } else { 64 // Expand to word 65 - find_word_boundaries(&doc.rope, doc.cursor.offset) 66 }; 67 68 match action { 69 FormatAction::Bold => { 70 - doc.rope.insert(end, "**"); 71 - doc.rope.insert(start, "**"); 72 doc.cursor.offset = end + 4; 73 doc.selection = None; 74 } 75 FormatAction::Italic => { 76 - doc.rope.insert(end, "*"); 77 - doc.rope.insert(start, "*"); 78 doc.cursor.offset = end + 2; 79 doc.selection = None; 80 } 81 FormatAction::Strikethrough => { 82 - doc.rope.insert(end, "~~"); 83 - doc.rope.insert(start, "~~"); 84 doc.cursor.offset = end + 4; 85 doc.selection = None; 86 } 87 FormatAction::Code => { 88 - doc.rope.insert(end, "`"); 89 - doc.rope.insert(start, "`"); 90 doc.cursor.offset = end + 2; 91 doc.selection = None; 92 } 93 FormatAction::Link => { 94 // Insert [selected text](url) 95 - doc.rope.insert(end, "](url)"); 96 - doc.rope.insert(start, "["); 97 doc.cursor.offset = end + 8; // Position cursor after ](url) 98 doc.selection = None; 99 } 100 FormatAction::Image => { 101 // Insert ![alt text](url) 102 - doc.rope.insert(end, "](url)"); 103 - doc.rope.insert(start, "!["); 104 doc.cursor.offset = end + 9; 105 doc.selection = None; 106 } 107 FormatAction::Heading(level) => { 108 // Find start of current line 109 - let line_start = find_line_start(&doc.rope, doc.cursor.offset); 110 let prefix = "#".repeat(level as usize) + " "; 111 - doc.rope.insert(line_start, &prefix); 112 doc.cursor.offset += prefix.len(); 113 doc.selection = None; 114 } 115 FormatAction::BulletList => { 116 - let line_start = find_line_start(&doc.rope, doc.cursor.offset); 117 - doc.rope.insert(line_start, "- "); 118 doc.cursor.offset += 2; 119 doc.selection = None; 120 } 121 FormatAction::NumberedList => { 122 - let line_start = find_line_start(&doc.rope, doc.cursor.offset); 123 - doc.rope.insert(line_start, "1. "); 124 doc.cursor.offset += 3; 125 doc.selection = None; 126 } 127 FormatAction::Quote => { 128 - let line_start = find_line_start(&doc.rope, doc.cursor.offset); 129 - doc.rope.insert(line_start, "> "); 130 doc.cursor.offset += 2; 131 doc.selection = None; 132 } 133 } 134 } 135 136 - /// Find start of line containing offset (same as in mod.rs) 137 - fn find_line_start(rope: &jumprope::JumpRopeBuf, offset: usize) -> usize { 138 - let mut char_pos = 0; 139 - let mut last_newline_pos = None; 140 - 141 - let rope = rope.borrow(); 142 - for substr in rope.slice_substrings(0..offset) { 143 - for c in substr.chars() { 144 - if c == '\n' { 145 - last_newline_pos = Some(char_pos); 146 - } 147 - char_pos += 1; 148 - } 149 } 150 151 - last_newline_pos.map(|pos| pos + 1).unwrap_or(0) 152 }

··· 21 /// 22 /// Expands to whitespace boundaries. Used when applying formatting 23 /// without a selection. 24 + pub fn find_word_boundaries(text: &loro::LoroText, offset: usize) -> (usize, usize) { 25 + let len = text.len_unicode(); 26 + 27 + // Find start by scanning backwards using char_at 28 let mut start = 0; 29 + for i in (0..offset).rev() { 30 + match text.char_at(i) { 31 + Ok(c) if c.is_whitespace() => { 32 + start = i + 1; 33 + break; 34 } 35 + Ok(_) => continue, 36 + Err(_) => break, 37 } 38 } 39 40 + // Find end by scanning forwards using char_at 41 + let mut end = len; 42 + for i in offset..len { 43 + match text.char_at(i) { 44 + Ok(c) if c.is_whitespace() => { 45 + end = i; 46 + break; 47 } 48 + Ok(_) => continue, 49 + Err(_) => break, 50 } 51 } 52 ··· 62 (sel.anchor.min(sel.head), sel.anchor.max(sel.head)) 63 } else { 64 // Expand to word 65 + find_word_boundaries(doc.loro_text(), doc.cursor.offset) 66 }; 67 68 match action { 69 FormatAction::Bold => { 70 + // Insert end marker first so start position stays valid 71 + let _ = doc.insert_tracked(end, "**"); 72 + let _ = doc.insert_tracked(start, "**"); 73 doc.cursor.offset = end + 4; 74 doc.selection = None; 75 } 76 FormatAction::Italic => { 77 + let _ = doc.insert_tracked(end, "*"); 78 + let _ = doc.insert_tracked(start, "*"); 79 doc.cursor.offset = end + 2; 80 doc.selection = None; 81 } 82 FormatAction::Strikethrough => { 83 + let _ = doc.insert_tracked(end, "~~"); 84 + let _ = doc.insert_tracked(start, "~~"); 85 doc.cursor.offset = end + 4; 86 doc.selection = None; 87 } 88 FormatAction::Code => { 89 + let _ = doc.insert_tracked(end, "`"); 90 + let _ = doc.insert_tracked(start, "`"); 91 doc.cursor.offset = end + 2; 92 doc.selection = None; 93 } 94 FormatAction::Link => { 95 // Insert [selected text](url) 96 + let _ = doc.insert_tracked(end, "](url)"); 97 + let _ = doc.insert_tracked(start, "["); 98 doc.cursor.offset = end + 8; // Position cursor after ](url) 99 doc.selection = None; 100 } 101 FormatAction::Image => { 102 // Insert ![alt text](url) 103 + let _ = doc.insert_tracked(end, "](url)"); 104 + let _ = doc.insert_tracked(start, "!["); 105 doc.cursor.offset = end + 9; 106 doc.selection = None; 107 } 108 FormatAction::Heading(level) => { 109 // Find start of current line 110 + let line_start = find_line_start(doc.loro_text(), doc.cursor.offset); 111 let prefix = "#".repeat(level as usize) + " "; 112 + let _ = doc.insert_tracked(line_start, &prefix); 113 doc.cursor.offset += prefix.len(); 114 doc.selection = None; 115 } 116 FormatAction::BulletList => { 117 + let line_start = find_line_start(doc.loro_text(), doc.cursor.offset); 118 + let _ = doc.insert_tracked(line_start, "- "); 119 doc.cursor.offset += 2; 120 doc.selection = None; 121 } 122 FormatAction::NumberedList => { 123 + let line_start = find_line_start(doc.loro_text(), doc.cursor.offset); 124 + let _ = doc.insert_tracked(line_start, "1. "); 125 doc.cursor.offset += 3; 126 doc.selection = None; 127 } 128 FormatAction::Quote => { 129 + let line_start = find_line_start(doc.loro_text(), doc.cursor.offset); 130 + let _ = doc.insert_tracked(line_start, "> "); 131 doc.cursor.offset += 2; 132 doc.selection = None; 133 } 134 } 135 } 136 137 + /// Find start of line containing offset 138 + fn find_line_start(text: &loro::LoroText, offset: usize) -> usize { 139 + if offset == 0 { 140 + return 0; 141 } 142 143 + // Get text up to offset 144 + let prefix = match text.slice(0, offset) { 145 + Ok(s) => s, 146 + Err(_) => return 0, 147 + }; 148 + 149 + // Find last newline 150 + prefix 151 + .chars() 152 + .enumerate() 153 + .filter(|(_, c)| *c == '\n') 154 + .last() 155 + .map(|(pos, _)| pos + 1) 156 + .unwrap_or(0) 157 }

+118 -156

crates/weaver-app/src/components/editor/mod.rs

··· 10 mod offset_map; 11 mod paragraph; 12 mod render; 13 - mod rope_writer; 14 mod storage; 15 mod toolbar; 16 mod visibility; ··· 24 pub use offset_map::{OffsetMapping, RenderResult, find_mapping_for_byte}; 25 pub use paragraph::ParagraphRender; 26 pub use render::{RenderCache, render_paragraphs_incremental}; 27 - pub use rope_writer::RopeWriter; 28 pub use storage::{EditorSnapshot, clear_storage, load_from_storage, save_to_storage}; 29 pub use toolbar::EditorToolbar; 30 pub use visibility::VisibilityState; ··· 38 /// - `initial_content`: Optional initial markdown content 39 /// 40 /// # Features 41 - /// - JumpRope-based text storage for efficient editing 42 /// - Event interception for full control over editing operations 43 /// - Toolbar formatting buttons 44 /// - LocalStorage auto-save with debouncing ··· 75 let edit = doc.last_edit.as_ref(); 76 77 let (paras, new_cache) = 78 - render::render_paragraphs_incremental(&doc.rope, Some(&cache), edit); 79 80 // Update cache for next render (write-only via spawn to avoid reactive loop) 81 dioxus::prelude::spawn(async move { ··· 107 // Update DOM when paragraphs change (incremental rendering) 108 #[cfg(all(target_arch = "wasm32", target_os = "unknown"))] 109 use_effect(move || { 110 let new_paras = paragraphs(); 111 - let cursor_offset = document().cursor.offset; 112 113 // Use peek() to avoid creating reactive dependency on cached_paragraphs 114 let prev = cached_paragraphs.peek().clone(); ··· 120 use wasm_bindgen::JsCast; 121 use wasm_bindgen::prelude::*; 122 123 - let rope = document().rope.clone(); 124 - let map = offset_map(); 125 - 126 // Use requestAnimationFrame to wait for browser paint 127 if let Some(window) = web_sys::window() { 128 let closure = Closure::once(move || { 129 if let Err(e) = 130 - cursor::restore_cursor_position(&rope, cursor_offset, &map, editor_id) 131 { 132 tracing::warn!("Cursor restoration failed: {:?}", e); 133 } ··· 142 cached_paragraphs.set(new_paras.clone()); 143 144 // Update syntax visibility after DOM changes 145 - let doc = document(); 146 - let spans = syntax_spans(); 147 update_syntax_visibility( 148 - doc.cursor.offset, 149 - doc.selection.as_ref(), 150 &spans, 151 &new_paras, 152 ); ··· 155 // Auto-save with debounce 156 #[cfg(all(target_arch = "wasm32", target_os = "unknown"))] 157 use_effect(move || { 158 let doc = document(); 159 160 // Save after 500ms of no typing 161 let timer = gloo_timers::callback::Timeout::new(500, move || { 162 - let _ = storage::save_to_storage(&doc.to_string(), doc.cursor.offset); 163 }); 164 timer.forget(); 165 }); ··· 213 }, 214 215 onclick: move |_evt| { 216 - // After mouse click, sync cursor from DOM 217 - let paras = cached_paragraphs(); 218 - sync_cursor_from_dom(&mut document, editor_id, &paras); 219 - // Update syntax visibility after cursor sync 220 - let doc = document(); 221 - let spans = syntax_spans(); 222 - update_syntax_visibility( 223 - doc.cursor.offset, 224 - doc.selection.as_ref(), 225 - &spans, 226 - &paras, 227 - ); 228 - }, 229 - 230 - onmouseup: move |_evt| { 231 - // After drag selection, sync cursor/selection from DOM 232 let paras = cached_paragraphs(); 233 sync_cursor_from_dom(&mut document, editor_id, &paras); 234 // Update syntax visibility after cursor sync ··· 528 // Delete selection if present 529 if let Some(sel) = doc.selection { 530 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 531 - doc.rope.remove(start..end); 532 doc.cursor.offset = start; 533 doc.selection = None; 534 } 535 536 // Insert pasted text 537 - doc.rope.insert(doc.cursor.offset, &text); 538 doc.cursor.offset += text.chars().count(); 539 }); 540 } ··· 545 } 546 } 547 548 - /// Handle cut events - extract text, write to clipboard, then delete from rope 549 fn handle_cut(evt: Event<ClipboardData>, document: &mut Signal<EditorDocument>) { 550 tracing::info!("[CUT] handle_cut called"); 551 ··· 560 if let Some(sel) = doc.selection { 561 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 562 if start != end { 563 - // Extract text from rope 564 - let selected_text = extract_rope_slice(&doc.rope, start, end); 565 tracing::info!( 566 "[CUT] Extracted {} chars: {:?}", 567 selected_text.len(), ··· 575 } 576 } 577 578 - // Now delete from rope 579 - doc.rope.remove(start..end); 580 doc.cursor.offset = start; 581 doc.selection = None; 582 } ··· 591 } 592 } 593 594 - /// Handle copy events - extract text from rope, clean it up, write to clipboard 595 fn handle_copy(evt: Event<ClipboardData>, document: &Signal<EditorDocument>) { 596 tracing::info!("[COPY] handle_copy called"); 597 ··· 606 if let Some(sel) = doc.selection { 607 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 608 if start != end { 609 - // Extract text from rope 610 - let selected_text = extract_rope_slice(&doc.rope, start, end); 611 612 // Strip zero-width chars used for gap handling 613 let clean_text = selected_text ··· 640 } 641 } 642 643 - /// Extract a slice of text from the rope as a String 644 - fn extract_rope_slice(rope: &jumprope::JumpRopeBuf, start: usize, end: usize) -> String { 645 - let mut result = String::new(); 646 - let rope_ref = rope.borrow(); 647 - for substr in rope_ref.slice_substrings(start..end) { 648 - result.push_str(substr); 649 - } 650 - result 651 } 652 653 /// Handle keyboard events and update document state ··· 675 } 676 } 677 678 - // Insert character at cursor 679 - if doc.selection.is_some() { 680 - // Delete selection first 681 - let sel = doc.selection.unwrap(); 682 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 683 - doc.rope.remove(start..end); 684 - doc.cursor.offset = start; 685 - doc.selection = None; 686 } 687 - 688 - doc.rope.insert(doc.cursor.offset, &ch); 689 - doc.cursor.offset += ch.chars().count(); 690 } 691 692 Key::Backspace => { 693 if let Some(sel) = doc.selection { 694 // Delete selection 695 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 696 - doc.rope.remove(start..end); 697 doc.cursor.offset = start; 698 doc.selection = None; 699 } else if doc.cursor.offset > 0 { 700 // Check if we're about to delete a newline 701 - let prev_char = get_char_at(&doc.rope, doc.cursor.offset - 1); 702 703 if prev_char == Some('\n') { 704 let newline_pos = doc.cursor.offset - 1; ··· 708 // Check if there's another newline before this one (empty paragraph) 709 // If so, delete both newlines to merge paragraphs 710 if newline_pos > 0 { 711 - let prev_prev_char = get_char_at(&doc.rope, newline_pos - 1); 712 if prev_prev_char == Some('\n') { 713 // Empty paragraph case: delete both newlines 714 delete_start = newline_pos - 1; ··· 716 } 717 718 // Also check if there's a zero-width char after cursor (inserted by Shift+Enter) 719 - if let Some(ch) = get_char_at(&doc.rope, delete_end) { 720 if ch == '\u{200C}' || ch == '\u{200B}' { 721 delete_end += 1; 722 } ··· 724 725 // Scan backwards through whitespace before the newline(s) 726 while delete_start > 0 { 727 - let ch = get_char_at(&doc.rope, delete_start - 1); 728 match ch { 729 Some(' ') | Some('\t') | Some('\u{200C}') | Some('\u{200B}') => { 730 delete_start -= 1; ··· 735 } 736 737 // Delete from where we stopped to end (including any trailing zero-width) 738 - doc.rope.remove(delete_start..delete_end); 739 doc.cursor.offset = delete_start; 740 } else { 741 // Normal backspace - delete one char 742 let prev = doc.cursor.offset - 1; 743 - doc.rope.remove(prev..doc.cursor.offset); 744 doc.cursor.offset = prev; 745 } 746 } 747 } 748 749 Key::Delete => { 750 - if let Some(sel) = doc.selection { 751 // Delete selection 752 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 753 - doc.rope.remove(start..end); 754 doc.cursor.offset = start; 755 - doc.selection = None; 756 } else if doc.cursor.offset < doc.len_chars() { 757 // Delete next char 758 - doc.rope.remove(doc.cursor.offset..doc.cursor.offset + 1); 759 } 760 } 761 ··· 765 } 766 767 Key::Enter => { 768 - if doc.selection.is_some() { 769 - let sel = doc.selection.unwrap(); 770 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 771 - doc.rope.remove(start..end); 772 doc.cursor.offset = start; 773 - doc.selection = None; 774 } 775 776 if mods.shift() { 777 // Shift+Enter: hard line break (soft break) 778 - doc.rope.insert(doc.cursor.offset, " \n\u{200C}"); 779 doc.cursor.offset += 3; 780 - } else if let Some(ctx) = detect_list_context(&doc.rope, doc.cursor.offset) { 781 // We're in a list item 782 tracing::debug!("[ENTER] List context detected: {:?}", ctx); 783 tracing::debug!( 784 - "[ENTER] Cursor at {}, rope len {}", 785 doc.cursor.offset, 786 - doc.rope.len_chars() 787 ); 788 - if is_list_item_empty(&doc.rope, doc.cursor.offset, &ctx) { 789 tracing::debug!("[ENTER] Item is empty, exiting list"); 790 // Empty item - exit list by removing marker and inserting paragraph break 791 - let line_start = find_line_start(&doc.rope, doc.cursor.offset); 792 - let line_end = find_line_end(&doc.rope, doc.cursor.offset); 793 794 // Delete the empty list item line INCLUDING its trailing newline 795 // line_end points to the newline, so +1 to include it 796 - let delete_end = (line_end + 1).min(doc.rope.len_chars()); 797 798 - doc.rope.remove(line_start..delete_end); 799 - doc.cursor.offset = line_start; 800 - 801 - // Insert two newlines, a zero-width whitespace character, and then another 802 - // newline to properly split the list (TODO: clean up the weird whitespace 803 - // char once that new paragraph has content) 804 - doc.rope.insert(doc.cursor.offset, "\n\n\u{200C}\n"); 805 - doc.cursor.offset += 2; 806 } else { 807 // Non-empty item - continue list 808 let continuation = match ctx { ··· 814 } 815 }; 816 let len = continuation.chars().count(); 817 - doc.rope.insert(doc.cursor.offset, &continuation); 818 doc.cursor.offset += len; 819 } 820 } else { 821 // Not in a list - normal paragraph break 822 - doc.rope.insert(doc.cursor.offset, "\n\n"); 823 doc.cursor.offset += 2; 824 } 825 } ··· 846 /// Detect if cursor is in a list item and return context for continuation. 847 /// 848 /// Scans backwards to find start of current line, then checks for list marker. 849 - fn detect_list_context(rope: &jumprope::JumpRopeBuf, cursor_offset: usize) -> Option<ListContext> { 850 // Find start of current line 851 - let line_start = find_line_start(rope, cursor_offset); 852 853 // Get the line content from start to cursor 854 - let line_end = find_line_end(rope, cursor_offset); 855 if line_start >= line_end { 856 return None; 857 } 858 859 // Extract line text 860 - let mut line = String::new(); 861 - let rope_ref = rope.borrow(); 862 - for substr in rope_ref.slice_substrings(line_start..line_end) { 863 - line.push_str(substr); 864 - } 865 866 // Parse indentation 867 let indent: String = line ··· 901 /// 902 /// Used to determine whether Enter should continue the list or exit it. 903 fn is_list_item_empty( 904 - rope: &jumprope::JumpRopeBuf, 905 cursor_offset: usize, 906 ctx: &ListContext, 907 ) -> bool { 908 - let line_start = find_line_start(rope, cursor_offset); 909 - let line_end = find_line_end(rope, cursor_offset); 910 911 // Get line content 912 - let mut line = String::new(); 913 - let rope_ref = rope.borrow(); 914 - for substr in rope_ref.slice_substrings(line_start..line_end) { 915 - line.push_str(substr); 916 - } 917 918 // Calculate expected marker length 919 let marker_len = match ctx { ··· 935 line.len() <= marker_len 936 } 937 938 - /// Get character at the given offset in the rope 939 - fn get_char_at(rope: &jumprope::JumpRopeBuf, offset: usize) -> Option<char> { 940 - if offset >= rope.len_chars() { 941 - return None; 942 - } 943 - 944 - let rope = rope.borrow(); 945 - let mut current = 0; 946 - for substr in rope.slice_substrings(offset..offset + 1) { 947 - for c in substr.chars() { 948 - if current == 0 { 949 - return Some(c); 950 - } 951 - current += 1; 952 - } 953 - } 954 - None 955 } 956 957 /// Find start of line containing offset 958 - fn find_line_start(rope: &jumprope::JumpRopeBuf, offset: usize) -> usize { 959 - // Search backwards from cursor for newline 960 - let mut char_pos = 0; 961 - let mut last_newline_pos = None; 962 - 963 - let rope = rope.borrow(); 964 - for substr in rope.slice_substrings(0..offset) { 965 - // TODO: make more efficient 966 - for c in substr.chars() { 967 - if c == '\n' { 968 - last_newline_pos = Some(char_pos); 969 - } 970 - char_pos += 1; 971 - } 972 } 973 - 974 - last_newline_pos.map(|pos| pos + 1).unwrap_or(0) 975 } 976 977 /// Find end of line containing offset 978 - fn find_line_end(rope: &jumprope::JumpRopeBuf, offset: usize) -> usize { 979 - // Search forwards from cursor for newline 980 - let mut char_pos = offset; 981 - 982 - let rope = rope.borrow(); 983 - let byte_len = rope.len_bytes() - 1; 984 - for substr in rope.slice_substrings(offset..byte_len) { 985 - // TODO: make more efficient 986 - for c in substr.chars() { 987 - if c == '\n' { 988 - return char_pos; 989 - } 990 - char_pos += 1; 991 - } 992 } 993 - 994 - rope.len_chars() 995 } 996 997 /// Update paragraph DOM elements incrementally.

··· 10 mod offset_map; 11 mod paragraph; 12 mod render; 13 mod storage; 14 mod toolbar; 15 mod visibility; ··· 23 pub use offset_map::{OffsetMapping, RenderResult, find_mapping_for_byte}; 24 pub use paragraph::ParagraphRender; 25 pub use render::{RenderCache, render_paragraphs_incremental}; 26 pub use storage::{EditorSnapshot, clear_storage, load_from_storage, save_to_storage}; 27 pub use toolbar::EditorToolbar; 28 pub use visibility::VisibilityState; ··· 36 /// - `initial_content`: Optional initial markdown content 37 /// 38 /// # Features 39 + /// - Loro CRDT-based text storage with undo/redo support 40 /// - Event interception for full control over editing operations 41 /// - Toolbar formatting buttons 42 /// - LocalStorage auto-save with debouncing ··· 73 let edit = doc.last_edit.as_ref(); 74 75 let (paras, new_cache) = 76 + render::render_paragraphs_incremental(doc.loro_text(), Some(&cache), edit); 77 78 // Update cache for next render (write-only via spawn to avoid reactive loop) 79 dioxus::prelude::spawn(async move { ··· 105 // Update DOM when paragraphs change (incremental rendering) 106 #[cfg(all(target_arch = "wasm32", target_os = "unknown"))] 107 use_effect(move || { 108 + // Read document once to avoid multiple borrows 109 + let doc = document(); 110 + let cursor_offset = doc.cursor.offset; 111 + let selection = doc.selection; 112 + drop(doc); // Release borrow before other operations 113 + 114 let new_paras = paragraphs(); 115 + let map = offset_map(); 116 + let spans = syntax_spans(); 117 118 // Use peek() to avoid creating reactive dependency on cached_paragraphs 119 let prev = cached_paragraphs.peek().clone(); ··· 125 use wasm_bindgen::JsCast; 126 use wasm_bindgen::prelude::*; 127 128 // Use requestAnimationFrame to wait for browser paint 129 if let Some(window) = web_sys::window() { 130 let closure = Closure::once(move || { 131 if let Err(e) = 132 + cursor::restore_cursor_position(cursor_offset, &map, editor_id) 133 { 134 tracing::warn!("Cursor restoration failed: {:?}", e); 135 } ··· 144 cached_paragraphs.set(new_paras.clone()); 145 146 // Update syntax visibility after DOM changes 147 + // Debug: log what syntax spans we have 148 + for span in spans.iter() { 149 + tracing::debug!( 150 + "[VISIBILITY_INPUT] span {} char_range {:?} formatted_range {:?}", 151 + span.syn_id, 152 + span.char_range, 153 + span.formatted_range 154 + ); 155 + } 156 update_syntax_visibility( 157 + cursor_offset, 158 + selection.as_ref(), 159 &spans, 160 &new_paras, 161 ); ··· 164 // Auto-save with debounce 165 #[cfg(all(target_arch = "wasm32", target_os = "unknown"))] 166 use_effect(move || { 167 + // Read document once and extract what we need 168 let doc = document(); 169 + let content = doc.to_string(); 170 + let cursor = doc.cursor.offset; 171 + drop(doc); 172 173 // Save after 500ms of no typing 174 let timer = gloo_timers::callback::Timeout::new(500, move || { 175 + let _ = storage::save_to_storage(&content, cursor); 176 }); 177 timer.forget(); 178 }); ··· 226 }, 227 228 onclick: move |_evt| { 229 + // After mouse click or drag selection, sync cursor from DOM 230 + // (click fires after mouseup, so this handles both cases) 231 let paras = cached_paragraphs(); 232 sync_cursor_from_dom(&mut document, editor_id, &paras); 233 // Update syntax visibility after cursor sync ··· 527 // Delete selection if present 528 if let Some(sel) = doc.selection { 529 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 530 + let _ = doc.remove_tracked(start, end.saturating_sub(start)); 531 doc.cursor.offset = start; 532 doc.selection = None; 533 } 534 535 // Insert pasted text 536 + let _ = doc.insert_tracked(doc.cursor.offset, &text); 537 doc.cursor.offset += text.chars().count(); 538 }); 539 } ··· 544 } 545 } 546 547 + /// Handle cut events - extract text, write to clipboard, then delete 548 fn handle_cut(evt: Event<ClipboardData>, document: &mut Signal<EditorDocument>) { 549 tracing::info!("[CUT] handle_cut called"); 550 ··· 559 if let Some(sel) = doc.selection { 560 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 561 if start != end { 562 + // Extract text 563 + let selected_text = doc.slice(start, end).unwrap_or_default(); 564 tracing::info!( 565 "[CUT] Extracted {} chars: {:?}", 566 selected_text.len(), ··· 574 } 575 } 576 577 + // Now delete 578 + let _ = doc.remove_tracked(start, end.saturating_sub(start)); 579 doc.cursor.offset = start; 580 doc.selection = None; 581 } ··· 590 } 591 } 592 593 + /// Handle copy events - extract text, clean it up, write to clipboard 594 fn handle_copy(evt: Event<ClipboardData>, document: &Signal<EditorDocument>) { 595 tracing::info!("[COPY] handle_copy called"); 596 ··· 605 if let Some(sel) = doc.selection { 606 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 607 if start != end { 608 + // Extract text 609 + let selected_text = doc.slice(start, end).unwrap_or_default(); 610 611 // Strip zero-width chars used for gap handling 612 let clean_text = selected_text ··· 639 } 640 } 641 642 + /// Extract a slice of text from a string by char indices 643 + fn extract_text_slice(text: &str, start: usize, end: usize) -> String { 644 + text.chars().skip(start).take(end.saturating_sub(start)).collect() 645 } 646 647 /// Handle keyboard events and update document state ··· 669 } 670 } 671 672 + // Insert character at cursor (replacing selection if any) 673 + if let Some(sel) = doc.selection.take() { 674 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 675 + let _ = doc.replace_tracked(start, end.saturating_sub(start), &ch); 676 + doc.cursor.offset = start + ch.chars().count(); 677 + } else { 678 + let _ = doc.insert_tracked(doc.cursor.offset, &ch); 679 + doc.cursor.offset += ch.chars().count(); 680 } 681 } 682 683 Key::Backspace => { 684 if let Some(sel) = doc.selection { 685 // Delete selection 686 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 687 + let _ = doc.remove_tracked(start, end.saturating_sub(start)); 688 doc.cursor.offset = start; 689 doc.selection = None; 690 } else if doc.cursor.offset > 0 { 691 // Check if we're about to delete a newline 692 + let prev_char = get_char_at(doc.loro_text(), doc.cursor.offset - 1); 693 694 if prev_char == Some('\n') { 695 let newline_pos = doc.cursor.offset - 1; ··· 699 // Check if there's another newline before this one (empty paragraph) 700 // If so, delete both newlines to merge paragraphs 701 if newline_pos > 0 { 702 + let prev_prev_char = get_char_at(doc.loro_text(), newline_pos - 1); 703 if prev_prev_char == Some('\n') { 704 // Empty paragraph case: delete both newlines 705 delete_start = newline_pos - 1; ··· 707 } 708 709 // Also check if there's a zero-width char after cursor (inserted by Shift+Enter) 710 + if let Some(ch) = get_char_at(doc.loro_text(), delete_end) { 711 if ch == '\u{200C}' || ch == '\u{200B}' { 712 delete_end += 1; 713 } ··· 715 716 // Scan backwards through whitespace before the newline(s) 717 while delete_start > 0 { 718 + let ch = get_char_at(doc.loro_text(), delete_start - 1); 719 match ch { 720 Some(' ') | Some('\t') | Some('\u{200C}') | Some('\u{200B}') => { 721 delete_start -= 1; ··· 726 } 727 728 // Delete from where we stopped to end (including any trailing zero-width) 729 + let _ = doc.remove_tracked(delete_start, delete_end.saturating_sub(delete_start)); 730 doc.cursor.offset = delete_start; 731 } else { 732 // Normal backspace - delete one char 733 let prev = doc.cursor.offset - 1; 734 + let _ = doc.remove_tracked(prev, 1); 735 doc.cursor.offset = prev; 736 } 737 } 738 } 739 740 Key::Delete => { 741 + if let Some(sel) = doc.selection.take() { 742 // Delete selection 743 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 744 + let _ = doc.remove_tracked(start, end.saturating_sub(start)); 745 doc.cursor.offset = start; 746 } else if doc.cursor.offset < doc.len_chars() { 747 // Delete next char 748 + let _ = doc.remove_tracked(doc.cursor.offset, 1); 749 } 750 } 751 ··· 755 } 756 757 Key::Enter => { 758 + if let Some(sel) = doc.selection.take() { 759 let (start, end) = (sel.anchor.min(sel.head), sel.anchor.max(sel.head)); 760 + let _ = doc.remove_tracked(start, end.saturating_sub(start)); 761 doc.cursor.offset = start; 762 } 763 764 if mods.shift() { 765 // Shift+Enter: hard line break (soft break) 766 + let _ = doc.insert_tracked(doc.cursor.offset, " \n\u{200C}"); 767 doc.cursor.offset += 3; 768 + } else if let Some(ctx) = detect_list_context(doc.loro_text(), doc.cursor.offset) { 769 // We're in a list item 770 tracing::debug!("[ENTER] List context detected: {:?}", ctx); 771 tracing::debug!( 772 + "[ENTER] Cursor at {}, doc len {}", 773 doc.cursor.offset, 774 + doc.len_chars() 775 ); 776 + if is_list_item_empty(doc.loro_text(), doc.cursor.offset, &ctx) { 777 tracing::debug!("[ENTER] Item is empty, exiting list"); 778 // Empty item - exit list by removing marker and inserting paragraph break 779 + let line_start = find_line_start(doc.loro_text(), doc.cursor.offset); 780 + let line_end = find_line_end(doc.loro_text(), doc.cursor.offset); 781 782 // Delete the empty list item line INCLUDING its trailing newline 783 // line_end points to the newline, so +1 to include it 784 + let delete_end = (line_end + 1).min(doc.len_chars()); 785 786 + // Use replace_tracked to atomically delete line and insert paragraph break 787 + let _ = doc.replace_tracked(line_start, delete_end.saturating_sub(line_start), "\n\n\u{200C}\n"); 788 + doc.cursor.offset = line_start + 2; 789 } else { 790 // Non-empty item - continue list 791 let continuation = match ctx { ··· 797 } 798 }; 799 let len = continuation.chars().count(); 800 + let _ = doc.insert_tracked(doc.cursor.offset, &continuation); 801 doc.cursor.offset += len; 802 } 803 } else { 804 // Not in a list - normal paragraph break 805 + let _ = doc.insert_tracked(doc.cursor.offset, "\n\n"); 806 doc.cursor.offset += 2; 807 } 808 } ··· 829 /// Detect if cursor is in a list item and return context for continuation. 830 /// 831 /// Scans backwards to find start of current line, then checks for list marker. 832 + fn detect_list_context(text: &loro::LoroText, cursor_offset: usize) -> Option<ListContext> { 833 // Find start of current line 834 + let line_start = find_line_start(text, cursor_offset); 835 836 // Get the line content from start to cursor 837 + let line_end = find_line_end(text, cursor_offset); 838 if line_start >= line_end { 839 return None; 840 } 841 842 // Extract line text 843 + let line = text.slice(line_start, line_end).ok()?; 844 845 // Parse indentation 846 let indent: String = line ··· 880 /// 881 /// Used to determine whether Enter should continue the list or exit it. 882 fn is_list_item_empty( 883 + text: &loro::LoroText, 884 cursor_offset: usize, 885 ctx: &ListContext, 886 ) -> bool { 887 + let line_start = find_line_start(text, cursor_offset); 888 + let line_end = find_line_end(text, cursor_offset); 889 890 // Get line content 891 + let line = match text.slice(line_start, line_end) { 892 + Ok(s) => s, 893 + Err(_) => return false, 894 + }; 895 896 // Calculate expected marker length 897 let marker_len = match ctx { ··· 913 line.len() <= marker_len 914 } 915 916 + /// Get character at the given offset in LoroText 917 + fn get_char_at(text: &loro::LoroText, offset: usize) -> Option<char> { 918 + text.char_at(offset).ok() 919 } 920 921 /// Find start of line containing offset 922 + fn find_line_start(text: &loro::LoroText, offset: usize) -> usize { 923 + if offset == 0 { 924 + return 0; 925 } 926 + // Only slice the portion before cursor 927 + let prefix = match text.slice(0, offset) { 928 + Ok(s) => s, 929 + Err(_) => return 0, 930 + }; 931 + prefix 932 + .chars() 933 + .enumerate() 934 + .filter(|(_, c)| *c == '\n') 935 + .last() 936 + .map(|(pos, _)| pos + 1) 937 + .unwrap_or(0) 938 } 939 940 /// Find end of line containing offset 941 + fn find_line_end(text: &loro::LoroText, offset: usize) -> usize { 942 + let char_len = text.len_unicode(); 943 + if offset >= char_len { 944 + return char_len; 945 } 946 + // Only slice from cursor to end 947 + let suffix = match text.slice(offset, char_len) { 948 + Ok(s) => s, 949 + Err(_) => return char_len, 950 + }; 951 + suffix 952 + .chars() 953 + .enumerate() 954 + .find(|(_, c)| *c == '\n') 955 + .map(|(i, _)| offset + i) 956 + .unwrap_or(char_len) 957 } 958 959 /// Update paragraph DOM elements incrementally.

+4 -11

crates/weaver-app/src/components/editor/paragraph.rs

··· 5 6 use super::offset_map::OffsetMapping; 7 use super::writer::SyntaxSpanInfo; 8 - use jumprope::JumpRopeBuf; 9 use std::ops::Range; 10 11 /// A rendered paragraph with its source range and offset mappings. ··· 40 hasher.finish() 41 } 42 43 - /// Extract substring from rope as String 44 - pub fn rope_slice_to_string(rope: &JumpRopeBuf, range: Range<usize>) -> String { 45 - let rope_borrow = rope.borrow(); 46 - let mut result = String::new(); 47 - 48 - for substr in rope_borrow.slice_substrings(range) { 49 - result.push_str(substr); 50 - } 51 - 52 - result 53 } 54

··· 5 6 use super::offset_map::OffsetMapping; 7 use super::writer::SyntaxSpanInfo; 8 + use loro::LoroText; 9 use std::ops::Range; 10 11 /// A rendered paragraph with its source range and offset mappings. ··· 40 hasher.finish() 41 } 42 43 + /// Extract substring from LoroText as String 44 + pub fn text_slice_to_string(text: &LoroText, range: Range<usize>) -> String { 45 + text.slice(range.start, range.end).unwrap_or_default() 46 } 47

+15 -12

crates/weaver-app/src/components/editor/render.rs

··· 6 7 use super::document::EditInfo; 8 use super::offset_map::{OffsetMapping, RenderResult}; 9 - use super::paragraph::{ParagraphRender, hash_source, rope_slice_to_string}; 10 use super::writer::{EditorWriter, SyntaxSpanInfo}; 11 - use jumprope::JumpRopeBuf; 12 use markdown_weaver::Parser; 13 use std::ops::Range; 14 ··· 105 /// # Returns 106 /// Tuple of (rendered paragraphs, updated cache) 107 pub fn render_paragraphs_incremental( 108 - rope: &JumpRopeBuf, 109 cache: Option<&RenderCache>, 110 edit: Option<&EditInfo>, 111 ) -> (Vec<ParagraphRender>, RenderCache) { 112 - let source = rope.to_string(); 113 114 // Handle empty document 115 if source.is_empty() { ··· 190 191 match EditorWriter::<_, _, ()>::new_boundary_only( 192 &source, 193 - rope, 194 parser, 195 &mut scratch_output, 196 ) ··· 213 let mut syn_id_offset = cache.map(|c| c.next_syn_id).unwrap_or(0); 214 215 for (idx, (byte_range, char_range)) in paragraph_ranges.iter().enumerate() { 216 - let para_source = rope_slice_to_string(rope, char_range.clone()); 217 let source_hash = hash_source(&para_source); 218 219 tracing::debug!( ··· 250 251 (cached.html.clone(), adjusted_map, adjusted_syntax) 252 } else { 253 - // Fresh render needed 254 - let para_rope = JumpRopeBuf::from(para_source.as_str()); 255 let parser = Parser::new_ext(&para_source, weaver_renderer::default_md_options()) 256 .into_offset_iter(); 257 let mut output = String::new(); ··· 259 let (mut offset_map, mut syntax_spans) = 260 match EditorWriter::<_, _, ()>::new_with_offsets( 261 &para_source, 262 - &para_rope, 263 parser, 264 &mut output, 265 node_id_offset, ··· 374 utf16_len: 1, 375 }], 376 syntax_spans: vec![], 377 - source_hash: hash_source(&rope_slice_to_string(rope, gap_start_char..gap_end_char)), 378 }); 379 } 380 ··· 386 // Add trailing gap if needed 387 let has_trailing_newlines = source.ends_with("\n\n") || source.ends_with("\n"); 388 if has_trailing_newlines { 389 - let doc_end_char = rope.len_chars(); 390 - let doc_end_byte = rope.len_bytes(); 391 392 if doc_end_char > prev_end_char { 393 // Position-based ID for trailing gap

··· 6 7 use super::document::EditInfo; 8 use super::offset_map::{OffsetMapping, RenderResult}; 9 + use super::paragraph::{ParagraphRender, hash_source, text_slice_to_string}; 10 use super::writer::{EditorWriter, SyntaxSpanInfo}; 11 + use loro::LoroText; 12 use markdown_weaver::Parser; 13 use std::ops::Range; 14 ··· 105 /// # Returns 106 /// Tuple of (rendered paragraphs, updated cache) 107 pub fn render_paragraphs_incremental( 108 + text: &LoroText, 109 cache: Option<&RenderCache>, 110 edit: Option<&EditInfo>, 111 ) -> (Vec<ParagraphRender>, RenderCache) { 112 + let source = text.to_string(); 113 114 // Handle empty document 115 if source.is_empty() { ··· 190 191 match EditorWriter::<_, _, ()>::new_boundary_only( 192 &source, 193 + text, 194 parser, 195 &mut scratch_output, 196 ) ··· 213 let mut syn_id_offset = cache.map(|c| c.next_syn_id).unwrap_or(0); 214 215 for (idx, (byte_range, char_range)) in paragraph_ranges.iter().enumerate() { 216 + let para_source = text_slice_to_string(text, char_range.clone()); 217 let source_hash = hash_source(&para_source); 218 219 tracing::debug!( ··· 250 251 (cached.html.clone(), adjusted_map, adjusted_syntax) 252 } else { 253 + // Fresh render needed - create detached LoroDoc for this paragraph 254 + let para_doc = loro::LoroDoc::new(); 255 + let para_text = para_doc.get_text("content"); 256 + let _ = para_text.insert(0, &para_source); 257 + 258 let parser = Parser::new_ext(&para_source, weaver_renderer::default_md_options()) 259 .into_offset_iter(); 260 let mut output = String::new(); ··· 262 let (mut offset_map, mut syntax_spans) = 263 match EditorWriter::<_, _, ()>::new_with_offsets( 264 &para_source, 265 + &para_text, 266 parser, 267 &mut output, 268 node_id_offset, ··· 377 utf16_len: 1, 378 }], 379 syntax_spans: vec![], 380 + source_hash: hash_source(&text_slice_to_string(text, gap_start_char..gap_end_char)), 381 }); 382 } 383 ··· 389 // Add trailing gap if needed 390 let has_trailing_newlines = source.ends_with("\n\n") || source.ends_with("\n"); 391 if has_trailing_newlines { 392 + let doc_end_char = text.len_unicode(); 393 + let doc_end_byte = text.len_utf8(); 394 395 if doc_end_char > prev_end_char { 396 // Position-based ID for trailing gap

-81

crates/weaver-app/src/components/editor/rope_writer.rs

··· 1 - //! StrWrite wrapper for JumpRopeBuf to enable efficient HTML rendering. 2 - 3 - use jumprope::JumpRopeBuf; 4 - use markdown_weaver_escape::StrWrite; 5 - 6 - /// Wrapper around JumpRopeBuf that implements StrWrite. 7 - /// 8 - /// This allows rendering HTML directly into a rope structure, enabling: 9 - /// - O(log n) insertions instead of O(n) string reallocation 10 - /// - Efficient splicing for incremental rendering 11 - /// - Fast paragraph replacement in cached output 12 - pub struct RopeWriter { 13 - rope: JumpRopeBuf, 14 - } 15 - 16 - impl RopeWriter { 17 - pub fn new() -> Self { 18 - Self { 19 - rope: JumpRopeBuf::new(), 20 - } 21 - } 22 - 23 - pub fn from_rope(rope: JumpRopeBuf) -> Self { 24 - Self { rope } 25 - } 26 - 27 - pub fn into_rope(self) -> JumpRopeBuf { 28 - self.rope 29 - } 30 - 31 - pub fn as_rope(&self) -> &JumpRopeBuf { 32 - &self.rope 33 - } 34 - 35 - pub fn to_string(&self) -> String { 36 - self.rope.to_string() 37 - } 38 - } 39 - 40 - impl Default for RopeWriter { 41 - fn default() -> Self { 42 - Self::new() 43 - } 44 - } 45 - 46 - impl StrWrite for RopeWriter { 47 - type Error = std::convert::Infallible; 48 - 49 - fn write_str(&mut self, s: &str) -> Result<(), Self::Error> { 50 - let offset = self.rope.len_chars(); 51 - self.rope.insert(offset, s); 52 - Ok(()) 53 - } 54 - 55 - fn write_fmt(&mut self, args: std::fmt::Arguments<'_>) -> Result<(), Self::Error> { 56 - let mut temp = String::new(); 57 - std::fmt::Write::write_fmt(&mut temp, args).unwrap(); 58 - self.write_str(&temp) 59 - } 60 - } 61 - 62 - #[cfg(test)] 63 - mod tests { 64 - use super::*; 65 - 66 - #[test] 67 - fn test_rope_writer_basic() { 68 - let mut writer = RopeWriter::new(); 69 - writer.write_str("hello ").unwrap(); 70 - writer.write_str("world").unwrap(); 71 - assert_eq!(writer.to_string(), "hello world"); 72 - } 73 - 74 - #[test] 75 - fn test_rope_writer_fmt() { 76 - use std::fmt::Write; 77 - let mut writer = RopeWriter::new(); 78 - write!(&mut writer, "number: {}", 42).unwrap(); 79 - assert_eq!(writer.to_string(), "number: 42"); 80 - } 81 - }

···

+14 -4

crates/weaver-app/src/components/editor/snapshots/weaver_app__components__editor__tests__bold.snap

··· 8 char_range: 9 - 0 10 - 18 11 - html: "Some **bold** text\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 31 child_index: ~ 32 utf16_len: 5 33 - byte_range: 34 - 7 35 - 11 36 char_range: 37 - 7 38 - 11 39 node_id: n0 40 - char_offset_in_node: 5 41 child_index: ~ 42 utf16_len: 4 43 - byte_range: ··· 47 - 11 48 - 13 49 node_id: n0 50 - char_offset_in_node: 9 51 child_index: ~ 52 utf16_len: 2 53 - byte_range: ··· 57 - 13 58 - 18 59 node_id: n0 60 - char_offset_in_node: 11 61 child_index: ~ 62 utf16_len: 5 63 source_hash: 3007541947422346271

··· 8 char_range: 9 - 0 10 - 18 11 + html: "Some **bold** text\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 31 child_index: ~ 32 utf16_len: 5 33 - byte_range: 34 + - 5 35 + - 7 36 + char_range: 37 + - 5 38 + - 7 39 + node_id: n0 40 + char_offset_in_node: 5 41 + child_index: ~ 42 + utf16_len: 2 43 + - byte_range: 44 - 7 45 - 11 46 char_range: 47 - 7 48 - 11 49 node_id: n0 50 + char_offset_in_node: 7 51 child_index: ~ 52 utf16_len: 4 53 - byte_range: ··· 57 - 11 58 - 13 59 node_id: n0 60 + char_offset_in_node: 11 61 child_index: ~ 62 utf16_len: 2 63 - byte_range: ··· 67 - 13 68 - 18 69 node_id: n0 70 + char_offset_in_node: 13 71 child_index: ~ 72 utf16_len: 5 73 source_hash: 3007541947422346271

+25 -5

crates/weaver-app/src/components/editor/snapshots/weaver_app__components__editor__tests__bold_italic.snap

··· 8 char_range: 9 - 0 10 - 27 11 - html: "Some ***bold italic*** text\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 31 child_index: ~ 32 utf16_len: 5 33 - byte_range: 34 - 8 35 - 19 36 char_range: 37 - 8 38 - 19 39 node_id: n0 40 - char_offset_in_node: 5 41 child_index: ~ 42 utf16_len: 11 43 - byte_range: ··· 47 - 19 48 - 21 49 node_id: n0 50 - char_offset_in_node: 16 51 child_index: ~ 52 utf16_len: 2 53 - byte_range: ··· 57 - 21 58 - 22 59 node_id: n0 60 - char_offset_in_node: 18 61 child_index: ~ 62 utf16_len: 1 63 - byte_range: ··· 67 - 22 68 - 27 69 node_id: n0 70 - char_offset_in_node: 19 71 child_index: ~ 72 utf16_len: 5 73 source_hash: 17839597501764990486

··· 8 char_range: 9 - 0 10 - 27 11 + html: "Some ***bold italic*** text\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 31 child_index: ~ 32 utf16_len: 5 33 - byte_range: 34 + - 5 35 + - 6 36 + char_range: 37 + - 5 38 + - 6 39 + node_id: n0 40 + char_offset_in_node: 5 41 + child_index: ~ 42 + utf16_len: 1 43 + - byte_range: 44 + - 6 45 + - 8 46 + char_range: 47 + - 6 48 + - 8 49 + node_id: n0 50 + char_offset_in_node: 6 51 + child_index: ~ 52 + utf16_len: 2 53 + - byte_range: 54 - 8 55 - 19 56 char_range: 57 - 8 58 - 19 59 node_id: n0 60 + char_offset_in_node: 8 61 child_index: ~ 62 utf16_len: 11 63 - byte_range: ··· 67 - 19 68 - 21 69 node_id: n0 70 + char_offset_in_node: 19 71 child_index: ~ 72 utf16_len: 2 73 - byte_range: ··· 77 - 21 78 - 22 79 node_id: n0 80 + char_offset_in_node: 21 81 child_index: ~ 82 utf16_len: 1 83 - byte_range: ··· 87 - 22 88 - 27 89 node_id: n0 90 + char_offset_in_node: 22 91 child_index: ~ 92 utf16_len: 5 93 source_hash: 17839597501764990486

+2 -2

crates/weaver-app/src/components/editor/snapshots/weaver_app__components__editor__tests__inline_code.snap

··· 39 node_id: n0 40 char_offset_in_node: 5 41 child_index: ~ 42 - utf16_len: 4 43 - byte_range: 44 - 11 45 - 16 ··· 47 - 11 48 - 16 49 node_id: n0 50 - char_offset_in_node: 9 51 child_index: ~ 52 utf16_len: 5 53 source_hash: 10489263388249723293

··· 39 node_id: n0 40 char_offset_in_node: 5 41 child_index: ~ 42 + utf16_len: 6 43 - byte_range: 44 - 11 45 - 16 ··· 47 - 11 48 - 16 49 node_id: n0 50 + char_offset_in_node: 11 51 child_index: ~ 52 utf16_len: 5 53 source_hash: 10489263388249723293

+14 -4

crates/weaver-app/src/components/editor/snapshots/weaver_app__components__editor__tests__italic.snap

··· 8 char_range: 9 - 0 10 - 18 11 - html: "Some *italic* text\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 31 child_index: ~ 32 utf16_len: 5 33 - byte_range: 34 - 6 35 - 12 36 char_range: 37 - 6 38 - 12 39 node_id: n0 40 - char_offset_in_node: 5 41 child_index: ~ 42 utf16_len: 6 43 - byte_range: ··· 47 - 12 48 - 13 49 node_id: n0 50 - char_offset_in_node: 11 51 child_index: ~ 52 utf16_len: 1 53 - byte_range: ··· 57 - 13 58 - 18 59 node_id: n0 60 - char_offset_in_node: 12 61 child_index: ~ 62 utf16_len: 5 63 source_hash: 4363411941421262428

··· 8 char_range: 9 - 0 10 - 18 11 + html: "Some *italic* text\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 31 child_index: ~ 32 utf16_len: 5 33 - byte_range: 34 + - 5 35 + - 6 36 + char_range: 37 + - 5 38 + - 6 39 + node_id: n0 40 + char_offset_in_node: 5 41 + child_index: ~ 42 + utf16_len: 1 43 + - byte_range: 44 - 6 45 - 12 46 char_range: 47 - 6 48 - 12 49 node_id: n0 50 + char_offset_in_node: 6 51 child_index: ~ 52 utf16_len: 6 53 - byte_range: ··· 57 - 12 58 - 13 59 node_id: n0 60 + char_offset_in_node: 12 61 child_index: ~ 62 utf16_len: 1 63 - byte_range: ··· 67 - 13 68 - 18 69 node_id: n0 70 + char_offset_in_node: 13 71 child_index: ~ 72 utf16_len: 5 73 source_hash: 4363411941421262428

+29 -9

crates/weaver-app/src/components/editor/snapshots/weaver_app__components__editor__tests__multiple_inline_formats.snap

··· 8 char_range: 9 - 0 10 - 32 11 - html: "**Bold** and *italic* and `<code>code</code>`\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 21 child_index: 0 22 utf16_len: 0 23 - byte_range: 24 - 2 25 - 6 26 char_range: 27 - 2 28 - 6 29 node_id: n0 30 - char_offset_in_node: 0 31 child_index: ~ 32 utf16_len: 4 33 - byte_range: ··· 37 - 6 38 - 8 39 node_id: n0 40 - char_offset_in_node: 4 41 child_index: ~ 42 utf16_len: 2 43 - byte_range: ··· 47 - 8 48 - 13 49 node_id: n0 50 - char_offset_in_node: 6 51 child_index: ~ 52 utf16_len: 5 53 - byte_range: 54 - 14 55 - 20 56 char_range: 57 - 14 58 - 20 59 node_id: n0 60 - char_offset_in_node: 11 61 child_index: ~ 62 utf16_len: 6 63 - byte_range: ··· 67 - 20 68 - 21 69 node_id: n0 70 - char_offset_in_node: 17 71 child_index: ~ 72 utf16_len: 1 73 - byte_range: ··· 77 - 21 78 - 26 79 node_id: n0 80 - char_offset_in_node: 18 81 child_index: ~ 82 utf16_len: 5 83 - byte_range: ··· 87 - 27 88 - 31 89 node_id: n0 90 - char_offset_in_node: 23 91 child_index: ~ 92 - utf16_len: 4 93 source_hash: 17988102203032347642

··· 8 char_range: 9 - 0 10 - 32 11 + html: "**Bold** and *italic* and `<code>code</code>`\n" 12 offset_map: 13 - byte_range: 14 - 0 ··· 21 child_index: 0 22 utf16_len: 0 23 - byte_range: 24 + - 0 25 + - 2 26 + char_range: 27 + - 0 28 + - 2 29 + node_id: n0 30 + char_offset_in_node: 0 31 + child_index: ~ 32 + utf16_len: 2 33 + - byte_range: 34 - 2 35 - 6 36 char_range: 37 - 2 38 - 6 39 node_id: n0 40 + char_offset_in_node: 2 41 child_index: ~ 42 utf16_len: 4 43 - byte_range: ··· 47 - 6 48 - 8 49 node_id: n0 50 + char_offset_in_node: 6 51 child_index: ~ 52 utf16_len: 2 53 - byte_range: ··· 57 - 8 58 - 13 59 node_id: n0 60 + char_offset_in_node: 8 61 child_index: ~ 62 utf16_len: 5 63 - byte_range: 64 + - 13 65 + - 14 66 + char_range: 67 + - 13 68 + - 14 69 + node_id: n0 70 + char_offset_in_node: 13 71 + child_index: ~ 72 + utf16_len: 1 73 + - byte_range: 74 - 14 75 - 20 76 char_range: 77 - 14 78 - 20 79 node_id: n0 80 + char_offset_in_node: 14 81 child_index: ~ 82 utf16_len: 6 83 - byte_range: ··· 87 - 20 88 - 21 89 node_id: n0 90 + char_offset_in_node: 20 91 child_index: ~ 92 utf16_len: 1 93 - byte_range: ··· 97 - 21 98 - 26 99 node_id: n0 100 + char_offset_in_node: 21 101 child_index: ~ 102 utf16_len: 5 103 - byte_range: ··· 107 - 27 108 - 31 109 node_id: n0 110 + char_offset_in_node: 26 111 child_index: ~ 112 + utf16_len: 6 113 source_hash: 17988102203032347642

+10 -40

crates/weaver-app/src/components/editor/snapshots/weaver_app__components__editor__tests__ordered_list.snap

··· 8 char_range: 9 - 0 10 - 27 11 - html: "<ol>\n<li data-node-id=\"n0\">1. First\n</li>\n<li data-node-id=\"n1\">2. Second\n</li>\n<li data-node-id=\"n2\">3. Third</li>\n</ol>\n" 12 offset_map: 13 - byte_range: 14 - 0 15 - - 2 16 char_range: 17 - 0 18 - - 2 19 node_id: n0 20 char_offset_in_node: 0 21 child_index: ~ 22 - utf16_len: 2 23 - - byte_range: 24 - - 2 25 - - 3 26 - char_range: 27 - - 2 28 - - 3 29 - node_id: n0 30 - char_offset_in_node: 2 31 - child_index: ~ 32 - utf16_len: 1 33 - byte_range: 34 - 3 35 - 8 ··· 52 utf16_len: 1 53 - byte_range: 54 - 9 55 - - 11 56 - char_range: 57 - - 9 58 - - 11 59 - node_id: n1 60 - char_offset_in_node: 0 61 - child_index: ~ 62 - utf16_len: 2 63 - - byte_range: 64 - - 11 65 - 12 66 char_range: 67 - - 11 68 - 12 69 node_id: n1 70 - char_offset_in_node: 2 71 child_index: ~ 72 - utf16_len: 1 73 - byte_range: 74 - 12 75 - 18 ··· 92 utf16_len: 1 93 - byte_range: 94 - 19 95 - - 21 96 char_range: 97 - 19 98 - - 21 99 node_id: n2 100 char_offset_in_node: 0 101 child_index: ~ 102 - utf16_len: 2 103 - - byte_range: 104 - - 21 105 - - 22 106 - char_range: 107 - - 21 108 - - 22 109 - node_id: n2 110 - char_offset_in_node: 2 111 - child_index: ~ 112 - utf16_len: 1 113 - byte_range: 114 - 22 115 - 27

··· 8 char_range: 9 - 0 10 - 27 11 + html: "<ol>\n<li data-node-id=\"n0\">1. First\n</li>\n<li data-node-id=\"n1\">2. Second\n</li>\n<li data-node-id=\"n2\">3. Third</li>\n</ol>\n" 12 offset_map: 13 - byte_range: 14 - 0 15 + - 3 16 char_range: 17 - 0 18 + - 3 19 node_id: n0 20 char_offset_in_node: 0 21 child_index: ~ 22 + utf16_len: 3 23 - byte_range: 24 - 3 25 - 8 ··· 42 utf16_len: 1 43 - byte_range: 44 - 9 45 - 12 46 char_range: 47 + - 9 48 - 12 49 node_id: n1 50 + char_offset_in_node: 0 51 child_index: ~ 52 + utf16_len: 3 53 - byte_range: 54 - 12 55 - 18 ··· 72 utf16_len: 1 73 - byte_range: 74 - 19 75 + - 22 76 char_range: 77 - 19 78 + - 22 79 node_id: n2 80 char_offset_in_node: 0 81 child_index: ~ 82 + utf16_len: 3 83 - byte_range: 84 - 22 85 - 27

+18 -10

crates/weaver-app/src/components/editor/tests.rs

··· 3 use super::offset_map::{OffsetMapping, find_mapping_for_char}; 4 use super::paragraph::ParagraphRender; 5 use super::render::render_paragraphs_incremental; 6 - use jumprope::JumpRopeBuf; 7 use serde::Serialize; 8 9 /// Serializable version of ParagraphRender for snapshot testing. ··· 54 55 /// Helper: render markdown and convert to serializable test output. 56 fn render_test(input: &str) -> Vec<TestParagraph> { 57 - let rope = JumpRopeBuf::from(input); 58 - let (paragraphs, _cache) = render_paragraphs_incremental(&rope, None, None); 59 paragraphs.iter().map(TestParagraph::from).collect() 60 } 61 ··· 434 // cursor snaps to adjacent paragraphs for standard breaks. 435 // Only EXTRA whitespace beyond \n\n gets gap elements. 436 let input = "Hello\n\nWorld"; 437 - let rope = JumpRopeBuf::from(input); 438 - let (paragraphs, _cache) = render_paragraphs_incremental(&rope, None, None); 439 440 // With standard \n\n break, we expect 2 paragraphs (no gap element) 441 // Paragraph ranges include some trailing whitespace from markdown parsing ··· 453 // Extra whitespace beyond MIN_PARAGRAPH_BREAK (2) gets gap elements 454 // Plain paragraphs don't consume trailing newlines like headings do 455 let input = "Hello\n\n\n\nWorld"; // 4 newlines = gap of 4 > 2 456 - let rope = JumpRopeBuf::from(input); 457 - let (paragraphs, _cache) = render_paragraphs_incremental(&rope, None, None); 458 459 // With extra newlines, we expect 3 elements: para, gap, para 460 assert_eq!(paragraphs.len(), 3, "Expected 3 elements with extra whitespace"); ··· 542 fn test_incremental_cache_reuse() { 543 // Verify cache is populated and can be reused 544 let input = "First para\n\nSecond para"; 545 - let rope = JumpRopeBuf::from(input); 546 547 - let (paras1, cache1) = render_paragraphs_incremental(&rope, None, None); 548 assert!(!cache1.paragraphs.is_empty(), "Cache should be populated"); 549 550 // Second render with same content should reuse cache 551 - let (paras2, _cache2) = render_paragraphs_incremental(&rope, Some(&cache1), None); 552 553 // Should produce identical output 554 assert_eq!(paras1.len(), paras2.len());

··· 3 use super::offset_map::{OffsetMapping, find_mapping_for_char}; 4 use super::paragraph::ParagraphRender; 5 use super::render::render_paragraphs_incremental; 6 + use loro::LoroDoc; 7 use serde::Serialize; 8 9 /// Serializable version of ParagraphRender for snapshot testing. ··· 54 55 /// Helper: render markdown and convert to serializable test output. 56 fn render_test(input: &str) -> Vec<TestParagraph> { 57 + let doc = LoroDoc::new(); 58 + let text = doc.get_text("content"); 59 + text.insert(0, input).unwrap(); 60 + let (paragraphs, _cache) = render_paragraphs_incremental(&text, None, None); 61 paragraphs.iter().map(TestParagraph::from).collect() 62 } 63 ··· 436 // cursor snaps to adjacent paragraphs for standard breaks. 437 // Only EXTRA whitespace beyond \n\n gets gap elements. 438 let input = "Hello\n\nWorld"; 439 + let doc = LoroDoc::new(); 440 + let text = doc.get_text("content"); 441 + text.insert(0, input).unwrap(); 442 + let (paragraphs, _cache) = render_paragraphs_incremental(&text, None, None); 443 444 // With standard \n\n break, we expect 2 paragraphs (no gap element) 445 // Paragraph ranges include some trailing whitespace from markdown parsing ··· 457 // Extra whitespace beyond MIN_PARAGRAPH_BREAK (2) gets gap elements 458 // Plain paragraphs don't consume trailing newlines like headings do 459 let input = "Hello\n\n\n\nWorld"; // 4 newlines = gap of 4 > 2 460 + let doc = LoroDoc::new(); 461 + let text = doc.get_text("content"); 462 + text.insert(0, input).unwrap(); 463 + let (paragraphs, _cache) = render_paragraphs_incremental(&text, None, None); 464 465 // With extra newlines, we expect 3 elements: para, gap, para 466 assert_eq!(paragraphs.len(), 3, "Expected 3 elements with extra whitespace"); ··· 548 fn test_incremental_cache_reuse() { 549 // Verify cache is populated and can be reused 550 let input = "First para\n\nSecond para"; 551 + let doc = LoroDoc::new(); 552 + let text = doc.get_text("content"); 553 + text.insert(0, input).unwrap(); 554 555 + let (paras1, cache1) = render_paragraphs_incremental(&text, None, None); 556 assert!(!cache1.paragraphs.is_empty(), "Cache should be populated"); 557 558 // Second render with same content should reuse cache 559 + let (paras2, _cache2) = render_paragraphs_incremental(&text, Some(&cache1), None); 560 561 // Should produce identical output 562 assert_eq!(paras1.len(), paras2.len());

+108 -9

crates/weaver-app/src/components/editor/visibility.rs

··· 33 let mut visible = HashSet::new(); 34 35 for span in syntax_spans { 36 let should_show = match span.syntax_type { 37 SyntaxType::Inline => { 38 // Show if cursor within formatted span content OR adjacent to markers 39 - // "Adjacent" means within 1 char of the syntax boundaries 40 - let extended_range = span.char_range.start.saturating_sub(1) 41 - ..span.char_range.end.saturating_add(1); 42 43 // Also show if cursor is anywhere in the formatted_range 44 // (the region between paired opening/closing markers) 45 let in_formatted_region = span 46 .formatted_range 47 .as_ref() 48 - .map(|r| r.contains(&cursor_offset)) 49 .unwrap_or(false); 50 51 - extended_range.contains(&cursor_offset) 52 || in_formatted_region 53 || selection_overlaps(selection, &span.char_range) 54 || span 55 .formatted_range 56 .as_ref() 57 .map(|r| selection_overlaps(selection, r)) 58 - .unwrap_or(false) 59 } 60 SyntaxType::Block => { 61 // Show if cursor anywhere in same paragraph ··· 116 false 117 } 118 119 #[cfg(test)] 120 mod tests { 121 use super::*; ··· 197 198 #[test] 199 fn test_inline_visibility_cursor_adjacent() { 200 let spans = vec![ 201 make_span("s0", 5, 7, SyntaxType::Inline), // ** at positions 5-6 202 ]; 203 - let paras = vec![make_para(0, 20, spans.clone())]; 204 205 // Cursor at position 4 (one before ** which starts at 5) 206 let vis = VisibilityState::calculate(4, None, &spans, &paras); ··· 216 let spans = vec![ 217 make_span("s0", 10, 12, SyntaxType::Inline), 218 ]; 219 - let paras = vec![make_para(0, 30, spans.clone())]; 220 221 // Cursor at position 0 (far from **) 222 let vis = VisibilityState::calculate(0, None, &spans, &paras); ··· 259 let spans = vec![ 260 make_span("s0", 5, 7, SyntaxType::Inline), 261 ]; 262 - let paras = vec![make_para(0, 20, spans.clone())]; 263 264 // Selection overlaps the syntax span 265 let selection = Selection { anchor: 3, head: 10 }; 266 let vis = VisibilityState::calculate(10, Some(&selection), &spans, &paras); 267 assert!(vis.is_visible("s0"), "** should be visible when selection overlaps"); 268 } 269 }

··· 33 let mut visible = HashSet::new(); 34 35 for span in syntax_spans { 36 + // Find the paragraph containing this span for boundary clamping 37 + let para_bounds = find_paragraph_bounds(&span.char_range, paragraphs); 38 + 39 let should_show = match span.syntax_type { 40 SyntaxType::Inline => { 41 // Show if cursor within formatted span content OR adjacent to markers 42 + // "Adjacent" means within 1 char of the syntax boundaries, 43 + // clamped to paragraph bounds (paragraphs are split by newlines, 44 + // so clamping to para bounds prevents cross-line extension) 45 + let extended_start = 46 + safe_extend_left(span.char_range.start, 1, para_bounds.as_ref()); 47 + let extended_end = 48 + safe_extend_right(span.char_range.end, 1, para_bounds.as_ref()); 49 + let extended_range = extended_start..extended_end; 50 51 // Also show if cursor is anywhere in the formatted_range 52 // (the region between paired opening/closing markers) 53 + // Extend by 1 char on BOTH sides for symmetric "approaching" behavior, 54 + // clamped to paragraph bounds. 55 let in_formatted_region = span 56 .formatted_range 57 .as_ref() 58 + .map(|r| { 59 + let ext_start = safe_extend_left(r.start, 1, para_bounds.as_ref()); 60 + let ext_end = safe_extend_right(r.end, 1, para_bounds.as_ref()); 61 + cursor_offset >= ext_start && cursor_offset <= ext_end 62 + }) 63 .unwrap_or(false); 64 65 + let in_extended = extended_range.contains(&cursor_offset); 66 + let result = in_extended 67 || in_formatted_region 68 || selection_overlaps(selection, &span.char_range) 69 || span 70 .formatted_range 71 .as_ref() 72 .map(|r| selection_overlaps(selection, r)) 73 + .unwrap_or(false); 74 + 75 + tracing::debug!( 76 + "[VISIBILITY] span {} char_range {:?} formatted_range {:?} cursor {} -> in_extended={} in_formatted={} visible={}", 77 + span.syn_id, 78 + span.char_range, 79 + span.formatted_range, 80 + cursor_offset, 81 + in_extended, 82 + in_formatted_region, 83 + result 84 + ); 85 + 86 + result 87 } 88 SyntaxType::Block => { 89 // Show if cursor anywhere in same paragraph ··· 144 false 145 } 146 147 + /// Find the paragraph bounds containing a syntax span. 148 + fn find_paragraph_bounds( 149 + syntax_range: &Range<usize>, 150 + paragraphs: &[ParagraphRender], 151 + ) -> Option<Range<usize>> { 152 + for para in paragraphs { 153 + // Skip gap paragraphs 154 + if para.syntax_spans.is_empty() && !para.char_range.is_empty() { 155 + continue; 156 + } 157 + 158 + if para.char_range.start <= syntax_range.start && syntax_range.end <= para.char_range.end { 159 + return Some(para.char_range.clone()); 160 + } 161 + } 162 + None 163 + } 164 + 165 + /// Safely extend a position leftward by `amount` chars, clamped to paragraph bounds. 166 + /// 167 + /// Paragraphs are already split by newlines, so clamping to paragraph bounds 168 + /// naturally prevents extending across line boundaries. 169 + fn safe_extend_left(pos: usize, amount: usize, para_bounds: Option<&Range<usize>>) -> usize { 170 + let min_pos = para_bounds.map(|p| p.start).unwrap_or(0); 171 + pos.saturating_sub(amount).max(min_pos) 172 + } 173 + 174 + /// Safely extend a position rightward by `amount` chars, clamped to paragraph bounds. 175 + /// 176 + /// Paragraphs are already split by newlines, so clamping to paragraph bounds 177 + /// naturally prevents extending across line boundaries. 178 + fn safe_extend_right(pos: usize, amount: usize, para_bounds: Option<&Range<usize>>) -> usize { 179 + let max_pos = para_bounds.map(|p| p.end).unwrap_or(usize::MAX); 180 + pos.saturating_add(amount).min(max_pos) 181 + } 182 + 183 #[cfg(test)] 184 mod tests { 185 use super::*; ··· 261 262 #[test] 263 fn test_inline_visibility_cursor_adjacent() { 264 + // "test **bold** after" 265 + // 5 7 266 let spans = vec![ 267 make_span("s0", 5, 7, SyntaxType::Inline), // ** at positions 5-6 268 ]; 269 + let paras = vec![make_para(0, 19, spans.clone())]; 270 271 // Cursor at position 4 (one before ** which starts at 5) 272 let vis = VisibilityState::calculate(4, None, &spans, &paras); ··· 282 let spans = vec![ 283 make_span("s0", 10, 12, SyntaxType::Inline), 284 ]; 285 + let paras = vec![make_para(0, 33, spans.clone())]; 286 287 // Cursor at position 0 (far from **) 288 let vis = VisibilityState::calculate(0, None, &spans, &paras); ··· 325 let spans = vec![ 326 make_span("s0", 5, 7, SyntaxType::Inline), 327 ]; 328 + let paras = vec![make_para(0, 24, spans.clone())]; 329 330 // Selection overlaps the syntax span 331 let selection = Selection { anchor: 3, head: 10 }; 332 let vis = VisibilityState::calculate(10, Some(&selection), &spans, &paras); 333 assert!(vis.is_visible("s0"), "** should be visible when selection overlaps"); 334 + } 335 + 336 + #[test] 337 + fn test_paragraph_boundary_blocks_extension() { 338 + // Cursor in paragraph 2 should NOT reveal syntax in paragraph 1, 339 + // even if cursor is only 1 char after the paragraph boundary 340 + // (paragraph bounds clamp the extension) 341 + let spans = vec![ 342 + make_span_with_range("s0", 0, 2, SyntaxType::Inline, 0..8), // opening ** 343 + make_span_with_range("s1", 6, 8, SyntaxType::Inline, 0..8), // closing ** 344 + ]; 345 + let paras = vec![ 346 + make_para(0, 8, spans.clone()), // "**bold**" 347 + make_para(9, 13, vec![]), // "text" (after newline) 348 + ]; 349 + 350 + // Cursor at position 9 (start of second paragraph) 351 + // Should NOT reveal the closing ** because para bounds clamp extension 352 + let vis = VisibilityState::calculate(9, None, &spans, &paras); 353 + assert!(!vis.is_visible("s1"), "closing ** should NOT be visible when cursor is in next paragraph"); 354 + } 355 + 356 + #[test] 357 + fn test_extension_clamps_to_paragraph() { 358 + // Syntax at very start of paragraph - extension left should stop at para start 359 + let spans = vec![ 360 + make_span_with_range("s0", 0, 2, SyntaxType::Inline, 0..8), 361 + ]; 362 + let paras = vec![make_para(0, 8, spans.clone())]; 363 + 364 + // Cursor at position 0 - should still see the opening ** 365 + let vis = VisibilityState::calculate(0, None, &spans, &paras); 366 + assert!(vis.is_visible("s0"), "** at start should be visible when cursor at position 0"); 367 } 368 }

+95 -26

crates/weaver-app/src/components/editor/writer.rs

··· 7 //! represent consumed formatting characters. 8 9 use super::offset_map::{OffsetMapping, RenderResult}; 10 - use jumprope::JumpRopeBuf; 11 use markdown_weaver::{ 12 Alignment, BlockQuoteKind, CodeBlockKind, CowStr, EmbedType, Event, LinkType, Tag, 13 }; ··· 109 /// and emits them as styled spans for visibility in the editor. 110 pub struct EditorWriter<'a, I: Iterator<Item = (Event<'a>, Range<usize>)>, W: StrWrite, E = ()> { 111 source: &'a str, 112 - source_rope: &'a JumpRopeBuf, 113 events: I, 114 writer: W, 115 last_byte_offset: usize, ··· 141 current_node_id: Option<String>, // node ID for current text container 142 current_node_char_offset: usize, // UTF-16 offset within current node 143 current_node_child_count: usize, // number of child elements/text nodes in current container 144 145 // Paragraph boundary tracking for incremental rendering 146 paragraph_ranges: Vec<(Range<usize>, Range<usize>)>, // (byte_range, char_range) ··· 170 impl<'a, I: Iterator<Item = (Event<'a>, Range<usize>)>, W: StrWrite, E: EmbedContentProvider> 171 EditorWriter<'a, I, W, E> 172 { 173 - pub fn new(source: &'a str, source_rope: &'a JumpRopeBuf, events: I, writer: W) -> Self { 174 - Self::new_with_node_offset(source, source_rope, events, writer, 0) 175 } 176 177 pub fn new_with_node_offset( 178 source: &'a str, 179 - source_rope: &'a JumpRopeBuf, 180 events: I, 181 writer: W, 182 node_id_offset: usize, 183 ) -> Self { 184 - Self::new_with_offsets(source, source_rope, events, writer, node_id_offset, 0) 185 } 186 187 pub fn new_with_offsets( 188 source: &'a str, 189 - source_rope: &'a JumpRopeBuf, 190 events: I, 191 writer: W, 192 node_id_offset: usize, ··· 194 ) -> Self { 195 Self { 196 source, 197 - source_rope, 198 events, 199 writer, 200 last_byte_offset: 0, ··· 217 current_node_id: None, 218 current_node_char_offset: 0, 219 current_node_child_count: 0, 220 paragraph_ranges: Vec::new(), 221 current_paragraph_start: None, 222 list_depth: 0, ··· 232 /// Used for fast boundary discovery in incremental rendering. 233 pub fn new_boundary_only( 234 source: &'a str, 235 - source_rope: &'a JumpRopeBuf, 236 events: I, 237 writer: W, 238 ) -> Self { 239 Self { 240 source, 241 - source_rope, 242 events, 243 writer, 244 last_byte_offset: 0, ··· 261 current_node_id: None, 262 current_node_char_offset: 0, 263 current_node_child_count: 0, 264 syntax_spans: Vec::new(), 265 next_syn_id: 0, 266 pending_inline_formats: Vec::new(), ··· 276 pub fn with_embed_provider(self, provider: E) -> EditorWriter<'a, I, W, E> { 277 EditorWriter { 278 source: self.source, 279 - source_rope: self.source_rope, 280 events: self.events, 281 writer: self.writer, 282 last_byte_offset: self.last_byte_offset, ··· 299 current_node_id: self.current_node_id, 300 current_node_char_offset: self.current_node_char_offset, 301 current_node_child_count: self.current_node_child_count, 302 paragraph_ranges: self.paragraph_ranges, 303 current_paragraph_start: self.current_paragraph_start, 304 list_depth: self.list_depth, ··· 343 let format_end = self.last_char_offset; 344 let formatted_range = format_start..format_end; 345 346 // Update the opening span's formatted_range 347 if let Some(opening_span) = self 348 .syntax_spans ··· 350 .find(|s| s.syn_id == opening_syn_id) 351 { 352 opening_span.formatted_range = Some(formatted_range.clone()); 353 } 354 355 // Update the closing span's formatted_range (the most recent one) ··· 358 // Only update if it's an inline span (closing syntax should be inline) 359 if closing_span.syntax_type == SyntaxType::Inline { 360 closing_span.formatted_range = Some(formatted_range); 361 } 362 } 363 } ··· 544 self.current_node_child_count = 0; 545 } 546 547 /// Record an offset mapping for the given byte and char ranges. 548 /// 549 - /// Computes UTF-16 length efficiently using the rope's internal indexing. 550 fn record_mapping(&mut self, byte_range: Range<usize>, char_range: Range<usize>) { 551 if let Some(ref node_id) = self.current_node_id { 552 - // Use rope to convert char offsets to UTF-16 (wchar) offsets - O(log n) 553 - let rope = self.source_rope.borrow(); 554 - let wchar_start = rope.chars_to_wchars(char_range.start); 555 - let wchar_end = rope.chars_to_wchars(char_range.end); 556 - let utf16_len = wchar_end - wchar_start; 557 558 let mapping = OffsetMapping { 559 byte_range: byte_range.clone(), ··· 601 602 // For End events, emit any trailing content within the event's range 603 // BEFORE calling end_tag (which calls end_node and clears current_node_id) 604 - if matches!(&event, Event::End(_)) { 605 // Emit gap from last_byte_offset to range.end 606 // (emit_syntax handles char offset tracking) 607 self.emit_gap_before(range.end)?; 608 - } else { 609 // For other events, emit any gap before range.start 610 // (emit_syntax handles char offset tracking) 611 self.emit_gap_before(range.start)?; 612 } 613 614 // Store last_byte before processing 615 let last_byte_before = self.last_byte_offset; ··· 632 // Handle unmapped trailing content (stripped by parser) 633 // This includes trailing spaces that markdown ignores 634 let doc_byte_len = self.source.len(); 635 - let doc_char_len = self.source_rope.len_chars(); 636 637 if self.last_byte_offset < doc_byte_len || self.last_char_offset < doc_char_len { 638 // Emit the trailing content as visible syntax ··· 1173 syntax_type, 1174 formatted_range: None, // Will be updated when closing tag is emitted 1175 }); 1176 1177 // For paired inline syntax (Strong, Emphasis, Strikethrough), 1178 // track the opening span so we can set formatted_range when closing ··· 1990 self.write("</dd>\n") 1991 } 1992 TagEnd::Emphasis => { 1993 self.finalize_paired_inline_format(); 1994 - self.write("") 1995 } 1996 TagEnd::Superscript => self.write(""), 1997 TagEnd::Subscript => self.write(""), 1998 TagEnd::Strong => { 1999 self.finalize_paired_inline_format(); 2000 - self.write("") 2001 } 2002 TagEnd::Strikethrough => { 2003 self.finalize_paired_inline_format(); 2004 - self.write("</s>") 2005 } 2006 TagEnd::Link => self.write("</a>"), 2007 TagEnd::Image => Ok(()), // No-op: raw_text() already consumed the End(Image) event ··· 2019 2020 result?; 2021 2022 - // Note: Closing syntax for inline tags (Strong, Emphasis, etc.) is now handled 2023 - // by emit_gap_before(range.end) which is called before end_tag() in the main loop. 2024 - // No need for manual emission here anymore. 2025 2026 Ok(()) 2027 }

··· 7 //! represent consumed formatting characters. 8 9 use super::offset_map::{OffsetMapping, RenderResult}; 10 + use loro::LoroText; 11 use markdown_weaver::{ 12 Alignment, BlockQuoteKind, CodeBlockKind, CowStr, EmbedType, Event, LinkType, Tag, 13 }; ··· 109 /// and emits them as styled spans for visibility in the editor. 110 pub struct EditorWriter<'a, I: Iterator<Item = (Event<'a>, Range<usize>)>, W: StrWrite, E = ()> { 111 source: &'a str, 112 + source_text: &'a LoroText, 113 events: I, 114 writer: W, 115 last_byte_offset: usize, ··· 141 current_node_id: Option<String>, // node ID for current text container 142 current_node_char_offset: usize, // UTF-16 offset within current node 143 current_node_child_count: usize, // number of child elements/text nodes in current container 144 + 145 + // Incremental UTF-16 offset tracking (replaces rope.chars_to_wchars) 146 + // Maps char_offset -> utf16_offset at checkpoints we've traversed. 147 + // Can be reused for future lookups or passed to subsequent writers. 148 + utf16_checkpoints: Vec<(usize, usize)>, // (char_offset, utf16_offset) 149 150 // Paragraph boundary tracking for incremental rendering 151 paragraph_ranges: Vec<(Range<usize>, Range<usize>)>, // (byte_range, char_range) ··· 175 impl<'a, I: Iterator<Item = (Event<'a>, Range<usize>)>, W: StrWrite, E: EmbedContentProvider> 176 EditorWriter<'a, I, W, E> 177 { 178 + pub fn new(source: &'a str, source_text: &'a LoroText, events: I, writer: W) -> Self { 179 + Self::new_with_node_offset(source, source_text, events, writer, 0) 180 } 181 182 pub fn new_with_node_offset( 183 source: &'a str, 184 + source_text: &'a LoroText, 185 events: I, 186 writer: W, 187 node_id_offset: usize, 188 ) -> Self { 189 + Self::new_with_offsets(source, source_text, events, writer, node_id_offset, 0) 190 } 191 192 pub fn new_with_offsets( 193 source: &'a str, 194 + source_text: &'a LoroText, 195 events: I, 196 writer: W, 197 node_id_offset: usize, ··· 199 ) -> Self { 200 Self { 201 source, 202 + source_text, 203 events, 204 writer, 205 last_byte_offset: 0, ··· 222 current_node_id: None, 223 current_node_char_offset: 0, 224 current_node_child_count: 0, 225 + utf16_checkpoints: vec![(0, 0)], 226 paragraph_ranges: Vec::new(), 227 current_paragraph_start: None, 228 list_depth: 0, ··· 238 /// Used for fast boundary discovery in incremental rendering. 239 pub fn new_boundary_only( 240 source: &'a str, 241 + source_text: &'a LoroText, 242 events: I, 243 writer: W, 244 ) -> Self { 245 Self { 246 source, 247 + source_text, 248 events, 249 writer, 250 last_byte_offset: 0, ··· 267 current_node_id: None, 268 current_node_char_offset: 0, 269 current_node_child_count: 0, 270 + utf16_checkpoints: vec![(0, 0)], 271 syntax_spans: Vec::new(), 272 next_syn_id: 0, 273 pending_inline_formats: Vec::new(), ··· 283 pub fn with_embed_provider(self, provider: E) -> EditorWriter<'a, I, W, E> { 284 EditorWriter { 285 source: self.source, 286 + source_text: self.source_text, 287 events: self.events, 288 writer: self.writer, 289 last_byte_offset: self.last_byte_offset, ··· 306 current_node_id: self.current_node_id, 307 current_node_char_offset: self.current_node_char_offset, 308 current_node_child_count: self.current_node_child_count, 309 + utf16_checkpoints: self.utf16_checkpoints, 310 paragraph_ranges: self.paragraph_ranges, 311 current_paragraph_start: self.current_paragraph_start, 312 list_depth: self.list_depth, ··· 351 let format_end = self.last_char_offset; 352 let formatted_range = format_start..format_end; 353 354 + tracing::debug!( 355 + "[FINALIZE_PAIRED] Setting formatted_range {:?} for opening '{}' and closing (last span)", 356 + formatted_range, 357 + opening_syn_id 358 + ); 359 + 360 // Update the opening span's formatted_range 361 if let Some(opening_span) = self 362 .syntax_spans ··· 364 .find(|s| s.syn_id == opening_syn_id) 365 { 366 opening_span.formatted_range = Some(formatted_range.clone()); 367 + tracing::debug!("[FINALIZE_PAIRED] Updated opening span {}", opening_syn_id); 368 + } else { 369 + tracing::warn!("[FINALIZE_PAIRED] Could not find opening span {}", opening_syn_id); 370 } 371 372 // Update the closing span's formatted_range (the most recent one) ··· 375 // Only update if it's an inline span (closing syntax should be inline) 376 if closing_span.syntax_type == SyntaxType::Inline { 377 closing_span.formatted_range = Some(formatted_range); 378 + tracing::debug!("[FINALIZE_PAIRED] Updated closing span {}", closing_span.syn_id); 379 } 380 } 381 } ··· 562 self.current_node_child_count = 0; 563 } 564 565 + /// Compute UTF-16 length for a text slice with fast path for ASCII. 566 + #[inline] 567 + fn utf16_len_for_slice(text: &str) -> usize { 568 + let byte_len = text.len(); 569 + let char_len = text.chars().count(); 570 + 571 + // Fast path: if byte_len == char_len, all ASCII, so utf16_len == char_len 572 + if byte_len == char_len { 573 + char_len 574 + } else { 575 + // Slow path: has multi-byte chars, need to count UTF-16 code units 576 + text.encode_utf16().count() 577 + } 578 + } 579 + 580 /// Record an offset mapping for the given byte and char ranges. 581 /// 582 + /// Builds up utf16_checkpoints incrementally for efficient lookups. 583 fn record_mapping(&mut self, byte_range: Range<usize>, char_range: Range<usize>) { 584 if let Some(ref node_id) = self.current_node_id { 585 + // Get UTF-16 length using fast path 586 + let text_slice = &self.source[byte_range.clone()]; 587 + let utf16_len = Self::utf16_len_for_slice(text_slice); 588 + 589 + // Record checkpoint at end of this range for future lookups 590 + let last_checkpoint = self.utf16_checkpoints.last().copied().unwrap_or((0, 0)); 591 + let new_utf16_offset = last_checkpoint.1 + utf16_len; 592 + 593 + // Only add checkpoint if we've advanced 594 + if char_range.end > last_checkpoint.0 { 595 + self.utf16_checkpoints.push((char_range.end, new_utf16_offset)); 596 + } 597 598 let mapping = OffsetMapping { 599 byte_range: byte_range.clone(), ··· 641 642 // For End events, emit any trailing content within the event's range 643 // BEFORE calling end_tag (which calls end_node and clears current_node_id) 644 + // 645 + // EXCEPTION: For inline formatting tags (Strong, Emphasis, Strikethrough), 646 + // the closing syntax must be emitted AFTER the closing HTML tag, not before. 647 + // Otherwise the closing `**` span ends up INSIDE the element. 648 + // These tags handle their own closing syntax in end_tag(). 649 + use markdown_weaver::TagEnd; 650 + let is_inline_format_end = matches!( 651 + &event, 652 + Event::End(TagEnd::Strong | TagEnd::Emphasis | TagEnd::Strikethrough) 653 + ); 654 + 655 + if matches!(&event, Event::End(_)) && !is_inline_format_end { 656 // Emit gap from last_byte_offset to range.end 657 // (emit_syntax handles char offset tracking) 658 self.emit_gap_before(range.end)?; 659 + } else if !matches!(&event, Event::End(_)) { 660 // For other events, emit any gap before range.start 661 // (emit_syntax handles char offset tracking) 662 self.emit_gap_before(range.start)?; 663 } 664 + // For inline format End events, gap is emitted inside end_tag() AFTER the closing HTML 665 666 // Store last_byte before processing 667 let last_byte_before = self.last_byte_offset; ··· 684 // Handle unmapped trailing content (stripped by parser) 685 // This includes trailing spaces that markdown ignores 686 let doc_byte_len = self.source.len(); 687 + let doc_char_len = self.source_text.len_unicode(); 688 689 if self.last_byte_offset < doc_byte_len || self.last_char_offset < doc_char_len { 690 // Emit the trailing content as visible syntax ··· 1225 syntax_type, 1226 formatted_range: None, // Will be updated when closing tag is emitted 1227 }); 1228 + 1229 + // Record offset mapping for cursor positioning 1230 + // This is critical - without it, current_node_char_offset is wrong 1231 + // and all subsequent cursor positions are shifted 1232 + let byte_start = range.start; 1233 + let byte_end = range.start + syntax_byte_len; 1234 + self.record_mapping(byte_start..byte_end, char_start..char_end); 1235 1236 // For paired inline syntax (Strong, Emphasis, Strikethrough), 1237 // track the opening span so we can set formatted_range when closing ··· 2049 self.write("</dd>\n") 2050 } 2051 TagEnd::Emphasis => { 2052 + // Write closing tag FIRST, then emit closing syntax OUTSIDE the tag 2053 + self.write("")?; 2054 + self.emit_gap_before(range.end)?; 2055 self.finalize_paired_inline_format(); 2056 + Ok(()) 2057 } 2058 TagEnd::Superscript => self.write(""), 2059 TagEnd::Subscript => self.write(""), 2060 TagEnd::Strong => { 2061 + // Write closing tag FIRST, then emit closing syntax OUTSIDE the tag 2062 + self.write("")?; 2063 + self.emit_gap_before(range.end)?; 2064 self.finalize_paired_inline_format(); 2065 + Ok(()) 2066 } 2067 TagEnd::Strikethrough => { 2068 + // Write closing tag FIRST, then emit closing syntax OUTSIDE the tag 2069 + self.write("</s>")?; 2070 + self.emit_gap_before(range.end)?; 2071 self.finalize_paired_inline_format(); 2072 + Ok(()) 2073 } 2074 TagEnd::Link => self.write("</a>"), 2075 TagEnd::Image => Ok(()), // No-op: raw_text() already consumed the End(Image) event ··· 2087 2088 result?; 2089 2090 + // Note: Closing syntax for inline formatting tags (Strong, Emphasis, Strikethrough) 2091 + // is handled INSIDE their respective match arms above, AFTER writing the closing HTML. 2092 + // This ensures the closing syntax span appears OUTSIDE the formatted element. 2093 + // Other End events have their closing syntax emitted by emit_gap_before() in the main loop. 2094 2095 Ok(()) 2096 }