Add efficient serialisation for diffs #21
18 changed files with 533 additions and 70 deletions
38
Cargo.lock
generated
38
Cargo.lock
generated
|
|
@ -124,6 +124,12 @@ version = "0.4.27"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "13dc2df351e3202783a1fe0d44375f7295ffb4049267b0f3018346dc122a1d94"
|
checksum = "13dc2df351e3202783a1fe0d44375f7295ffb4049267b0f3018346dc122a1d94"
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "memchr"
|
||||||
|
version = "2.7.6"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "f52b00d39961fc5b2736ea853c9cc86238e165017a493d1d5c8eac6bdc4cc273"
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "memory_units"
|
name = "memory_units"
|
||||||
version = "0.4.0"
|
version = "0.4.0"
|
||||||
|
|
@ -182,6 +188,7 @@ dependencies = [
|
||||||
"insta",
|
"insta",
|
||||||
"pretty_assertions",
|
"pretty_assertions",
|
||||||
"serde",
|
"serde",
|
||||||
|
"serde_json",
|
||||||
"serde_yaml",
|
"serde_yaml",
|
||||||
"test-case",
|
"test-case",
|
||||||
"wasm-bindgen",
|
"wasm-bindgen",
|
||||||
|
|
@ -212,24 +219,47 @@ dependencies = [
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "serde"
|
name = "serde"
|
||||||
version = "1.0.219"
|
version = "1.0.228"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "5f0e2c6ed6606019b4e29e69dbaba95b11854410e5347d525002456dbbb786b6"
|
checksum = "9a8e94ea7f378bd32cbbd37198a4a91436180c5bb472411e48b5ec2e2124ae9e"
|
||||||
|
dependencies = [
|
||||||
|
"serde_core",
|
||||||
|
"serde_derive",
|
||||||
|
]
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "serde_core"
|
||||||
|
version = "1.0.228"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "41d385c7d4ca58e59fc732af25c3983b67ac852c1a25000afe1175de458b67ad"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"serde_derive",
|
"serde_derive",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "serde_derive"
|
name = "serde_derive"
|
||||||
version = "1.0.219"
|
version = "1.0.228"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "5b0276cf7f2c73365f7157c8123c21cd9a50fbbd844757af28ca1f5925fc2a00"
|
checksum = "d540f220d3187173da220f885ab66608367b6574e925011a9353e4badda91d79"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"proc-macro2",
|
"proc-macro2",
|
||||||
"quote",
|
"quote",
|
||||||
"syn",
|
"syn",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "serde_json"
|
||||||
|
version = "1.0.145"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "402a6f66d8c709116cf22f558eab210f5a50187f702eb4d7e5ef38d9a7f1c79c"
|
||||||
|
dependencies = [
|
||||||
|
"itoa",
|
||||||
|
"memchr",
|
||||||
|
"ryu",
|
||||||
|
"serde",
|
||||||
|
"serde_core",
|
||||||
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "serde_yaml"
|
name = "serde_yaml"
|
||||||
version = "0.9.34+deprecated"
|
version = "0.9.34+deprecated"
|
||||||
|
|
|
||||||
|
|
@ -24,6 +24,7 @@ path = "examples/merge-file.rs"
|
||||||
serde = { version = "1.0.219", optional = true, features = ["derive"] }
|
serde = { version = "1.0.219", optional = true, features = ["derive"] }
|
||||||
|
|
||||||
wasm-bindgen = { version = "0.2.99", optional = true }
|
wasm-bindgen = { version = "0.2.99", optional = true }
|
||||||
|
serde_json = { version = "1.0.145", optional = true }
|
||||||
|
|
||||||
# The `console_error_panic_hook` crate provides better debugging of panics by
|
# The `console_error_panic_hook` crate provides better debugging of panics by
|
||||||
# logging them with `console.error`. This is great for development, but requires
|
# logging them with `console.error`. This is great for development, but requires
|
||||||
|
|
@ -36,8 +37,9 @@ wee_alloc = { version = "0.4.2", optional = true }
|
||||||
[features]
|
[features]
|
||||||
default = []
|
default = []
|
||||||
serde = [ "dep:serde" ]
|
serde = [ "dep:serde" ]
|
||||||
wasm = [ "dep:wasm-bindgen", "dep:wee_alloc" ]
|
wasm = [ "dep:wasm-bindgen", "dep:wee_alloc", "dep:serde_json", "serde" ]
|
||||||
console_error_panic_hook = [ "dep:console_error_panic_hook" ]
|
console_error_panic_hook = [ "dep:console_error_panic_hook" ]
|
||||||
|
all = [ "wasm", "console_error_panic_hook" ]
|
||||||
|
|
||||||
[dev-dependencies]
|
[dev-dependencies]
|
||||||
insta = "1.42.2"
|
insta = "1.42.2"
|
||||||
|
|
|
||||||
|
|
@ -24,6 +24,7 @@ A Rust and TypeScript library for merging conflicting text edits without manual
|
||||||
### Rust
|
### Rust
|
||||||
|
|
||||||
Install via crates.io:
|
Install via crates.io:
|
||||||
|
|
||||||
```sh
|
```sh
|
||||||
cargo add reconcile-text
|
cargo add reconcile-text
|
||||||
```
|
```
|
||||||
|
|
|
||||||
2
reconcile-js/package-lock.json
generated
2
reconcile-js/package-lock.json
generated
|
|
@ -24,7 +24,7 @@
|
||||||
},
|
},
|
||||||
"../pkg": {
|
"../pkg": {
|
||||||
"name": "reconcile-text",
|
"name": "reconcile-text",
|
||||||
"version": "0.4.10",
|
"version": "0.5.0",
|
||||||
"dev": true,
|
"dev": true,
|
||||||
"license": "MIT"
|
"license": "MIT"
|
||||||
},
|
},
|
||||||
|
|
|
||||||
|
|
@ -5,6 +5,7 @@ import {
|
||||||
SpanWithHistory as wasmSpanWithHistory,
|
SpanWithHistory as wasmSpanWithHistory,
|
||||||
reconcileWithHistory as wasmReconcileWithHistory,
|
reconcileWithHistory as wasmReconcileWithHistory,
|
||||||
isBinary as wasmIsBinary,
|
isBinary as wasmIsBinary,
|
||||||
|
getCompactDiff as wasmGetCompactDiff,
|
||||||
initSync,
|
initSync,
|
||||||
} from 'reconcile-text';
|
} from 'reconcile-text';
|
||||||
|
|
||||||
|
|
@ -179,6 +180,40 @@ export function reconcile(
|
||||||
return jsResult;
|
return jsResult;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Generates a compact diff representation between an original and changed text.
|
||||||
|
*
|
||||||
|
* These can be parsed and unpacked using Rust crate's EditedText::from_change_set.
|
||||||
|
*
|
||||||
|
* This function computes the differences between two versions of text and returns
|
||||||
|
* a compact string representation of those changes. The returned format is
|
||||||
|
* serialised JSON.
|
||||||
|
*
|
||||||
|
* @param original - The original/base version of the text
|
||||||
|
* @param changed - The modified version of the text (either string or TextWithCursors with cursor positions)
|
||||||
|
* @param tokenizer - The tokenisation strategy, which is the same as used in `reconcile`.
|
||||||
|
* @returns A compact string representation of the diff between original and changed text
|
||||||
|
*/
|
||||||
|
export function getCompactDiff(
|
||||||
|
original: string,
|
||||||
|
changed: string | TextWithOptionalCursors,
|
||||||
|
tokenizer: BuiltinTokenizer = 'Word'
|
||||||
|
): string {
|
||||||
|
init();
|
||||||
|
|
||||||
|
if (!BUILTIN_TOKENIZERS.includes(tokenizer)) {
|
||||||
|
throw new Error(UNSUPPORTED_TOKENIZER_ERROR);
|
||||||
|
}
|
||||||
|
|
||||||
|
const changedWasm = toWasmTextWithCursors(changed);
|
||||||
|
|
||||||
|
const result = wasmGetCompactDiff(original, changedWasm, tokenizer);
|
||||||
|
|
||||||
|
changedWasm.free();
|
||||||
|
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Merges three versions of text and returns detailed provenance information.
|
* Merges three versions of text and returns detailed provenance information.
|
||||||
*
|
*
|
||||||
|
|
|
||||||
|
|
@ -3,9 +3,8 @@
|
||||||
set -e
|
set -e
|
||||||
|
|
||||||
wasm-pack build --target web --features wasm
|
wasm-pack build --target web --features wasm
|
||||||
cargo test --verbose -- --include-ignored
|
cargo test --verbose --features serde -- --include-ignored
|
||||||
cargo test --features serde
|
cargo test --features serde,wasm
|
||||||
cargo test --features wasm
|
|
||||||
wasm-pack test --node --features wasm
|
wasm-pack test --node --features wasm
|
||||||
|
|
||||||
cd reconcile-js
|
cd reconcile-js
|
||||||
|
|
|
||||||
44
src/lib.rs
44
src/lib.rs
|
|
@ -151,6 +151,48 @@
|
||||||
//! ]
|
//! ]
|
||||||
//! );
|
//! );
|
||||||
//! ```
|
//! ```
|
||||||
|
//! ## Efficiently serialize changes
|
||||||
|
//!
|
||||||
|
//! The edits can be serialized into a compact representation without the full
|
||||||
|
//! original text, making the size only depends on the changes made.
|
||||||
|
//!
|
||||||
|
//! ```rust
|
||||||
|
//! use reconcile_text::{EditedText, BuiltinTokenizer};
|
||||||
|
//! use serde_yaml;
|
||||||
|
//! use pretty_assertions::assert_eq;
|
||||||
|
//!
|
||||||
|
//!
|
||||||
|
//! let original = "Merging text is hard!";
|
||||||
|
//! let changes = "Merging text is easy with reconcile!";
|
||||||
|
//!
|
||||||
|
//! let result = EditedText::from_strings(
|
||||||
|
//! original,
|
||||||
|
//! &changes.into()
|
||||||
|
//! );
|
||||||
|
//!
|
||||||
|
//! let serialized = serde_yaml::to_string(&result.to_change_set()).unwrap();
|
||||||
|
//! assert_eq!(
|
||||||
|
//! serialized,
|
||||||
|
//! concat!(
|
||||||
|
//! "operations:\n",
|
||||||
|
//! "- 15\n",
|
||||||
|
//! "- -6\n",
|
||||||
|
//! "- ' easy with reconcile!'\n",
|
||||||
|
//! "cursors: []\n"
|
||||||
|
//! )
|
||||||
|
//! );
|
||||||
|
//!
|
||||||
|
//! let deserialized = serde_yaml::from_str(&serialized).unwrap();
|
||||||
|
//! let reconstructed = EditedText::from_change_set(
|
||||||
|
//! original,
|
||||||
|
//! deserialized,
|
||||||
|
//! &*BuiltinTokenizer::Word
|
||||||
|
//! );
|
||||||
|
//! assert_eq!(
|
||||||
|
//! reconstructed.apply().text(),
|
||||||
|
//! "Merging text is easy with reconcile!"
|
||||||
|
//! );
|
||||||
|
//! ```
|
||||||
//!
|
//!
|
||||||
//! ## Error handling
|
//! ## Error handling
|
||||||
//!
|
//!
|
||||||
|
|
@ -169,7 +211,7 @@ mod tokenizer;
|
||||||
mod types;
|
mod types;
|
||||||
mod utils;
|
mod utils;
|
||||||
|
|
||||||
pub use operation_transformation::{EditedText, reconcile};
|
pub use operation_transformation::{ChangeSet, EditedText, reconcile};
|
||||||
pub use tokenizer::{BuiltinTokenizer, Tokenizer, token::Token};
|
pub use tokenizer::{BuiltinTokenizer, Tokenizer, token::Token};
|
||||||
pub use types::{
|
pub use types::{
|
||||||
cursor_position::CursorPosition, history::History, side::Side,
|
cursor_position::CursorPosition, history::History, side::Side,
|
||||||
|
|
|
||||||
|
|
@ -1,15 +1,14 @@
|
||||||
mod edited_text;
|
mod edited_text;
|
||||||
mod operation;
|
mod operation;
|
||||||
|
mod transport;
|
||||||
mod utils;
|
mod utils;
|
||||||
use std::fmt::Debug;
|
use std::fmt::Debug;
|
||||||
|
|
||||||
pub use edited_text::EditedText;
|
pub use edited_text::EditedText;
|
||||||
pub use operation::Operation;
|
pub use operation::Operation;
|
||||||
|
pub use transport::ChangeSet;
|
||||||
|
|
||||||
use crate::{
|
use crate::{Tokenizer, types::text_with_cursors::TextWithCursors};
|
||||||
Tokenizer,
|
|
||||||
types::{side::Side, text_with_cursors::TextWithCursors},
|
|
||||||
};
|
|
||||||
|
|
||||||
/// Given an `original` document and two concurrent edits to it,
|
/// Given an `original` document and two concurrent edits to it,
|
||||||
/// return a document containing all changes from both `left`
|
/// return a document containing all changes from both `left`
|
||||||
|
|
@ -48,10 +47,8 @@ pub fn reconcile<'a, T>(
|
||||||
where
|
where
|
||||||
T: PartialEq + Clone + Debug,
|
T: PartialEq + Clone + Debug,
|
||||||
{
|
{
|
||||||
let left_operations =
|
let left_operations = EditedText::from_strings_with_tokenizer(original, left, tokenizer);
|
||||||
EditedText::from_strings_with_tokenizer(original, left, tokenizer, Side::Left);
|
let right_operations = EditedText::from_strings_with_tokenizer(original, right, tokenizer);
|
||||||
let right_operations =
|
|
||||||
EditedText::from_strings_with_tokenizer(original, right, tokenizer, Side::Right);
|
|
||||||
|
|
||||||
left_operations.merge(right_operations)
|
left_operations.merge(right_operations)
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -1,12 +1,13 @@
|
||||||
use std::fmt::Debug;
|
use std::{fmt::Debug, vec};
|
||||||
|
|
||||||
#[cfg(feature = "serde")]
|
#[cfg(feature = "serde")]
|
||||||
use serde::{Deserialize, Serialize};
|
use serde::{Deserialize, Serialize};
|
||||||
|
|
||||||
use crate::{
|
use crate::{
|
||||||
BuiltinTokenizer, CursorPosition, TextWithCursors,
|
BuiltinTokenizer, ChangeSet, CursorPosition, TextWithCursors,
|
||||||
operation_transformation::{
|
operation_transformation::{
|
||||||
Operation,
|
Operation,
|
||||||
|
transport::SimpleOperation,
|
||||||
utils::{cook_operations::cook_operations, elongate_operations::elongate_operations},
|
utils::{cook_operations::cook_operations, elongate_operations::elongate_operations},
|
||||||
},
|
},
|
||||||
raw_operation::RawOperation,
|
raw_operation::RawOperation,
|
||||||
|
|
@ -35,6 +36,7 @@ where
|
||||||
{
|
{
|
||||||
text: &'a str,
|
text: &'a str,
|
||||||
operations: Vec<Operation<T>>,
|
operations: Vec<Operation<T>>,
|
||||||
|
operation_sides: Vec<Side>,
|
||||||
cursors: Vec<CursorPosition>,
|
cursors: Vec<CursorPosition>,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
@ -46,8 +48,8 @@ impl<'a> EditedText<'a, String> {
|
||||||
/// word tokenizer is used to tokenize the text which splits the text on
|
/// word tokenizer is used to tokenize the text which splits the text on
|
||||||
/// whitespaces.
|
/// whitespaces.
|
||||||
#[must_use]
|
#[must_use]
|
||||||
pub fn from_strings(original: &'a str, updated: &TextWithCursors, side: Side) -> Self {
|
pub fn from_strings(original: &'a str, updated: &TextWithCursors) -> Self {
|
||||||
Self::from_strings_with_tokenizer(original, updated, &*BuiltinTokenizer::Word, side)
|
Self::from_strings_with_tokenizer(original, updated, &*BuiltinTokenizer::Word)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
@ -64,16 +66,18 @@ where
|
||||||
original: &'a str,
|
original: &'a str,
|
||||||
updated: &TextWithCursors,
|
updated: &TextWithCursors,
|
||||||
tokenizer: &Tokenizer<T>,
|
tokenizer: &Tokenizer<T>,
|
||||||
side: Side,
|
|
||||||
) -> Self {
|
) -> Self {
|
||||||
let original_tokens = (tokenizer)(original);
|
let original_tokens = (tokenizer)(original);
|
||||||
let updated_tokens = (tokenizer)(&updated.text());
|
let updated_tokens = (tokenizer)(&updated.text());
|
||||||
|
|
||||||
let diff: Vec<RawOperation<T>> = RawOperation::vec_from(&original_tokens, &updated_tokens);
|
let diff: Vec<RawOperation<T>> = RawOperation::vec_from(&original_tokens, &updated_tokens);
|
||||||
|
let operations: Vec<Operation<T>> = cook_operations(elongate_operations(diff)).collect();
|
||||||
|
let operation_count = operations.len();
|
||||||
|
|
||||||
Self::new(
|
Self::new(
|
||||||
original,
|
original,
|
||||||
cook_operations(elongate_operations(diff), side).collect(),
|
operations,
|
||||||
|
vec![Side::Left; operation_count],
|
||||||
updated.cursors(),
|
updated.cursors(),
|
||||||
)
|
)
|
||||||
}
|
}
|
||||||
|
|
@ -81,12 +85,18 @@ where
|
||||||
/// Create a new `EditedText` with the given operations.
|
/// Create a new `EditedText` with the given operations.
|
||||||
/// The operations must be in the order in which they are meant to be
|
/// The operations must be in the order in which they are meant to be
|
||||||
/// applied. The operations must not overlap.
|
/// applied. The operations must not overlap.
|
||||||
fn new(text: &'a str, operations: Vec<Operation<T>>, mut cursors: Vec<CursorPosition>) -> Self {
|
fn new(
|
||||||
|
text: &'a str,
|
||||||
|
operations: Vec<Operation<T>>,
|
||||||
|
operation_sides: Vec<Side>,
|
||||||
|
mut cursors: Vec<CursorPosition>,
|
||||||
|
) -> Self {
|
||||||
cursors.sort_by_key(|cursor| cursor.char_index);
|
cursors.sort_by_key(|cursor| cursor.char_index);
|
||||||
|
|
||||||
Self {
|
Self {
|
||||||
text,
|
text,
|
||||||
operations,
|
operations,
|
||||||
|
operation_sides,
|
||||||
cursors,
|
cursors,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
@ -109,6 +119,8 @@ where
|
||||||
|
|
||||||
let mut merged_operations: Vec<Operation<T>> =
|
let mut merged_operations: Vec<Operation<T>> =
|
||||||
Vec::with_capacity(self.operations.len() + other.operations.len());
|
Vec::with_capacity(self.operations.len() + other.operations.len());
|
||||||
|
let mut merged_operation_sides: Vec<Side> =
|
||||||
|
Vec::with_capacity(self.operations.len() + other.operations.len());
|
||||||
|
|
||||||
let mut left_iter = self.operations.into_iter();
|
let mut left_iter = self.operations.into_iter();
|
||||||
let mut right_iter = other.operations.into_iter();
|
let mut right_iter = other.operations.into_iter();
|
||||||
|
|
@ -149,7 +161,7 @@ where
|
||||||
);
|
);
|
||||||
|
|
||||||
let original_length = operation.len();
|
let original_length = operation.len();
|
||||||
let result = match side {
|
let (side, result) = match side {
|
||||||
Side::Left => {
|
Side::Left => {
|
||||||
let result = operation.merge_operations(&mut last_other_op);
|
let result = operation.merge_operations(&mut last_other_op);
|
||||||
|
|
||||||
|
|
@ -181,7 +193,7 @@ where
|
||||||
maybe_left_op = left_iter.next();
|
maybe_left_op = left_iter.next();
|
||||||
last_left_op = Some(result.clone());
|
last_left_op = Some(result.clone());
|
||||||
|
|
||||||
result
|
(Side::Left, result)
|
||||||
}
|
}
|
||||||
Side::Right => {
|
Side::Right => {
|
||||||
let result = operation.merge_operations(&mut last_other_op);
|
let result = operation.merge_operations(&mut last_other_op);
|
||||||
|
|
@ -214,7 +226,7 @@ where
|
||||||
maybe_right_op = right_iter.next();
|
maybe_right_op = right_iter.next();
|
||||||
last_right_op = Some(result.clone());
|
last_right_op = Some(result.clone());
|
||||||
|
|
||||||
result
|
(Side::Right, result)
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
@ -227,13 +239,21 @@ where
|
||||||
}
|
}
|
||||||
|
|
||||||
merged_operations.push(result);
|
merged_operations.push(result);
|
||||||
|
merged_operation_sides.push(side);
|
||||||
}
|
}
|
||||||
|
|
||||||
for cursor in left_cursors.chain(right_cursors) {
|
for cursor in left_cursors.chain(right_cursors) {
|
||||||
merged_cursors.push(cursor.with_index(merged_length));
|
merged_cursors.push(cursor.with_index(merged_length));
|
||||||
}
|
}
|
||||||
|
|
||||||
Self::new(self.text, merged_operations, merged_cursors)
|
debug_assert_eq!(merged_operations.len(), merged_operation_sides.len());
|
||||||
|
|
||||||
|
Self::new(
|
||||||
|
self.text,
|
||||||
|
merged_operations,
|
||||||
|
merged_operation_sides,
|
||||||
|
merged_cursors,
|
||||||
|
)
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Apply the operations to the text and return the resulting text.
|
/// Apply the operations to the text and return the resulting text.
|
||||||
|
|
@ -288,14 +308,14 @@ where
|
||||||
|
|
||||||
let mut history = Vec::with_capacity(self.operations.len());
|
let mut history = Vec::with_capacity(self.operations.len());
|
||||||
|
|
||||||
for operation in &self.operations {
|
for (operation, side) in self.operations.iter().zip(self.operation_sides.iter()) {
|
||||||
builder = operation.apply(builder);
|
builder = operation.apply(builder);
|
||||||
|
|
||||||
match operation {
|
match operation {
|
||||||
Operation::Equal { .. } => {
|
Operation::Equal { .. } => {
|
||||||
history.push(SpanWithHistory::new(builder.take(), History::Unchanged));
|
history.push(SpanWithHistory::new(builder.take(), History::Unchanged));
|
||||||
}
|
}
|
||||||
Operation::Insert { side, .. } => match side {
|
Operation::Insert { .. } => match side {
|
||||||
Side::Left => {
|
Side::Left => {
|
||||||
history.push(SpanWithHistory::new(builder.take(), History::AddedFromLeft));
|
history.push(SpanWithHistory::new(builder.take(), History::AddedFromLeft));
|
||||||
}
|
}
|
||||||
|
|
@ -307,7 +327,6 @@ where
|
||||||
Operation::Delete {
|
Operation::Delete {
|
||||||
deleted_character_count,
|
deleted_character_count,
|
||||||
order,
|
order,
|
||||||
side,
|
|
||||||
..
|
..
|
||||||
} => {
|
} => {
|
||||||
let deleted = self.text[*order..*order + *deleted_character_count].to_string();
|
let deleted = self.text[*order..*order + *deleted_character_count].to_string();
|
||||||
|
|
@ -325,6 +344,37 @@ where
|
||||||
|
|
||||||
history
|
history
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Serialize the `EditedText` as a `ChangeSet`, which contains only
|
||||||
|
/// the operations and cursor positions, but without the original text.
|
||||||
|
/// This is useful for sending changes over the network if there's
|
||||||
|
/// a clear consensus on the original text.
|
||||||
|
#[must_use]
|
||||||
|
pub fn to_change_set(&self) -> ChangeSet {
|
||||||
|
ChangeSet::new(
|
||||||
|
SimpleOperation::from_operations(&self.operations),
|
||||||
|
self.cursors.clone(),
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Deserialize an `EditedText` from a `ChangeSet` and the original text.
|
||||||
|
/// This is useful for reconstructing the `EditedText` on the receiving
|
||||||
|
/// end after sending only the `ChangeSet` over the network.
|
||||||
|
#[must_use]
|
||||||
|
pub fn from_change_set(
|
||||||
|
text: &'a str,
|
||||||
|
change_set: ChangeSet,
|
||||||
|
tokenizer: &Tokenizer<T>,
|
||||||
|
) -> EditedText<'a, T> {
|
||||||
|
let operations = SimpleOperation::to_operations(change_set.operations, text, tokenizer);
|
||||||
|
let operation_count = operations.len();
|
||||||
|
EditedText::new(
|
||||||
|
text,
|
||||||
|
operations,
|
||||||
|
vec![Side::Left; operation_count],
|
||||||
|
change_set.cursors,
|
||||||
|
)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#[cfg(test)]
|
#[cfg(test)]
|
||||||
|
|
@ -339,7 +389,7 @@ mod tests {
|
||||||
let left = "hello world! How are you? Adam";
|
let left = "hello world! How are you? Adam";
|
||||||
let right = "Hello, my friend! How are you doing? Albert";
|
let right = "Hello, my friend! How are you doing? Albert";
|
||||||
|
|
||||||
let operations = EditedText::from_strings(left, &right.into(), Side::Right);
|
let operations = EditedText::from_strings(left, &right.into());
|
||||||
|
|
||||||
insta::assert_debug_snapshot!(operations);
|
insta::assert_debug_snapshot!(operations);
|
||||||
|
|
||||||
|
|
@ -351,7 +401,7 @@ mod tests {
|
||||||
fn test_calculate_operations_with_no_diff() {
|
fn test_calculate_operations_with_no_diff() {
|
||||||
let text = "hello world!";
|
let text = "hello world!";
|
||||||
|
|
||||||
let operations = EditedText::from_strings(text, &text.into(), Side::Right);
|
let operations = EditedText::from_strings(text, &text.into());
|
||||||
|
|
||||||
assert_debug_snapshot!(operations);
|
assert_debug_snapshot!(operations);
|
||||||
|
|
||||||
|
|
@ -366,10 +416,42 @@ mod tests {
|
||||||
let right = "Hello world! How are you?";
|
let right = "Hello world! How are you?";
|
||||||
let expected = "Hello world! How are you? I'm Andras.";
|
let expected = "Hello world! How are you? I'm Andras.";
|
||||||
|
|
||||||
let operations_1 = EditedText::from_strings(original, &left.into(), Side::Left);
|
let operations_1 = EditedText::from_strings(original, &left.into());
|
||||||
let operations_2 = EditedText::from_strings(original, &right.into(), Side::Right);
|
let operations_2 = EditedText::from_strings(original, &right.into());
|
||||||
|
|
||||||
let operations = operations_1.merge(operations_2);
|
let operations = operations_1.merge(operations_2);
|
||||||
assert_eq!(operations.apply().text(), expected);
|
assert_eq!(operations.apply().text(), expected);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_change_set_deserialisation() {
|
||||||
|
let original = "Merging text is hard!";
|
||||||
|
let changes = "Merging text is easy with reconcile!";
|
||||||
|
let result = EditedText::from_strings(original, &changes.into());
|
||||||
|
let serialized = serde_yaml::to_string(&result.to_change_set()).unwrap();
|
||||||
|
|
||||||
|
let expected = concat!(
|
||||||
|
"operations:\n",
|
||||||
|
"- 15\n",
|
||||||
|
"- -6\n",
|
||||||
|
"- ' easy with reconcile!'\n",
|
||||||
|
"cursors: []\n"
|
||||||
|
);
|
||||||
|
|
||||||
|
assert_eq!(serialized, expected);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_change_set_serialization() {
|
||||||
|
let original = "The quick brown fox jumps over the lazy dog.";
|
||||||
|
let updated = "The quick red fox jumped over the very lazy dog!";
|
||||||
|
|
||||||
|
let edited_text = EditedText::from_strings(original, &updated.into());
|
||||||
|
|
||||||
|
let change_set = edited_text.to_change_set();
|
||||||
|
let deserialized_edited_text =
|
||||||
|
EditedText::from_change_set(original, change_set, &*BuiltinTokenizer::Word);
|
||||||
|
|
||||||
|
assert_eq!(deserialized_edited_text.apply().text(), updated);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -4,7 +4,7 @@ use core::fmt::{Debug, Display};
|
||||||
use serde::{Deserialize, Serialize};
|
use serde::{Deserialize, Serialize};
|
||||||
|
|
||||||
use crate::{
|
use crate::{
|
||||||
Side, Token,
|
Token,
|
||||||
utils::{
|
utils::{
|
||||||
find_longest_prefix_contained_within::find_longest_prefix_contained_within,
|
find_longest_prefix_contained_within::find_longest_prefix_contained_within,
|
||||||
string_builder::StringBuilder,
|
string_builder::StringBuilder,
|
||||||
|
|
@ -23,23 +23,21 @@ where
|
||||||
length: usize,
|
length: usize,
|
||||||
|
|
||||||
#[cfg(debug_assertions)]
|
#[cfg(debug_assertions)]
|
||||||
|
#[cfg_attr(feature = "serde", serde(skip_serializing))]
|
||||||
text: Option<String>,
|
text: Option<String>,
|
||||||
},
|
},
|
||||||
|
|
||||||
Insert {
|
Insert {
|
||||||
side: Side,
|
|
||||||
|
|
||||||
order: usize,
|
order: usize,
|
||||||
text: Vec<Token<T>>,
|
text: Vec<Token<T>>,
|
||||||
},
|
},
|
||||||
|
|
||||||
Delete {
|
Delete {
|
||||||
side: Side,
|
|
||||||
|
|
||||||
order: usize,
|
order: usize,
|
||||||
deleted_character_count: usize,
|
deleted_character_count: usize,
|
||||||
|
|
||||||
#[cfg(debug_assertions)]
|
#[cfg(debug_assertions)]
|
||||||
|
#[cfg_attr(feature = "serde", serde(skip_serializing))]
|
||||||
deleted_text: Option<String>,
|
deleted_text: Option<String>,
|
||||||
},
|
},
|
||||||
}
|
}
|
||||||
|
|
@ -72,15 +70,14 @@ where
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Creates an insert operation with the given index and text.
|
/// Creates an insert operation with the given index and text.
|
||||||
pub fn create_insert(order: usize, text: Vec<Token<T>>, side: Side) -> Self {
|
pub fn create_insert(order: usize, text: Vec<Token<T>>) -> Self {
|
||||||
Operation::Insert { side, order, text }
|
Operation::Insert { order, text }
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Creates a delete operation with the given index and number of
|
/// Creates a delete operation with the given index and number of
|
||||||
/// to-be-deleted characters.
|
/// to-be-deleted characters.
|
||||||
pub fn create_delete(order: usize, deleted_character_count: usize, side: Side) -> Self {
|
pub fn create_delete(order: usize, deleted_character_count: usize) -> Self {
|
||||||
Operation::Delete {
|
Operation::Delete {
|
||||||
side,
|
|
||||||
order,
|
order,
|
||||||
deleted_character_count,
|
deleted_character_count,
|
||||||
|
|
||||||
|
|
@ -89,9 +86,8 @@ where
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn create_delete_with_text(order: usize, text: String, side: Side) -> Self {
|
pub fn create_delete_with_text(order: usize, text: String) -> Self {
|
||||||
Operation::Delete {
|
Operation::Delete {
|
||||||
side,
|
|
||||||
order,
|
order,
|
||||||
deleted_character_count: text.chars().count(),
|
deleted_character_count: text.chars().count(),
|
||||||
|
|
||||||
|
|
@ -206,7 +202,7 @@ where
|
||||||
|
|
||||||
match (operation, previous_operation) {
|
match (operation, previous_operation) {
|
||||||
(
|
(
|
||||||
Operation::Insert { side, order, text },
|
Operation::Insert { order, text },
|
||||||
Some(Operation::Insert {
|
Some(Operation::Insert {
|
||||||
text: previous_inserted_text,
|
text: previous_inserted_text,
|
||||||
..
|
..
|
||||||
|
|
@ -218,12 +214,11 @@ where
|
||||||
let offset_in_tokens =
|
let offset_in_tokens =
|
||||||
find_longest_prefix_contained_within(previous_inserted_text, &text);
|
find_longest_prefix_contained_within(previous_inserted_text, &text);
|
||||||
|
|
||||||
Operation::create_insert(order, text[offset_in_tokens..].to_vec(), side)
|
Operation::create_insert(order, text[offset_in_tokens..].to_vec())
|
||||||
}
|
}
|
||||||
|
|
||||||
(
|
(
|
||||||
Operation::Delete {
|
Operation::Delete {
|
||||||
side,
|
|
||||||
order,
|
order,
|
||||||
deleted_character_count,
|
deleted_character_count,
|
||||||
|
|
||||||
|
|
@ -247,20 +242,19 @@ where
|
||||||
|
|
||||||
#[cfg(debug_assertions)]
|
#[cfg(debug_assertions)]
|
||||||
let updated_delete = deleted_text.as_ref().map_or_else(
|
let updated_delete = deleted_text.as_ref().map_or_else(
|
||||||
|| Operation::create_delete(order + overlap, new_length, side),
|
|| Operation::create_delete(order + overlap, new_length),
|
||||||
|text| {
|
|text| {
|
||||||
Operation::create_delete_with_text(
|
Operation::create_delete_with_text(
|
||||||
order + overlap,
|
order + overlap,
|
||||||
text.chars()
|
text.chars()
|
||||||
.skip(deleted_character_count - new_length)
|
.skip(deleted_character_count - new_length)
|
||||||
.collect::<String>(),
|
.collect::<String>(),
|
||||||
side,
|
|
||||||
)
|
)
|
||||||
},
|
},
|
||||||
);
|
);
|
||||||
|
|
||||||
#[cfg(not(debug_assertions))]
|
#[cfg(not(debug_assertions))]
|
||||||
let updated_delete = Operation::create_delete(order + overlap, new_length, side);
|
let updated_delete = Operation::create_delete(order + overlap, new_length);
|
||||||
|
|
||||||
updated_delete
|
updated_delete
|
||||||
}
|
}
|
||||||
|
|
@ -405,8 +399,7 @@ mod tests {
|
||||||
#[test]
|
#[test]
|
||||||
fn test_apply_delete_with_create() {
|
fn test_apply_delete_with_create() {
|
||||||
let builder = StringBuilder::new("hello world");
|
let builder = StringBuilder::new("hello world");
|
||||||
let delete_operation =
|
let delete_operation = Operation::<()>::create_delete_with_text(0, "hello ".to_owned());
|
||||||
Operation::<()>::create_delete_with_text(0, "hello ".to_owned(), Side::Left);
|
|
||||||
let retain_operation = Operation::<()>::create_equal(6, 5);
|
let retain_operation = Operation::<()>::create_equal(6, 5);
|
||||||
|
|
||||||
let mut builder = delete_operation.apply(builder);
|
let mut builder = delete_operation.apply(builder);
|
||||||
|
|
@ -420,7 +413,7 @@ mod tests {
|
||||||
let builder = StringBuilder::new("hello");
|
let builder = StringBuilder::new("hello");
|
||||||
|
|
||||||
let retain_operation = Operation::<()>::create_equal(0, 5);
|
let retain_operation = Operation::<()>::create_equal(0, 5);
|
||||||
let insert_operation = Operation::create_insert(5, vec![" my friend".into()], Side::Right);
|
let insert_operation = Operation::create_insert(5, vec![" my friend".into()]);
|
||||||
|
|
||||||
let mut builder = retain_operation.apply(builder);
|
let mut builder = retain_operation.apply(builder);
|
||||||
builder = insert_operation.apply(builder);
|
builder = insert_operation.apply(builder);
|
||||||
|
|
|
||||||
|
|
@ -1,7 +1,6 @@
|
||||||
---
|
---
|
||||||
source: src/operation_transformation/edited_text.rs
|
source: src/operation_transformation/edited_text.rs
|
||||||
expression: operations
|
expression: operations
|
||||||
snapshot_kind: text
|
|
||||||
---
|
---
|
||||||
EditedText {
|
EditedText {
|
||||||
text: "hello world! How are you? Adam",
|
text: "hello world! How are you? Adam",
|
||||||
|
|
@ -15,5 +14,15 @@ EditedText {
|
||||||
<delete ' you? Adam' from 20>,
|
<delete ' you? Adam' from 20>,
|
||||||
<insert ' you doing? Albert' at 31>,
|
<insert ' you doing? Albert' at 31>,
|
||||||
],
|
],
|
||||||
|
operation_sides: [
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
],
|
||||||
cursors: [],
|
cursors: [],
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -1,7 +1,6 @@
|
||||||
---
|
---
|
||||||
source: src/operation_transformation/edited_text.rs
|
source: src/operation_transformation/edited_text.rs
|
||||||
expression: operations
|
expression: operations
|
||||||
snapshot_kind: text
|
|
||||||
---
|
---
|
||||||
EditedText {
|
EditedText {
|
||||||
text: "hello world!",
|
text: "hello world!",
|
||||||
|
|
@ -10,5 +9,10 @@ EditedText {
|
||||||
<equal ' ' from 5>,
|
<equal ' ' from 5>,
|
||||||
<equal 'world!' from 6>,
|
<equal 'world!' from 6>,
|
||||||
],
|
],
|
||||||
|
operation_sides: [
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
Left,
|
||||||
|
],
|
||||||
cursors: [],
|
cursors: [],
|
||||||
}
|
}
|
||||||
|
|
|
||||||
204
src/operation_transformation/transport.rs
Normal file
204
src/operation_transformation/transport.rs
Normal file
|
|
@ -0,0 +1,204 @@
|
||||||
|
use std::fmt::Debug;
|
||||||
|
|
|||||||
|
|
||||||
|
#[cfg(feature = "serde")]
|
||||||
|
use serde::{
|
||||||
|
Deserialize, Serialize,
|
||||||
|
de::{self, Deserializer, Visitor},
|
||||||
|
ser::Serializer,
|
||||||
|
};
|
||||||
|
|
||||||
|
use crate::{CursorPosition, Tokenizer, operation_transformation::Operation};
|
||||||
|
|
||||||
|
#[derive(Clone, PartialEq, Eq, Debug)]
|
||||||
|
pub enum SimpleOperation {
|
||||||
|
Equal { length: usize },
|
||||||
|
Insert { text: String },
|
||||||
|
Delete { length: usize },
|
||||||
|
}
|
||||||
|
|
||||||
|
impl SimpleOperation {
|
||||||
|
pub fn from_operations<T>(operation: &Vec<Operation<T>>) -> Vec<Self>
|
||||||
|
where
|
||||||
|
T: PartialEq + Clone + Debug,
|
||||||
|
{
|
||||||
|
let mut result: Vec<Self> = Vec::with_capacity(operation.len());
|
||||||
|
let mut previous_equal: Option<usize> = None;
|
||||||
|
|
||||||
|
for operation in operation {
|
||||||
|
match operation {
|
||||||
|
Operation::Equal { length, .. } => {
|
||||||
|
if let Some(prev_length) = previous_equal {
|
||||||
|
previous_equal = Some(prev_length + *length);
|
||||||
|
} else {
|
||||||
|
previous_equal = Some(*length);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Operation::Insert { text, .. } => {
|
||||||
|
if let Some(prev_length) = previous_equal {
|
||||||
|
result.push(SimpleOperation::Equal {
|
||||||
|
length: prev_length,
|
||||||
|
});
|
||||||
|
previous_equal = None;
|
||||||
|
}
|
||||||
|
|
||||||
|
let text: String = text
|
||||||
|
.iter()
|
||||||
|
.map(super::super::tokenizer::token::Token::original)
|
||||||
|
.collect();
|
||||||
|
result.push(SimpleOperation::Insert { text });
|
||||||
|
}
|
||||||
|
|
||||||
|
Operation::Delete {
|
||||||
|
deleted_character_count,
|
||||||
|
..
|
||||||
|
} => {
|
||||||
|
if let Some(prev_length) = previous_equal {
|
||||||
|
result.push(SimpleOperation::Equal {
|
||||||
|
length: prev_length,
|
||||||
|
});
|
||||||
|
previous_equal = None;
|
||||||
|
}
|
||||||
|
|
||||||
|
result.push(SimpleOperation::Delete {
|
||||||
|
length: *deleted_character_count,
|
||||||
|
});
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if let Some(prev_length) = previous_equal {
|
||||||
|
result.push(SimpleOperation::Equal {
|
||||||
|
length: prev_length,
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
result
|
||||||
|
}
|
||||||
|
|
||||||
|
// This is similar to `crate::operation_transformation::utils::cook_operations`
|
||||||
|
pub fn to_operations<T>(
|
||||||
|
simple_operations: Vec<Self>,
|
||||||
|
original_text: &str,
|
||||||
|
tokenizer: &Tokenizer<T>,
|
||||||
|
) -> Vec<Operation<T>>
|
||||||
|
where
|
||||||
|
T: PartialEq + Clone + Debug,
|
||||||
|
{
|
||||||
|
let mut operations: Vec<Operation<T>> = Vec::with_capacity(simple_operations.len());
|
||||||
|
let mut order = 0;
|
||||||
|
|
||||||
|
for simple_operation in simple_operations {
|
||||||
|
match simple_operation {
|
||||||
|
SimpleOperation::Equal { length } => {
|
||||||
|
let original_characters: String =
|
||||||
|
original_text.chars().skip(order).take(length).collect();
|
||||||
|
|
||||||
|
let original_tokens = tokenizer(&original_characters);
|
||||||
|
for token in original_tokens {
|
||||||
|
operations
|
||||||
|
.push(Operation::create_equal(order, token.get_original_length()));
|
||||||
|
order += token.get_original_length();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
SimpleOperation::Insert { text } => {
|
||||||
|
let tokens = tokenizer(&text);
|
||||||
|
operations.push(Operation::create_insert(order, tokens));
|
||||||
|
}
|
||||||
|
|
||||||
|
SimpleOperation::Delete { length } => {
|
||||||
|
operations.push(Operation::create_delete(order, length));
|
||||||
|
order += length;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
operations
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(feature = "serde")]
|
||||||
|
impl Serialize for SimpleOperation {
|
||||||
|
fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
|
||||||
|
where
|
||||||
|
S: Serializer,
|
||||||
|
{
|
||||||
|
// neat idea from https://github.com/spebern/operational-transform-rs/blob/9faa17f0a2b282ac2e09dbb2d29fdaf2ae0bbb4a/operational-transform/src/serde.rs#L14
|
||||||
|
match self {
|
||||||
|
SimpleOperation::Equal { length } => serializer.serialize_u64(*length as u64),
|
||||||
|
SimpleOperation::Insert { text } => serializer.serialize_str(text),
|
||||||
|
SimpleOperation::Delete { length } => {
|
||||||
|
serializer.serialize_i64(-(i64::try_from(*length).unwrap_or(i64::MAX)))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(feature = "serde")]
|
||||||
|
impl<'de> Deserialize<'de> for SimpleOperation {
|
||||||
|
fn deserialize<D>(deserializer: D) -> Result<SimpleOperation, D::Error>
|
||||||
|
where
|
||||||
|
D: Deserializer<'de>,
|
||||||
|
{
|
||||||
|
use std::fmt;
|
||||||
|
|
||||||
|
struct OperationVisitor;
|
||||||
|
|
||||||
|
impl Visitor<'_> for OperationVisitor {
|
||||||
|
type Value = SimpleOperation;
|
||||||
|
|
||||||
|
fn expecting(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||||
|
formatter.write_str("an integer between -2^63 and 2^64-1 or a string")
|
||||||
|
}
|
||||||
|
|
||||||
|
fn visit_u64<E>(self, value: u64) -> Result<Self::Value, E>
|
||||||
|
where
|
||||||
|
E: de::Error,
|
||||||
|
{
|
||||||
|
Ok(SimpleOperation::Equal {
|
||||||
|
length: usize::try_from(value).unwrap_or(usize::MAX),
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
fn visit_i64<E>(self, value: i64) -> Result<Self::Value, E>
|
||||||
|
where
|
||||||
|
E: de::Error,
|
||||||
|
{
|
||||||
|
Ok(SimpleOperation::Delete {
|
||||||
|
length: usize::try_from(-value).unwrap_or(usize::MAX),
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
fn visit_str<E>(self, value: &str) -> Result<Self::Value, E>
|
||||||
|
where
|
||||||
|
E: de::Error,
|
||||||
|
{
|
||||||
|
Ok(SimpleOperation::Insert {
|
||||||
|
text: value.to_owned(),
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
deserializer.deserialize_any(OperationVisitor)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// A serializable representation of the changes made to a text document
|
||||||
|
/// without the original text.
|
||||||
|
#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
|
||||||
|
#[derive(Debug, Clone, PartialEq, Default)]
|
||||||
|
pub struct ChangeSet {
|
||||||
|
pub operations: Vec<SimpleOperation>,
|
||||||
|
pub cursors: Vec<CursorPosition>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl ChangeSet {
|
||||||
|
#[must_use]
|
||||||
|
pub fn new(operations: Vec<SimpleOperation>, cursors: Vec<CursorPosition>) -> Self {
|
||||||
|
Self {
|
||||||
|
operations,
|
||||||
|
cursors,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
@ -1,10 +1,10 @@
|
||||||
use std::fmt::Debug;
|
use std::fmt::Debug;
|
||||||
|
|
||||||
use crate::{operation_transformation::Operation, raw_operation::RawOperation, types::side::Side};
|
use crate::{operation_transformation::Operation, raw_operation::RawOperation};
|
||||||
|
|
||||||
/// Turn raw operations into ordered operations while keeping track of the
|
/// Turn raw operations into ordered operations while keeping track of the
|
||||||
/// original token's indexes.
|
/// original token's indexes.
|
||||||
pub fn cook_operations<I, T>(raw_operations: I, side: Side) -> impl Iterator<Item = Operation<T>>
|
pub fn cook_operations<I, T>(raw_operations: I) -> impl Iterator<Item = Operation<T>>
|
||||||
where
|
where
|
||||||
I: IntoIterator<Item = RawOperation<T>>,
|
I: IntoIterator<Item = RawOperation<T>>,
|
||||||
T: PartialEq + Clone + Debug,
|
T: PartialEq + Clone + Debug,
|
||||||
|
|
@ -29,18 +29,15 @@ where
|
||||||
|
|
||||||
op
|
op
|
||||||
}
|
}
|
||||||
RawOperation::Insert(tokens) => {
|
RawOperation::Insert(tokens) => Operation::create_insert(original_text_index, tokens),
|
||||||
Operation::create_insert(original_text_index, tokens, side)
|
|
||||||
}
|
|
||||||
RawOperation::Delete(..) => {
|
RawOperation::Delete(..) => {
|
||||||
let op = if cfg!(debug_assertions) {
|
let op = if cfg!(debug_assertions) {
|
||||||
Operation::create_delete_with_text(
|
Operation::create_delete_with_text(
|
||||||
original_text_index,
|
original_text_index,
|
||||||
raw_operation.get_original_text(),
|
raw_operation.get_original_text(),
|
||||||
side,
|
|
||||||
)
|
)
|
||||||
} else {
|
} else {
|
||||||
Operation::create_delete(original_text_index, length, side)
|
Operation::create_delete(original_text_index, length)
|
||||||
};
|
};
|
||||||
|
|
||||||
original_text_index += length;
|
original_text_index += length;
|
||||||
|
|
|
||||||
|
|
@ -1,4 +1,4 @@
|
||||||
use std::iter::Iterator;
|
use std::{fmt, iter::Iterator};
|
||||||
|
|
||||||
/// A helper for building a string in-order based on an original string and a
|
/// A helper for building a string in-order based on an original string and a
|
||||||
/// series of insertions, deletions, and copies applied to it. It is safe to use
|
/// series of insertions, deletions, and copies applied to it. It is safe to use
|
||||||
|
|
@ -12,6 +12,18 @@ pub struct StringBuilder<'a> {
|
||||||
remaining: String,
|
remaining: String,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
impl fmt::Debug for StringBuilder<'_> {
|
||||||
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||||
|
let mut debug_struct = f.debug_struct("StringBuilder");
|
||||||
|
debug_struct.field("buffer", &self.buffer);
|
||||||
|
|
||||||
|
#[cfg(debug_assertions)]
|
||||||
|
debug_struct.field("remaining", &self.remaining);
|
||||||
|
|
||||||
|
debug_struct.finish_non_exhaustive()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
impl StringBuilder<'_> {
|
impl StringBuilder<'_> {
|
||||||
pub fn new(original: &str) -> StringBuilder<'_> {
|
pub fn new(original: &str) -> StringBuilder<'_> {
|
||||||
StringBuilder {
|
StringBuilder {
|
||||||
|
|
|
||||||
19
src/wasm.rs
19
src/wasm.rs
|
|
@ -87,6 +87,25 @@ pub fn generic_reconcile(
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// WASM wrapper around getting a compact diff representation as a JSON string
|
||||||
|
///
|
||||||
|
/// # Panics
|
||||||
|
///
|
||||||
|
/// If serialization to JSON fails which should not happen
|
||||||
|
#[wasm_bindgen(js_name = getCompactDiff)]
|
||||||
|
#[must_use]
|
||||||
|
pub fn get_compact_diff(
|
||||||
|
parent: &str,
|
||||||
|
changed: &TextWithCursors,
|
||||||
|
tokenizer: BuiltinTokenizer,
|
||||||
|
) -> String {
|
||||||
|
set_panic_hook();
|
||||||
|
let edited_text = crate::EditedText::from_strings_with_tokenizer(parent, changed, &*tokenizer);
|
||||||
|
let change_set = edited_text.to_change_set();
|
||||||
|
|
||||||
|
serde_json::to_string(&change_set).expect("Failed to serialize change set")
|
||||||
|
}
|
||||||
|
|
||||||
/// Heuristically determine if the given data is a binary or a text file's
|
/// Heuristically determine if the given data is a binary or a text file's
|
||||||
/// content.
|
/// content.
|
||||||
#[wasm_bindgen(js_name = isBinary)]
|
#[wasm_bindgen(js_name = isBinary)]
|
||||||
|
|
|
||||||
|
|
@ -3,7 +3,7 @@ mod example_document;
|
||||||
use std::{fs, path::Path};
|
use std::{fs, path::Path};
|
||||||
|
|
||||||
use example_document::ExampleDocument;
|
use example_document::ExampleDocument;
|
||||||
use reconcile_text::{BuiltinTokenizer, reconcile};
|
use reconcile_text::{BuiltinTokenizer, EditedText, reconcile};
|
||||||
use serde::Deserialize;
|
use serde::Deserialize;
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
|
|
@ -34,6 +34,35 @@ fn test_document_one_way_with_cursors() {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_document_one_way_with_cursors_and_serialisation() {
|
||||||
|
for doc in &get_all_documents() {
|
||||||
|
let parent = doc.parent();
|
||||||
|
let left_operations =
|
||||||
|
EditedText::from_strings_with_tokenizer(&parent, &doc.left(), &*BuiltinTokenizer::Word);
|
||||||
|
let right_operations = EditedText::from_strings_with_tokenizer(
|
||||||
|
&parent,
|
||||||
|
&doc.right(),
|
||||||
|
&*BuiltinTokenizer::Word,
|
||||||
|
);
|
||||||
|
|
||||||
|
let serialised_left =
|
||||||
|
serde_yaml::from_str(&serde_yaml::to_string(&left_operations.to_change_set()).unwrap())
|
||||||
|
.unwrap();
|
||||||
|
let serialised_right = serde_yaml::from_str(
|
||||||
|
&serde_yaml::to_string(&right_operations.to_change_set()).unwrap(),
|
||||||
|
)
|
||||||
|
.unwrap();
|
||||||
|
|
||||||
|
let restored_left_operations =
|
||||||
|
EditedText::from_change_set(&parent, serialised_left, &*BuiltinTokenizer::Word);
|
||||||
|
let restored_right_operations =
|
||||||
|
EditedText::from_change_set(&parent, serialised_right, &*BuiltinTokenizer::Word);
|
||||||
|
|
||||||
|
doc.assert_eq(&restored_left_operations.merge(restored_right_operations));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_document_inverse_way_without_cursors() {
|
fn test_document_inverse_way_without_cursors() {
|
||||||
for doc in &get_all_documents() {
|
for doc in &get_all_documents() {
|
||||||
|
|
|
||||||
|
|
@ -46,7 +46,7 @@ fn test_merge_text_with_cursors() {
|
||||||
}
|
}
|
||||||
|
|
||||||
#[wasm_bindgen_test(unsupported = test)]
|
#[wasm_bindgen_test(unsupported = test)]
|
||||||
fn merge_binary() {
|
fn test_merge_binary() {
|
||||||
let left = [0, 1, 2];
|
let left = [0, 1, 2];
|
||||||
let right = [3, 4, 5];
|
let right = [3, 4, 5];
|
||||||
assert_eq!(
|
assert_eq!(
|
||||||
|
|
@ -62,6 +62,14 @@ fn test_is_binary() {
|
||||||
assert!(!is_binary(b"hello"));
|
assert!(!is_binary(b"hello"));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[wasm_bindgen_test(unsupported = test)]
|
||||||
|
fn test_get_compact_diff() {
|
||||||
|
let parent = "hello ";
|
||||||
|
let changed = "world";
|
||||||
|
let result = get_compact_diff(parent, &changed.into(), BuiltinTokenizer::Word);
|
||||||
|
assert_eq!(result, "{\"operations\":[-6,\"world\"],\"cursors\":[]}");
|
||||||
|
}
|
||||||
|
|
||||||
#[wasm_bindgen_test(unsupported = test)]
|
#[wasm_bindgen_test(unsupported = test)]
|
||||||
fn test_is_binary_empty() {
|
fn test_is_binary_empty() {
|
||||||
assert!(!is_binary(b""));
|
assert!(!is_binary(b""));
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue
The range description is incorrect. The actual range is -2^63 to 2^64-1 (i64::MIN to u64::MAX). The message should read 'an integer between -2^63 and 2^64-1 or a string'.