591 lines
22 KiB
Rust
Raw Normal View History

2021-08-04 07:55:54 +08:00
use crate::{
2021-08-04 15:09:04 +08:00
core::{attributes::*, operation::*, Interval},
2021-08-04 07:55:54 +08:00
errors::OTError,
};
2021-07-31 20:53:45 +08:00
use bytecount::num_chars;
2021-08-03 23:13:20 +08:00
use std::{cmp::Ordering, fmt, iter::FromIterator, str::FromStr};
2021-07-31 20:53:45 +08:00
#[derive(Clone, Debug, PartialEq)]
pub struct Delta {
pub ops: Vec<Operation>,
pub base_len: usize,
pub target_len: usize,
}
impl Default for Delta {
fn default() -> Self {
Self {
ops: Vec::new(),
base_len: 0,
target_len: 0,
}
}
}
2021-08-01 10:45:15 +08:00
impl FromStr for Delta {
type Err = ();
fn from_str(s: &str) -> Result<Delta, Self::Err> {
let mut delta = Delta::with_capacity(1);
delta.add(Operation::Insert(s.into()));
Ok(delta)
}
}
impl<T: AsRef<str>> From<T> for Delta {
fn from(s: T) -> Delta { Delta::from_str(s.as_ref()).unwrap() }
}
2021-08-03 23:13:20 +08:00
impl fmt::Display for Delta {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
f.write_str(&serde_json::to_string(self).unwrap_or("".to_owned()))?;
// for op in &self.ops {
// f.write_fmt(format_args!("{}", op));
// }
Ok(())
}
}
2021-08-01 10:45:15 +08:00
impl FromIterator<Operation> for Delta {
fn from_iter<T: IntoIterator<Item = Operation>>(ops: T) -> Self {
let mut operations = Delta::default();
for op in ops {
operations.add(op);
}
operations
}
}
2021-07-31 20:53:45 +08:00
impl Delta {
#[inline]
pub fn with_capacity(capacity: usize) -> Self {
Self {
ops: Vec::with_capacity(capacity),
base_len: 0,
target_len: 0,
}
}
2021-08-01 14:39:30 +08:00
pub fn add(&mut self, op: Operation) {
2021-08-01 10:45:15 +08:00
match op {
Operation::Delete(i) => self.delete(i),
2021-08-01 14:39:30 +08:00
Operation::Insert(i) => self.insert(&i.s, i.attributes),
2021-08-04 15:09:04 +08:00
Operation::Retain(r) => self.retain(r.n, r.attributes),
2021-08-01 10:45:15 +08:00
}
}
2021-07-31 20:53:45 +08:00
pub fn delete(&mut self, n: u64) {
if n == 0 {
return;
}
self.base_len += n as usize;
2021-08-01 10:45:15 +08:00
if let Some(Operation::Delete(n_last)) = self.ops.last_mut() {
*n_last += n;
} else {
self.ops.push(OpBuilder::delete(n).build());
2021-07-31 20:53:45 +08:00
}
}
2021-08-03 16:20:25 +08:00
pub fn insert(&mut self, s: &str, attrs: Attributes) {
2021-07-31 20:53:45 +08:00
if s.is_empty() {
return;
}
2021-08-01 10:45:15 +08:00
2021-08-01 16:39:32 +08:00
self.target_len += num_chars(s.as_bytes());
2021-08-01 10:45:15 +08:00
let new_last = match self.ops.as_mut_slice() {
[.., Operation::Insert(insert)] => {
2021-08-01 16:39:32 +08:00
//
2021-08-04 15:09:04 +08:00
insert.merge_or_new_op(s, attrs)
2021-07-31 20:53:45 +08:00
},
[.., Operation::Insert(pre_insert), Operation::Delete(_)] => {
2021-08-01 16:39:32 +08:00
//
2021-08-04 15:09:04 +08:00
pre_insert.merge_or_new_op(s, attrs)
2021-07-31 20:53:45 +08:00
},
2021-08-01 10:45:15 +08:00
[.., op_last @ Operation::Delete(_)] => {
2021-07-31 20:53:45 +08:00
let new_last = op_last.clone();
2021-08-01 16:39:32 +08:00
*op_last = OpBuilder::insert(s).attributes(attrs).build();
Some(new_last)
2021-07-31 20:53:45 +08:00
},
2021-08-01 16:39:32 +08:00
_ => Some(OpBuilder::insert(s).attributes(attrs).build()),
2021-07-31 20:53:45 +08:00
};
2021-08-01 16:39:32 +08:00
match new_last {
None => {},
Some(new_last) => self.ops.push(new_last),
}
2021-07-31 20:53:45 +08:00
}
2021-08-03 16:20:25 +08:00
pub fn retain(&mut self, n: u64, attrs: Attributes) {
2021-07-31 20:53:45 +08:00
if n == 0 {
return;
}
self.base_len += n as usize;
self.target_len += n as usize;
if let Some(Operation::Retain(retain)) = self.ops.last_mut() {
2021-08-04 15:09:04 +08:00
if let Some(new_op) = retain.merge_or_new_op(n, attrs) {
self.ops.push(new_op);
2021-08-01 16:39:32 +08:00
}
2021-08-01 10:45:15 +08:00
} else {
self.ops
2021-08-01 14:39:30 +08:00
.push(OpBuilder::retain(n).attributes(attrs).build());
2021-07-31 20:53:45 +08:00
}
}
/// Merges the operation with `other` into one operation while preserving
/// the changes of both. Or, in other words, for each input string S and a
/// pair of consecutive operations A and B.
/// `apply(apply(S, A), B) = apply(S, compose(A, B))`
/// must hold.
///
/// # Error
///
/// Returns an `OTError` if the operations are not composable due to length
/// conflicts.
pub fn compose(&self, other: &Self) -> Result<Self, OTError> {
if self.target_len != other.base_len {
return Err(OTError);
}
let mut new_delta = Delta::default();
let mut ops1 = self.ops.iter().cloned();
let mut ops2 = other.ops.iter().cloned();
2021-08-01 10:45:15 +08:00
let mut next_op1 = ops1.next();
let mut next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
loop {
2021-08-01 10:45:15 +08:00
match (&next_op1, &next_op2) {
2021-07-31 20:53:45 +08:00
(None, None) => break,
2021-08-01 10:45:15 +08:00
(Some(Operation::Delete(i)), _) => {
2021-07-31 20:53:45 +08:00
new_delta.delete(*i);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
(_, Some(Operation::Insert(o_insert))) => {
2021-08-03 16:20:25 +08:00
new_delta.insert(
&o_insert.s,
attributes_from(&next_op2).unwrap_or(Attributes::Empty),
);
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
(None, _) | (_, None) => {
return Err(OTError);
},
(Some(Operation::Retain(retain)), Some(Operation::Retain(o_retain))) => {
2021-08-03 16:20:25 +08:00
let composed_attrs = compose_attributes(&next_op1, &next_op2);
2021-08-02 23:08:24 +08:00
log::debug!(
"[retain:{} - retain:{}]: {:?}",
2021-08-04 15:09:04 +08:00
retain.n,
o_retain.n,
2021-08-02 23:08:24 +08:00
composed_attrs
);
match retain.cmp(&o_retain) {
2021-07-31 23:22:17 +08:00
Ordering::Less => {
2021-08-04 15:09:04 +08:00
new_delta.retain(retain.n, composed_attrs);
next_op2 = Some(OpBuilder::retain(o_retain.n - retain.n).build());
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 23:22:17 +08:00
},
std::cmp::Ordering::Equal => {
2021-08-04 15:09:04 +08:00
new_delta.retain(retain.n, composed_attrs);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 23:22:17 +08:00
},
std::cmp::Ordering::Greater => {
2021-08-04 15:09:04 +08:00
new_delta.retain(o_retain.n, composed_attrs);
next_op1 = Some(OpBuilder::retain(retain.n - o_retain.n).build());
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 23:22:17 +08:00
},
}
2021-07-31 20:53:45 +08:00
},
(Some(Operation::Insert(insert)), Some(Operation::Delete(o_num))) => {
match (num_chars(insert.as_bytes()) as u64).cmp(o_num) {
2021-07-31 20:53:45 +08:00
Ordering::Less => {
2021-08-01 10:45:15 +08:00
next_op2 = Some(
OpBuilder::delete(*o_num - num_chars(insert.as_bytes()) as u64)
2021-08-03 16:20:25 +08:00
.attributes(insert.attributes.clone())
.build(),
2021-07-31 20:53:45 +08:00
);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Equal => {
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Greater => {
2021-08-01 10:45:15 +08:00
next_op1 = Some(
2021-08-01 16:39:32 +08:00
OpBuilder::insert(
&insert.chars().skip(*o_num as usize).collect::<String>(),
2021-08-01 16:39:32 +08:00
)
.build(),
2021-07-31 20:53:45 +08:00
);
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
}
},
(Some(Operation::Insert(insert)), Some(Operation::Retain(o_retain))) => {
2021-08-03 16:20:25 +08:00
let composed_attrs = compose_attributes(&next_op1, &next_op2);
2021-08-02 23:08:24 +08:00
log::debug!(
"[insert:{} - retain:{}]: {:?}",
insert.s,
2021-08-04 15:09:04 +08:00
o_retain.n,
2021-08-02 23:08:24 +08:00
composed_attrs
);
match (insert.num_chars()).cmp(o_retain) {
2021-07-31 20:53:45 +08:00
Ordering::Less => {
new_delta.insert(&insert.s, composed_attrs.clone());
next_op2 = Some(
2021-08-04 15:09:04 +08:00
OpBuilder::retain(o_retain.n - insert.num_chars())
.attributes(composed_attrs.clone())
.build(),
);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Equal => {
new_delta.insert(&insert.s, composed_attrs);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Greater => {
2021-08-01 10:45:15 +08:00
let chars = &mut insert.chars();
new_delta.insert(
2021-08-04 15:09:04 +08:00
&chars.take(o_retain.n as usize).collect::<String>(),
composed_attrs,
);
2021-08-03 16:20:25 +08:00
next_op1 = Some(
OpBuilder::insert(&chars.collect::<String>())
.attributes(Attributes::Empty)
.build(),
);
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
}
},
(Some(Operation::Retain(retain)), Some(Operation::Delete(o_num))) => {
match retain.cmp(&o_num) {
Ordering::Less => {
2021-08-04 15:09:04 +08:00
new_delta.delete(retain.n);
next_op2 = Some(OpBuilder::delete(*o_num - retain.n).build());
next_op1 = ops1.next();
},
Ordering::Equal => {
new_delta.delete(*o_num);
next_op2 = ops2.next();
next_op1 = ops1.next();
},
Ordering::Greater => {
new_delta.delete(*o_num);
2021-08-04 15:09:04 +08:00
next_op1 = Some(OpBuilder::retain(retain.n - *o_num).build());
next_op2 = ops2.next();
},
}
2021-07-31 20:53:45 +08:00
},
};
}
Ok(new_delta)
}
/// Transforms two operations A and B that happened concurrently and
/// produces two operations A' and B' (in an array) such that
/// `apply(apply(S, A), B') = apply(apply(S, B), A')`.
/// This function is the heart of OT.
///
/// # Error
///
/// Returns an `OTError` if the operations cannot be transformed due to
/// length conflicts.
pub fn transform(&self, other: &Self) -> Result<(Self, Self), OTError> {
if self.base_len != other.base_len {
return Err(OTError);
}
let mut a_prime = Delta::default();
let mut b_prime = Delta::default();
let mut ops1 = self.ops.iter().cloned();
let mut ops2 = other.ops.iter().cloned();
2021-08-01 10:45:15 +08:00
let mut next_op1 = ops1.next();
let mut next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
loop {
2021-08-01 10:45:15 +08:00
match (&next_op1, &next_op2) {
2021-07-31 20:53:45 +08:00
(None, None) => break,
2021-08-01 10:45:15 +08:00
(Some(Operation::Insert(insert)), _) => {
// let composed_attrs = transform_attributes(&next_op1, &next_op2, true);
a_prime.insert(&insert.s, insert.attributes.clone());
b_prime.retain(insert.num_chars(), insert.attributes.clone());
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
(_, Some(Operation::Insert(o_insert))) => {
let composed_attrs = transform_attributes(&next_op1, &next_op2, true);
a_prime.retain(o_insert.num_chars(), composed_attrs.clone());
2021-08-03 16:20:25 +08:00
b_prime.insert(&o_insert.s, composed_attrs);
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
(None, _) => {
return Err(OTError);
},
(_, None) => {
return Err(OTError);
},
(Some(Operation::Retain(retain)), Some(Operation::Retain(o_retain))) => {
let composed_attrs = transform_attributes(&next_op1, &next_op2, true);
match retain.cmp(&o_retain) {
2021-07-31 20:53:45 +08:00
Ordering::Less => {
2021-08-04 15:09:04 +08:00
a_prime.retain(retain.n, composed_attrs.clone());
b_prime.retain(retain.n, composed_attrs.clone());
next_op2 = Some(OpBuilder::retain(o_retain.n - retain.n).build());
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Equal => {
2021-08-04 15:09:04 +08:00
a_prime.retain(retain.n, composed_attrs.clone());
b_prime.retain(retain.n, composed_attrs.clone());
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Greater => {
2021-08-04 15:09:04 +08:00
a_prime.retain(o_retain.n, composed_attrs.clone());
b_prime.retain(o_retain.n, composed_attrs.clone());
next_op1 = Some(OpBuilder::retain(retain.n - o_retain.n).build());
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
};
},
2021-08-01 10:45:15 +08:00
(Some(Operation::Delete(i)), Some(Operation::Delete(j))) => match i.cmp(&j) {
2021-07-31 20:53:45 +08:00
Ordering::Less => {
2021-08-01 10:45:15 +08:00
next_op2 = Some(OpBuilder::delete(*j - *i).build());
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Equal => {
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Greater => {
2021-08-01 10:45:15 +08:00
next_op1 = Some(OpBuilder::delete(*i - *j).build());
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
},
(Some(Operation::Delete(i)), Some(Operation::Retain(o_retain))) => {
match i.cmp(&o_retain) {
2021-07-31 20:53:45 +08:00
Ordering::Less => {
a_prime.delete(*i);
2021-08-04 15:09:04 +08:00
next_op2 = Some(OpBuilder::retain(o_retain.n - *i).build());
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Equal => {
a_prime.delete(*i);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Greater => {
2021-08-04 15:09:04 +08:00
a_prime.delete(o_retain.n);
next_op1 = Some(OpBuilder::delete(*i - o_retain.n).build());
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
};
},
(Some(Operation::Retain(retain)), Some(Operation::Delete(j))) => {
match retain.cmp(&j) {
2021-07-31 20:53:45 +08:00
Ordering::Less => {
2021-08-04 15:09:04 +08:00
b_prime.delete(retain.n);
next_op2 = Some(OpBuilder::delete(*j - retain.n).build());
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Equal => {
2021-08-04 15:09:04 +08:00
b_prime.delete(retain.n);
2021-08-01 10:45:15 +08:00
next_op1 = ops1.next();
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
Ordering::Greater => {
b_prime.delete(*j);
2021-08-04 15:09:04 +08:00
next_op1 = Some(OpBuilder::retain(retain.n - *j).build());
2021-08-01 10:45:15 +08:00
next_op2 = ops2.next();
2021-07-31 20:53:45 +08:00
},
};
},
}
}
Ok((a_prime, b_prime))
}
/// Applies an operation to a string, returning a new string.
///
/// # Error
///
/// Returns an error if the operation cannot be applied due to length
/// conflicts.
pub fn apply(&self, s: &str) -> Result<String, OTError> {
if num_chars(s.as_bytes()) != self.base_len {
return Err(OTError);
}
let mut new_s = String::new();
let chars = &mut s.chars();
for op in &self.ops {
2021-08-01 10:45:15 +08:00
match &op {
Operation::Retain(retain) => {
2021-08-04 15:09:04 +08:00
for c in chars.take(retain.n as usize) {
2021-07-31 20:53:45 +08:00
new_s.push(c);
}
},
2021-08-01 10:45:15 +08:00
Operation::Delete(delete) => {
2021-07-31 20:53:45 +08:00
for _ in 0..*delete {
chars.next();
}
},
2021-08-01 10:45:15 +08:00
Operation::Insert(insert) => {
new_s += &insert.s;
2021-07-31 20:53:45 +08:00
},
}
}
Ok(new_s)
}
/// Computes the inverse of an operation. The inverse of an operation is the
/// operation that reverts the effects of the operation
pub fn invert(&self, s: &str) -> Self {
2021-08-01 10:45:15 +08:00
let mut inverted = Delta::default();
2021-07-31 20:53:45 +08:00
let chars = &mut s.chars();
for op in &self.ops {
2021-08-01 10:45:15 +08:00
match &op {
Operation::Retain(retain) => {
2021-08-04 15:09:04 +08:00
inverted.retain(retain.n, Attributes::Follow);
// TODO: use advance_by instead, but it's unstable now
// chars.advance_by(retain.num)
for _ in 0..retain.n {
2021-07-31 20:53:45 +08:00
chars.next();
}
},
2021-08-01 10:45:15 +08:00
Operation::Insert(insert) => {
inverted.delete(insert.num_chars());
2021-07-31 20:53:45 +08:00
},
2021-08-01 10:45:15 +08:00
Operation::Delete(delete) => {
inverted.insert(
2021-07-31 23:22:17 +08:00
&chars.take(*delete as usize).collect::<String>(),
op.get_attributes(),
2021-07-31 23:22:17 +08:00
);
2021-07-31 20:53:45 +08:00
},
}
}
2021-08-01 10:45:15 +08:00
inverted
2021-07-31 20:53:45 +08:00
}
2021-08-04 15:09:04 +08:00
pub fn invert_delta(&self, other: &Delta) -> Delta {
let mut inverted = Delta::default();
if other.is_empty() {
return inverted;
}
let a = |inverted: &mut Delta, op: &Operation, index: usize, op_len: usize| {
let ops = other.ops_in_interval(Interval::new(index, op_len));
ops.into_iter().for_each(|other_op| match op {
Operation::Delete(_) => {
inverted.add(other_op);
},
Operation::Retain(_) => {},
Operation::Insert(_) => {
if !op.is_plain() {
let inverted_attrs =
invert_attributes(op.get_attributes(), other_op.get_attributes());
inverted.retain(other_op.length(), inverted_attrs);
}
},
});
};
let mut index = 0;
for op in &self.ops {
let op_len: usize = op.length() as usize;
match op {
Operation::Delete(_) => {
a(&mut inverted, op, index, op_len);
index += op_len;
},
Operation::Retain(_) => {
if op.is_plain() {
inverted.retain(op_len as u64, Attributes::Empty);
} else {
a(&mut inverted, op, index, op_len as usize);
}
index += op_len;
},
Operation::Insert(insert) => {
inverted.delete(op_len as u64);
},
}
}
inverted
}
2021-07-31 20:53:45 +08:00
/// Checks if this operation has no effect.
#[inline]
pub fn is_noop(&self) -> bool {
2021-08-01 10:45:15 +08:00
match self.ops.as_slice() {
2021-07-31 20:53:45 +08:00
[] => true,
2021-08-01 10:45:15 +08:00
[Operation::Retain(_)] => true,
2021-07-31 20:53:45 +08:00
_ => false,
}
}
2021-08-01 10:45:15 +08:00
pub fn is_empty(&self) -> bool { self.ops.is_empty() }
2021-07-31 23:22:17 +08:00
2021-08-04 15:09:04 +08:00
pub fn ops_in_interval(&self, interval: Interval) -> Vec<Operation> {
let mut ops: Vec<Operation> = Vec::with_capacity(self.ops.len());
let mut offset: usize = 0;
let mut ops_iter = self.ops.iter();
let mut op = ops_iter.next();
while offset < interval.end && op.is_some() {
if let Some(op) = op {
if offset < interval.start {
offset += op.length() as usize;
} else {
ops.push(op.clone());
offset += op.length() as usize;
}
2021-08-03 16:20:25 +08:00
}
2021-08-04 15:09:04 +08:00
op = ops_iter.next();
}
ops
2021-08-01 16:39:32 +08:00
}
2021-08-04 15:09:04 +08:00
pub fn attributes_in_interval(&self, interval: Interval) -> Attributes {
let mut attributes_data = AttributesData::new();
let mut offset: usize = 0;
self.ops.iter().for_each(|op| match op {
Operation::Delete(_n) => {},
Operation::Retain(_retain) => {
unimplemented!()
// if interval.contains(retain.n as usize) {
// match &retain.attributes {
// Attributes::Follow => {},
// Attributes::Custom(data) => {
// attributes_data.extend(data.clone());
// },
// Attributes::Empty => {},
// }
// }
},
Operation::Insert(insert) => match &insert.attributes {
Attributes::Follow => {},
Attributes::Custom(data) => {
let end = insert.num_chars() as usize;
if interval.contains_range(offset, offset + end) {
attributes_data.extend(data.clone());
}
offset += end;
},
Attributes::Empty => {},
},
});
if attributes_data.is_plain() {
Attributes::Empty
} else {
Attributes::Custom(attributes_data)
}
2021-07-31 23:22:17 +08:00
}
}