2011-05-30 16:53:11 +02:00
/ *
* This is the Changeset library copied from the old Etherpad with some modifications to use it in node . js
* Can be found in https : //github.com/ether/pad/blob/master/infrastructure/ace/www/easysync2.js
2012-01-17 11:47:46 +01:00
* /
2011-05-30 16:53:11 +02:00
2011-12-04 16:33:56 +01:00
/ * *
2012-01-17 11:47:46 +01:00
* This code is mostly from the old Etherpad . Please help us to comment this code .
2011-12-04 16:33:56 +01:00
* This helps other people to understand this code better and helps them to improve it .
* TL ; DR COMMENTS ON THIS FILE ARE HIGHLY APPRECIATED
* /
2011-05-30 16:53:11 +02:00
/ *
2011-08-11 16:26:41 +02:00
* Copyright 2009 Google Inc . , 2011 Peter 'Pita' Martischka ( Primary Technology Ltd )
2011-03-26 14:10:41 +01:00
*
* Licensed under the Apache License , Version 2.0 ( the "License" ) ;
* you may not use this file except in compliance with the License .
* You may obtain a copy of the License at
*
* http : //www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing , software
* distributed under the License is distributed on an "AS-IS" BASIS ,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
* See the License for the specific language governing permissions and
* limitations under the License .
* /
2012-03-18 09:05:46 +01:00
var AttributePool = require ( "./AttributePool" ) ;
2011-03-26 14:10:41 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* === === === === === === == General Util Functions === === === === === === === ==
* /
2012-02-26 11:27:56 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* This method is called whenever there is an error in the sync process
* @ param msg { string } Just some message
* /
2011-03-26 14:10:41 +01:00
exports . error = function error ( msg ) {
var e = new Error ( msg ) ;
e . easysync = true ;
throw e ;
} ;
2012-02-26 11:27:56 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* This method is user for assertions with Messages
* if assert fails , the error function called .
* @ param b { boolean } assertion condition
* @ param msgParts { string } error to be passed if it fails
* /
2011-03-26 14:10:41 +01:00
exports . assert = function assert ( b , msgParts ) {
if ( ! b ) {
var msg = Array . prototype . slice . call ( arguments , 1 ) . join ( '' ) ;
exports . error ( "exports: " + msg ) ;
}
} ;
2012-02-26 12:22:46 +01:00
/ * *
* Parses a number from string base 36
* @ param str { string } string of the number in base 36
* @ returns { int } number
* /
2011-03-26 14:10:41 +01:00
exports . parseNum = function ( str ) {
return parseInt ( str , 36 ) ;
} ;
2012-02-26 11:27:56 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* Writes a number in base 36 and puts it in a string
* @ param num { int } number
* @ returns { string } string
* /
2011-03-26 14:10:41 +01:00
exports . numToString = function ( num ) {
return num . toString ( 36 ) . toLowerCase ( ) ;
} ;
2012-02-26 11:27:56 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* Converts stuff before $ to base 10
* @ obsolete not really used anywhere ? ?
* @ param cs { string } the string
* @ return integer
* /
2011-03-26 14:10:41 +01:00
exports . toBaseTen = function ( cs ) {
var dollarIndex = cs . indexOf ( '$' ) ;
var beforeDollar = cs . substring ( 0 , dollarIndex ) ;
var fromDollar = cs . substring ( dollarIndex ) ;
return beforeDollar . replace ( /[0-9a-z]+/g , function ( s ) {
return String ( exports . parseNum ( s ) ) ;
} ) + fromDollar ;
} ;
2012-02-26 11:27:56 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* === === === === === === == Changeset Functions === === === === === === === ==
* /
2012-02-26 11:27:56 +01:00
2012-02-26 12:22:46 +01:00
/ * *
* returns the required length of the text before changeset
* can be applied
* @ param cs { string } String representation of the Changeset
* /
2011-03-26 14:10:41 +01:00
exports . oldLen = function ( cs ) {
return exports . unpack ( cs ) . oldLen ;
} ;
2012-02-26 12:22:46 +01:00
/ * *
* returns the length of the text after changeset is applied
* @ param cs { string } String representation of the Changeset
* /
2011-03-26 14:10:41 +01:00
exports . newLen = function ( cs ) {
return exports . unpack ( cs ) . newLen ;
} ;
2012-02-26 12:22:46 +01:00
/ * *
* this function creates an iterator which decodes string changeset operations
* @ param opsStr { string } String encoding of the change operations to be performed
* @ param optStartIndex { int } from where in the string should the iterator start
* @ return { Op } type object iterator
* /
2011-03-26 14:10:41 +01:00
exports . opIterator = function ( opsStr , optStartIndex ) {
//print(opsStr);
var regex = /((?:\*[0-9a-z]+)*)(?:\|([0-9a-z]+))?([-+=])([0-9a-z]+)|\?|/g ;
var startIndex = ( optStartIndex || 0 ) ;
var curIndex = startIndex ;
var prevIndex = curIndex ;
function nextRegexMatch ( ) {
prevIndex = curIndex ;
var result ;
2012-07-08 11:51:04 +02:00
regex . lastIndex = curIndex ;
result = regex . exec ( opsStr ) ;
curIndex = regex . lastIndex ;
if ( result [ 0 ] == '?' ) {
exports . error ( "Hit error opcode in op stream" ) ;
2011-03-26 14:10:41 +01:00
}
2012-07-08 11:51:04 +02:00
2011-03-26 14:10:41 +01:00
return result ;
}
var regexResult = nextRegexMatch ( ) ;
var obj = exports . newOp ( ) ;
function next ( optObj ) {
var op = ( optObj || obj ) ;
2012-07-08 11:51:04 +02:00
if ( regexResult [ 0 ] ) {
2011-03-26 14:10:41 +01:00
op . attribs = regexResult [ 1 ] ;
op . lines = exports . parseNum ( regexResult [ 2 ] || 0 ) ;
op . opcode = regexResult [ 3 ] ;
op . chars = exports . parseNum ( regexResult [ 4 ] ) ;
regexResult = nextRegexMatch ( ) ;
} else {
exports . clearOp ( op ) ;
}
return op ;
}
function hasNext ( ) {
2012-07-08 11:51:04 +02:00
return ! ! ( regexResult [ 0 ] ) ;
2011-03-26 14:10:41 +01:00
}
function lastIndex ( ) {
return prevIndex ;
}
return {
next : next ,
hasNext : hasNext ,
lastIndex : lastIndex
} ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Cleans an Op object
* @ param { Op } object to be cleared
* /
2011-03-26 14:10:41 +01:00
exports . clearOp = function ( op ) {
op . opcode = '' ;
op . chars = 0 ;
op . lines = 0 ;
op . attribs = '' ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Creates a new Op object
* @ param optOpcode the type operation of the Op object
* /
2011-03-26 14:10:41 +01:00
exports . newOp = function ( optOpcode ) {
return {
opcode : ( optOpcode || '' ) ,
chars : 0 ,
lines : 0 ,
attribs : ''
} ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Clones an Op
* @ param op Op to be cloned
* /
2011-03-26 14:10:41 +01:00
exports . cloneOp = function ( op ) {
return {
opcode : op . opcode ,
chars : op . chars ,
lines : op . lines ,
attribs : op . attribs
} ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Copies op1 to op2
* @ param op1 src Op
* @ param op2 dest Op
* /
2011-03-26 14:10:41 +01:00
exports . copyOp = function ( op1 , op2 ) {
op2 . opcode = op1 . opcode ;
op2 . chars = op1 . chars ;
op2 . lines = op1 . lines ;
op2 . attribs = op1 . attribs ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Writes the Op in a string the way that changesets need it
* /
2011-03-26 14:10:41 +01:00
exports . opString = function ( op ) {
// just for debugging
if ( ! op . opcode ) return 'null' ;
var assem = exports . opAssembler ( ) ;
assem . append ( op ) ;
return assem . toString ( ) ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Used just for debugging
* /
2011-03-26 14:10:41 +01:00
exports . stringOp = function ( str ) {
// just for debugging
return exports . opIterator ( str ) . next ( ) ;
} ;
2012-02-26 12:34:06 +01:00
/ * *
* Used to check if a Changeset if valid
* @ param cs { Changeset } Changeset to be checked
* /
2011-03-26 14:10:41 +01:00
exports . checkRep = function ( cs ) {
// doesn't check things that require access to attrib pool (e.g. attribute order)
// or original string (e.g. newline positions)
var unpacked = exports . unpack ( cs ) ;
var oldLen = unpacked . oldLen ;
var newLen = unpacked . newLen ;
var ops = unpacked . ops ;
var charBank = unpacked . charBank ;
var assem = exports . smartOpAssembler ( ) ;
var oldPos = 0 ;
var calcNewLen = 0 ;
var numInserted = 0 ;
var iter = exports . opIterator ( ops ) ;
while ( iter . hasNext ( ) ) {
var o = iter . next ( ) ;
switch ( o . opcode ) {
case '=' :
oldPos += o . chars ;
calcNewLen += o . chars ;
break ;
case '-' :
oldPos += o . chars ;
exports . assert ( oldPos < oldLen , oldPos , " >= " , oldLen , " in " , cs ) ;
break ;
case '+' :
{
calcNewLen += o . chars ;
numInserted += o . chars ;
exports . assert ( calcNewLen < newLen , calcNewLen , " >= " , newLen , " in " , cs ) ;
break ;
}
}
assem . append ( o ) ;
}
calcNewLen += oldLen - oldPos ;
charBank = charBank . substring ( 0 , numInserted ) ;
while ( charBank . length < numInserted ) {
charBank += "?" ;
}
assem . endDocument ( ) ;
var normalized = exports . pack ( oldLen , calcNewLen , assem . toString ( ) , charBank ) ;
exports . assert ( normalized == cs , normalized , ' != ' , cs ) ;
return cs ;
}
2012-02-26 12:34:06 +01:00
/ * *
2012-02-26 13:18:17 +01:00
* === === === === === === == Util Functions === === === === === === === ==
* /
/ * *
* creates an object that allows you to append operations ( type Op ) and also
* compresses them if possible
2012-02-26 12:34:06 +01:00
* /
2011-03-26 14:10:41 +01:00
exports . smartOpAssembler = function ( ) {
// Like opAssembler but able to produce conforming exportss
// from slightly looser input, at the cost of speed.
// Specifically:
// - merges consecutive operations that can be merged
// - strips final "="
// - ignores 0-length changes
// - reorders consecutive + and - (which margingOpAssembler doesn't do)
var minusAssem = exports . mergingOpAssembler ( ) ;
var plusAssem = exports . mergingOpAssembler ( ) ;
var keepAssem = exports . mergingOpAssembler ( ) ;
var assem = exports . stringAssembler ( ) ;
var lastOpcode = '' ;
var lengthChange = 0 ;
function flushKeeps ( ) {
assem . append ( keepAssem . toString ( ) ) ;
keepAssem . clear ( ) ;
}
function flushPlusMinus ( ) {
assem . append ( minusAssem . toString ( ) ) ;
minusAssem . clear ( ) ;
assem . append ( plusAssem . toString ( ) ) ;
plusAssem . clear ( ) ;
}
function append ( op ) {
if ( ! op . opcode ) return ;
if ( ! op . chars ) return ;
if ( op . opcode == '-' ) {
if ( lastOpcode == '=' ) {
flushKeeps ( ) ;
}
minusAssem . append ( op ) ;
lengthChange -= op . chars ;
} else if ( op . opcode == '+' ) {
if ( lastOpcode == '=' ) {
flushKeeps ( ) ;
}
plusAssem . append ( op ) ;
lengthChange += op . chars ;
} else if ( op . opcode == '=' ) {
if ( lastOpcode != '=' ) {
flushPlusMinus ( ) ;
}
keepAssem . append ( op ) ;
}
lastOpcode = op . opcode ;
}
function appendOpWithText ( opcode , text , attribs , pool ) {
var op = exports . newOp ( opcode ) ;
op . attribs = exports . makeAttribsString ( opcode , attribs , pool ) ;
var lastNewlinePos = text . lastIndexOf ( '\n' ) ;
if ( lastNewlinePos < 0 ) {
op . chars = text . length ;
op . lines = 0 ;
append ( op ) ;
} else {
op . chars = lastNewlinePos + 1 ;
op . lines = text . match ( /\n/g ) . length ;
append ( op ) ;
op . chars = text . length - ( lastNewlinePos + 1 ) ;
op . lines = 0 ;
append ( op ) ;
}
}
function toString ( ) {
flushPlusMinus ( ) ;
flushKeeps ( ) ;
return assem . toString ( ) ;
}
function clear ( ) {
minusAssem . clear ( ) ;
plusAssem . clear ( ) ;
keepAssem . clear ( ) ;
assem . clear ( ) ;
lengthChange = 0 ;
}
function endDocument ( ) {
keepAssem . endDocument ( ) ;
}
function getLengthChange ( ) {
return lengthChange ;
}
return {
append : append ,
toString : toString ,
clear : clear ,
endDocument : endDocument ,
appendOpWithText : appendOpWithText ,
getLengthChange : getLengthChange
} ;
} ;
2012-07-08 11:51:04 +02:00
exports . mergingOpAssembler = function ( ) {
// This assembler can be used in production; it efficiently
// merges consecutive operations that are mergeable, ignores
// no-ops, and drops final pure "keeps". It does not re-order
// operations.
var assem = exports . opAssembler ( ) ;
var bufOp = exports . newOp ( ) ;
// If we get, for example, insertions [xxx\n,yyy], those don't merge,
// but if we get [xxx\n,yyy,zzz\n], that merges to [xxx\nyyyzzz\n].
// This variable stores the length of yyy and any other newline-less
// ops immediately after it.
var bufOpAdditionalCharsAfterNewline = 0 ;
function flush ( isEndDocument ) {
if ( bufOp . opcode ) {
if ( isEndDocument && bufOp . opcode == '=' && ! bufOp . attribs ) {
// final merged keep, leave it implicit
} else {
assem . append ( bufOp ) ;
if ( bufOpAdditionalCharsAfterNewline ) {
bufOp . chars = bufOpAdditionalCharsAfterNewline ;
bufOp . lines = 0 ;
2011-03-26 14:10:41 +01:00
assem . append ( bufOp ) ;
2012-07-08 11:51:04 +02:00
bufOpAdditionalCharsAfterNewline = 0 ;
2011-03-26 14:10:41 +01:00
}
}
2012-07-08 11:51:04 +02:00
bufOp . opcode = '' ;
2011-03-26 14:10:41 +01:00
}
2012-07-08 11:51:04 +02:00
}
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function append ( op ) {
if ( op . chars > 0 ) {
if ( bufOp . opcode == op . opcode && bufOp . attribs == op . attribs ) {
if ( op . lines > 0 ) {
// bufOp and additional chars are all mergeable into a multi-line op
bufOp . chars += bufOpAdditionalCharsAfterNewline + op . chars ;
bufOp . lines += op . lines ;
bufOpAdditionalCharsAfterNewline = 0 ;
} else if ( bufOp . lines == 0 ) {
// both bufOp and op are in-line
bufOp . chars += op . chars ;
2011-03-26 14:10:41 +01:00
} else {
2012-07-08 11:51:04 +02:00
// append in-line text to multi-line bufOp
bufOpAdditionalCharsAfterNewline += op . chars ;
2011-03-26 14:10:41 +01:00
}
2012-07-08 11:51:04 +02:00
} else {
flush ( ) ;
exports . copyOp ( op , bufOp ) ;
2011-03-26 14:10:41 +01:00
}
}
2012-07-08 11:51:04 +02:00
}
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function endDocument ( ) {
flush ( true ) ;
}
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function toString ( ) {
flush ( ) ;
return assem . toString ( ) ;
}
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function clear ( ) {
assem . clear ( ) ;
exports . clearOp ( bufOp ) ;
}
return {
append : append ,
toString : toString ,
clear : clear ,
endDocument : endDocument
2011-03-26 14:10:41 +01:00
} ;
2012-07-08 11:51:04 +02:00
} ;
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
exports . opAssembler = function ( ) {
var pieces = [ ] ;
// this function allows op to be mutated later (doesn't keep a ref)
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function append ( op ) {
pieces . push ( op . attribs ) ;
if ( op . lines ) {
pieces . push ( '|' , exports . numToString ( op . lines ) ) ;
2011-03-26 14:10:41 +01:00
}
2012-07-08 11:51:04 +02:00
pieces . push ( op . opcode ) ;
pieces . push ( exports . numToString ( op . chars ) ) ;
}
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function toString ( ) {
return pieces . join ( '' ) ;
}
2011-03-26 14:10:41 +01:00
2012-07-08 11:51:04 +02:00
function clear ( ) {
pieces . length = 0 ;
}
return {
append : append ,
toString : toString ,
clear : clear
2011-03-26 14:10:41 +01:00
} ;
2012-07-08 11:51:04 +02:00
} ;
2011-03-26 14:10:41 +01:00
2012-02-26 13:18:17 +01:00
/ * *
* A custom made String Iterator
* @ param str { string } String to be iterated over
* /
2011-03-26 14:10:41 +01:00
exports . stringIterator = function ( str ) {
var curIndex = 0 ;
function assertRemaining ( n ) {
exports . assert ( n <= remaining ( ) , "!(" , n , " <= " , remaining ( ) , ")" ) ;
}
function take ( n ) {
assertRemaining ( n ) ;
var s = str . substr ( curIndex , n ) ;
curIndex += n ;
return s ;
}
function peek ( n ) {
assertRemaining ( n ) ;
var s = str . substr ( curIndex , n ) ;
return s ;
}
function skip ( n ) {
assertRemaining ( n ) ;
curIndex += n ;
}
function remaining ( ) {
return str . length - curIndex ;
}
return {
take : take ,
skip : skip ,
remaining : remaining ,
peek : peek
} ;
} ;
2012-02-26 13:18:17 +01:00
/ * *
* A custom made StringBuffer
* /
2011-03-26 14:10:41 +01:00
exports . stringAssembler = function ( ) {
var pieces = [ ] ;
function append ( x ) {
pieces . push ( String ( x ) ) ;
}
function toString ( ) {
return pieces . join ( '' ) ;
}
return {
append : append ,
toString : toString
} ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* This class allows to iterate and modify texts which have several lines
* It is used for applying Changesets on arrays of lines
* Note from prev docs : "lines" need not be an array as long as it supports certain calls ( lines _foo inside ) .
* /
2011-03-26 14:10:41 +01:00
exports . textLinesMutator = function ( lines ) {
// Mutates lines, an array of strings, in place.
// Mutation operations have the same constraints as exports operations
// with respect to newlines, but not the other additional constraints
// (i.e. ins/del ordering, forbidden no-ops, non-mergeability, final newline).
// Can be used to mutate lists of strings where the last char of each string
// is not actually a newline, but for the purposes of N and L values,
// the caller should pretend it is, and for things to work right in that case, the input
// to insert() should be a single line with no newlines.
var curSplice = [ 0 , 0 ] ;
var inSplice = false ;
// position in document after curSplice is applied:
var curLine = 0 ,
curCol = 0 ;
// invariant: if (inSplice) then (curLine is in curSplice[0] + curSplice.length - {2,3}) &&
// curLine >= curSplice[0]
// invariant: if (inSplice && (curLine >= curSplice[0] + curSplice.length - 2)) then
// curCol == 0
function lines _applySplice ( s ) {
lines . splice . apply ( lines , s ) ;
}
function lines _toSource ( ) {
return lines . toSource ( ) ;
}
function lines _get ( idx ) {
if ( lines . get ) {
return lines . get ( idx ) ;
} else {
return lines [ idx ] ;
}
}
// can be unimplemented if removeLines's return value not needed
function lines _slice ( start , end ) {
if ( lines . slice ) {
return lines . slice ( start , end ) ;
} else {
return [ ] ;
}
}
function lines _length ( ) {
if ( ( typeof lines . length ) == "number" ) {
return lines . length ;
} else {
return lines . length ( ) ;
}
}
function enterSplice ( ) {
curSplice [ 0 ] = curLine ;
curSplice [ 1 ] = 0 ;
if ( curCol > 0 ) {
putCurLineInSplice ( ) ;
}
inSplice = true ;
}
function leaveSplice ( ) {
lines _applySplice ( curSplice ) ;
curSplice . length = 2 ;
curSplice [ 0 ] = curSplice [ 1 ] = 0 ;
inSplice = false ;
}
function isCurLineInSplice ( ) {
return ( curLine - curSplice [ 0 ] < ( curSplice . length - 2 ) ) ;
}
function debugPrint ( typ ) {
print ( typ + ": " + curSplice . toSource ( ) + " / " + curLine + "," + curCol + " / " + lines _toSource ( ) ) ;
}
function putCurLineInSplice ( ) {
if ( ! isCurLineInSplice ( ) ) {
curSplice . push ( lines _get ( curSplice [ 0 ] + curSplice [ 1 ] ) ) ;
curSplice [ 1 ] ++ ;
}
return 2 + curLine - curSplice [ 0 ] ;
}
function skipLines ( L , includeInSplice ) {
if ( L ) {
if ( includeInSplice ) {
if ( ! inSplice ) {
enterSplice ( ) ;
}
for ( var i = 0 ; i < L ; i ++ ) {
curCol = 0 ;
putCurLineInSplice ( ) ;
curLine ++ ;
}
} else {
if ( inSplice ) {
if ( L > 1 ) {
leaveSplice ( ) ;
} else {
putCurLineInSplice ( ) ;
}
}
curLine += L ;
curCol = 0 ;
}
//print(inSplice+" / "+isCurLineInSplice()+" / "+curSplice[0]+" / "+curSplice[1]+" / "+lines.length);
/ * i f ( i n S p l i c e & & ( ! i s C u r L i n e I n S p l i c e ( ) ) & & ( c u r S p l i c e [ 0 ] + c u r S p l i c e [ 1 ] < l i n e s . l e n g t h ) ) {
print ( "BLAH" ) ;
putCurLineInSplice ( ) ;
} * /
// tests case foo in remove(), which isn't otherwise covered in current impl
}
//debugPrint("skip");
}
function skip ( N , L , includeInSplice ) {
if ( N ) {
if ( L ) {
skipLines ( L , includeInSplice ) ;
} else {
if ( includeInSplice && ! inSplice ) {
enterSplice ( ) ;
}
if ( inSplice ) {
putCurLineInSplice ( ) ;
}
curCol += N ;
//debugPrint("skip");
}
}
}
function removeLines ( L ) {
var removed = '' ;
if ( L ) {
if ( ! inSplice ) {
enterSplice ( ) ;
}
function nextKLinesText ( k ) {
var m = curSplice [ 0 ] + curSplice [ 1 ] ;
return lines _slice ( m , m + k ) . join ( '' ) ;
}
if ( isCurLineInSplice ( ) ) {
//print(curCol);
if ( curCol == 0 ) {
removed = curSplice [ curSplice . length - 1 ] ;
// print("FOO"); // case foo
curSplice . length -- ;
removed += nextKLinesText ( L - 1 ) ;
curSplice [ 1 ] += L - 1 ;
} else {
removed = nextKLinesText ( L - 1 ) ;
curSplice [ 1 ] += L - 1 ;
var sline = curSplice . length - 1 ;
removed = curSplice [ sline ] . substring ( curCol ) + removed ;
curSplice [ sline ] = curSplice [ sline ] . substring ( 0 , curCol ) + lines _get ( curSplice [ 0 ] + curSplice [ 1 ] ) ;
curSplice [ 1 ] += 1 ;
}
} else {
removed = nextKLinesText ( L ) ;
curSplice [ 1 ] += L ;
}
//debugPrint("remove");
}
return removed ;
}
function remove ( N , L ) {
var removed = '' ;
if ( N ) {
if ( L ) {
return removeLines ( L ) ;
} else {
if ( ! inSplice ) {
enterSplice ( ) ;
}
var sline = putCurLineInSplice ( ) ;
removed = curSplice [ sline ] . substring ( curCol , curCol + N ) ;
curSplice [ sline ] = curSplice [ sline ] . substring ( 0 , curCol ) + curSplice [ sline ] . substring ( curCol + N ) ;
//debugPrint("remove");
}
}
return removed ;
}
function insert ( text , L ) {
if ( text ) {
if ( ! inSplice ) {
enterSplice ( ) ;
}
if ( L ) {
var newLines = exports . splitTextLines ( text ) ;
if ( isCurLineInSplice ( ) ) {
//if (curCol == 0) {
//curSplice.length--;
//curSplice[1]--;
//Array.prototype.push.apply(curSplice, newLines);
//curLine += newLines.length;
//}
//else {
var sline = curSplice . length - 1 ;
var theLine = curSplice [ sline ] ;
var lineCol = curCol ;
curSplice [ sline ] = theLine . substring ( 0 , lineCol ) + newLines [ 0 ] ;
curLine ++ ;
newLines . splice ( 0 , 1 ) ;
Array . prototype . push . apply ( curSplice , newLines ) ;
curLine += newLines . length ;
curSplice . push ( theLine . substring ( lineCol ) ) ;
curCol = 0 ;
//}
} else {
Array . prototype . push . apply ( curSplice , newLines ) ;
curLine += newLines . length ;
}
} else {
var sline = putCurLineInSplice ( ) ;
curSplice [ sline ] = curSplice [ sline ] . substring ( 0 , curCol ) + text + curSplice [ sline ] . substring ( curCol ) ;
curCol += text . length ;
}
//debugPrint("insert");
}
}
function hasMore ( ) {
//print(lines.length+" / "+inSplice+" / "+(curSplice.length - 2)+" / "+curSplice[1]);
var docLines = lines _length ( ) ;
if ( inSplice ) {
docLines += curSplice . length - 2 - curSplice [ 1 ] ;
}
return curLine < docLines ;
}
function close ( ) {
if ( inSplice ) {
leaveSplice ( ) ;
}
//debugPrint("close");
}
var self = {
skip : skip ,
remove : remove ,
insert : insert ,
close : close ,
hasMore : hasMore ,
removeLines : removeLines ,
skipLines : skipLines
} ;
return self ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Function allowing iterating over two Op strings .
* @ params in1 { string } first Op string
* @ params idx1 { int } integer where 1 st iterator should start
* @ params in2 { string } second Op string
* @ params idx2 { int } integer where 2 nd iterator should start
* @ params func { function } which decides how 1 st or 2 nd iterator
* advances . When opX . opcode = 0 , iterator X advances to
* next element
* func has signature f ( op1 , op2 , opOut )
* op1 - current operation of the first iterator
* op2 - current operation of the second iterator
* opOut - result operator to be put into Changeset
* @ return { string } the integrated changeset
* /
2011-03-26 14:10:41 +01:00
exports . applyZip = function ( in1 , idx1 , in2 , idx2 , func ) {
var iter1 = exports . opIterator ( in1 , idx1 ) ;
var iter2 = exports . opIterator ( in2 , idx2 ) ;
var assem = exports . smartOpAssembler ( ) ;
var op1 = exports . newOp ( ) ;
var op2 = exports . newOp ( ) ;
var opOut = exports . newOp ( ) ;
while ( op1 . opcode || iter1 . hasNext ( ) || op2 . opcode || iter2 . hasNext ( ) ) {
if ( ( ! op1 . opcode ) && iter1 . hasNext ( ) ) iter1 . next ( op1 ) ;
if ( ( ! op2 . opcode ) && iter2 . hasNext ( ) ) iter2 . next ( op2 ) ;
func ( op1 , op2 , opOut ) ;
if ( opOut . opcode ) {
//print(opOut.toSource());
assem . append ( opOut ) ;
opOut . opcode = '' ;
}
}
assem . endDocument ( ) ;
return assem . toString ( ) ;
} ;
2012-02-26 13:18:17 +01:00
/ * *
* Unpacks a string encoded Changeset into a proper Changeset object
* @ params cs { string } String encoded Changeset
* @ returns { Changeset } a Changeset class
* /
2011-03-26 14:10:41 +01:00
exports . unpack = function ( cs ) {
var headerRegex = /Z:([0-9a-z]+)([><])([0-9a-z]+)|/ ;
var headerMatch = headerRegex . exec ( cs ) ;
if ( ( ! headerMatch ) || ( ! headerMatch [ 0 ] ) ) {
exports . error ( "Not a exports: " + cs ) ;
}
var oldLen = exports . parseNum ( headerMatch [ 1 ] ) ;
var changeSign = ( headerMatch [ 2 ] == '>' ) ? 1 : - 1 ;
var changeMag = exports . parseNum ( headerMatch [ 3 ] ) ;
var newLen = oldLen + changeSign * changeMag ;
var opsStart = headerMatch [ 0 ] . length ;
var opsEnd = cs . indexOf ( "$" ) ;
if ( opsEnd < 0 ) opsEnd = cs . length ;
return {
oldLen : oldLen ,
newLen : newLen ,
ops : cs . substring ( opsStart , opsEnd ) ,
charBank : cs . substring ( opsEnd + 1 )
} ;
} ;
2012-02-26 13:18:17 +01:00
/ * *
* Packs Changeset object into a string
* @ params oldLen { int } Old length of the Changeset
* @ params newLen { int ] New length of the Changeset
* @ params opsStr { string } String encoding of the changes to be made
* @ params bank { string } Charbank of the Changeset
* @ returns { Changeset } a Changeset class
* /
2011-03-26 14:10:41 +01:00
exports . pack = function ( oldLen , newLen , opsStr , bank ) {
var lenDiff = newLen - oldLen ;
var lenDiffStr = ( lenDiff >= 0 ? '>' + exports . numToString ( lenDiff ) : '<' + exports . numToString ( - lenDiff ) ) ;
var a = [ ] ;
a . push ( 'Z:' , exports . numToString ( oldLen ) , lenDiffStr , opsStr , '$' , bank ) ;
return a . join ( '' ) ;
} ;
2012-02-26 13:18:17 +01:00
/ * *
* Applies a Changeset to a string
* @ params cs { string } String encoded Changeset
* @ params str { string } String to which a Changeset should be applied
* /
2011-03-26 14:10:41 +01:00
exports . applyToText = function ( cs , str ) {
var unpacked = exports . unpack ( cs ) ;
exports . assert ( str . length == unpacked . oldLen , "mismatched apply: " , str . length , " / " , unpacked . oldLen ) ;
var csIter = exports . opIterator ( unpacked . ops ) ;
var bankIter = exports . stringIterator ( unpacked . charBank ) ;
var strIter = exports . stringIterator ( str ) ;
var assem = exports . stringAssembler ( ) ;
while ( csIter . hasNext ( ) ) {
var op = csIter . next ( ) ;
switch ( op . opcode ) {
case '+' :
assem . append ( bankIter . take ( op . chars ) ) ;
break ;
case '-' :
strIter . skip ( op . chars ) ;
break ;
case '=' :
assem . append ( strIter . take ( op . chars ) ) ;
break ;
}
}
assem . append ( strIter . take ( strIter . remaining ( ) ) ) ;
return assem . toString ( ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* applies a changeset on an array of lines
* @ param CS { Changeset } the changeset to be applied
* @ param lines The lines to which the changeset needs to be applied
* /
2011-03-26 14:10:41 +01:00
exports . mutateTextLines = function ( cs , lines ) {
var unpacked = exports . unpack ( cs ) ;
var csIter = exports . opIterator ( unpacked . ops ) ;
var bankIter = exports . stringIterator ( unpacked . charBank ) ;
var mut = exports . textLinesMutator ( lines ) ;
while ( csIter . hasNext ( ) ) {
var op = csIter . next ( ) ;
switch ( op . opcode ) {
case '+' :
mut . insert ( bankIter . take ( op . chars ) , op . lines ) ;
break ;
case '-' :
mut . remove ( op . chars , op . lines ) ;
break ;
case '=' :
mut . skip ( op . chars , op . lines , ( ! ! op . attribs ) ) ;
break ;
}
}
mut . close ( ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Composes two attribute strings ( see below ) into one .
* @ param att1 { string } first attribute string
* @ param att2 { string } second attribue string
* @ param resultIsMutaton { boolean }
* @ param pool { AttribPool } attribute pool
* /
2011-03-26 14:10:41 +01:00
exports . composeAttributes = function ( att1 , att2 , resultIsMutation , pool ) {
// att1 and att2 are strings like "*3*f*1c", asMutation is a boolean.
// Sometimes attribute (key,value) pairs are treated as attribute presence
// information, while other times they are treated as operations that
// mutate a set of attributes, and this affects whether an empty value
// is a deletion or a change.
// Examples, of the form (att1Items, att2Items, resultIsMutation) -> result
// ([], [(bold, )], true) -> [(bold, )]
// ([], [(bold, )], false) -> []
// ([], [(bold, true)], true) -> [(bold, true)]
// ([], [(bold, true)], false) -> [(bold, true)]
// ([(bold, true)], [(bold, )], true) -> [(bold, )]
// ([(bold, true)], [(bold, )], false) -> []
// pool can be null if att2 has no attributes.
if ( ( ! att1 ) && resultIsMutation ) {
// In the case of a mutation (i.e. composing two exportss),
// an att2 composed with an empy att1 is just att2. If att1
// is part of an attribution string, then att2 may remove
// attributes that are already gone, so don't do this optimization.
return att2 ;
}
if ( ! att2 ) return att1 ;
var atts = [ ] ;
att1 . replace ( /\*([0-9a-z]+)/g , function ( _ , a ) {
atts . push ( pool . getAttrib ( exports . parseNum ( a ) ) ) ;
return '' ;
} ) ;
att2 . replace ( /\*([0-9a-z]+)/g , function ( _ , a ) {
var pair = pool . getAttrib ( exports . parseNum ( a ) ) ;
var found = false ;
for ( var i = 0 ; i < atts . length ; i ++ ) {
var oldPair = atts [ i ] ;
if ( oldPair [ 0 ] == pair [ 0 ] ) {
if ( pair [ 1 ] || resultIsMutation ) {
oldPair [ 1 ] = pair [ 1 ] ;
} else {
atts . splice ( i , 1 ) ;
}
found = true ;
break ;
}
}
if ( ( ! found ) && ( pair [ 1 ] || resultIsMutation ) ) {
atts . push ( pair ) ;
}
return '' ;
} ) ;
atts . sort ( ) ;
var buf = exports . stringAssembler ( ) ;
for ( var i = 0 ; i < atts . length ; i ++ ) {
buf . append ( '*' ) ;
buf . append ( exports . numToString ( pool . putAttrib ( atts [ i ] ) ) ) ;
}
//print(att1+" / "+att2+" / "+buf.toString());
return buf . toString ( ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Function used as parameter for applyZip to apply a Changeset to an
* attribute
* /
2011-03-26 14:10:41 +01:00
exports . _slicerZipperFunc = function ( attOp , csOp , opOut , pool ) {
// attOp is the op from the sequence that is being operated on, either an
// attribution string or the earlier of two exportss being composed.
// pool can be null if definitely not needed.
//print(csOp.toSource()+" "+attOp.toSource()+" "+opOut.toSource());
if ( attOp . opcode == '-' ) {
exports . copyOp ( attOp , opOut ) ;
attOp . opcode = '' ;
} else if ( ! attOp . opcode ) {
exports . copyOp ( csOp , opOut ) ;
csOp . opcode = '' ;
} else {
switch ( csOp . opcode ) {
case '-' :
{
if ( csOp . chars <= attOp . chars ) {
// delete or delete part
if ( attOp . opcode == '=' ) {
opOut . opcode = '-' ;
opOut . chars = csOp . chars ;
opOut . lines = csOp . lines ;
opOut . attribs = '' ;
}
attOp . chars -= csOp . chars ;
attOp . lines -= csOp . lines ;
csOp . opcode = '' ;
if ( ! attOp . chars ) {
attOp . opcode = '' ;
}
} else {
// delete and keep going
if ( attOp . opcode == '=' ) {
opOut . opcode = '-' ;
opOut . chars = attOp . chars ;
opOut . lines = attOp . lines ;
opOut . attribs = '' ;
}
csOp . chars -= attOp . chars ;
csOp . lines -= attOp . lines ;
attOp . opcode = '' ;
}
break ;
}
case '+' :
{
// insert
exports . copyOp ( csOp , opOut ) ;
csOp . opcode = '' ;
break ;
}
case '=' :
{
if ( csOp . chars <= attOp . chars ) {
// keep or keep part
opOut . opcode = attOp . opcode ;
opOut . chars = csOp . chars ;
opOut . lines = csOp . lines ;
opOut . attribs = exports . composeAttributes ( attOp . attribs , csOp . attribs , attOp . opcode == '=' , pool ) ;
csOp . opcode = '' ;
attOp . chars -= csOp . chars ;
attOp . lines -= csOp . lines ;
if ( ! attOp . chars ) {
attOp . opcode = '' ;
}
} else {
// keep and keep going
opOut . opcode = attOp . opcode ;
opOut . chars = attOp . chars ;
opOut . lines = attOp . lines ;
opOut . attribs = exports . composeAttributes ( attOp . attribs , csOp . attribs , attOp . opcode == '=' , pool ) ;
attOp . opcode = '' ;
csOp . chars -= attOp . chars ;
csOp . lines -= attOp . lines ;
}
break ;
}
case '' :
{
exports . copyOp ( attOp , opOut ) ;
attOp . opcode = '' ;
break ;
}
}
}
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Applies a Changeset to the attribs string of a AText .
* @ param cs { string } Changeset
* @ param astr { string } the attribs string of a AText
* @ param pool { AttribsPool } the attibutes pool
* /
2011-03-26 14:10:41 +01:00
exports . applyToAttribution = function ( cs , astr , pool ) {
var unpacked = exports . unpack ( cs ) ;
return exports . applyZip ( astr , 0 , unpacked . ops , 0 , function ( op1 , op2 , opOut ) {
return exports . _slicerZipperFunc ( op1 , op2 , opOut , pool ) ;
} ) ;
} ;
/ * e x p o r t s . o n e I n s e r t e d L i n e A t A T i m e O p I t e r a t o r = f u n c t i o n ( o p s S t r , o p t S t a r t I n d e x , c h a r B a n k ) {
var iter = exports . opIterator ( opsStr , optStartIndex ) ;
var bankIndex = 0 ;
} ; * /
exports . mutateAttributionLines = function ( cs , lines , pool ) {
//dmesg(cs);
//dmesg(lines.toSource()+" ->");
var unpacked = exports . unpack ( cs ) ;
var csIter = exports . opIterator ( unpacked . ops ) ;
var csBank = unpacked . charBank ;
var csBankIndex = 0 ;
// treat the attribution lines as text lines, mutating a line at a time
var mut = exports . textLinesMutator ( lines ) ;
var lineIter = null ;
function isNextMutOp ( ) {
return ( lineIter && lineIter . hasNext ( ) ) || mut . hasMore ( ) ;
}
function nextMutOp ( destOp ) {
if ( ( ! ( lineIter && lineIter . hasNext ( ) ) ) && mut . hasMore ( ) ) {
var line = mut . removeLines ( 1 ) ;
lineIter = exports . opIterator ( line ) ;
}
if ( lineIter && lineIter . hasNext ( ) ) {
lineIter . next ( destOp ) ;
} else {
destOp . opcode = '' ;
}
}
var lineAssem = null ;
function outputMutOp ( op ) {
//print("outputMutOp: "+op.toSource());
if ( ! lineAssem ) {
lineAssem = exports . mergingOpAssembler ( ) ;
}
lineAssem . append ( op ) ;
if ( op . lines > 0 ) {
exports . assert ( op . lines == 1 , "Can't have op.lines of " , op . lines , " in attribution lines" ) ;
// ship it to the mut
mut . insert ( lineAssem . toString ( ) , 1 ) ;
lineAssem = null ;
}
}
var csOp = exports . newOp ( ) ;
var attOp = exports . newOp ( ) ;
var opOut = exports . newOp ( ) ;
while ( csOp . opcode || csIter . hasNext ( ) || attOp . opcode || isNextMutOp ( ) ) {
if ( ( ! csOp . opcode ) && csIter . hasNext ( ) ) {
csIter . next ( csOp ) ;
}
//print(csOp.toSource()+" "+attOp.toSource()+" "+opOut.toSource());
//print(csOp.opcode+"/"+csOp.lines+"/"+csOp.attribs+"/"+lineAssem+"/"+lineIter+"/"+(lineIter?lineIter.hasNext():null));
//print("csOp: "+csOp.toSource());
if ( ( ! csOp . opcode ) && ( ! attOp . opcode ) && ( ! lineAssem ) && ( ! ( lineIter && lineIter . hasNext ( ) ) ) ) {
break ; // done
} else if ( csOp . opcode == '=' && csOp . lines > 0 && ( ! csOp . attribs ) && ( ! attOp . opcode ) && ( ! lineAssem ) && ( ! ( lineIter && lineIter . hasNext ( ) ) ) ) {
// skip multiple lines; this is what makes small changes not order of the document size
mut . skipLines ( csOp . lines ) ;
//print("skipped: "+csOp.lines);
csOp . opcode = '' ;
} else if ( csOp . opcode == '+' ) {
if ( csOp . lines > 1 ) {
var firstLineLen = csBank . indexOf ( '\n' , csBankIndex ) + 1 - csBankIndex ;
exports . copyOp ( csOp , opOut ) ;
csOp . chars -= firstLineLen ;
csOp . lines -- ;
opOut . lines = 1 ;
opOut . chars = firstLineLen ;
} else {
exports . copyOp ( csOp , opOut ) ;
csOp . opcode = '' ;
}
outputMutOp ( opOut ) ;
csBankIndex += opOut . chars ;
opOut . opcode = '' ;
} else {
if ( ( ! attOp . opcode ) && isNextMutOp ( ) ) {
nextMutOp ( attOp ) ;
}
//print("attOp: "+attOp.toSource());
exports . _slicerZipperFunc ( attOp , csOp , opOut , pool ) ;
if ( opOut . opcode ) {
outputMutOp ( opOut ) ;
opOut . opcode = '' ;
}
}
}
exports . assert ( ! lineAssem , "line assembler not finished" ) ;
mut . close ( ) ;
//dmesg("-> "+lines.toSource());
} ;
2012-02-26 19:59:11 +01:00
/ * *
* joins several Attribution lines
* @ param theAlines collection of Attribution lines
* @ returns { string } joined Attribution lines
* /
2011-03-26 14:10:41 +01:00
exports . joinAttributionLines = function ( theAlines ) {
var assem = exports . mergingOpAssembler ( ) ;
for ( var i = 0 ; i < theAlines . length ; i ++ ) {
var aline = theAlines [ i ] ;
var iter = exports . opIterator ( aline ) ;
while ( iter . hasNext ( ) ) {
assem . append ( iter . next ( ) ) ;
}
}
return assem . toString ( ) ;
} ;
exports . splitAttributionLines = function ( attrOps , text ) {
var iter = exports . opIterator ( attrOps ) ;
var assem = exports . mergingOpAssembler ( ) ;
var lines = [ ] ;
var pos = 0 ;
function appendOp ( op ) {
assem . append ( op ) ;
if ( op . lines > 0 ) {
lines . push ( assem . toString ( ) ) ;
assem . clear ( ) ;
}
pos += op . chars ;
}
while ( iter . hasNext ( ) ) {
var op = iter . next ( ) ;
var numChars = op . chars ;
var numLines = op . lines ;
while ( numLines > 1 ) {
var newlineEnd = text . indexOf ( '\n' , pos ) + 1 ;
exports . assert ( newlineEnd > 0 , "newlineEnd <= 0 in splitAttributionLines" ) ;
op . chars = newlineEnd - pos ;
op . lines = 1 ;
appendOp ( op ) ;
numChars -= op . chars ;
numLines -= op . lines ;
}
if ( numLines == 1 ) {
op . chars = numChars ;
op . lines = 1 ;
}
appendOp ( op ) ;
}
return lines ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* splits text into lines
* @ param { string } text to be splitted
* /
2011-03-26 14:10:41 +01:00
exports . splitTextLines = function ( text ) {
return text . match ( /[^\n]*(?:\n|[^\n]$)/g ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* compose two Changesets
* @ param cs1 { Changeset } first Changeset
* @ param cs2 { Changeset } second Changeset
* @ param pool { AtribsPool } Attribs pool
* /
2011-03-26 14:10:41 +01:00
exports . compose = function ( cs1 , cs2 , pool ) {
var unpacked1 = exports . unpack ( cs1 ) ;
var unpacked2 = exports . unpack ( cs2 ) ;
var len1 = unpacked1 . oldLen ;
var len2 = unpacked1 . newLen ;
exports . assert ( len2 == unpacked2 . oldLen , "mismatched composition" ) ;
var len3 = unpacked2 . newLen ;
var bankIter1 = exports . stringIterator ( unpacked1 . charBank ) ;
var bankIter2 = exports . stringIterator ( unpacked2 . charBank ) ;
var bankAssem = exports . stringAssembler ( ) ;
var newOps = exports . applyZip ( unpacked1 . ops , 0 , unpacked2 . ops , 0 , function ( op1 , op2 , opOut ) {
//var debugBuilder = exports.stringAssembler();
//debugBuilder.append(exports.opString(op1));
//debugBuilder.append(',');
//debugBuilder.append(exports.opString(op2));
//debugBuilder.append(' / ');
var op1code = op1 . opcode ;
var op2code = op2 . opcode ;
if ( op1code == '+' && op2code == '-' ) {
bankIter1 . skip ( Math . min ( op1 . chars , op2 . chars ) ) ;
}
exports . _slicerZipperFunc ( op1 , op2 , opOut , pool ) ;
if ( opOut . opcode == '+' ) {
if ( op2code == '+' ) {
bankAssem . append ( bankIter2 . take ( opOut . chars ) ) ;
} else {
bankAssem . append ( bankIter1 . take ( opOut . chars ) ) ;
}
}
//debugBuilder.append(exports.opString(op1));
//debugBuilder.append(',');
//debugBuilder.append(exports.opString(op2));
//debugBuilder.append(' -> ');
//debugBuilder.append(exports.opString(opOut));
//print(debugBuilder.toString());
} ) ;
return exports . pack ( len1 , len3 , newOps , bankAssem . toString ( ) ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* returns a function that tests if a string of attributes
* ( e . g . * 3 * 4 ) contains a given attribute key , value that
* is already present in the pool .
* @ param attribPair array [ key , value ] of the attribute
* @ param pool { AttribPool } Attribute pool
* /
2011-03-26 14:10:41 +01:00
exports . attributeTester = function ( attribPair , pool ) {
if ( ! pool ) {
return never ;
}
var attribNum = pool . putAttrib ( attribPair , true ) ;
if ( attribNum < 0 ) {
return never ;
} else {
var re = new RegExp ( '\\*' + exports . numToString ( attribNum ) + '(?!\\w)' ) ;
return function ( attribs ) {
return re . test ( attribs ) ;
} ;
}
function never ( attribs ) {
return false ;
}
} ;
2012-02-26 19:59:11 +01:00
/ * *
* creates the identity Changeset of length N
* @ param N { int } length of the identity changeset
* /
2011-03-26 14:10:41 +01:00
exports . identity = function ( N ) {
return exports . pack ( N , N , "" , "" ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* creates a Changeset which works on oldFullText and removes text
* from spliceStart to spliceStart + numRemoved and inserts newText
* instead . Also gives possibility to add attributes optNewTextAPairs
* for the new text .
* @ param oldFullText { string } old text
* @ param spliecStart { int } where splicing starts
* @ param numRemoved { int } number of characters to be removed
* @ param newText { string } string to be inserted
* @ param optNewTextAPairs { string } new pairs to be inserted
* @ param pool { AttribPool } Attribution Pool
* /
2011-03-26 14:10:41 +01:00
exports . makeSplice = function ( oldFullText , spliceStart , numRemoved , newText , optNewTextAPairs , pool ) {
var oldLen = oldFullText . length ;
if ( spliceStart >= oldLen ) {
spliceStart = oldLen - 1 ;
}
if ( numRemoved > oldFullText . length - spliceStart - 1 ) {
numRemoved = oldFullText . length - spliceStart - 1 ;
}
var oldText = oldFullText . substring ( spliceStart , spliceStart + numRemoved ) ;
var newLen = oldLen + newText . length - oldText . length ;
var assem = exports . smartOpAssembler ( ) ;
assem . appendOpWithText ( '=' , oldFullText . substring ( 0 , spliceStart ) ) ;
assem . appendOpWithText ( '-' , oldText ) ;
assem . appendOpWithText ( '+' , newText , optNewTextAPairs , pool ) ;
assem . endDocument ( ) ;
return exports . pack ( oldLen , newLen , assem . toString ( ) , newText ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Transforms a changeset into a list of splices in the form
* [ startChar , endChar , newText ] meaning replace text from
* startChar to endChar with newText
* @ param cs Changeset
* /
2011-03-26 14:10:41 +01:00
exports . toSplices = function ( cs ) {
2012-02-26 19:59:11 +01:00
//
2011-03-26 14:10:41 +01:00
var unpacked = exports . unpack ( cs ) ;
var splices = [ ] ;
var oldPos = 0 ;
var iter = exports . opIterator ( unpacked . ops ) ;
var charIter = exports . stringIterator ( unpacked . charBank ) ;
var inSplice = false ;
while ( iter . hasNext ( ) ) {
var op = iter . next ( ) ;
if ( op . opcode == '=' ) {
oldPos += op . chars ;
inSplice = false ;
} else {
if ( ! inSplice ) {
splices . push ( [ oldPos , oldPos , "" ] ) ;
inSplice = true ;
}
if ( op . opcode == '-' ) {
oldPos += op . chars ;
splices [ splices . length - 1 ] [ 1 ] += op . chars ;
} else if ( op . opcode == '+' ) {
splices [ splices . length - 1 ] [ 2 ] += charIter . take ( op . chars ) ;
}
}
}
return splices ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
*
* /
2011-03-26 14:10:41 +01:00
exports . characterRangeFollow = function ( cs , startChar , endChar , insertionsAfter ) {
var newStartChar = startChar ;
var newEndChar = endChar ;
var splices = exports . toSplices ( cs ) ;
var lengthChangeSoFar = 0 ;
for ( var i = 0 ; i < splices . length ; i ++ ) {
var splice = splices [ i ] ;
var spliceStart = splice [ 0 ] + lengthChangeSoFar ;
var spliceEnd = splice [ 1 ] + lengthChangeSoFar ;
var newTextLength = splice [ 2 ] . length ;
var thisLengthChange = newTextLength - ( spliceEnd - spliceStart ) ;
if ( spliceStart <= newStartChar && spliceEnd >= newEndChar ) {
// splice fully replaces/deletes range
// (also case that handles insertion at a collapsed selection)
if ( insertionsAfter ) {
newStartChar = newEndChar = spliceStart ;
} else {
newStartChar = newEndChar = spliceStart + newTextLength ;
}
} else if ( spliceEnd <= newStartChar ) {
// splice is before range
newStartChar += thisLengthChange ;
newEndChar += thisLengthChange ;
} else if ( spliceStart >= newEndChar ) {
// splice is after range
} else if ( spliceStart >= newStartChar && spliceEnd <= newEndChar ) {
// splice is inside range
newEndChar += thisLengthChange ;
} else if ( spliceEnd < newEndChar ) {
// splice overlaps beginning of range
newStartChar = spliceStart + newTextLength ;
newEndChar += thisLengthChange ;
} else {
// splice overlaps end of range
newEndChar = spliceStart ;
}
lengthChangeSoFar += thisLengthChange ;
}
return [ newStartChar , newEndChar ] ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Iterate over attributes in a changeset and move them from
* oldPool to newPool
* @ param cs { Changeset } Chageset / attribution string to be iterated over
* @ param oldPool { AttribPool } old attributes pool
* @ param newPool { AttribPool } new attributes pool
* @ return { string } the new Changeset
* /
2011-03-26 14:10:41 +01:00
exports . moveOpsToNewPool = function ( cs , oldPool , newPool ) {
// works on exports or attribution string
var dollarPos = cs . indexOf ( '$' ) ;
if ( dollarPos < 0 ) {
dollarPos = cs . length ;
}
var upToDollar = cs . substring ( 0 , dollarPos ) ;
var fromDollar = cs . substring ( dollarPos ) ;
// order of attribs stays the same
return upToDollar . replace ( /\*([0-9a-z]+)/g , function ( _ , a ) {
var oldNum = exports . parseNum ( a ) ;
var pair = oldPool . getAttrib ( oldNum ) ;
var newNum = newPool . putAttrib ( pair ) ;
return '*' + exports . numToString ( newNum ) ;
} ) + fromDollar ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* create an attribution inserting a text
* @ param text { string } text to be inserted
* /
2011-03-26 14:10:41 +01:00
exports . makeAttribution = function ( text ) {
var assem = exports . smartOpAssembler ( ) ;
assem . appendOpWithText ( '+' , text ) ;
return assem . toString ( ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Iterates over attributes in exports , attribution string , or attribs property of an op
* and runs function func on them
* @ param cs { Changeset } changeset
* @ param func { function } function to be called
* /
2011-03-26 14:10:41 +01:00
exports . eachAttribNumber = function ( cs , func ) {
var dollarPos = cs . indexOf ( '$' ) ;
if ( dollarPos < 0 ) {
dollarPos = cs . length ;
}
var upToDollar = cs . substring ( 0 , dollarPos ) ;
upToDollar . replace ( /\*([0-9a-z]+)/g , function ( _ , a ) {
func ( exports . parseNum ( a ) ) ;
return '' ;
} ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Filter attributes which should remain in a Changeset
* callable on a exports , attribution string , or attribs property of an op ,
* though it may easily create adjacent ops that can be merged .
* @ param cs { Changeset } changeset to be filtered
* @ param filter { function } fnc which returns true if an
* attribute X ( int ) should be kept in the Changeset
* /
2011-03-26 14:10:41 +01:00
exports . filterAttribNumbers = function ( cs , filter ) {
return exports . mapAttribNumbers ( cs , filter ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* does exactly the same as exports . filterAttribNumbers
* /
2011-03-26 14:10:41 +01:00
exports . mapAttribNumbers = function ( cs , func ) {
var dollarPos = cs . indexOf ( '$' ) ;
if ( dollarPos < 0 ) {
dollarPos = cs . length ;
}
var upToDollar = cs . substring ( 0 , dollarPos ) ;
var newUpToDollar = upToDollar . replace ( /\*([0-9a-z]+)/g , function ( s , a ) {
var n = func ( exports . parseNum ( a ) ) ;
if ( n === true ) {
return s ;
} else if ( ( typeof n ) === "number" ) {
return '*' + exports . numToString ( n ) ;
} else {
return '' ;
}
} ) ;
return newUpToDollar + cs . substring ( dollarPos ) ;
} ;
2012-02-26 13:18:17 +01:00
/ * *
* Create a Changeset going from Identity to a certain state
* @ params text { string } text of the final change
* @ attribs attribs { string } optional , operations which insert
* the text and also puts the right attributes
* /
2011-03-26 14:10:41 +01:00
exports . makeAText = function ( text , attribs ) {
return {
text : text ,
attribs : ( attribs || exports . makeAttribution ( text ) )
} ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Apply a Changeset to a AText
* @ param cs { Changeset } Changeset to be applied
* @ param atext { AText }
* @ param pool { AttribPool } Attribute Pool to add to
* /
2011-03-26 14:10:41 +01:00
exports . applyToAText = function ( cs , atext , pool ) {
return {
text : exports . applyToText ( cs , atext . text ) ,
attribs : exports . applyToAttribution ( cs , atext . attribs , pool )
} ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Clones a AText structure
* @ param atext { AText }
* /
2011-03-26 14:10:41 +01:00
exports . cloneAText = function ( atext ) {
return {
text : atext . text ,
attribs : atext . attribs
} ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Copies a AText structure from atext1 to atext2
* @ param atext { AText }
* /
2011-03-26 14:10:41 +01:00
exports . copyAText = function ( atext1 , atext2 ) {
atext2 . text = atext1 . text ;
atext2 . attribs = atext1 . attribs ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Append the set of operations from atext to an assembler
* @ param atext { AText }
* @ param assem Assembler like smartOpAssembler
* /
2011-03-26 14:10:41 +01:00
exports . appendATextToAssembler = function ( atext , assem ) {
// intentionally skips last newline char of atext
var iter = exports . opIterator ( atext . attribs ) ;
var op = exports . newOp ( ) ;
while ( iter . hasNext ( ) ) {
iter . next ( op ) ;
if ( ! iter . hasNext ( ) ) {
// last op, exclude final newline
if ( op . lines <= 1 ) {
op . lines = 0 ;
op . chars -- ;
if ( op . chars ) {
assem . append ( op ) ;
}
} else {
var nextToLastNewlineEnd =
atext . text . lastIndexOf ( '\n' , atext . text . length - 2 ) + 1 ;
var lastLineLength = atext . text . length - nextToLastNewlineEnd - 1 ;
op . lines -- ;
op . chars -= ( lastLineLength + 1 ) ;
assem . append ( op ) ;
op . lines = 0 ;
op . chars = lastLineLength ;
if ( op . chars ) {
assem . append ( op ) ;
}
}
} else {
assem . append ( op ) ;
}
}
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Creates a clone of a Changeset and it ' s APool
* @ param cs { Changeset }
* @ param pool { AtributePool }
* /
2013-04-08 20:46:45 +02:00
var lastEvent = null ; // This is just a temporary measure to ensure we don't send the exact same changeset twice
// Documentation for this is available at https://github.com/ether/etherpad-lite/issues/1652
2011-03-26 14:10:41 +01:00
exports . prepareForWire = function ( cs , pool ) {
2013-04-08 20:46:45 +02:00
if ( cs == lastEvent ) {
throw new Error ( "Not sending the same event twice..." ) ;
return false ;
}
2012-03-18 09:05:46 +01:00
var newPool = new AttributePool ( ) ;
2011-03-26 14:10:41 +01:00
var newCs = exports . moveOpsToNewPool ( cs , pool , newPool ) ;
2013-04-08 20:46:45 +02:00
lastEvent = cs ;
2011-03-26 14:10:41 +01:00
return {
translated : newCs ,
2013-04-08 20:46:45 +02:00
pool : newPool
2011-03-26 14:10:41 +01:00
} ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Checks if a changeset s the identity changeset
* /
2011-03-26 14:10:41 +01:00
exports . isIdentity = function ( cs ) {
var unpacked = exports . unpack ( cs ) ;
return unpacked . ops == "" && unpacked . oldLen == unpacked . newLen ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* returns all the values of attributes with a certain key
* in an Op attribs string
* @ param attribs { string } Attribute string of a Op
* @ param key { string } string to be seached for
* @ param pool { AttribPool } attribute pool
* /
2011-03-26 14:10:41 +01:00
exports . opAttributeValue = function ( op , key , pool ) {
return exports . attribsAttributeValue ( op . attribs , key , pool ) ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* returns all the values of attributes with a certain key
* in an attribs string
* @ param attribs { string } Attribute string
* @ param key { string } string to be seached for
* @ param pool { AttribPool } attribute pool
* /
2011-03-26 14:10:41 +01:00
exports . attribsAttributeValue = function ( attribs , key , pool ) {
var value = '' ;
if ( attribs ) {
exports . eachAttribNumber ( attribs , function ( n ) {
if ( pool . getAttribKey ( n ) == key ) {
value = pool . getAttribValue ( n ) ;
}
} ) ;
}
return value ;
} ;
2012-02-26 19:59:11 +01:00
/ * *
* Creates a Changeset builder for a string with initial
* length oldLen . Allows to add / remove parts of it
* @ param oldLen { int } Old length
* /
2011-03-26 14:10:41 +01:00
exports . builder = function ( oldLen ) {
var assem = exports . smartOpAssembler ( ) ;
var o = exports . newOp ( ) ;
var charBank = exports . stringAssembler ( ) ;
var self = {
// attribs are [[key1,value1],[key2,value2],...] or '*0*1...' (no pool needed in latter case)
keep : function ( N , L , attribs , pool ) {
o . opcode = '=' ;
o . attribs = ( attribs && exports . makeAttribsString ( '=' , attribs , pool ) ) || '' ;
o . chars = N ;
o . lines = ( L || 0 ) ;
assem . append ( o ) ;
return self ;
} ,
keepText : function ( text , attribs , pool ) {
assem . appendOpWithText ( '=' , text , attribs , pool ) ;
return self ;
} ,
insert : function ( text , attribs , pool ) {
assem . appendOpWithText ( '+' , text , attribs , pool ) ;
charBank . append ( text ) ;
return self ;
} ,
remove : function ( N , L ) {
o . opcode = '-' ;
o . attribs = '' ;
o . chars = N ;
o . lines = ( L || 0 ) ;
assem . append ( o ) ;
return self ;
} ,
toString : function ( ) {
assem . endDocument ( ) ;
var newLen = oldLen + assem . getLengthChange ( ) ;
return exports . pack ( oldLen , newLen , assem . toString ( ) , charBank . toString ( ) ) ;
}
} ;
return self ;
} ;
exports . makeAttribsString = function ( opcode , attribs , pool ) {
// makeAttribsString(opcode, '*3') or makeAttribsString(opcode, [['foo','bar']], myPool) work
if ( ! attribs ) {
return '' ;
} else if ( ( typeof attribs ) == "string" ) {
return attribs ;
} else if ( pool && attribs && attribs . length ) {
if ( attribs . length > 1 ) {
attribs = attribs . slice ( ) ;
attribs . sort ( ) ;
}
var result = [ ] ;
for ( var i = 0 ; i < attribs . length ; i ++ ) {
var pair = attribs [ i ] ;
if ( opcode == '=' || ( opcode == '+' && pair [ 1 ] ) ) {
result . push ( '*' + exports . numToString ( pool . putAttrib ( pair ) ) ) ;
}
}
return result . join ( '' ) ;
}
} ;
// like "substring" but on a single-line attribution string
exports . subattribution = function ( astr , start , optEnd ) {
var iter = exports . opIterator ( astr , 0 ) ;
var assem = exports . smartOpAssembler ( ) ;
var attOp = exports . newOp ( ) ;
var csOp = exports . newOp ( ) ;
var opOut = exports . newOp ( ) ;
function doCsOp ( ) {
if ( csOp . chars ) {
while ( csOp . opcode && ( attOp . opcode || iter . hasNext ( ) ) ) {
if ( ! attOp . opcode ) iter . next ( attOp ) ;
if ( csOp . opcode && attOp . opcode && csOp . chars >= attOp . chars && attOp . lines > 0 && csOp . lines <= 0 ) {
csOp . lines ++ ;
}
exports . _slicerZipperFunc ( attOp , csOp , opOut , null ) ;
if ( opOut . opcode ) {
assem . append ( opOut ) ;
opOut . opcode = '' ;
}
}
}
}
csOp . opcode = '-' ;
csOp . chars = start ;
doCsOp ( ) ;
if ( optEnd === undefined ) {
if ( attOp . opcode ) {
assem . append ( attOp ) ;
}
while ( iter . hasNext ( ) ) {
iter . next ( attOp ) ;
assem . append ( attOp ) ;
}
} else {
csOp . opcode = '=' ;
csOp . chars = optEnd - start ;
doCsOp ( ) ;
}
return assem . toString ( ) ;
} ;
exports . inverse = function ( cs , lines , alines , pool ) {
// lines and alines are what the exports is meant to apply to.
// They may be arrays or objects with .get(i) and .length methods.
// They include final newlines on lines.
function lines _get ( idx ) {
if ( lines . get ) {
return lines . get ( idx ) ;
} else {
return lines [ idx ] ;
}
}
function lines _length ( ) {
if ( ( typeof lines . length ) == "number" ) {
return lines . length ;
} else {
return lines . length ( ) ;
}
}
function alines _get ( idx ) {
if ( alines . get ) {
return alines . get ( idx ) ;
} else {
return alines [ idx ] ;
}
}
function alines _length ( ) {
if ( ( typeof alines . length ) == "number" ) {
return alines . length ;
} else {
return alines . length ( ) ;
}
}
var curLine = 0 ;
var curChar = 0 ;
var curLineOpIter = null ;
var curLineOpIterLine ;
var curLineNextOp = exports . newOp ( '+' ) ;
var unpacked = exports . unpack ( cs ) ;
var csIter = exports . opIterator ( unpacked . ops ) ;
var builder = exports . builder ( unpacked . newLen ) ;
function consumeAttribRuns ( numChars , func /*(len, attribs, endsLine)*/ ) {
if ( ( ! curLineOpIter ) || ( curLineOpIterLine != curLine ) ) {
// create curLineOpIter and advance it to curChar
curLineOpIter = exports . opIterator ( alines _get ( curLine ) ) ;
curLineOpIterLine = curLine ;
var indexIntoLine = 0 ;
var done = false ;
while ( ! done ) {
curLineOpIter . next ( curLineNextOp ) ;
if ( indexIntoLine + curLineNextOp . chars >= curChar ) {
curLineNextOp . chars -= ( curChar - indexIntoLine ) ;
done = true ;
} else {
indexIntoLine += curLineNextOp . chars ;
}
}
}
while ( numChars > 0 ) {
if ( ( ! curLineNextOp . chars ) && ( ! curLineOpIter . hasNext ( ) ) ) {
curLine ++ ;
curChar = 0 ;
curLineOpIterLine = curLine ;
curLineNextOp . chars = 0 ;
curLineOpIter = exports . opIterator ( alines _get ( curLine ) ) ;
}
if ( ! curLineNextOp . chars ) {
curLineOpIter . next ( curLineNextOp ) ;
}
var charsToUse = Math . min ( numChars , curLineNextOp . chars ) ;
func ( charsToUse , curLineNextOp . attribs , charsToUse == curLineNextOp . chars && curLineNextOp . lines > 0 ) ;
numChars -= charsToUse ;
curLineNextOp . chars -= charsToUse ;
curChar += charsToUse ;
}
if ( ( ! curLineNextOp . chars ) && ( ! curLineOpIter . hasNext ( ) ) ) {
curLine ++ ;
curChar = 0 ;
}
}
function skip ( N , L ) {
if ( L ) {
curLine += L ;
curChar = 0 ;
} else {
if ( curLineOpIter && curLineOpIterLine == curLine ) {
consumeAttribRuns ( N , function ( ) { } ) ;
} else {
curChar += N ;
}
}
}
function nextText ( numChars ) {
var len = 0 ;
var assem = exports . stringAssembler ( ) ;
var firstString = lines _get ( curLine ) . substring ( curChar ) ;
len += firstString . length ;
assem . append ( firstString ) ;
var lineNum = curLine + 1 ;
while ( len < numChars ) {
var nextString = lines _get ( lineNum ) ;
len += nextString . length ;
assem . append ( nextString ) ;
lineNum ++ ;
}
return assem . toString ( ) . substring ( 0 , numChars ) ;
}
function cachedStrFunc ( func ) {
var cache = { } ;
return function ( s ) {
if ( ! cache [ s ] ) {
cache [ s ] = func ( s ) ;
}
return cache [ s ] ;
} ;
}
var attribKeys = [ ] ;
var attribValues = [ ] ;
while ( csIter . hasNext ( ) ) {
var csOp = csIter . next ( ) ;
if ( csOp . opcode == '=' ) {
if ( csOp . attribs ) {
attribKeys . length = 0 ;
attribValues . length = 0 ;
exports . eachAttribNumber ( csOp . attribs , function ( n ) {
attribKeys . push ( pool . getAttribKey ( n ) ) ;
attribValues . push ( pool . getAttribValue ( n ) ) ;
} ) ;
var undoBackToAttribs = cachedStrFunc ( function ( attribs ) {
var backAttribs = [ ] ;
for ( var i = 0 ; i < attribKeys . length ; i ++ ) {
var appliedKey = attribKeys [ i ] ;
var appliedValue = attribValues [ i ] ;
var oldValue = exports . attribsAttributeValue ( attribs , appliedKey , pool ) ;
if ( appliedValue != oldValue ) {
backAttribs . push ( [ appliedKey , oldValue ] ) ;
}
}
return exports . makeAttribsString ( '=' , backAttribs , pool ) ;
} ) ;
consumeAttribRuns ( csOp . chars , function ( len , attribs , endsLine ) {
builder . keep ( len , endsLine ? 1 : 0 , undoBackToAttribs ( attribs ) ) ;
} ) ;
} else {
skip ( csOp . chars , csOp . lines ) ;
builder . keep ( csOp . chars , csOp . lines ) ;
}
} else if ( csOp . opcode == '+' ) {
builder . remove ( csOp . chars , csOp . lines ) ;
} else if ( csOp . opcode == '-' ) {
var textBank = nextText ( csOp . chars ) ;
var textBankIndex = 0 ;
consumeAttribRuns ( csOp . chars , function ( len , attribs , endsLine ) {
builder . insert ( textBank . substr ( textBankIndex , len ) , attribs ) ;
textBankIndex += len ;
} ) ;
}
}
return exports . checkRep ( builder . toString ( ) ) ;
} ;
// %CLIENT FILE ENDS HERE%
exports . follow = function ( cs1 , cs2 , reverseInsertOrder , pool ) {
var unpacked1 = exports . unpack ( cs1 ) ;
var unpacked2 = exports . unpack ( cs2 ) ;
var len1 = unpacked1 . oldLen ;
var len2 = unpacked2 . oldLen ;
exports . assert ( len1 == len2 , "mismatched follow" ) ;
var chars1 = exports . stringIterator ( unpacked1 . charBank ) ;
var chars2 = exports . stringIterator ( unpacked2 . charBank ) ;
var oldLen = unpacked1 . newLen ;
var oldPos = 0 ;
var newLen = 0 ;
var hasInsertFirst = exports . attributeTester ( [ 'insertorder' , 'first' ] , pool ) ;
var newOps = exports . applyZip ( unpacked1 . ops , 0 , unpacked2 . ops , 0 , function ( op1 , op2 , opOut ) {
if ( op1 . opcode == '+' || op2 . opcode == '+' ) {
var whichToDo ;
if ( op2 . opcode != '+' ) {
whichToDo = 1 ;
} else if ( op1 . opcode != '+' ) {
whichToDo = 2 ;
} else {
// both +
var firstChar1 = chars1 . peek ( 1 ) ;
var firstChar2 = chars2 . peek ( 1 ) ;
var insertFirst1 = hasInsertFirst ( op1 . attribs ) ;
var insertFirst2 = hasInsertFirst ( op2 . attribs ) ;
if ( insertFirst1 && ! insertFirst2 ) {
whichToDo = 1 ;
} else if ( insertFirst2 && ! insertFirst1 ) {
whichToDo = 2 ;
}
// insert string that doesn't start with a newline first so as not to break up lines
else if ( firstChar1 == '\n' && firstChar2 != '\n' ) {
whichToDo = 2 ;
} else if ( firstChar1 != '\n' && firstChar2 == '\n' ) {
whichToDo = 1 ;
}
// break symmetry:
else if ( reverseInsertOrder ) {
whichToDo = 2 ;
} else {
whichToDo = 1 ;
}
}
if ( whichToDo == 1 ) {
chars1 . skip ( op1 . chars ) ;
opOut . opcode = '=' ;
opOut . lines = op1 . lines ;
opOut . chars = op1 . chars ;
opOut . attribs = '' ;
op1 . opcode = '' ;
} else {
// whichToDo == 2
chars2 . skip ( op2 . chars ) ;
exports . copyOp ( op2 , opOut ) ;
op2 . opcode = '' ;
}
} else if ( op1 . opcode == '-' ) {
if ( ! op2 . opcode ) {
op1 . opcode = '' ;
} else {
if ( op1 . chars <= op2 . chars ) {
op2 . chars -= op1 . chars ;
op2 . lines -= op1 . lines ;
op1 . opcode = '' ;
if ( ! op2 . chars ) {
op2 . opcode = '' ;
}
} else {
op1 . chars -= op2 . chars ;
op1 . lines -= op2 . lines ;
op2 . opcode = '' ;
}
}
} else if ( op2 . opcode == '-' ) {
exports . copyOp ( op2 , opOut ) ;
if ( ! op1 . opcode ) {
op2 . opcode = '' ;
} else if ( op2 . chars <= op1 . chars ) {
// delete part or all of a keep
op1 . chars -= op2 . chars ;
op1 . lines -= op2 . lines ;
op2 . opcode = '' ;
if ( ! op1 . chars ) {
op1 . opcode = '' ;
}
} else {
// delete all of a keep, and keep going
opOut . lines = op1 . lines ;
opOut . chars = op1 . chars ;
op2 . lines -= op1 . lines ;
op2 . chars -= op1 . chars ;
op1 . opcode = '' ;
}
} else if ( ! op1 . opcode ) {
exports . copyOp ( op2 , opOut ) ;
op2 . opcode = '' ;
} else if ( ! op2 . opcode ) {
exports . copyOp ( op1 , opOut ) ;
op1 . opcode = '' ;
} else {
// both keeps
opOut . opcode = '=' ;
opOut . attribs = exports . followAttributes ( op1 . attribs , op2 . attribs , pool ) ;
if ( op1 . chars <= op2 . chars ) {
opOut . chars = op1 . chars ;
opOut . lines = op1 . lines ;
op2 . chars -= op1 . chars ;
op2 . lines -= op1 . lines ;
op1 . opcode = '' ;
if ( ! op2 . chars ) {
op2 . opcode = '' ;
}
} else {
opOut . chars = op2 . chars ;
opOut . lines = op2 . lines ;
op1 . chars -= op2 . chars ;
op1 . lines -= op2 . lines ;
op2 . opcode = '' ;
}
}
switch ( opOut . opcode ) {
case '=' :
oldPos += opOut . chars ;
newLen += opOut . chars ;
break ;
case '-' :
oldPos += opOut . chars ;
break ;
case '+' :
newLen += opOut . chars ;
break ;
}
} ) ;
newLen += oldLen - oldPos ;
return exports . pack ( oldLen , newLen , newOps , unpacked2 . charBank ) ;
} ;
exports . followAttributes = function ( att1 , att2 , pool ) {
// The merge of two sets of attribute changes to the same text
// takes the lexically-earlier value if there are two values
// for the same key. Otherwise, all key/value changes from
// both attribute sets are taken. This operation is the "follow",
// so a set of changes is produced that can be applied to att1
// to produce the merged set.
if ( ( ! att2 ) || ( ! pool ) ) return '' ;
if ( ! att1 ) return att2 ;
var atts = [ ] ;
att2 . replace ( /\*([0-9a-z]+)/g , function ( _ , a ) {
atts . push ( pool . getAttrib ( exports . parseNum ( a ) ) ) ;
return '' ;
} ) ;
att1 . replace ( /\*([0-9a-z]+)/g , function ( _ , a ) {
var pair1 = pool . getAttrib ( exports . parseNum ( a ) ) ;
for ( var i = 0 ; i < atts . length ; i ++ ) {
var pair2 = atts [ i ] ;
if ( pair1 [ 0 ] == pair2 [ 0 ] ) {
if ( pair1 [ 1 ] <= pair2 [ 1 ] ) {
// winner of merge is pair1, delete this attribute
atts . splice ( i , 1 ) ;
}
break ;
}
}
return '' ;
} ) ;
// we've only removed attributes, so they're already sorted
var buf = exports . stringAssembler ( ) ;
for ( var i = 0 ; i < atts . length ; i ++ ) {
buf . append ( '*' ) ;
buf . append ( exports . numToString ( pool . putAttrib ( atts [ i ] ) ) ) ;
}
return buf . toString ( ) ;
} ;
2013-01-27 16:40:37 +01:00
exports . composeWithDeletions = function ( cs1 , cs2 , pool ) {
var unpacked1 = exports . unpack ( cs1 ) ;
var unpacked2 = exports . unpack ( cs2 ) ;
var len1 = unpacked1 . oldLen ;
var len2 = unpacked1 . newLen ;
exports . assert ( len2 == unpacked2 . oldLen , "mismatched composition" ) ;
var len3 = unpacked2 . newLen ;
var bankIter1 = exports . stringIterator ( unpacked1 . charBank ) ;
var bankIter2 = exports . stringIterator ( unpacked2 . charBank ) ;
var bankAssem = exports . stringAssembler ( ) ;
var newOps = exports . applyZip ( unpacked1 . ops , 0 , unpacked2 . ops , 0 , function ( op1 , op2 , opOut ) {
var op1code = op1 . opcode ;
var op2code = op2 . opcode ;
if ( op1code == '+' && op2code == '-' ) {
bankIter1 . skip ( Math . min ( op1 . chars , op2 . chars ) ) ;
}
exports . _slicerZipperFuncWithDeletions ( op1 , op2 , opOut , pool ) ;
if ( opOut . opcode == '+' ) {
if ( op2code == '+' ) {
bankAssem . append ( bankIter2 . take ( opOut . chars ) ) ;
} else {
bankAssem . append ( bankIter1 . take ( opOut . chars ) ) ;
}
}
} ) ;
return exports . pack ( len1 , len3 , newOps , bankAssem . toString ( ) ) ;
} ;
// This function is 95% like _slicerZipperFunc, we just changed two lines to ensure it merges the attribs of deletions properly.
// This is necassary for correct paddiff. But to ensure these changes doesn't affect anything else, we've created a seperate function only used for paddiffs
exports . _slicerZipperFuncWithDeletions = function ( attOp , csOp , opOut , pool ) {
// attOp is the op from the sequence that is being operated on, either an
// attribution string or the earlier of two exportss being composed.
// pool can be null if definitely not needed.
//print(csOp.toSource()+" "+attOp.toSource()+" "+opOut.toSource());
if ( attOp . opcode == '-' ) {
exports . copyOp ( attOp , opOut ) ;
attOp . opcode = '' ;
} else if ( ! attOp . opcode ) {
exports . copyOp ( csOp , opOut ) ;
csOp . opcode = '' ;
} else {
switch ( csOp . opcode ) {
case '-' :
{
if ( csOp . chars <= attOp . chars ) {
// delete or delete part
if ( attOp . opcode == '=' ) {
opOut . opcode = '-' ;
opOut . chars = csOp . chars ;
opOut . lines = csOp . lines ;
opOut . attribs = csOp . attribs ; //changed by yammer
}
attOp . chars -= csOp . chars ;
attOp . lines -= csOp . lines ;
csOp . opcode = '' ;
if ( ! attOp . chars ) {
attOp . opcode = '' ;
}
} else {
// delete and keep going
if ( attOp . opcode == '=' ) {
opOut . opcode = '-' ;
opOut . chars = attOp . chars ;
opOut . lines = attOp . lines ;
opOut . attribs = csOp . attribs ; //changed by yammer
}
csOp . chars -= attOp . chars ;
csOp . lines -= attOp . lines ;
attOp . opcode = '' ;
}
break ;
}
case '+' :
{
// insert
exports . copyOp ( csOp , opOut ) ;
csOp . opcode = '' ;
break ;
}
case '=' :
{
if ( csOp . chars <= attOp . chars ) {
// keep or keep part
opOut . opcode = attOp . opcode ;
opOut . chars = csOp . chars ;
opOut . lines = csOp . lines ;
opOut . attribs = exports . composeAttributes ( attOp . attribs , csOp . attribs , attOp . opcode == '=' , pool ) ;
csOp . opcode = '' ;
attOp . chars -= csOp . chars ;
attOp . lines -= csOp . lines ;
if ( ! attOp . chars ) {
attOp . opcode = '' ;
}
} else {
// keep and keep going
opOut . opcode = attOp . opcode ;
opOut . chars = attOp . chars ;
opOut . lines = attOp . lines ;
opOut . attribs = exports . composeAttributes ( attOp . attribs , csOp . attribs , attOp . opcode == '=' , pool ) ;
attOp . opcode = '' ;
csOp . chars -= attOp . chars ;
csOp . lines -= attOp . lines ;
}
break ;
}
case '' :
{
exports . copyOp ( attOp , opOut ) ;
attOp . opcode = '' ;
break ;
}
}
}
} ;