From 83c03f88a24e0b93e963553c4f97f26bf8435877 Mon Sep 17 00:00:00 2001
From: "Shane F. Carr" <shane.carr@wustl.edu>
Date: Tue, 22 May 2018 06:59:46 -0700
Subject: [PATCH 1/2] Initial commit of utf32_string plumbing.  Changes all
 string operations to use functions instead of operators that coerce arguments
 to primitive types.  Checks or converts to utf32_string at the API boundary. 
 Changes unit test suite to be run twice, one with standard string and once
 with forced utf32_string.

---
 javascript/diff_match_patch_uncompressed.js | 466 ++++++++++++++++----
 javascript/tests/diff_match_patch_test.html |  29 +-
 javascript/tests/diff_match_patch_test.js   | 252 +++++++----
 3 files changed, 552 insertions(+), 195 deletions(-)

diff --git a/javascript/diff_match_patch_uncompressed.js b/javascript/diff_match_patch_uncompressed.js
index d56f2e7d..1830629d 100644
--- a/javascript/diff_match_patch_uncompressed.js
+++ b/javascript/diff_match_patch_uncompressed.js
@@ -101,13 +101,19 @@ diff_match_patch.prototype.diff_main = function(text1, text2, opt_checklines,
   }
 
   // Check for equality (speedup).
-  if (text1 == text2) {
+  if (text1.toString() == text2.toString()) {
     if (text1) {
       return [[DIFF_EQUAL, text1]];
     }
     return [];
   }
 
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text1) || diff_match_patch.utf32_string.hasSupplemental(text2)) {
+    text1 = diff_match_patch.utf32_string.from(text1);
+    text2 = diff_match_patch.utf32_string.from(text2);
+  }
+
   if (typeof opt_checklines == 'undefined') {
     opt_checklines = true;
   }
@@ -129,10 +135,10 @@ diff_match_patch.prototype.diff_main = function(text1, text2, opt_checklines,
   var diffs = this.diff_compute_(text1, text2, checklines, deadline);
 
   // Restore the prefix and suffix.
-  if (commonprefix) {
+  if (commonprefix.length) {
     diffs.unshift([DIFF_EQUAL, commonprefix]);
   }
-  if (commonsuffix) {
+  if (commonsuffix.length) {
     diffs.push([DIFF_EQUAL, commonsuffix]);
   }
   this.diff_cleanupMerge(diffs);
@@ -154,14 +160,17 @@ diff_match_patch.prototype.diff_main = function(text1, text2, opt_checklines,
  */
 diff_match_patch.prototype.diff_compute_ = function(text1, text2, checklines,
     deadline) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   var diffs;
 
-  if (!text1) {
+  if (!text1.length) {
     // Just add some text (speedup).
     return [[DIFF_INSERT, text2]];
   }
 
-  if (!text2) {
+  if (!text2.length) {
     // Just delete some text (speedup).
     return [[DIFF_DELETE, text1]];
   }
@@ -222,6 +231,9 @@ diff_match_patch.prototype.diff_compute_ = function(text1, text2, checklines,
  * @private
  */
 diff_match_patch.prototype.diff_lineMode_ = function(text1, text2, deadline) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   // Scan the text on a line-by-line basis first.
   var a = this.diff_linesToChars_(text1, text2);
   text1 = a.chars1;
@@ -247,11 +259,11 @@ diff_match_patch.prototype.diff_lineMode_ = function(text1, text2, deadline) {
     switch (diffs[pointer][0]) {
       case DIFF_INSERT:
         count_insert++;
-        text_insert += diffs[pointer][1];
+        text_insert = text_insert.concat(diffs[pointer][1]);
         break;
       case DIFF_DELETE:
         count_delete++;
-        text_delete += diffs[pointer][1];
+        text_delete = text_delete.concat(diffs[pointer][1]);
         break;
       case DIFF_EQUAL:
         // Upon reaching an equality, check for prior redundancies.
@@ -291,6 +303,9 @@ diff_match_patch.prototype.diff_lineMode_ = function(text1, text2, deadline) {
  * @private
  */
 diff_match_patch.prototype.diff_bisect_ = function(text1, text2, deadline) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   // Cache the text lengths to prevent multiple calls.
   var text1_length = text1.length;
   var text2_length = text2.length;
@@ -415,6 +430,9 @@ diff_match_patch.prototype.diff_bisect_ = function(text1, text2, deadline) {
  */
 diff_match_patch.prototype.diff_bisectSplit_ = function(text1, text2, x, y,
     deadline) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   var text1a = text1.substring(0, x);
   var text2a = text2.substring(0, y);
   var text1b = text1.substring(x);
@@ -440,12 +458,15 @@ diff_match_patch.prototype.diff_bisectSplit_ = function(text1, text2, x, y,
  * @private
  */
 diff_match_patch.prototype.diff_linesToChars_ = function(text1, text2) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   var lineArray = [];  // e.g. lineArray[4] == 'Hello\n'
   var lineHash = {};   // e.g. lineHash['Hello\n'] == 4
 
   // '\x00' is a valid character, but various debuggers don't like it.
   // So we'll insert a junk entry to avoid generating a null character.
-  lineArray[0] = '';
+  lineArray[0] = text1.substring(0, 0);
 
   /**
    * Split a text into an array of strings.  Reduce the texts to a string of
@@ -470,14 +491,15 @@ diff_match_patch.prototype.diff_linesToChars_ = function(text1, text2) {
         lineEnd = text.length - 1;
       }
       var line = text.substring(lineStart, lineEnd + 1);
+      var lineKey = line.toString();
       lineStart = lineEnd + 1;
 
-      if (lineHash.hasOwnProperty ? lineHash.hasOwnProperty(line) :
-          (lineHash[line] !== undefined)) {
-        chars += String.fromCharCode(lineHash[line]);
+      if (lineHash.hasOwnProperty ? lineHash.hasOwnProperty(lineKey) :
+          (lineHash[lineKey] !== undefined)) {
+        chars += String.fromCharCode(lineHash[lineKey]);
       } else {
         chars += String.fromCharCode(lineArrayLength);
-        lineHash[line] = lineArrayLength;
+        lineHash[lineKey] = lineArrayLength;
         lineArray[lineArrayLength++] = line;
       }
     }
@@ -498,13 +520,21 @@ diff_match_patch.prototype.diff_linesToChars_ = function(text1, text2) {
  * @private
  */
 diff_match_patch.prototype.diff_charsToLines_ = function(diffs, lineArray) {
+  this.assertSafe_(lineArray);
+
   for (var x = 0; x < diffs.length; x++) {
     var chars = diffs[x][1];
-    var text = [];
-    for (var y = 0; y < chars.length; y++) {
-      text[y] = lineArray[chars.charCodeAt(y)];
+    var text;
+    if (chars.length === 0) {
+      // don't lose string type (regular or utf32_string)
+      text = lineArray[0].substring(0, 0);
+    } else {
+      text = lineArray[chars.charCodeAt(0)]
+    }
+    for (var y = 1; y < chars.length; y++) {
+      text = text.concat(lineArray[chars.charCodeAt(y)]);
     }
-    diffs[x][1] = text.join('');
+    diffs[x][1] = text;
   }
 };
 
@@ -521,6 +551,13 @@ diff_match_patch.prototype.diff_commonPrefix = function(text1, text2) {
   if (!text1 || !text2 || text1.charAt(0) != text2.charAt(0)) {
     return 0;
   }
+
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text1) || diff_match_patch.utf32_string.hasSupplemental(text2)) {
+    text1 = diff_match_patch.utf32_string.from(text1);
+    text2 = diff_match_patch.utf32_string.from(text2);
+  }
+
   // Binary search.
   // Performance analysis: http://neil.fraser.name/news/2007/10/09/
   var pointermin = 0;
@@ -528,8 +565,8 @@ diff_match_patch.prototype.diff_commonPrefix = function(text1, text2) {
   var pointermid = pointermax;
   var pointerstart = 0;
   while (pointermin < pointermid) {
-    if (text1.substring(pointerstart, pointermid) ==
-        text2.substring(pointerstart, pointermid)) {
+    if (text1.substring(pointerstart, pointermid).toString() ==
+        text2.substring(pointerstart, pointermid).toString()) {
       pointermin = pointermid;
       pointerstart = pointermin;
     } else {
@@ -553,6 +590,12 @@ diff_match_patch.prototype.diff_commonSuffix = function(text1, text2) {
       text1.charAt(text1.length - 1) != text2.charAt(text2.length - 1)) {
     return 0;
   }
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text1) || diff_match_patch.utf32_string.hasSupplemental(text2)) {
+    text1 = diff_match_patch.utf32_string.from(text1);
+    text2 = diff_match_patch.utf32_string.from(text2);
+  }
+
   // Binary search.
   // Performance analysis: http://neil.fraser.name/news/2007/10/09/
   var pointermin = 0;
@@ -560,8 +603,8 @@ diff_match_patch.prototype.diff_commonSuffix = function(text1, text2) {
   var pointermid = pointermax;
   var pointerend = 0;
   while (pointermin < pointermid) {
-    if (text1.substring(text1.length - pointermid, text1.length - pointerend) ==
-        text2.substring(text2.length - pointermid, text2.length - pointerend)) {
+    if (text1.substring(text1.length - pointermid, text1.length - pointerend).toString() ==
+        text2.substring(text2.length - pointermid, text2.length - pointerend).toString()) {
       pointermin = pointermid;
       pointerend = pointermin;
     } else {
@@ -582,6 +625,9 @@ diff_match_patch.prototype.diff_commonSuffix = function(text1, text2) {
  * @private
  */
 diff_match_patch.prototype.diff_commonOverlap_ = function(text1, text2) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   // Cache the text lengths to prevent multiple calls.
   var text1_length = text1.length;
   var text2_length = text2.length;
@@ -597,7 +643,7 @@ diff_match_patch.prototype.diff_commonOverlap_ = function(text1, text2) {
   }
   var text_length = Math.min(text1_length, text2_length);
   // Quick check for the worst case.
-  if (text1 == text2) {
+  if (text1.toString() == text2.toString()) {
     return text_length;
   }
 
@@ -613,8 +659,8 @@ diff_match_patch.prototype.diff_commonOverlap_ = function(text1, text2) {
       return best;
     }
     length += found;
-    if (found == 0 || text1.substring(text_length - length) ==
-        text2.substring(0, length)) {
+    if (found == 0 || text1.substring(text_length - length).toString() ==
+        text2.substring(0, length).toString()) {
       best = length;
       length++;
     }
@@ -634,6 +680,9 @@ diff_match_patch.prototype.diff_commonOverlap_ = function(text1, text2) {
  * @private
  */
 diff_match_patch.prototype.diff_halfMatch_ = function(text1, text2) {
+  this.assertSafe_(text1);
+  this.assertSafe_(text2);
+
   if (this.Diff_Timeout <= 0) {
     // Don't risk returning a non-optimal diff if we have unlimited time.
     return null;
@@ -661,7 +710,7 @@ diff_match_patch.prototype.diff_halfMatch_ = function(text1, text2) {
     // Start with a 1/4 length substring at position i as a seed.
     var seed = longtext.substring(i, i + Math.floor(longtext.length / 4));
     var j = -1;
-    var best_common = '';
+    var best_common = longtext.substring(0, 0);  // retain string type
     var best_longtext_a, best_longtext_b, best_shorttext_a, best_shorttext_b;
     while ((j = shorttext.indexOf(seed, j + 1)) != -1) {
       var prefixLength = dmp.diff_commonPrefix(longtext.substring(i),
@@ -669,8 +718,8 @@ diff_match_patch.prototype.diff_halfMatch_ = function(text1, text2) {
       var suffixLength = dmp.diff_commonSuffix(longtext.substring(0, i),
                                                shorttext.substring(0, j));
       if (best_common.length < suffixLength + prefixLength) {
-        best_common = shorttext.substring(j - suffixLength, j) +
-            shorttext.substring(j, j + prefixLength);
+        best_common = shorttext.substring(j - suffixLength, j).concat(
+            shorttext.substring(j, j + prefixLength));
         best_longtext_a = longtext.substring(0, i - suffixLength);
         best_longtext_b = longtext.substring(i + prefixLength);
         best_shorttext_a = shorttext.substring(0, j - suffixLength);
@@ -726,6 +775,8 @@ diff_match_patch.prototype.diff_halfMatch_ = function(text1, text2) {
  * @param {!Array.<!diff_match_patch.Diff>} diffs Array of diff tuples.
  */
 diff_match_patch.prototype.diff_cleanupSemantic = function(diffs) {
+  this.assertSafe_(diffs);
+
   var changes = false;
   var equalities = [];  // Stack of indices where equalities are found.
   var equalitiesLength = 0;  // Keeping our own length var is faster in JS.
@@ -841,6 +892,8 @@ diff_match_patch.prototype.diff_cleanupSemantic = function(diffs) {
  * @param {!Array.<!diff_match_patch.Diff>} diffs Array of diff tuples.
  */
 diff_match_patch.prototype.diff_cleanupSemanticLossless = function(diffs) {
+  this.assertSafe_(diffs);
+
   /**
    * Given two strings, compute a score representing whether the internal
    * boundary falls on logical boundaries.
@@ -852,7 +905,7 @@ diff_match_patch.prototype.diff_cleanupSemanticLossless = function(diffs) {
    * @private
    */
   function diff_cleanupSemanticScore_(one, two) {
-    if (!one || !two) {
+    if (!one.length || !two.length) {
       // Edges are the best.
       return 6;
     }
@@ -913,8 +966,8 @@ diff_match_patch.prototype.diff_cleanupSemanticLossless = function(diffs) {
       if (commonOffset) {
         var commonString = edit.substring(edit.length - commonOffset);
         equality1 = equality1.substring(0, equality1.length - commonOffset);
-        edit = commonString + edit.substring(0, edit.length - commonOffset);
-        equality2 = commonString + equality2;
+        edit = commonString.concat(edit.substring(0, edit.length - commonOffset));
+        equality2 = commonString.concat(equality2);
       }
 
       // Second, step character by character right, looking for the best fit.
@@ -924,8 +977,8 @@ diff_match_patch.prototype.diff_cleanupSemanticLossless = function(diffs) {
       var bestScore = diff_cleanupSemanticScore_(equality1, edit) +
           diff_cleanupSemanticScore_(edit, equality2);
       while (edit.charAt(0) === equality2.charAt(0)) {
-        equality1 += edit.charAt(0);
-        edit = edit.substring(1) + equality2.charAt(0);
+        equality1 = equality1.concat(edit.charAt(0));
+        edit = edit.substring(1).concat(equality2.charAt(0));
         equality2 = equality2.substring(1);
         var score = diff_cleanupSemanticScore_(equality1, edit) +
             diff_cleanupSemanticScore_(edit, equality2);
@@ -938,16 +991,16 @@ diff_match_patch.prototype.diff_cleanupSemanticLossless = function(diffs) {
         }
       }
 
-      if (diffs[pointer - 1][1] != bestEquality1) {
+      if (diffs[pointer - 1][1].toString() != bestEquality1.toString()) {
         // We have an improvement, save it back to the diff.
-        if (bestEquality1) {
+        if (bestEquality1.length) {
           diffs[pointer - 1][1] = bestEquality1;
         } else {
           diffs.splice(pointer - 1, 1);
           pointer--;
         }
         diffs[pointer][1] = bestEdit;
-        if (bestEquality2) {
+        if (bestEquality2.length) {
           diffs[pointer + 1][1] = bestEquality2;
         } else {
           diffs.splice(pointer + 1, 1);
@@ -971,6 +1024,8 @@ diff_match_patch.blanklineStartRegex_ = /^\r?\n\r?\n/;
  * @param {!Array.<!diff_match_patch.Diff>} diffs Array of diff tuples.
  */
 diff_match_patch.prototype.diff_cleanupEfficiency = function(diffs) {
+  this.assertSafe_(diffs);
+
   var changes = false;
   var equalities = [];  // Stack of indices where equalities are found.
   var equalitiesLength = 0;  // Keeping our own length var is faster in JS.
@@ -1053,23 +1108,27 @@ diff_match_patch.prototype.diff_cleanupEfficiency = function(diffs) {
  * @param {!Array.<!diff_match_patch.Diff>} diffs Array of diff tuples.
  */
 diff_match_patch.prototype.diff_cleanupMerge = function(diffs) {
-  diffs.push([DIFF_EQUAL, '']);  // Add a dummy entry at the end.
+  this.assertSafe_(diffs);
+  // Preserve string type:
+  var emptyString = (diffs.length === 0 ? '' : diffs[0][1].substring(0, 0));
+
+  diffs.push([DIFF_EQUAL, emptyString]);  // Add a dummy entry at the end.
   var pointer = 0;
   var count_delete = 0;
   var count_insert = 0;
-  var text_delete = '';
-  var text_insert = '';
+  var text_delete = emptyString;
+  var text_insert = emptyString;
   var commonlength;
   while (pointer < diffs.length) {
     switch (diffs[pointer][0]) {
       case DIFF_INSERT:
         count_insert++;
-        text_insert += diffs[pointer][1];
+        text_insert = text_insert.concat(diffs[pointer][1]);
         pointer++;
         break;
       case DIFF_DELETE:
         count_delete++;
-        text_delete += diffs[pointer][1];
+        text_delete = text_delete.concat(diffs[pointer][1]);
         pointer++;
         break;
       case DIFF_EQUAL:
@@ -1082,8 +1141,9 @@ diff_match_patch.prototype.diff_cleanupMerge = function(diffs) {
               if ((pointer - count_delete - count_insert) > 0 &&
                   diffs[pointer - count_delete - count_insert - 1][0] ==
                   DIFF_EQUAL) {
-                diffs[pointer - count_delete - count_insert - 1][1] +=
-                    text_insert.substring(0, commonlength);
+                diffs[pointer - count_delete - count_insert - 1][1] =
+                  diffs[pointer - count_delete - count_insert - 1][1].concat(
+                    text_insert.substring(0, commonlength));
               } else {
                 diffs.splice(0, 0, [DIFF_EQUAL,
                                     text_insert.substring(0, commonlength)]);
@@ -1096,7 +1156,7 @@ diff_match_patch.prototype.diff_cleanupMerge = function(diffs) {
             commonlength = this.diff_commonSuffix(text_insert, text_delete);
             if (commonlength !== 0) {
               diffs[pointer][1] = text_insert.substring(text_insert.length -
-                  commonlength) + diffs[pointer][1];
+                  commonlength).concat(diffs[pointer][1]);
               text_insert = text_insert.substring(0, text_insert.length -
                   commonlength);
               text_delete = text_delete.substring(0, text_delete.length -
@@ -1119,19 +1179,19 @@ diff_match_patch.prototype.diff_cleanupMerge = function(diffs) {
                     (count_delete ? 1 : 0) + (count_insert ? 1 : 0) + 1;
         } else if (pointer !== 0 && diffs[pointer - 1][0] == DIFF_EQUAL) {
           // Merge this equality with the previous one.
-          diffs[pointer - 1][1] += diffs[pointer][1];
+          diffs[pointer - 1][1] = diffs[pointer - 1][1].concat(diffs[pointer][1]);
           diffs.splice(pointer, 1);
         } else {
           pointer++;
         }
         count_insert = 0;
         count_delete = 0;
-        text_delete = '';
-        text_insert = '';
+        text_delete = emptyString;
+        text_insert = emptyString;
         break;
     }
   }
-  if (diffs[diffs.length - 1][1] === '') {
+  if (diffs[diffs.length - 1][1].length === 0) {
     diffs.pop();  // Remove the dummy entry at the end.
   }
 
@@ -1146,21 +1206,20 @@ diff_match_patch.prototype.diff_cleanupMerge = function(diffs) {
         diffs[pointer + 1][0] == DIFF_EQUAL) {
       // This is a single edit surrounded by equalities.
       if (diffs[pointer][1].substring(diffs[pointer][1].length -
-          diffs[pointer - 1][1].length) == diffs[pointer - 1][1]) {
+          diffs[pointer - 1][1].length).toString() == diffs[pointer - 1][1].toString()) {
         // Shift the edit over the previous equality.
-        diffs[pointer][1] = diffs[pointer - 1][1] +
+        diffs[pointer][1] = diffs[pointer - 1][1].concat(
             diffs[pointer][1].substring(0, diffs[pointer][1].length -
-                                        diffs[pointer - 1][1].length);
-        diffs[pointer + 1][1] = diffs[pointer - 1][1] + diffs[pointer + 1][1];
+                                        diffs[pointer - 1][1].length));
+        diffs[pointer + 1][1] = diffs[pointer - 1][1].concat(diffs[pointer + 1][1]);
         diffs.splice(pointer - 1, 1);
         changes = true;
-      } else if (diffs[pointer][1].substring(0, diffs[pointer + 1][1].length) ==
-          diffs[pointer + 1][1]) {
+      } else if (diffs[pointer][1].substring(0, diffs[pointer + 1][1].length).toString() ==
+          diffs[pointer + 1][1].toString()) {
         // Shift the edit over the next equality.
-        diffs[pointer - 1][1] += diffs[pointer + 1][1];
+        diffs[pointer - 1][1] = diffs[pointer - 1][1].concat(diffs[pointer + 1][1]);
         diffs[pointer][1] =
-            diffs[pointer][1].substring(diffs[pointer + 1][1].length) +
-            diffs[pointer + 1][1];
+            diffs[pointer][1].substring(diffs[pointer + 1][1].length).concat(            diffs[pointer + 1][1]);
         diffs.splice(pointer + 1, 1);
         changes = true;
       }
@@ -1183,6 +1242,8 @@ diff_match_patch.prototype.diff_cleanupMerge = function(diffs) {
  * @return {number} Location within text2.
  */
 diff_match_patch.prototype.diff_xIndex = function(diffs, loc) {
+  this.assertSafe_(diffs);
+
   var chars1 = 0;
   var chars2 = 0;
   var last_chars1 = 0;
@@ -1216,6 +1277,8 @@ diff_match_patch.prototype.diff_xIndex = function(diffs, loc) {
  * @return {string} HTML representation.
  */
 diff_match_patch.prototype.diff_prettyHtml = function(diffs) {
+  this.assertSafe_(diffs);
+
   var html = [];
   var pattern_amp = /&/g;
   var pattern_lt = /</g;
@@ -1228,13 +1291,13 @@ diff_match_patch.prototype.diff_prettyHtml = function(diffs) {
         .replace(pattern_gt, '&gt;').replace(pattern_para, '&para;<br>');
     switch (op) {
       case DIFF_INSERT:
-        html[x] = '<ins style="background:#e6ffe6;">' + text + '</ins>';
+        html[x] = '<ins style="background:#e6ffe6;">' + text.toString() + '</ins>';
         break;
       case DIFF_DELETE:
-        html[x] = '<del style="background:#ffe6e6;">' + text + '</del>';
+        html[x] = '<del style="background:#ffe6e6;">' + text.toString() + '</del>';
         break;
       case DIFF_EQUAL:
-        html[x] = '<span>' + text + '</span>';
+        html[x] = '<span>' + text.toString() + '</span>';
         break;
     }
   }
@@ -1248,13 +1311,28 @@ diff_match_patch.prototype.diff_prettyHtml = function(diffs) {
  * @return {string} Source text.
  */
 diff_match_patch.prototype.diff_text1 = function(diffs) {
+  return this.diff_text1_(diffs).toString();
+};
+
+
+/**
+ * Same as diff_text1 but might return a utf32_string.
+ * @private
+ */
+diff_match_patch.prototype.diff_text1_ = function(diffs) {
+  this.assertSafe_(diffs);
   var text = [];
   for (var x = 0; x < diffs.length; x++) {
     if (diffs[x][0] !== DIFF_INSERT) {
-      text[x] = diffs[x][1];
+      text[x] = diffs[x][1].toString();
     }
   }
-  return text.join('');
+  var retval = text.join('');
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(retval)) {
+    retval = diff_match_patch.utf32_string.from(retval);
+  }
+  return retval;
 };
 
 
@@ -1264,13 +1342,28 @@ diff_match_patch.prototype.diff_text1 = function(diffs) {
  * @return {string} Destination text.
  */
 diff_match_patch.prototype.diff_text2 = function(diffs) {
+  return this.diff_text2_(diffs).toString();
+};
+
+
+/**
+ * Same as diff_text2 but might return a utf32_string.
+ * @private
+ */
+diff_match_patch.prototype.diff_text2_ = function(diffs) {
+  this.assertSafe_(diffs);
   var text = [];
   for (var x = 0; x < diffs.length; x++) {
     if (diffs[x][0] !== DIFF_DELETE) {
-      text[x] = diffs[x][1];
+      text[x] = diffs[x][1].toString();
     }
   }
-  return text.join('');
+  var retval = text.join('');
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(retval)) {
+    retval = diff_match_patch.utf32_string.from(retval);
+  }
+  return retval;
 };
 
 
@@ -1281,6 +1374,7 @@ diff_match_patch.prototype.diff_text2 = function(diffs) {
  * @return {number} Number of changes.
  */
 diff_match_patch.prototype.diff_levenshtein = function(diffs) {
+  this.assertSafe_(diffs);
   var levenshtein = 0;
   var insertions = 0;
   var deletions = 0;
@@ -1316,6 +1410,7 @@ diff_match_patch.prototype.diff_levenshtein = function(diffs) {
  * @return {string} Delta text.
  */
 diff_match_patch.prototype.diff_toDelta = function(diffs) {
+  this.assertSafe_(diffs);
   var text = [];
   for (var x = 0; x < diffs.length; x++) {
     switch (diffs[x][0]) {
@@ -1343,6 +1438,11 @@ diff_match_patch.prototype.diff_toDelta = function(diffs) {
  * @throws {!Error} If invalid input.
  */
 diff_match_patch.prototype.diff_fromDelta = function(text1, delta) {
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text1)) {
+    text1 = diff_match_patch.utf32_string.from(text1);
+  }
+
   var diffs = [];
   var diffsLength = 0;  // Keeping our own length var is faster in JS.
   var pointer = 0;  // Cursor in text1
@@ -1406,15 +1506,19 @@ diff_match_patch.prototype.match_main = function(text, pattern, loc) {
   if (text == null || pattern == null || loc == null) {
     throw new Error('Null input. (match_main)');
   }
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text)) {
+    text = diff_match_patch.utf32_string.from(text);
+  }
 
   loc = Math.max(0, Math.min(loc, text.length));
-  if (text == pattern) {
+  if (text.toString() == pattern.toString()) {
     // Shortcut (potentially not guaranteed by the algorithm)
     return 0;
   } else if (!text.length) {
     // Nothing to match.
     return -1;
-  } else if (text.substring(loc, loc + pattern.length) == pattern) {
+  } else if (text.substring(loc, loc + pattern.length).toString() == pattern.toString()) {
     // Perfect match at the perfect spot!  (Includes case of null pattern)
     return loc;
   } else {
@@ -1434,6 +1538,7 @@ diff_match_patch.prototype.match_main = function(text, pattern, loc) {
  * @private
  */
 diff_match_patch.prototype.match_bitap_ = function(text, pattern, loc) {
+  this.assertSafe_(text);
   if (pattern.length > this.Match_MaxBits) {
     throw new Error('Pattern too long for this browser.');
   }
@@ -1571,6 +1676,7 @@ diff_match_patch.prototype.match_alphabet_ = function(pattern) {
  * @private
  */
 diff_match_patch.prototype.patch_addContext_ = function(patch, text) {
+  this.assertSafe_(text);
   if (text.length == 0) {
     return;
   }
@@ -1591,13 +1697,13 @@ diff_match_patch.prototype.patch_addContext_ = function(patch, text) {
 
   // Add the prefix.
   var prefix = text.substring(patch.start2 - padding, patch.start2);
-  if (prefix) {
+  if (prefix.length) {
     patch.diffs.unshift([DIFF_EQUAL, prefix]);
   }
   // Add the suffix.
   var suffix = text.substring(patch.start2 + patch.length1,
                               patch.start2 + patch.length1 + padding);
-  if (suffix) {
+  if (suffix.length) {
     patch.diffs.push([DIFF_EQUAL, suffix]);
   }
 
@@ -1649,7 +1755,7 @@ diff_match_patch.prototype.patch_make = function(a, opt_b, opt_c) {
     // Method 2: diffs
     // Compute text1 from diffs.
     diffs = /** @type {!Array.<!diff_match_patch.Diff>} */(a);
-    text1 = this.diff_text1(diffs);
+    text1 = this.diff_text1_(diffs);
   } else if (typeof a == 'string' && opt_b && typeof opt_b == 'object' &&
       typeof opt_c == 'undefined') {
     // Method 3: text1, diffs
@@ -1665,6 +1771,11 @@ diff_match_patch.prototype.patch_make = function(a, opt_b, opt_c) {
     throw new Error('Unknown call format to patch_make.');
   }
 
+  this.assertSafe_(diffs);
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text1)) {
+    text1 = diff_match_patch.utf32_string.from(text1);
+  }
   if (diffs.length === 0) {
     return [];  // Get rid of the null case.
   }
@@ -1692,15 +1803,15 @@ diff_match_patch.prototype.patch_make = function(a, opt_b, opt_c) {
       case DIFF_INSERT:
         patch.diffs[patchDiffLength++] = diffs[x];
         patch.length2 += diff_text.length;
-        postpatch_text = postpatch_text.substring(0, char_count2) + diff_text +
-                         postpatch_text.substring(char_count2);
+        postpatch_text = postpatch_text.substring(0, char_count2).concat(
+                         diff_text, postpatch_text.substring(char_count2));
         break;
       case DIFF_DELETE:
         patch.length1 += diff_text.length;
         patch.diffs[patchDiffLength++] = diffs[x];
-        postpatch_text = postpatch_text.substring(0, char_count2) +
-                         postpatch_text.substring(char_count2 +
-                             diff_text.length);
+        postpatch_text = postpatch_text.substring(0, char_count2).concat(
+                         postpatch_text.substring(
+                          char_count2 + diff_text.length));
         break;
       case DIFF_EQUAL:
         if (diff_text.length <= 2 * this.Patch_Margin &&
@@ -1783,11 +1894,16 @@ diff_match_patch.prototype.patch_apply = function(patches, text) {
     return [text, []];
   }
 
+  // Check for Unicode
+  if (diff_match_patch.utf32_string.hasSupplemental(text)) {
+    text = diff_match_patch.utf32_string.from(text);
+  }
+
   // Deep copy the patches so that no changes are made to originals.
   patches = this.patch_deepCopy(patches);
 
   var nullPadding = this.patch_addPadding(patches);
-  text = nullPadding + text + nullPadding;
+  text = nullPadding.concat(text, nullPadding);
 
   this.patch_splitMax(patches);
   // delta keeps track of the offset between the expected and actual location
@@ -1798,7 +1914,7 @@ diff_match_patch.prototype.patch_apply = function(patches, text) {
   var results = [];
   for (var x = 0; x < patches.length; x++) {
     var expected_loc = patches[x].start2 + delta;
-    var text1 = this.diff_text1(patches[x].diffs);
+    var text1 = this.diff_text1_(patches[x].diffs);
     var start_loc;
     var end_loc = -1;
     if (text1.length > this.Match_MaxBits) {
@@ -1833,11 +1949,11 @@ diff_match_patch.prototype.patch_apply = function(patches, text) {
       } else {
         text2 = text.substring(start_loc, end_loc + this.Match_MaxBits);
       }
-      if (text1 == text2) {
+      if (text1.toString() == text2.toString()) {
         // Perfect match, just shove the replacement text in.
-        text = text.substring(0, start_loc) +
-               this.diff_text2(patches[x].diffs) +
-               text.substring(start_loc + text1.length);
+        text = text.substring(0, start_loc).concat(
+               this.diff_text2_(patches[x].diffs),
+               text.substring(start_loc + text1.length));
       } else {
         // Imperfect match.  Run a diff to get a framework of equivalent
         // indices.
@@ -1857,12 +1973,11 @@ diff_match_patch.prototype.patch_apply = function(patches, text) {
               index2 = this.diff_xIndex(diffs, index1);
             }
             if (mod[0] === DIFF_INSERT) {  // Insertion
-              text = text.substring(0, start_loc + index2) + mod[1] +
-                     text.substring(start_loc + index2);
+              text = text.substring(0, start_loc + index2).concat(
+                     mod[1], text.substring(start_loc + index2));
             } else if (mod[0] === DIFF_DELETE) {  // Deletion
-              text = text.substring(0, start_loc + index2) +
-                     text.substring(start_loc + this.diff_xIndex(diffs,
-                         index1 + mod[1].length));
+              text = text.substring(0, start_loc + index2).concat(
+                     text.substring(start_loc + this.diff_xIndex(diffs, index1 + mod[1].length)));
             }
             if (mod[0] !== DIFF_DELETE) {
               index1 += mod[1].length;
@@ -1890,6 +2005,9 @@ diff_match_patch.prototype.patch_addPadding = function(patches) {
   for (var x = 1; x <= paddingLength; x++) {
     nullPadding += String.fromCharCode(x);
   }
+  if (patches[0].diffs[0][1].codePoints) {
+    nullPadding = diff_match_patch.utf32_string.from(nullPadding);
+  }
 
   // Bump all the patches forward.
   for (var x = 0; x < patches.length; x++) {
@@ -1910,7 +2028,7 @@ diff_match_patch.prototype.patch_addPadding = function(patches) {
   } else if (paddingLength > diffs[0][1].length) {
     // Grow first equality.
     var extraLength = paddingLength - diffs[0][1].length;
-    diffs[0][1] = nullPadding.substring(diffs[0][1].length) + diffs[0][1];
+    diffs[0][1] = nullPadding.substring(diffs[0][1].length).concat(diffs[0][1]);
     patch.start1 -= extraLength;
     patch.start2 -= extraLength;
     patch.length1 += extraLength;
@@ -1928,7 +2046,7 @@ diff_match_patch.prototype.patch_addPadding = function(patches) {
   } else if (paddingLength > diffs[diffs.length - 1][1].length) {
     // Grow last equality.
     var extraLength = paddingLength - diffs[diffs.length - 1][1].length;
-    diffs[diffs.length - 1][1] += nullPadding.substring(0, extraLength);
+    diffs[diffs.length - 1][1] = diffs[diffs.length - 1][1].concat(nullPadding.substring(0, extraLength));
     patch.length1 += extraLength;
     patch.length2 += extraLength;
   }
@@ -1961,7 +2079,7 @@ diff_match_patch.prototype.patch_splitMax = function(patches) {
       var empty = true;
       patch.start1 = start1 - precontext.length;
       patch.start2 = start2 - precontext.length;
-      if (precontext !== '') {
+      if (precontext.toString() !== '') {
         patch.length1 = patch.length2 = precontext.length;
         patch.diffs.push([DIFF_EQUAL, precontext]);
       }
@@ -1997,7 +2115,7 @@ diff_match_patch.prototype.patch_splitMax = function(patches) {
             empty = false;
           }
           patch.diffs.push([diff_type, diff_text]);
-          if (diff_text == bigpatch.diffs[0][1]) {
+          if (diff_text.toString() == bigpatch.diffs[0][1].toString()) {
             bigpatch.diffs.shift();
           } else {
             bigpatch.diffs[0][1] =
@@ -2006,18 +2124,18 @@ diff_match_patch.prototype.patch_splitMax = function(patches) {
         }
       }
       // Compute the head context for the next patch.
-      precontext = this.diff_text2(patch.diffs);
+      precontext = this.diff_text2_(patch.diffs);
       precontext =
           precontext.substring(precontext.length - this.Patch_Margin);
       // Append the end context for this patch.
-      var postcontext = this.diff_text1(bigpatch.diffs)
+      var postcontext = this.diff_text1_(bigpatch.diffs)
                             .substring(0, this.Patch_Margin);
-      if (postcontext !== '') {
+      if (postcontext.toString() !== '') {
         patch.length1 += postcontext.length;
         patch.length2 += postcontext.length;
         if (patch.diffs.length !== 0 &&
             patch.diffs[patch.diffs.length - 1][0] === DIFF_EQUAL) {
-          patch.diffs[patch.diffs.length - 1][1] += postcontext;
+          patch.diffs[patch.diffs.length - 1][1] = patch.diffs[patch.diffs.length - 1][1].concat(postcontext);
         } else {
           patch.diffs.push([DIFF_EQUAL, postcontext]);
         }
@@ -2121,6 +2239,25 @@ diff_match_patch.prototype.patch_fromText = function(textline) {
 };
 
 
+diff_match_patch.prototype.assertSafe_ = function(obj) {
+  if (obj.codePoints) {
+    return;
+  }
+  if (typeof obj === 'string') {
+    console.assert(!diff_match_patch.utf32_string.hasSupplemental(obj), obj);
+  }
+  if (typeof obj === 'object') {
+    for (var i=0; i<obj.length; i++) {
+      this.assertSafe_(obj[i]);
+    }
+  }
+  if (typeof obj === 'number') {
+    return;
+  }
+  console.assert('Unknown object type', obj);
+}
+
+
 /**
  * Class representing one patch operation.
  * @constructor
@@ -2182,6 +2319,153 @@ diff_match_patch.patch_obj.prototype.toString = function() {
 };
 
 
+/** Whether to force the implementation to always use utf32_string. */
+diff_match_patch.force_utf32_string = false;
+
+
+/** A String-like class that treats each code point as a single character. */
+diff_match_patch.utf32_string = function() {
+  this.string = "";
+  this.codePoints = [];
+  this.length = 0;
+};
+
+
+diff_match_patch.utf32_string.hasSupplemental = function(text) {
+  // Require at least String.prototype.codePointAt(), ES5+
+  if (!String.prototype.codePointAt) {
+    return false;
+  }
+  if (text.codePoints) {
+    // Argument is another utf32_string; do not re-convert
+    return false;
+  }
+  if (diff_match_patch.force_utf32_string) {
+    // Override: force utf32_string conversion
+    return true;
+  }
+  for (var i=0; i<text.length; i++) {
+    var ch = text.charCodeAt(i);
+    if (ch >= 0xD800 && ch <= 0xDFFF) {
+      return true;
+    }
+  }
+  return false;
+};
+
+
+diff_match_patch.utf32_string.from = function(text) {
+  var result = new diff_match_patch.utf32_string();
+  for (var i=0; i<text.length; i++) {
+    var cp = text.codePointAt(i);
+    result.codePoints.push(cp);
+    if (cp > 0xFFFF) {
+      i++;
+    }
+  }
+  result.string = text;
+  result.length = result.codePoints.length;
+  return result;
+};
+
+
+diff_match_patch.utf32_string.prototype.charAt = function(i) {
+  if (i < 0 || i >= this.length) {
+    return "";
+  }
+  return String.fromCodePoint(this.codePoints[i]);
+};
+
+
+diff_match_patch.utf32_string.prototype.charCodeAt = function(i) {
+  if (i < 0 || i >= this.length) {
+    return 0;
+  }
+  return this.codePoints[i];
+};
+
+
+diff_match_patch.utf32_string.prototype.substring = function(start, end) {
+  var result = new diff_match_patch.utf32_string();
+  // Implemented according to String.substring specification:
+  // https://www.ecma-international.org/ecma-262/5.1/#sec-15.5.4.15
+  var len = this.length;
+  // TODO: Check for integers like the spec says?
+  var intStart = start;
+  var intEnd = (typeof end === 'undefined') ? len : end;
+  var finalStart = Math.min(Math.max(intStart, 0), len);
+  var finalEnd = Math.min(Math.max(intEnd, 0), len);
+  var from = Math.min(finalStart, finalEnd);
+  var to = Math.max(finalStart, finalEnd);
+
+  // Compute the indices for the actual substring; we must maintain the string
+  // because toString() operations are expected to be fast.
+  var stringFrom = 0;
+  for (var i=0; i<from; i++) {
+    stringFrom += this.codePoints[i] <= 0xFFFF ? 1 : 2;
+  }
+  var stringTo = stringFrom;
+  for (var i=from; i<to; i++) {
+    stringTo += this.codePoints[i] <= 0xFFFF ? 1 : 2;
+  }
+  result.string = this.string.substring(stringFrom, stringTo);
+  result.codePoints = this.codePoints.slice(from, to);
+  result.length = result.codePoints.length;
+  return result;
+};
+
+
+diff_match_patch.utf32_string.prototype.indexOf = function(other, start) {
+  return this.string.indexOf(other.toString(), start);
+};
+
+
+diff_match_patch.utf32_string.prototype.lastIndexOf = function(other, start) {
+  return this.string.lastIndexOf(other.toString(), start);
+};
+
+
+diff_match_patch.utf32_string.prototype.concat = function() {
+  if (arguments.length > 1) {
+    var first = this.concat(arguments[0]);
+    return first.concat.apply(first, Array.prototype.slice.call(arguments, 1));
+  }
+
+  // Make sure input is a utf32_string
+  var other = arguments[0];
+  if (!other.codePoints) {
+    other = diff_match_patch.utf32_string.from(other);
+  }
+
+  var result = new diff_match_patch.utf32_string();
+  result.string = this.string + other.string;
+  result.codePoints = [].concat(this.codePoints, other.codePoints);
+  result.length = result.codePoints.length;
+  return result;
+};
+
+
+diff_match_patch.utf32_string.prototype.match = function() {
+  return this.string.match.apply(this.string, arguments);
+};
+
+
+diff_match_patch.utf32_string.prototype.replace = function() {
+  return diff_match_patch.utf32_string.from(this.string.replace.apply(this.string, arguments));
+};
+
+
+diff_match_patch.utf32_string.prototype.valueOf = function() {
+  throw new Error("warning: implicit conversion attempted on utf32_string; use toString instead");
+  return this.string;
+};
+
+
+diff_match_patch.utf32_string.prototype.toString = function() {
+  return this.string;
+};
+
+
 // Export these global variables so that they survive Google's JS compiler.
 // In a browser, 'this' will be 'window'.
 // Users of node.js should 'require' the uncompressed version since Google's
diff --git a/javascript/tests/diff_match_patch_test.html b/javascript/tests/diff_match_patch_test.html
index 7a7003ca..35af1a51 100644
--- a/javascript/tests/diff_match_patch_test.html
+++ b/javascript/tests/diff_match_patch_test.html
@@ -45,7 +45,7 @@
           // msg is optional.
           actual = expected;
           expected = msg;
-          msg = 'Expected: \'' + expected + '\' Actual: \'' + actual + '\'';
+          msg = 'Expected: \'' + (expected && expected.toString()) + '\' Actual: \'' + (actual && actual.toString()) + '\'';
         }
         if (expected === actual) {
           document.write('<FONT COLOR="#009900">Ok</FONT><BR>');
@@ -78,9 +78,15 @@
         }
       }
 
-      function runTests() {
+      function runTests(force_utf32_string) {
+        diff_match_patch.force_utf32_string = force_utf32_string;
+        if (force_utf32_string) {
+          document.write('<H2>Forced UTF-32 Strings</H2>');
+        } else {
+          document.write('<H2>Normal Strings</H2>');
+        }
         for (var x = 0; x < tests.length; x++) {
-          document.write('<H3>' + tests[x] + ':</H3>');
+          document.write('<H3>' + tests[x] + ' (' + (force_utf32_string ? 'utf32_string' : 'standard string') + '):</H3>');
           eval(tests[x] + '()');
         }
       }
@@ -115,7 +121,10 @@
           'testPatchMake',
           'testPatchSplitMax',
           'testPatchAddPadding',
-          'testPatchApply'];
+          'testPatchApply',
+
+         'testUnicode',
+          ];
 
     </script>
   </head>
@@ -136,11 +145,17 @@
 
     <script type="text/javascript">
       var startTime = (new Date()).getTime();
-      runTests();
+      runTests(false);
       var endTime = (new Date()).getTime();
-      document.write('<H3>Done.</H3>');
+      document.write('<H3>Done with standard string test.</H3>');
       document.write('<P>Tests passed: ' + test_good + '<BR>Tests failed: ' + test_bad + '</P>');
       document.write('<P>Total time: ' + (endTime - startTime) + ' ms</P>');
-    </script>
+
+      var startTime = (new Date()).getTime();
+      runTests(true);
+      var endTime = (new Date()).getTime();
+      document.write('<H3>Done with utf32_string test.</H3>');
+      document.write('<P>Tests passed: ' + test_good + '<BR>Tests failed: ' + test_bad + '</P>');
+      document.write('<P>Total time: ' + (endTime - startTime) + ' ms</P>');    </script>
   </body>
 </html>
diff --git a/javascript/tests/diff_match_patch_test.js b/javascript/tests/diff_match_patch_test.js
index 96521970..d8b2ee3f 100644
--- a/javascript/tests/diff_match_patch_test.js
+++ b/javascript/tests/diff_match_patch_test.js
@@ -23,7 +23,7 @@ function assertEquivalent(msg, expected, actual) {
     // msg is optional.
     actual = expected;
     expected = msg;
-    msg = 'Expected: \'' + expected + '\' Actual: \'' + actual + '\'';
+    msg = 'Expected: \'' + expected.toString() + '\' Actual: \'' + actual.toString() + '\'';
   }
   if (_equivalent(expected, actual)) {
     assertEquals(msg, String.toString(expected), String.toString(actual));
@@ -35,9 +35,15 @@ function assertEquivalent(msg, expected, actual) {
 
 // Are a and b the equivalent? -- Recursive.
 function _equivalent(a, b) {
-  if (a == b) {
+  if (a === b) {
     return true;
   }
+  // utf32_string comparison
+  if (a.codePoints || b.codePoints) {
+    if (a.toString() === b.toString()) {
+      return true;
+    }
+  }
   if (typeof a == 'object' && typeof b == 'object' && a !== null && b !== null) {
     if (a.toString() != b.toString()) {
       return false;
@@ -58,16 +64,34 @@ function _equivalent(a, b) {
 }
 
 
+function u32(text) {
+  if (diff_match_patch.utf32_string.hasSupplemental(text)) {
+    return diff_match_patch.utf32_string.from(text);
+  } else {
+    return text;
+  }
+}
+
+
+function d32(diffs) {
+  var result = [];
+  for (var i=0; i<diffs.length; i++) {
+    result[i] = [diffs[i][0], u32(diffs[i][1])];
+  }
+  return result;
+}
+
+
 function diff_rebuildtexts(diffs) {
   // Construct the two texts which made up the diff originally.
   var text1 = '';
   var text2 = '';
   for (var x = 0; x < diffs.length; x++) {
     if (diffs[x][0] != DIFF_INSERT) {
-      text1 += diffs[x][1];
+      text1 += diffs[x][1].toString();
     }
     if (diffs[x][0] != DIFF_DELETE) {
-      text2 += diffs[x][1];
+      text2 += diffs[x][1].toString();
     }
   }
   return [text1, text2];
@@ -106,54 +130,54 @@ function testDiffCommonSuffix() {
 function testDiffCommonOverlap() {
   // Detect any suffix/prefix overlap.
   // Null case.
-  assertEquals(0, dmp.diff_commonOverlap_('', 'abcd'));
+  assertEquals(0, dmp.diff_commonOverlap_(u32(''), u32('abcd')));
 
   // Whole case.
-  assertEquals(3, dmp.diff_commonOverlap_('abc', 'abcd'));
+  assertEquals(3, dmp.diff_commonOverlap_(u32('abc'), u32('abcd')));
 
   // No overlap.
-  assertEquals(0, dmp.diff_commonOverlap_('123456', 'abcd'));
+  assertEquals(0, dmp.diff_commonOverlap_(u32('123456'), u32('abcd')));
 
   // Overlap.
-  assertEquals(3, dmp.diff_commonOverlap_('123456xxx', 'xxxabcd'));
+  assertEquals(3, dmp.diff_commonOverlap_(u32('123456xxx'), u32('xxxabcd')));
 
   // Unicode.
   // Some overly clever languages (C#) may treat ligatures as equal to their
   // component letters.  E.g. U+FB01 == 'fi'
-  assertEquals(0, dmp.diff_commonOverlap_('fi', '\ufb01i'));
+  assertEquals(0, dmp.diff_commonOverlap_(u32('fi'), u32('\ufb01i')));
 }
 
 function testDiffHalfMatch() {
   // Detect a halfmatch.
   dmp.Diff_Timeout = 1;
   // No match.
-  assertEquals(null, dmp.diff_halfMatch_('1234567890', 'abcdef'));
+  assertEquals(null, dmp.diff_halfMatch_(u32('1234567890'), u32('abcdef')));
 
-  assertEquals(null, dmp.diff_halfMatch_('12345', '23'));
+  assertEquals(null, dmp.diff_halfMatch_(u32('12345'), u32('23')));
 
   // Single Match.
-  assertEquivalent(['12', '90', 'a', 'z', '345678'], dmp.diff_halfMatch_('1234567890', 'a345678z'));
+  assertEquivalent(['12', '90', 'a', 'z', '345678'], dmp.diff_halfMatch_(u32('1234567890'), u32('a345678z')));
 
-  assertEquivalent(['a', 'z', '12', '90', '345678'], dmp.diff_halfMatch_('a345678z', '1234567890'));
+  assertEquivalent(['a', 'z', '12', '90', '345678'], dmp.diff_halfMatch_(u32('a345678z'), u32('1234567890')));
 
-  assertEquivalent(['abc', 'z', '1234', '0', '56789'], dmp.diff_halfMatch_('abc56789z', '1234567890'));
+  assertEquivalent(['abc', 'z', '1234', '0', '56789'], dmp.diff_halfMatch_(u32('abc56789z'), u32('1234567890')));
 
-  assertEquivalent(['a', 'xyz', '1', '7890', '23456'], dmp.diff_halfMatch_('a23456xyz', '1234567890'));
+  assertEquivalent(['a', 'xyz', '1', '7890', '23456'], dmp.diff_halfMatch_(u32('a23456xyz'), u32('1234567890')));
 
   // Multiple Matches.
-  assertEquivalent(['12123', '123121', 'a', 'z', '1234123451234'], dmp.diff_halfMatch_('121231234123451234123121', 'a1234123451234z'));
+  assertEquivalent(['12123', '123121', 'a', 'z', '1234123451234'], dmp.diff_halfMatch_(u32('121231234123451234123121'), u32('a1234123451234z')));
 
-  assertEquivalent(['', '-=-=-=-=-=', 'x', '', 'x-=-=-=-=-=-=-='], dmp.diff_halfMatch_('x-=-=-=-=-=-=-=-=-=-=-=-=', 'xx-=-=-=-=-=-=-='));
+  assertEquivalent(['', '-=-=-=-=-=', 'x', '', 'x-=-=-=-=-=-=-='], dmp.diff_halfMatch_(u32('x-=-=-=-=-=-=-=-=-=-=-=-='), u32('xx-=-=-=-=-=-=-=')));
 
-  assertEquivalent(['-=-=-=-=-=', '', '', 'y', '-=-=-=-=-=-=-=y'], dmp.diff_halfMatch_('-=-=-=-=-=-=-=-=-=-=-=-=y', '-=-=-=-=-=-=-=yy'));
+  assertEquivalent(['-=-=-=-=-=', '', '', 'y', '-=-=-=-=-=-=-=y'], dmp.diff_halfMatch_(u32('-=-=-=-=-=-=-=-=-=-=-=-=y'), u32('-=-=-=-=-=-=-=yy')));
 
   // Non-optimal halfmatch.
   // Optimal diff would be -q+x=H-i+e=lloHe+Hu=llo-Hew+y not -qHillo+x=HelloHe-w+Hulloy
-  assertEquivalent(['qHillo', 'w', 'x', 'Hulloy', 'HelloHe'], dmp.diff_halfMatch_('qHilloHelloHew', 'xHelloHeHulloy'));
+  assertEquivalent(['qHillo', 'w', 'x', 'Hulloy', 'HelloHe'], dmp.diff_halfMatch_(u32('qHilloHelloHew'), u32('xHelloHeHulloy')));
 
   // Optimal no halfmatch.
   dmp.Diff_Timeout = 0;
-  assertEquals(null, dmp.diff_halfMatch_('qHilloHelloHew', 'xHelloHeHulloy'));
+  assertEquals(null, dmp.diff_halfMatch_(u32('qHilloHelloHew'), u32('xHelloHeHulloy')));
 }
 
 function testDiffLinesToChars() {
@@ -164,32 +188,32 @@ function testDiffLinesToChars() {
   }
 
   // Convert lines down to characters.
-  assertLinesToCharsResultEquals({chars1: '\x01\x02\x01', chars2: '\x02\x01\x02', lineArray: ['', 'alpha\n', 'beta\n']}, dmp.diff_linesToChars_('alpha\nbeta\nalpha\n', 'beta\nalpha\nbeta\n'));
+  assertLinesToCharsResultEquals({chars1: '\x01\x02\x01', chars2: '\x02\x01\x02', lineArray: ['', 'alpha\n', 'beta\n']}, dmp.diff_linesToChars_(u32('alpha\nbeta\nalpha\n'), u32('beta\nalpha\nbeta\n')));
 
-  assertLinesToCharsResultEquals({chars1: '', chars2: '\x01\x02\x03\x03', lineArray: ['', 'alpha\r\n', 'beta\r\n', '\r\n']}, dmp.diff_linesToChars_('', 'alpha\r\nbeta\r\n\r\n\r\n'));
+  assertLinesToCharsResultEquals({chars1: '', chars2: '\x01\x02\x03\x03', lineArray: ['', 'alpha\r\n', 'beta\r\n', '\r\n']}, dmp.diff_linesToChars_(u32(''), u32('alpha\r\nbeta\r\n\r\n\r\n')));
 
-  assertLinesToCharsResultEquals({chars1: '\x01', chars2: '\x02', lineArray: ['', 'a', 'b']}, dmp.diff_linesToChars_('a', 'b'));
+  assertLinesToCharsResultEquals({chars1: '\x01', chars2: '\x02', lineArray: ['', 'a', 'b']}, dmp.diff_linesToChars_(u32('a'), u32('b')));
 
   // More than 256 to reveal any 8-bit limitations.
   var n = 300;
   var lineList = [];
   var charList = [];
   for (var x = 1; x < n + 1; x++) {
-    lineList[x - 1] = x + '\n';
+    lineList[x - 1] = u32(x + '\n');
     charList[x - 1] = String.fromCharCode(x);
   }
   assertEquals(n, lineList.length);
   var lines = lineList.join('');
   var chars = charList.join('');
   assertEquals(n, chars.length);
-  lineList.unshift('');
-  assertLinesToCharsResultEquals({chars1: chars, chars2: '', lineArray: lineList}, dmp.diff_linesToChars_(lines, ''));
+  lineList.unshift(u32(''));
+  assertLinesToCharsResultEquals({chars1: chars, chars2: '', lineArray: lineList}, dmp.diff_linesToChars_(u32(lines), u32('')));
 }
 
 function testDiffCharsToLines() {
   // Convert chars up to lines.
   var diffs = [[DIFF_EQUAL, '\x01\x02\x01'], [DIFF_INSERT, '\x02\x01\x02']];
-  dmp.diff_charsToLines_(diffs, ['', 'alpha\n', 'beta\n']);
+  dmp.diff_charsToLines_(diffs, [u32(''), u32('alpha\n'), u32('beta\n')]);
   assertEquivalent([[DIFF_EQUAL, 'alpha\nbeta\nalpha\n'], [DIFF_INSERT, 'beta\nalpha\nbeta\n']], diffs);
 
   // More than 256 to reveal any 8-bit limitations.
@@ -197,14 +221,14 @@ function testDiffCharsToLines() {
   var lineList = [];
   var charList = [];
   for (var x = 1; x < n + 1; x++) {
-    lineList[x - 1] = x + '\n';
+    lineList[x - 1] = u32(x + '\n');
     charList[x - 1] = String.fromCharCode(x);
   }
   assertEquals(n, lineList.length);
   var lines = lineList.join('');
   var chars = charList.join('');
   assertEquals(n, chars.length);
-  lineList.unshift('');
+  lineList.unshift(u32(''));
   var diffs = [[DIFF_DELETE, chars]];
   dmp.diff_charsToLines_(diffs, lineList);
   assertEquivalent([[DIFF_DELETE, lines]], diffs);
@@ -213,62 +237,62 @@ function testDiffCharsToLines() {
 function testDiffCleanupMerge() {
   // Cleanup a messy diff.
   // Null case.
-  var diffs = [];
+  var diffs = d32([]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([], diffs);
 
   // No change case.
-  diffs = [[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'b'], [DIFF_INSERT, 'c']];
+  diffs = d32([[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'b'], [DIFF_INSERT, 'c']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'b'], [DIFF_INSERT, 'c']], diffs);
 
   // Merge equalities.
-  diffs = [[DIFF_EQUAL, 'a'], [DIFF_EQUAL, 'b'], [DIFF_EQUAL, 'c']];
+  diffs = d32([[DIFF_EQUAL, 'a'], [DIFF_EQUAL, 'b'], [DIFF_EQUAL, 'c']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_EQUAL, 'abc']], diffs);
 
   // Merge deletions.
-  diffs = [[DIFF_DELETE, 'a'], [DIFF_DELETE, 'b'], [DIFF_DELETE, 'c']];
+  diffs = d32([[DIFF_DELETE, 'a'], [DIFF_DELETE, 'b'], [DIFF_DELETE, 'c']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_DELETE, 'abc']], diffs);
 
   // Merge insertions.
-  diffs = [[DIFF_INSERT, 'a'], [DIFF_INSERT, 'b'], [DIFF_INSERT, 'c']];
+  diffs = d32([[DIFF_INSERT, 'a'], [DIFF_INSERT, 'b'], [DIFF_INSERT, 'c']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_INSERT, 'abc']], diffs);
 
   // Merge interweave.
-  diffs = [[DIFF_DELETE, 'a'], [DIFF_INSERT, 'b'], [DIFF_DELETE, 'c'], [DIFF_INSERT, 'd'], [DIFF_EQUAL, 'e'], [DIFF_EQUAL, 'f']];
+  diffs = d32([[DIFF_DELETE, 'a'], [DIFF_INSERT, 'b'], [DIFF_DELETE, 'c'], [DIFF_INSERT, 'd'], [DIFF_EQUAL, 'e'], [DIFF_EQUAL, 'f']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_DELETE, 'ac'], [DIFF_INSERT, 'bd'], [DIFF_EQUAL, 'ef']], diffs);
 
   // Prefix and suffix detection.
-  diffs = [[DIFF_DELETE, 'a'], [DIFF_INSERT, 'abc'], [DIFF_DELETE, 'dc']];
+  diffs = d32([[DIFF_DELETE, 'a'], [DIFF_INSERT, 'abc'], [DIFF_DELETE, 'dc']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'd'], [DIFF_INSERT, 'b'], [DIFF_EQUAL, 'c']], diffs);
 
   // Prefix and suffix detection with equalities.
-  diffs = [[DIFF_EQUAL, 'x'], [DIFF_DELETE, 'a'], [DIFF_INSERT, 'abc'], [DIFF_DELETE, 'dc'], [DIFF_EQUAL, 'y']];
+  diffs = d32([[DIFF_EQUAL, 'x'], [DIFF_DELETE, 'a'], [DIFF_INSERT, 'abc'], [DIFF_DELETE, 'dc'], [DIFF_EQUAL, 'y']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_EQUAL, 'xa'], [DIFF_DELETE, 'd'], [DIFF_INSERT, 'b'], [DIFF_EQUAL, 'cy']], diffs);
 
   // Slide edit left.
-  diffs = [[DIFF_EQUAL, 'a'], [DIFF_INSERT, 'ba'], [DIFF_EQUAL, 'c']];
+  diffs = d32([[DIFF_EQUAL, 'a'], [DIFF_INSERT, 'ba'], [DIFF_EQUAL, 'c']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_INSERT, 'ab'], [DIFF_EQUAL, 'ac']], diffs);
 
   // Slide edit right.
-  diffs = [[DIFF_EQUAL, 'c'], [DIFF_INSERT, 'ab'], [DIFF_EQUAL, 'a']];
+  diffs = d32([[DIFF_EQUAL, 'c'], [DIFF_INSERT, 'ab'], [DIFF_EQUAL, 'a']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_EQUAL, 'ca'], [DIFF_INSERT, 'ba']], diffs);
 
   // Slide edit left recursive.
-  diffs = [[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'b'], [DIFF_EQUAL, 'c'], [DIFF_DELETE, 'ac'], [DIFF_EQUAL, 'x']];
+  diffs = d32([[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'b'], [DIFF_EQUAL, 'c'], [DIFF_DELETE, 'ac'], [DIFF_EQUAL, 'x']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_DELETE, 'abc'], [DIFF_EQUAL, 'acx']], diffs);
 
   // Slide edit right recursive.
-  diffs = [[DIFF_EQUAL, 'x'], [DIFF_DELETE, 'ca'], [DIFF_EQUAL, 'c'], [DIFF_DELETE, 'b'], [DIFF_EQUAL, 'a']];
+  diffs = d32([[DIFF_EQUAL, 'x'], [DIFF_DELETE, 'ca'], [DIFF_EQUAL, 'c'], [DIFF_DELETE, 'b'], [DIFF_EQUAL, 'a']]);
   dmp.diff_cleanupMerge(diffs);
   assertEquivalent([[DIFF_EQUAL, 'xca'], [DIFF_DELETE, 'cba']], diffs);
 }
@@ -276,42 +300,42 @@ function testDiffCleanupMerge() {
 function testDiffCleanupSemanticLossless() {
   // Slide diffs to match logical boundaries.
   // Null case.
-  var diffs = [];
-  dmp.diff_cleanupSemanticLossless(diffs);
+  var diffs = d32([]);
+  dmp.diff_cleanupSemanticLossless(d32(diffs));
   assertEquivalent([], diffs);
 
   // Blank lines.
-  diffs = [[DIFF_EQUAL, 'AAA\r\n\r\nBBB'], [DIFF_INSERT, '\r\nDDD\r\n\r\nBBB'], [DIFF_EQUAL, '\r\nEEE']];
+  diffs = d32([[DIFF_EQUAL, 'AAA\r\n\r\nBBB'], [DIFF_INSERT, '\r\nDDD\r\n\r\nBBB'], [DIFF_EQUAL, '\r\nEEE']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_EQUAL, 'AAA\r\n\r\n'], [DIFF_INSERT, 'BBB\r\nDDD\r\n\r\n'], [DIFF_EQUAL, 'BBB\r\nEEE']], diffs);
 
   // Line boundaries.
-  diffs = [[DIFF_EQUAL, 'AAA\r\nBBB'], [DIFF_INSERT, ' DDD\r\nBBB'], [DIFF_EQUAL, ' EEE']];
+  diffs = d32([[DIFF_EQUAL, 'AAA\r\nBBB'], [DIFF_INSERT, ' DDD\r\nBBB'], [DIFF_EQUAL, ' EEE']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_EQUAL, 'AAA\r\n'], [DIFF_INSERT, 'BBB DDD\r\n'], [DIFF_EQUAL, 'BBB EEE']], diffs);
 
   // Word boundaries.
-  diffs = [[DIFF_EQUAL, 'The c'], [DIFF_INSERT, 'ow and the c'], [DIFF_EQUAL, 'at.']];
+  diffs = d32([[DIFF_EQUAL, 'The c'], [DIFF_INSERT, 'ow and the c'], [DIFF_EQUAL, 'at.']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_EQUAL, 'The '], [DIFF_INSERT, 'cow and the '], [DIFF_EQUAL, 'cat.']], diffs);
 
   // Alphanumeric boundaries.
-  diffs = [[DIFF_EQUAL, 'The-c'], [DIFF_INSERT, 'ow-and-the-c'], [DIFF_EQUAL, 'at.']];
+  diffs = d32([[DIFF_EQUAL, 'The-c'], [DIFF_INSERT, 'ow-and-the-c'], [DIFF_EQUAL, 'at.']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_EQUAL, 'The-'], [DIFF_INSERT, 'cow-and-the-'], [DIFF_EQUAL, 'cat.']], diffs);
 
   // Hitting the start.
-  diffs = [[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'a'], [DIFF_EQUAL, 'ax']];
+  diffs = d32([[DIFF_EQUAL, 'a'], [DIFF_DELETE, 'a'], [DIFF_EQUAL, 'ax']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_DELETE, 'a'], [DIFF_EQUAL, 'aax']], diffs);
 
   // Hitting the end.
-  diffs = [[DIFF_EQUAL, 'xa'], [DIFF_DELETE, 'a'], [DIFF_EQUAL, 'a']];
+  diffs = d32([[DIFF_EQUAL, 'xa'], [DIFF_DELETE, 'a'], [DIFF_EQUAL, 'a']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_EQUAL, 'xaa'], [DIFF_DELETE, 'a']], diffs);
 
   // Sentence boundaries.
-  diffs = [[DIFF_EQUAL, 'The xxx. The '], [DIFF_INSERT, 'zzz. The '], [DIFF_EQUAL, 'yyy.']];
+  diffs = d32([[DIFF_EQUAL, 'The xxx. The '], [DIFF_INSERT, 'zzz. The '], [DIFF_EQUAL, 'yyy.']]);
   dmp.diff_cleanupSemanticLossless(diffs);
   assertEquivalent([[DIFF_EQUAL, 'The xxx.'], [DIFF_INSERT, ' The zzz.'], [DIFF_EQUAL, ' The yyy.']], diffs);
 }
@@ -319,57 +343,57 @@ function testDiffCleanupSemanticLossless() {
 function testDiffCleanupSemantic() {
   // Cleanup semantically trivial equalities.
   // Null case.
-  var diffs = [];
+  var diffs = d32([]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([], diffs);
 
   // No elimination #1.
-  diffs = [[DIFF_DELETE, 'ab'], [DIFF_INSERT, 'cd'], [DIFF_EQUAL, '12'], [DIFF_DELETE, 'e']];
+  diffs = d32([[DIFF_DELETE, 'ab'], [DIFF_INSERT, 'cd'], [DIFF_EQUAL, '12'], [DIFF_DELETE, 'e']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'ab'], [DIFF_INSERT, 'cd'], [DIFF_EQUAL, '12'], [DIFF_DELETE, 'e']], diffs);
 
   // No elimination #2.
-  diffs = [[DIFF_DELETE, 'abc'], [DIFF_INSERT, 'ABC'], [DIFF_EQUAL, '1234'], [DIFF_DELETE, 'wxyz']];
+  diffs = d32([[DIFF_DELETE, 'abc'], [DIFF_INSERT, 'ABC'], [DIFF_EQUAL, '1234'], [DIFF_DELETE, 'wxyz']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'abc'], [DIFF_INSERT, 'ABC'], [DIFF_EQUAL, '1234'], [DIFF_DELETE, 'wxyz']], diffs);
 
   // Simple elimination.
-  diffs = [[DIFF_DELETE, 'a'], [DIFF_EQUAL, 'b'], [DIFF_DELETE, 'c']];
+  diffs = d32([[DIFF_DELETE, 'a'], [DIFF_EQUAL, 'b'], [DIFF_DELETE, 'c']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'abc'], [DIFF_INSERT, 'b']], diffs);
 
   // Backpass elimination.
-  diffs = [[DIFF_DELETE, 'ab'], [DIFF_EQUAL, 'cd'], [DIFF_DELETE, 'e'], [DIFF_EQUAL, 'f'], [DIFF_INSERT, 'g']];
+  diffs = d32([[DIFF_DELETE, 'ab'], [DIFF_EQUAL, 'cd'], [DIFF_DELETE, 'e'], [DIFF_EQUAL, 'f'], [DIFF_INSERT, 'g']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'abcdef'], [DIFF_INSERT, 'cdfg']], diffs);
 
   // Multiple eliminations.
-  diffs = [[DIFF_INSERT, '1'], [DIFF_EQUAL, 'A'], [DIFF_DELETE, 'B'], [DIFF_INSERT, '2'], [DIFF_EQUAL, '_'], [DIFF_INSERT, '1'], [DIFF_EQUAL, 'A'], [DIFF_DELETE, 'B'], [DIFF_INSERT, '2']];
+  diffs = d32([[DIFF_INSERT, '1'], [DIFF_EQUAL, 'A'], [DIFF_DELETE, 'B'], [DIFF_INSERT, '2'], [DIFF_EQUAL, '_'], [DIFF_INSERT, '1'], [DIFF_EQUAL, 'A'], [DIFF_DELETE, 'B'], [DIFF_INSERT, '2']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'AB_AB'], [DIFF_INSERT, '1A2_1A2']], diffs);
 
   // Word boundaries.
-  diffs = [[DIFF_EQUAL, 'The c'], [DIFF_DELETE, 'ow and the c'], [DIFF_EQUAL, 'at.']];
+  diffs = d32([[DIFF_EQUAL, 'The c'], [DIFF_DELETE, 'ow and the c'], [DIFF_EQUAL, 'at.']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_EQUAL, 'The '], [DIFF_DELETE, 'cow and the '], [DIFF_EQUAL, 'cat.']], diffs);
 
   // No overlap elimination.
-  diffs = [[DIFF_DELETE, 'abcxx'], [DIFF_INSERT, 'xxdef']];
+  diffs = d32([[DIFF_DELETE, 'abcxx'], [DIFF_INSERT, 'xxdef']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'abcxx'], [DIFF_INSERT, 'xxdef']], diffs);
 
   // Overlap elimination.
-  diffs = [[DIFF_DELETE, 'abcxxx'], [DIFF_INSERT, 'xxxdef']];
+  diffs = d32([[DIFF_DELETE, 'abcxxx'], [DIFF_INSERT, 'xxxdef']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'abc'], [DIFF_EQUAL, 'xxx'], [DIFF_INSERT, 'def']], diffs);
 
   // Reverse overlap elimination.
-  diffs = [[DIFF_DELETE, 'xxxabc'], [DIFF_INSERT, 'defxxx']];
+  diffs = d32([[DIFF_DELETE, 'xxxabc'], [DIFF_INSERT, 'defxxx']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_INSERT, 'def'], [DIFF_EQUAL, 'xxx'], [DIFF_DELETE, 'abc']], diffs);
 
   // Two overlap eliminations.
-  diffs = [[DIFF_DELETE, 'abcd1212'], [DIFF_INSERT, '1212efghi'], [DIFF_EQUAL, '----'], [DIFF_DELETE, 'A3'], [DIFF_INSERT, '3BC']];
+  diffs = d32([[DIFF_DELETE, 'abcd1212'], [DIFF_INSERT, '1212efghi'], [DIFF_EQUAL, '----'], [DIFF_DELETE, 'A3'], [DIFF_INSERT, '3BC']]);
   dmp.diff_cleanupSemantic(diffs);
   assertEquivalent([[DIFF_DELETE, 'abcd'], [DIFF_EQUAL, '1212'], [DIFF_INSERT, 'efghi'], [DIFF_EQUAL, '----'], [DIFF_DELETE, 'A'], [DIFF_EQUAL, '3'], [DIFF_INSERT, 'BC']], diffs);
 }
@@ -378,33 +402,33 @@ function testDiffCleanupEfficiency() {
   // Cleanup operationally trivial equalities.
   dmp.Diff_EditCost = 4;
   // Null case.
-  var diffs = [];
+  var diffs = d32([]);
   dmp.diff_cleanupEfficiency(diffs);
   assertEquivalent([], diffs);
 
   // No elimination.
-  diffs = [[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'wxyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']];
+  diffs = d32([[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'wxyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']]);
   dmp.diff_cleanupEfficiency(diffs);
   assertEquivalent([[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'wxyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']], diffs);
 
   // Four-edit elimination.
-  diffs = [[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'xyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']];
+  diffs = d32([[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'xyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']]);
   dmp.diff_cleanupEfficiency(diffs);
   assertEquivalent([[DIFF_DELETE, 'abxyzcd'], [DIFF_INSERT, '12xyz34']], diffs);
 
   // Three-edit elimination.
-  diffs = [[DIFF_INSERT, '12'], [DIFF_EQUAL, 'x'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']];
+  diffs = d32([[DIFF_INSERT, '12'], [DIFF_EQUAL, 'x'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']]);
   dmp.diff_cleanupEfficiency(diffs);
   assertEquivalent([[DIFF_DELETE, 'xcd'], [DIFF_INSERT, '12x34']], diffs);
 
   // Backpass elimination.
-  diffs = [[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'xy'], [DIFF_INSERT, '34'], [DIFF_EQUAL, 'z'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '56']];
+  diffs = d32([[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'xy'], [DIFF_INSERT, '34'], [DIFF_EQUAL, 'z'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '56']]);
   dmp.diff_cleanupEfficiency(diffs);
   assertEquivalent([[DIFF_DELETE, 'abxyzcd'], [DIFF_INSERT, '12xy34z56']], diffs);
 
   // High cost elimination.
   dmp.Diff_EditCost = 5;
-  diffs = [[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'wxyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']];
+  diffs = d32([[DIFF_DELETE, 'ab'], [DIFF_INSERT, '12'], [DIFF_EQUAL, 'wxyz'], [DIFF_DELETE, 'cd'], [DIFF_INSERT, '34']]);
   dmp.diff_cleanupEfficiency(diffs);
   assertEquivalent([[DIFF_DELETE, 'abwxyzcd'], [DIFF_INSERT, '12wxyz34']], diffs);
   dmp.Diff_EditCost = 4;
@@ -413,12 +437,12 @@ function testDiffCleanupEfficiency() {
 function testDiffPrettyHtml() {
   // Pretty print.
   var diffs = [[DIFF_EQUAL, 'a\n'], [DIFF_DELETE, '<B>b</B>'], [DIFF_INSERT, 'c&d']];
-  assertEquals('<span>a&para;<br></span><del style="background:#ffe6e6;">&lt;B&gt;b&lt;/B&gt;</del><ins style="background:#e6ffe6;">c&amp;d</ins>', dmp.diff_prettyHtml(diffs));
+  assertEquals('<span>a&para;<br></span><del style="background:#ffe6e6;">&lt;B&gt;b&lt;/B&gt;</del><ins style="background:#e6ffe6;">c&amp;d</ins>', dmp.diff_prettyHtml(d32(diffs)));
 }
 
 function testDiffText() {
   // Compute the source and destination texts.
-  var diffs = [[DIFF_EQUAL, 'jump'], [DIFF_DELETE, 's'], [DIFF_INSERT, 'ed'], [DIFF_EQUAL, ' over '], [DIFF_DELETE, 'the'], [DIFF_INSERT, 'a'], [DIFF_EQUAL, ' lazy']];
+  var diffs = d32([[DIFF_EQUAL, 'jump'], [DIFF_DELETE, 's'], [DIFF_INSERT, 'ed'], [DIFF_EQUAL, ' over '], [DIFF_DELETE, 'the'], [DIFF_INSERT, 'a'], [DIFF_EQUAL, ' lazy']]);
   assertEquals('jumps over the lazy', dmp.diff_text1(diffs));
 
   assertEquals('jumped over a lazy', dmp.diff_text2(diffs));
@@ -426,7 +450,7 @@ function testDiffText() {
 
 function testDiffDelta() {
   // Convert a diff into delta string.
-  var diffs = [[DIFF_EQUAL, 'jump'], [DIFF_DELETE, 's'], [DIFF_INSERT, 'ed'], [DIFF_EQUAL, ' over '], [DIFF_DELETE, 'the'], [DIFF_INSERT, 'a'], [DIFF_EQUAL, ' lazy'], [DIFF_INSERT, 'old dog']];
+  var diffs = d32([[DIFF_EQUAL, 'jump'], [DIFF_DELETE, 's'], [DIFF_INSERT, 'ed'], [DIFF_EQUAL, ' over '], [DIFF_DELETE, 'the'], [DIFF_INSERT, 'a'], [DIFF_EQUAL, ' lazy'], [DIFF_INSERT, 'old dog']]);
   var text1 = dmp.diff_text1(diffs);
   assertEquals('jumps over the lazy', text1);
 
@@ -461,7 +485,7 @@ function testDiffDelta() {
   }
 
   // Test deltas with special characters.
-  diffs = [[DIFF_EQUAL, '\u0680 \x00 \t %'], [DIFF_DELETE, '\u0681 \x01 \n ^'], [DIFF_INSERT, '\u0682 \x02 \\ |']];
+  diffs = d32([[DIFF_EQUAL, '\u0680 \x00 \t %'], [DIFF_DELETE, '\u0681 \x01 \n ^'], [DIFF_INSERT, '\u0682 \x02 \\ |']]);
   text1 = dmp.diff_text1(diffs);
   assertEquals('\u0680 \x00 \t %\u0681 \x01 \n ^', text1);
 
@@ -472,7 +496,7 @@ function testDiffDelta() {
   assertEquivalent(diffs, dmp.diff_fromDelta(text1, delta));
 
   // Verify pool of unchanged characters.
-  diffs = [[DIFF_INSERT, 'A-Z a-z 0-9 - _ . ! ~ * \' ( ) ; / ? : @ & = + $ , # ']];
+  diffs = d32([[DIFF_INSERT, 'A-Z a-z 0-9 - _ . ! ~ * \' ( ) ; / ? : @ & = + $ , # ']]);
   var text2 = dmp.diff_text2(diffs);
   assertEquals('A-Z a-z 0-9 - _ . ! ~ * \' ( ) ; / ? : @ & = + $ , # ', text2);
 
@@ -486,19 +510,19 @@ function testDiffDelta() {
 function testDiffXIndex() {
   // Translate a location in text1 to text2.
   // Translation on equality.
-  assertEquals(5, dmp.diff_xIndex([[DIFF_DELETE, 'a'], [DIFF_INSERT, '1234'], [DIFF_EQUAL, 'xyz']], 2));
+  assertEquals(5, dmp.diff_xIndex(d32([[DIFF_DELETE, 'a'], [DIFF_INSERT, '1234'], [DIFF_EQUAL, 'xyz']]), 2));
 
   // Translation on deletion.
-  assertEquals(1, dmp.diff_xIndex([[DIFF_EQUAL, 'a'], [DIFF_DELETE, '1234'], [DIFF_EQUAL, 'xyz']], 3));
+  assertEquals(1, dmp.diff_xIndex(d32([[DIFF_EQUAL, 'a'], [DIFF_DELETE, '1234'], [DIFF_EQUAL, 'xyz']]), 3));
 }
 
 function testDiffLevenshtein() {
   // Levenshtein with trailing equality.
-  assertEquals(4, dmp.diff_levenshtein([[DIFF_DELETE, 'abc'], [DIFF_INSERT, '1234'], [DIFF_EQUAL, 'xyz']]));
+  assertEquals(4, dmp.diff_levenshtein(d32([[DIFF_DELETE, 'abc'], [DIFF_INSERT, '1234'], [DIFF_EQUAL, 'xyz']])));
   // Levenshtein with leading equality.
-  assertEquals(4, dmp.diff_levenshtein([[DIFF_EQUAL, 'xyz'], [DIFF_DELETE, 'abc'], [DIFF_INSERT, '1234']]));
+  assertEquals(4, dmp.diff_levenshtein(d32([[DIFF_EQUAL, 'xyz'], [DIFF_DELETE, 'abc'], [DIFF_INSERT, '1234']])));
   // Levenshtein with middle equality.
-  assertEquals(7, dmp.diff_levenshtein([[DIFF_DELETE, 'abc'], [DIFF_EQUAL, 'xyz'], [DIFF_INSERT, '1234']]));
+  assertEquals(7, dmp.diff_levenshtein(d32([[DIFF_DELETE, 'abc'], [DIFF_EQUAL, 'xyz'], [DIFF_INSERT, '1234']])));
 }
 
 function testDiffBisect() {
@@ -508,10 +532,10 @@ function testDiffBisect() {
   // Since the resulting diff hasn't been normalized, it would be ok if
   // the insertion and deletion pairs are swapped.
   // If the order changes, tweak this test as required.
-  assertEquivalent([[DIFF_DELETE, 'c'], [DIFF_INSERT, 'm'], [DIFF_EQUAL, 'a'], [DIFF_DELETE, 't'], [DIFF_INSERT, 'p']], dmp.diff_bisect_(a, b, Number.MAX_VALUE));
+  assertEquivalent([[DIFF_DELETE, 'c'], [DIFF_INSERT, 'm'], [DIFF_EQUAL, 'a'], [DIFF_DELETE, 't'], [DIFF_INSERT, 'p']], dmp.diff_bisect_(u32(a), u32(b), Number.MAX_VALUE));
 
   // Timeout.
-  assertEquivalent([[DIFF_DELETE, 'cat'], [DIFF_INSERT, 'map']], dmp.diff_bisect_(a, b, 0));
+  assertEquivalent([[DIFF_DELETE, 'cat'], [DIFF_INSERT, 'map']], dmp.diff_bisect_(u32(a), u32(b), 0));
 }
 
 function testDiffMain() {
@@ -624,44 +648,44 @@ function testMatchBitap() {
   dmp.Match_Distance = 100;
   dmp.Match_Threshold = 0.5;
   // Exact matches.
-  assertEquals(5, dmp.match_bitap_('abcdefghijk', 'fgh', 5));
+  assertEquals(5, dmp.match_bitap_(u32('abcdefghijk'), u32('fgh'), 5));
 
-  assertEquals(5, dmp.match_bitap_('abcdefghijk', 'fgh', 0));
+  assertEquals(5, dmp.match_bitap_(u32('abcdefghijk'), u32('fgh'), 0));
 
   // Fuzzy matches.
-  assertEquals(4, dmp.match_bitap_('abcdefghijk', 'efxhi', 0));
+  assertEquals(4, dmp.match_bitap_(u32('abcdefghijk'), u32('efxhi'), 0));
 
-  assertEquals(2, dmp.match_bitap_('abcdefghijk', 'cdefxyhijk', 5));
+  assertEquals(2, dmp.match_bitap_(u32('abcdefghijk'), u32('cdefxyhijk'), 5));
 
-  assertEquals(-1, dmp.match_bitap_('abcdefghijk', 'bxy', 1));
+  assertEquals(-1, dmp.match_bitap_(u32('abcdefghijk'), u32('bxy'), 1));
 
   // Overflow.
-  assertEquals(2, dmp.match_bitap_('123456789xx0', '3456789x0', 2));
+  assertEquals(2, dmp.match_bitap_(u32('123456789xx0'), u32('3456789x0'), 2));
 
   // Threshold test.
   dmp.Match_Threshold = 0.4;
-  assertEquals(4, dmp.match_bitap_('abcdefghijk', 'efxyhi', 1));
+  assertEquals(4, dmp.match_bitap_(u32('abcdefghijk'), u32('efxyhi'), 1));
 
   dmp.Match_Threshold = 0.3;
-  assertEquals(-1, dmp.match_bitap_('abcdefghijk', 'efxyhi', 1));
+  assertEquals(-1, dmp.match_bitap_(u32('abcdefghijk'), u32('efxyhi'), 1));
 
   dmp.Match_Threshold = 0.0;
-  assertEquals(1, dmp.match_bitap_('abcdefghijk', 'bcdef', 1));
+  assertEquals(1, dmp.match_bitap_(u32('abcdefghijk'), u32('bcdef'), 1));
   dmp.Match_Threshold = 0.5;
 
   // Multiple select.
-  assertEquals(0, dmp.match_bitap_('abcdexyzabcde', 'abccde', 3));
+  assertEquals(0, dmp.match_bitap_(u32('abcdexyzabcde'), u32('abccde'), 3));
 
-  assertEquals(8, dmp.match_bitap_('abcdexyzabcde', 'abccde', 5));
+  assertEquals(8, dmp.match_bitap_(u32('abcdexyzabcde'), u32('abccde'), 5));
 
   // Distance test.
   dmp.Match_Distance = 10;  // Strict location.
-  assertEquals(-1, dmp.match_bitap_('abcdefghijklmnopqrstuvwxyz', 'abcdefg', 24));
+  assertEquals(-1, dmp.match_bitap_(u32('abcdefghijklmnopqrstuvwxyz'), u32('abcdefg'), 24));
 
-  assertEquals(0, dmp.match_bitap_('abcdefghijklmnopqrstuvwxyz', 'abcdxxefg', 1));
+  assertEquals(0, dmp.match_bitap_(u32('abcdefghijklmnopqrstuvwxyz'), u32('abcdxxefg'), 1));
 
   dmp.Match_Distance = 1000;  // Loose location.
-  assertEquals(0, dmp.match_bitap_('abcdefghijklmnopqrstuvwxyz', 'abcdefg', 24));
+  assertEquals(0, dmp.match_bitap_(u32('abcdefghijklmnopqrstuvwxyz'), u32('abcdefg'), 24));
 }
 
 function testMatchMain() {
@@ -743,22 +767,22 @@ function testPatchToText() {
 function testPatchAddContext() {
   dmp.Patch_Margin = 4;
   var p = dmp.patch_fromText('@@ -21,4 +21,10 @@\n-jump\n+somersault\n')[0];
-  dmp.patch_addContext_(p, 'The quick brown fox jumps over the lazy dog.');
+  dmp.patch_addContext_(p, u32('The quick brown fox jumps over the lazy dog.'));
   assertEquals('@@ -17,12 +17,18 @@\n fox \n-jump\n+somersault\n s ov\n', p.toString());
 
   // Same, but not enough trailing context.
   p = dmp.patch_fromText('@@ -21,4 +21,10 @@\n-jump\n+somersault\n')[0];
-  dmp.patch_addContext_(p, 'The quick brown fox jumps.');
+  dmp.patch_addContext_(p, u32('The quick brown fox jumps.'));
   assertEquals('@@ -17,10 +17,16 @@\n fox \n-jump\n+somersault\n s.\n', p.toString());
 
   // Same, but not enough leading context.
   p = dmp.patch_fromText('@@ -3 +3,2 @@\n-e\n+at\n')[0];
-  dmp.patch_addContext_(p, 'The quick brown fox jumps.');
+  dmp.patch_addContext_(p, u32('The quick brown fox jumps.'));
   assertEquals('@@ -1,7 +1,8 @@\n Th\n-e\n+at\n  qui\n', p.toString());
 
   // Same, but with ambiguity.
   p = dmp.patch_fromText('@@ -3 +3,2 @@\n-e\n+at\n')[0];
-  dmp.patch_addContext_(p, 'The quick brown fox jumps.  The quick brown fox crashes.');
+  dmp.patch_addContext_(p, u32('The quick brown fox jumps.  The quick brown fox crashes.'));
   assertEquals('@@ -1,27 +1,28 @@\n Th\n-e\n+at\n  quick brown fox jumps. \n', p.toString());
 }
 
@@ -935,3 +959,37 @@ function testPatchApply() {
   results = dmp.patch_apply(patches, 'x');
   assertEquivalent(['x123', [true]], results);
 }
+
+function testUnicode() {
+  var cp1 = '\uD800\uDDE4'; // U+101E4; cannot put directly in source file
+  var cp2 = '\uD800\uDDE5'; // U+101E5
+
+  // Basic diff
+  assertEquals(4, dmp.diff_commonSuffix('a4' + cp1 + '21', 'b4' + cp1 + '21'));
+
+  // Diff across surrogate boundary
+  assertEquals(1, dmp.diff_commonPrefix('a' + cp1 + 'b', 'a' + cp2 + 'b'));
+
+  // Half-match
+  // Internal API: Do utf32_string conversion manually
+  dmp.Diff_Timeout = 1;
+  assertEquivalent(['ab', 'cd', '12', '3', cp1 + cp2 + cp1 + cp2], dmp.diff_halfMatch_(diff_match_patch.utf32_string.from('ab' + cp1 + cp2 + cp1 + cp2 + 'cd'), diff_match_patch.utf32_string.from('12' + cp1 + cp2 + cp1 + cp2 + '3')));
+
+
+  var patches = dmp.patch_make('', "ab");
+  assertEquals('@@ -0,0 +1,2 @@\n+ab\n', dmp.patch_toText(patches));
+
+  // Basic supplemental characters patch with padding.
+  var patches = dmp.patch_make('', cp1 + cp1);
+  assertEquals('@@ -0,0 +1,2 @@\n+%F0%90%87%A4%F0%90%87%A4\n', dmp.patch_toText(patches));
+  dmp.patch_addPadding(patches);
+  assertEquals('@@ -1,8 +1,10 @@\n %01%02%03%04\n+%F0%90%87%A4%F0%90%87%A4\n %01%02%03%04\n', dmp.patch_toText(patches));
+
+  // Basic supplemental characters with diff.
+  var patches = dmp.patch_make(cp1 + 'a', cp1 + 'ab');
+  assertEquals('@@ -1,2 +1,3 @@\n %F0%90%87%A4a\n+b\n', dmp.patch_toText(patches));
+
+  // Do not break supplemental characters in half.
+  var patches = dmp.patch_make(cp1 + cp1 + cp1 + cp1 + cp1 + 'a', cp1 + cp1 + cp1 + cp1 + cp1 + 'ab');
+  assertEquals('@@ -1,6 +1,7 @@\n %F0%90%87%A4%F0%90%87%A4%F0%90%87%A4%F0%90%87%A4%F0%90%87%A4a\n+b\n', dmp.patch_toText(patches));
+}

From 33dad201ec71bed630e24376bca33c8a3f41b8bd Mon Sep 17 00:00:00 2001
From: "Shane F. Carr" <shane.carr@wustl.edu>
Date: Tue, 22 May 2018 07:15:12 -0700
Subject: [PATCH 2/2] Reset test success/failure counters for each run.

---
 javascript/tests/diff_match_patch_test.html | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/javascript/tests/diff_match_patch_test.html b/javascript/tests/diff_match_patch_test.html
index 35af1a51..03a01282 100644
--- a/javascript/tests/diff_match_patch_test.html
+++ b/javascript/tests/diff_match_patch_test.html
@@ -79,6 +79,8 @@
       }
 
       function runTests(force_utf32_string) {
+        test_good = 0;
+        test_bad = 0;
         diff_match_patch.force_utf32_string = force_utf32_string;
         if (force_utf32_string) {
           document.write('<H2>Forced UTF-32 Strings</H2>');