123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285 |
- /*
- ==============================================================================
- This file is part of the juce_core module of the JUCE library.
- Copyright (c) 2015 - ROLI Ltd.
- Permission to use, copy, modify, and/or distribute this software for any purpose with
- or without fee is hereby granted, provided that the above copyright notice and this
- permission notice appear in all copies.
- THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD
- TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN
- NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
- DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER
- IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
- CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
- ------------------------------------------------------------------------------
- NOTE! This permissive ISC license applies ONLY to files within the juce_core module!
- All other JUCE modules are covered by a dual GPL/commercial license, so if you are
- using any other modules, be sure to check that you also comply with their license.
- For more details, visit www.juce.com
- ==============================================================================
- */
- struct TextDiffHelpers
- {
- enum { minLengthToMatch = 3,
- maxComplexity = 16 * 1024 * 1024 };
- struct StringRegion
- {
- StringRegion (const String& s) noexcept
- : text (s.getCharPointer()), start (0), length (s.length()) {}
- StringRegion (const String::CharPointerType t, int s, int len) noexcept
- : text (t), start (s), length (len) {}
- void incrementStart() noexcept { ++text; ++start; --length; }
- String::CharPointerType text;
- int start, length;
- };
- static void addInsertion (TextDiff& td, const String::CharPointerType text, int index, int length)
- {
- TextDiff::Change c;
- c.insertedText = String (text, (size_t) length);
- c.start = index;
- c.length = 0;
- td.changes.add (c);
- }
- static void addDeletion (TextDiff& td, int index, int length)
- {
- TextDiff::Change c;
- c.start = index;
- c.length = length;
- td.changes.add (c);
- }
- static void diffSkippingCommonStart (TextDiff& td, StringRegion a, StringRegion b)
- {
- for (;;)
- {
- const juce_wchar ca = *a.text;
- const juce_wchar cb = *b.text;
- if (ca != cb || ca == 0)
- break;
- a.incrementStart();
- b.incrementStart();
- }
- diffRecursively (td, a, b);
- }
- static void diffRecursively (TextDiff& td, StringRegion a, StringRegion b)
- {
- int indexA = 0, indexB = 0;
- const int len = findLongestCommonSubstring (a.text, a.length, indexA,
- b.text, b.length, indexB);
- if (len >= minLengthToMatch)
- {
- if (indexA > 0 && indexB > 0)
- diffSkippingCommonStart (td, StringRegion (a.text, a.start, indexA),
- StringRegion (b.text, b.start, indexB));
- else if (indexA > 0)
- addDeletion (td, b.start, indexA);
- else if (indexB > 0)
- addInsertion (td, b.text, b.start, indexB);
- diffRecursively (td, StringRegion (a.text + (indexA + len), a.start + indexA + len, a.length - indexA - len),
- StringRegion (b.text + (indexB + len), b.start + indexB + len, b.length - indexB - len));
- }
- else
- {
- if (a.length > 0) addDeletion (td, b.start, a.length);
- if (b.length > 0) addInsertion (td, b.text, b.start, b.length);
- }
- }
- static int findLongestCommonSubstring (String::CharPointerType a, const int lenA, int& indexInA,
- String::CharPointerType b, const int lenB, int& indexInB) noexcept
- {
- if (lenA == 0 || lenB == 0)
- return 0;
- if (lenA * lenB > maxComplexity)
- return findCommonSuffix (a, lenA, indexInA,
- b, lenB, indexInB);
- const size_t scratchSpace = sizeof (int) * (2 + 2 * (size_t) lenB);
- if (scratchSpace < 4096)
- {
- int* scratch = (int*) alloca (scratchSpace);
- return findLongestCommonSubstring (a, lenA, indexInA, b, lenB, indexInB, scratchSpace, scratch);
- }
- HeapBlock<int> scratch (scratchSpace);
- return findLongestCommonSubstring (a, lenA, indexInA, b, lenB, indexInB, scratchSpace, scratch);
- }
- static int findLongestCommonSubstring (String::CharPointerType a, const int lenA, int& indexInA,
- String::CharPointerType b, const int lenB, int& indexInB,
- const size_t scratchSpace, int* const lines) noexcept
- {
- zeromem (lines, scratchSpace);
- int* l0 = lines;
- int* l1 = l0 + lenB + 1;
- int loopsWithoutImprovement = 0;
- int bestLength = 0;
- for (int i = 0; i < lenA; ++i)
- {
- const juce_wchar ca = a.getAndAdvance();
- String::CharPointerType b2 (b);
- for (int j = 0; j < lenB; ++j)
- {
- if (ca != b2.getAndAdvance())
- {
- l1[j + 1] = 0;
- }
- else
- {
- const int len = l0[j] + 1;
- l1[j + 1] = len;
- if (len > bestLength)
- {
- loopsWithoutImprovement = 0;
- bestLength = len;
- indexInA = i;
- indexInB = j;
- }
- }
- }
- if (++loopsWithoutImprovement > 100)
- break;
- std::swap (l0, l1);
- }
- indexInA -= bestLength - 1;
- indexInB -= bestLength - 1;
- return bestLength;
- }
- static int findCommonSuffix (String::CharPointerType a, const int lenA, int& indexInA,
- String::CharPointerType b, const int lenB, int& indexInB) noexcept
- {
- int length = 0;
- a += lenA - 1;
- b += lenB - 1;
- while (length < lenA && length < lenB && *a == *b)
- {
- --a;
- --b;
- ++length;
- }
- indexInA = lenA - length;
- indexInB = lenB - length;
- return length;
- }
- };
- TextDiff::TextDiff (const String& original, const String& target)
- {
- TextDiffHelpers::diffSkippingCommonStart (*this, original, target);
- }
- String TextDiff::appliedTo (String text) const
- {
- for (int i = 0; i < changes.size(); ++i)
- text = changes.getReference(i).appliedTo (text);
- return text;
- }
- bool TextDiff::Change::isDeletion() const noexcept
- {
- return insertedText.isEmpty();
- }
- String TextDiff::Change::appliedTo (const String& text) const noexcept
- {
- return text.replaceSection (start, length, insertedText);
- }
- //==============================================================================
- //==============================================================================
- #if JUCE_UNIT_TESTS
- class DiffTests : public UnitTest
- {
- public:
- DiffTests() : UnitTest ("TextDiff class") {}
- static String createString (Random& r)
- {
- juce_wchar buffer[500] = { 0 };
- for (int i = r.nextInt (numElementsInArray (buffer) - 1); --i >= 0;)
- {
- if (r.nextInt (10) == 0)
- {
- do
- {
- buffer[i] = (juce_wchar) (1 + r.nextInt (0x10ffff - 1));
- }
- while (! CharPointer_UTF16::canRepresent (buffer[i]));
- }
- else
- buffer[i] = (juce_wchar) ('a' + r.nextInt (3));
- }
- return CharPointer_UTF32 (buffer);
- }
- void testDiff (const String& a, const String& b)
- {
- TextDiff diff (a, b);
- const String result (diff.appliedTo (a));
- expectEquals (result, b);
- }
- void runTest() override
- {
- beginTest ("TextDiff");
- Random r = getRandom();
- testDiff (String::empty, String::empty);
- testDiff ("x", String::empty);
- testDiff (String::empty, "x");
- testDiff ("x", "x");
- testDiff ("x", "y");
- testDiff ("xxx", "x");
- testDiff ("x", "xxx");
- for (int i = 1000; --i >= 0;)
- {
- String s (createString (r));
- testDiff (s, createString (r));
- testDiff (s + createString (r), s + createString (r));
- }
- }
- };
- static DiffTests diffTests;
- #endif
|