/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
* This file is part of the LibreOffice project.
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* This file incorporates work covered by the following license notice:
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed
* with this work for additional information regarding copyright
* ownership. The ASF licenses this file to you under the Apache
* License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
*/
#include <sal/config.h>
#include <rtl/ustrbuf.hxx>
#include <o3tl/safeint.hxx>
#include <osl/diagnose.h>
#include <rtl/character.hxx>
#include <swmodule.hxx>
#include <doc.hxx>
#include <IDocumentUndoRedo.hxx>
#include <DocumentContentOperationsManager.hxx>
#include <IDocumentRedlineAccess.hxx>
#include <IDocumentState.hxx>
#include <docary.hxx>
#include <pam.hxx>
#include <ndtxt.hxx>
#include <redline.hxx>
#include <UndoRedline.hxx>
#include <section.hxx>
#include <tox.hxx>
#include <docsh.hxx>
#include <fmtcntnt.hxx>
#include <modcfg.hxx>
#include <frameformats.hxx>
#include <com/sun/star/document/XDocumentPropertiesSupplier.hpp>
#include <com/sun/star/document/XDocumentProperties.hpp>
#include <com/sun/star/frame/XModel.hpp>
#include <cstddef>
#include <memory>
#include <type_traits>
#include <vector>
using namespace ::com::sun::star;
using std::vector;
namespace {
class SwCompareLine final
{
const SwNode* m_pNode;
public:
explicit SwCompareLine( const SwNode& rNd ) : m_pNode( &rNd ) {}
SwCompareLine() : m_pNode( nullptr ) {}
sal_uLong GetHashValue() const;
bool Compare( const SwCompareLine& rLine ) const;
static sal_uLong GetTextNodeHashValue( const SwTextNode& rNd, sal_uLong nVal );
static bool CompareNode( const SwNode& rDstNd, const SwNode& rSrcNd );
static bool CompareTextNd( const SwTextNode& rDstNd,
const SwTextNode& rSrcNd );
bool ChangesInLine( const SwCompareLine& rLine,
std::unique_ptr<SwPaM>& rpInsRing, std::unique_ptr<SwPaM>& rpDelRing ) const;
const SwNode& GetNode() const { return *m_pNode; }
const SwNode& GetEndNode() const;
// for debugging
OUString GetText() const;
};
class CompareData
{
protected:
SwDoc& m_rDoc;
private:
std::unique_ptr<size_t[]> m_pIndex;
std::unique_ptr<bool[]> m_pChangedFlag;
std::unique_ptr<SwPaM> m_pInsertRing, m_pDelRing;
static SwNodeOffset PrevIdx( const SwNode* pNd );
static SwNodeOffset NextIdx( const SwNode* pNd );
vector<SwCompareLine> m_aLines;
bool m_bRecordDiff;
// Truncate beginning and end and add all others to the LinesArray
void CheckRanges( CompareData& );
virtual const SwNode& GetEndOfContent() = 0;
public:
CompareData(SwDoc& rD, bool bRecordDiff)
: m_rDoc( rD )
, m_bRecordDiff(bRecordDiff)
{
}
virtual ~CompareData();
// Are there differences?
bool HasDiffs( const CompareData& rData ) const;
// Triggers the comparison and creation of two documents
void CompareLines( CompareData& rData );
// Display the differences - calls the methods ShowInsert and ShowDelete.
// These are passed the start and end line number.
// Displaying the actually content is to be handled by the subclass!
sal_uLong ShowDiffs( const CompareData& rData );
void ShowInsert( sal_uLong nStt, sal_uLong nEnd );
void ShowDelete( const CompareData& rData, sal_uLong nStt,
sal_uLong nEnd, sal_uLong nInsPos );
void CheckForChangesInLine( const CompareData& rData,
sal_uLong nStt, sal_uLong nEnd,
sal_uLong nThisStt, sal_uLong nThisEnd );
// Set non-ambiguous index for a line. Same lines have the same index, even in the other CompareData!
void SetIndex( size_t nLine, size_t nIndex );
size_t GetIndex( size_t nLine ) const
{ return nLine < m_aLines.size() ? m_pIndex[ nLine ] : 0; }
// Set/get of a line has changed
void SetChanged( size_t nLine, bool bFlag = true );
bool GetChanged( size_t nLine ) const
{
return (m_pChangedFlag && nLine < m_aLines.size())
&& m_pChangedFlag[ nLine ];
}
size_t GetLineCount() const { return m_aLines.size(); }
const SwCompareLine& GetLine( size_t nLine ) const
{ return m_aLines[ nLine ]; }
void InsertLine( SwCompareLine aLine )
{ m_aLines.push_back( aLine ); }
void SetRedlinesToDoc( bool bUseDocInfo );
};
class CompareMainText : public CompareData
{
public:
CompareMainText(SwDoc &rD, bool bRecordDiff)
: CompareData(rD, bRecordDiff)
{
}
virtual const SwNode& GetEndOfContent() override
{
return m_rDoc.GetNodes().GetEndOfContent();
}
};
class CompareFrameFormatText : public CompareData
{
const SwNodeIndex &m_rIndex;
public:
CompareFrameFormatText(SwDoc &rD, const SwNodeIndex &rIndex)
: CompareData(rD, true/*bRecordDiff*/)
, m_rIndex(rIndex)
{
}
virtual const SwNode& GetEndOfContent() override
{
return *m_rIndex.GetNode().EndOfSectionNode();
}
};
class Hash
{
struct HashData
{
sal_uLong nNext, nHash;
SwCompareLine aLine;
HashData()
: nNext( 0 ), nHash( 0 ) {}
};
std::unique_ptr<sal_uLong[]> m_pHashArr;
std::unique_ptr<HashData[]> m_pDataArr;
sal_uLong m_nCount, m_nPrime;
public:
explicit Hash( sal_uLong nSize );
void CalcHashValue( CompareData& rData );
sal_uLong GetCount() const { return m_nCount; }
};
class Compare
{
public:
class MovedData
{
std::unique_ptr<sal_uLong[]> m_pIndex;
std::unique_ptr<sal_uLong[]> m_pLineNum;
sal_uLong m_nCount;
public:
MovedData( CompareData& rData, const char* pDiscard );
sal_uLong GetIndex( sal_uLong n ) const { return m_pIndex[ n ]; }
sal_uLong GetLineNum( sal_uLong n ) const { return m_pLineNum[ n ]; }
sal_uLong GetCount() const { return m_nCount; }
};
private:
/// Look for the moved lines
class CompareSequence
{
CompareData &m_rData1, &m_rData2;
const MovedData &m_rMoved1, &m_rMoved2;
std::unique_ptr<tools::Long[]> m_pMemory;
tools::Long *m_pFDiag, *m_pBDiag;
void Compare( sal_uLong nStt1, sal_uLong nEnd1, sal_uLong nStt2, sal_uLong nEnd2 );
sal_uLong CheckDiag( sal_uLong nStt1, sal_uLong nEnd1,
sal_uLong nStt2, sal_uLong nEnd2, sal_uLong* pCost );
public:
CompareSequence( CompareData& rD1, CompareData& rD2,
const MovedData& rMD1, const MovedData& rMD2 );
};
static void CountDifference( const CompareData& rData, sal_uLong* pCounts );
static void SetDiscard( const CompareData& rData,
char* pDiscard, const sal_uLong* pCounts );
static void CheckDiscard( size_t nLen, char* pDiscard );
static void ShiftBoundaries( CompareData& rData1, CompareData& rData2 );
public:
Compare( sal_uLong nDiff, CompareData& rData1, CompareData& rData2 );
};
class ArrayComparator
{
public:
virtual bool Compare( int nIdx1, int nIdx2 ) const = 0;
virtual int GetLen1() const = 0;
virtual int GetLen2() const = 0;
virtual ~ArrayComparator() {}
};
/// Consider two lines equal if similar enough (e.g. look like different
/// versions of the same paragraph)
class LineArrayComparator : public ArrayComparator
{
private:
int m_nLen1, m_nLen2;
const CompareData &m_rData1, &m_rData2;
int m_nFirst1, m_nFirst2;
public:
LineArrayComparator( const CompareData &rD1, const CompareData &rD2,
int nStt1, int nEnd1, int nStt2, int nEnd2 );
virtual bool Compare( int nIdx1, int nIdx2 ) const override;
virtual int GetLen1() const override { return m_nLen1; }
virtual int GetLen2() const override { return m_nLen2; }
};
class WordArrayComparator : public ArrayComparator
{
private:
const SwTextNode *m_pTextNode1, *m_pTextNode2;
std::unique_ptr<int[]> m_pPos1, m_pPos2;
int m_nCount1, m_nCount2; // number of words
static void CalcPositions( int *pPos, const SwTextNode *pTextNd, int &nCnt );
public:
WordArrayComparator( const SwTextNode *pNode1, const SwTextNode *pNode2 );
virtual bool Compare( int nIdx1, int nIdx2 ) const override;
virtual int GetLen1() const override { return m_nCount1; }
virtual int GetLen2() const override { return m_nCount2; }
int GetCharSequence( const int *pWordLcs1, const int *pWordLcs2,
int *pSubseq1, int *pSubseq2, int nLcsLen );
};
class CharArrayComparator : public ArrayComparator
{
private:
const SwTextNode *m_pTextNode1, *m_pTextNode2;
public:
CharArrayComparator( const SwTextNode *pNode1, const SwTextNode *pNode2 )
: m_pTextNode1( pNode1 ), m_pTextNode2( pNode2 )
{
}
virtual bool Compare( int nIdx1, int nIdx2 ) const override;
virtual int GetLen1() const override { return m_pTextNode1->GetText().getLength(); }
virtual int GetLen2() const override { return m_pTextNode2->GetText().getLength(); }
};
/// Options set in Tools->Options->Writer->Comparison
struct CmpOptionsContainer
{
SwCompareMode eCmpMode;
int nIgnoreLen;
bool bUseRsid;
};
}
static CmpOptionsContainer CmpOptions;
namespace {
class CommonSubseq
{
private:
std::unique_ptr<int[]> m_pData;
protected:
ArrayComparator &m_rComparator;
CommonSubseq( ArrayComparator &rComparator, int nMaxSize )
: m_rComparator( rComparator )
{
m_pData.reset( new int[ nMaxSize ] );
}
int FindLCS( int *pLcs1, int *pLcs2, int nStt1,
int nEnd1, int nStt2, int nEnd2 );
public:
static int IgnoreIsolatedPieces( int *pLcs1, int *pLcs2, int nLen1, int nLen2,
int nLcsLen, int nPieceLen );
};
/// Use Hirschberg's algorithm to find LCS in linear space
class LgstCommonSubseq: public CommonSubseq
{
private:
static const int CUTOFF = 1<<20; // Stop recursion at this value
std::unique_ptr<int[]> m_pL1, m_pL2;
std::unique_ptr<int[]> m_pBuff1, m_pBuff2;
void FindL( int *pL, int nStt1, int nEnd1, int nStt2, int nEnd2 );
int HirschbergLCS( int *pLcs1, int *pLcs2, int nStt1, int nEnd1,
int nStt2, int nEnd2 );
public:
explicit LgstCommonSubseq( ArrayComparator &rComparator );
int Find( int *pSubseq1, int *pSubseq2 );
};
/// Find a common subsequence in linear time
class FastCommonSubseq: private CommonSubseq
{
private:
static const int CUTOFF = 2056;
int FindFastCS( int *pSeq1, int *pSeq2, int nStt1, int nEnd1,
int nStt2, int nEnd2 );
public:
explicit FastCommonSubseq( ArrayComparator &rComparator )
: CommonSubseq( rComparator, CUTOFF )
{
}
int Find( int *pSubseq1, int *pSubseq2 )
{
return FindFastCS( pSubseq1, pSubseq2, 0, m_rComparator.GetLen1(),
0, m_rComparator.GetLen2() );
}
};
}
CompareData::~CompareData()
{
if( m_pDelRing )
{
while( m_pDelRing->GetNext() != m_pDelRing.get() )
delete m_pDelRing->GetNext();
m_pDelRing.reset();
}
if( m_pInsertRing )
{
while( m_pInsertRing->GetNext() != m_pInsertRing.get() )
delete m_pInsertRing->GetNext();
m_pInsertRing.reset();
}
}
void CompareData::SetIndex( size_t nLine, size_t nIndex )
{
if( !m_pIndex )
{
m_pIndex.reset( new size_t[ m_aLines.size() ] );
memset( m_pIndex.get(), 0, m_aLines.size() * sizeof( size_t ) );
}
if( nLine < m_aLines.size() )
m_pIndex[ nLine ] = nIndex;
}
void CompareData::SetChanged( size_t nLine, bool bFlag )
{
if( !m_pChangedFlag )
{
m_pChangedFlag.reset( new bool[ m_aLines.size() +1 ] );
memset( m_pChangedFlag.get(), 0, (m_aLines.size() +1) * sizeof( bool ) );
}
if( nLine < m_aLines.size() )
m_pChangedFlag[ nLine ] = bFlag;
}
void CompareData::CompareLines( CompareData& rData )
{
CheckRanges( rData );
sal_uLong nDifferent;
{
Hash aH( GetLineCount() + rData.GetLineCount() + 1 );
aH.CalcHashValue( *this );
aH.CalcHashValue( rData );
nDifferent = aH.GetCount();
}
{
Compare aComp( nDifferent, *this, rData );
}
}
sal_uLong CompareData::ShowDiffs( const CompareData& rData )
{
sal_uLong nLen1 = rData.GetLineCount(), nLen2 = GetLineCount();
sal_uLong nStt1 = 0, nStt2 = 0;
sal_uLong nCnt = 0;
while( nStt1 < nLen1 || nStt2 < nLen2 )
{
if( rData.GetChanged( nStt1 ) || GetChanged( nStt2 ) )
{
// Find a region of different lines between two pairs of identical
// lines.
sal_uLong nSav1 = nStt1, nSav2 = nStt2;
while( nStt1 < nLen1 && rData.GetChanged( nStt1 )) ++nStt1;
while( nStt2 < nLen2 && GetChanged( nStt2 )) ++nStt2;
if (m_bRecordDiff)
{
// Check if there are changed lines (only slightly different) and
// compare them in detail.
CheckForChangesInLine( rData, nSav1, nStt1, nSav2, nStt2 );
}
++nCnt;
}
++nStt1;
++nStt2;
}
return nCnt;
}
bool CompareData::HasDiffs( const CompareData& rData ) const
{
bool bRet = false;
sal_uLong nLen1 = rData.GetLineCount(), nLen2 = GetLineCount();
sal_uLong nStt1 = 0, nStt2 = 0;
while( nStt1 < nLen1 || nStt2 < nLen2 )
{
if( rData.GetChanged( nStt1 ) || GetChanged( nStt2 ) )
{
bRet = true;
break;
}
++nStt1;
++nStt2;
}
return bRet;
}
Hash::Hash( sal_uLong nSize )
: m_nCount(1)
{
static const sal_uLong primes[] =
{
509,
1021,
2039,
4093,
8191,
16381,
32749,
65521,
131071,
262139,
524287,
1048573,
2097143,
4194301,
8388593,
16777213,
33554393,
67108859, /* Preposterously large . . . */
134217689,
268435399,
536870909,
1073741789,
2147483647,
0
};
int i;
m_pDataArr.reset( new HashData[ nSize ] );
m_pDataArr[0].nNext = 0;
m_pDataArr[0].nHash = 0;
m_nPrime = primes[0];
for( i = 0; primes[i] < nSize / 3; i++)
if( !primes[i] )
{
m_pHashArr = nullptr;
return;
}
m_nPrime = primes[ i ];
m_pHashArr.reset( new sal_uLong[ m_nPrime ] );
memset( m_pHashArr.get(), 0, m_nPrime * sizeof( sal_uLong ) );
}
void Hash::CalcHashValue( CompareData& rData )
{
if( !m_pHashArr )
return;
for( size_t n = 0; n < rData.GetLineCount(); ++n )
{
const SwCompareLine aLine = rData.GetLine( n );
sal_uLong nH = aLine.GetHashValue();
sal_uLong* pFound = &m_pHashArr[ nH % m_nPrime ];
size_t i;
for( i = *pFound; ; i = m_pDataArr[i].nNext )
if( !i )
{
i = m_nCount++;
m_pDataArr[i].nNext = *pFound;
m_pDataArr[i].nHash = nH;
m_pDataArr[i].aLine = aLine;
*pFound = i;
break;
}
else if( m_pDataArr[i].nHash == nH &&
m_pDataArr[i].aLine.Compare( aLine ))
break;
rData.SetIndex( n, i );
}
}
Compare::Compare( sal_uLong nDiff, CompareData& rData1, CompareData& rData2 )
{
std::unique_ptr<MovedData> pMD1, pMD2;
// Look for the differing lines
{
std::unique_ptr<char[]> pDiscard1( new char[ rData1.GetLineCount() ] );
std::unique_ptr<char[]> pDiscard2( new char[ rData2.GetLineCount() ] );
std::unique_ptr<sal_uLong[]> pCount1(new sal_uLong[ nDiff ]);
std::unique_ptr<sal_uLong[]> pCount2(new sal_uLong[ nDiff ]);
memset( pCount1.get(), 0, nDiff * sizeof( sal_uLong ));
memset( pCount2.get(), 0, nDiff * sizeof( sal_uLong ));
// find indices in CompareData which have been assigned multiple times
CountDifference( rData1, pCount1.get() );
CountDifference( rData2, pCount2.get() );
// All which occur only once now have either been inserted or deleted.
// All which are also contained in the other one have been moved.
SetDiscard( rData1, pDiscard1.get(), pCount2.get() );
SetDiscard( rData2, pDiscard2.get(), pCount1.get() );
CheckDiscard( rData1.GetLineCount(), pDiscard1.get() );
CheckDiscard( rData2.GetLineCount(), pDiscard2.get() );
pMD1.reset(new MovedData( rData1, pDiscard1.get() ));
pMD2.reset(new MovedData( rData2, pDiscard2.get() ));
}
{
CompareSequence aTmp( rData1, rData2, *pMD1, *pMD2 );
}
ShiftBoundaries( rData1, rData2 );
}
void Compare::CountDifference( const CompareData& rData, sal_uLong* pCounts )
{
sal_uLong nLen = rData.GetLineCount();
for( sal_uLong n = 0; n < nLen; ++n )
{
sal_uLong nIdx = rData.GetIndex( n );
++pCounts[ nIdx ];
}
}
void Compare::SetDiscard( const CompareData& rData,
char* pDiscard, const sal_uLong* pCounts )
{
const sal_uLong nLen = rData.GetLineCount();
// calculate Max with respect to the line count
sal_uLong nMax = 5;
for( sal_uLong n = nLen / 64; ( n = n >> 2 ) > 0; )
nMax <<= 1;
for( sal_uLong n = 0; n < nLen; ++n )
{
sal_uLong nIdx = rData.GetIndex( n );
if( nIdx )
{
nIdx = pCounts[ nIdx ];
pDiscard[ n ] = !nIdx ? 1 : nIdx > nMax ? 2 : 0;
}
else
pDiscard[ n ] = 0;
}
}
void Compare::CheckDiscard( size_t nLen, char* pDiscard )
{
for( size_t n = 0; n < nLen; ++n )
{
if( 2 == pDiscard[ n ] )
pDiscard[n] = 0;
else if( pDiscard[ n ] )
{
size_t j;
size_t length;
size_t provisional = 0;
/* Find end of this run of discardable lines.
Count how many are provisionally discardable. */
for (j = n; j < nLen; j++)
{
if( !pDiscard[j] )
break;
if( 2 == pDiscard[j] )
++provisional;
}
/* Cancel provisional discards at end, and shrink the run. */
while( j > n && 2 == pDiscard[j - 1] )
{
pDiscard[ --j ] = 0;
--provisional;
}
/* Now we have the length of a run of discardable lines
whose first and last are not provisional. */
length = j - n;
/* If 1/4 of the lines in the run are provisional,
cancel discarding of all provisional lines in the run. */
if (provisional * 4 > length)
{
while (j > n)
if (pDiscard[--j] == 2)
pDiscard[j] = 0;
}
else
{
size_t consec;
size_t minimum = 1;
size_t tem = length / 4;
/* MINIMUM is approximate square root of LENGTH/4.
A subrun of two or more provisionals can stand
when LENGTH is at least 16.
A subrun of 4 or more can stand when LENGTH >= 64. */
while ((tem = tem >> 2) > 0)
minimum *= 2;
minimum++;
/* Cancel any subrun of MINIMUM or more provisionals
within the larger run. */
for (j = 0, consec = 0; j < length; j++)
if (pDiscard[n + j] != 2)
consec = 0;
else if (minimum == ++consec)
/* Back up to start of subrun, to cancel it all. */
j -= consec;
else if (minimum < consec)
pDiscard[n + j] = 0;
/* Scan from beginning of run
until we find 3 or more nonprovisionals in a row
or until the first nonprovisional at least 8 lines in.
Until that point, cancel any provisionals. */
for (j = 0, consec = 0; j < length; j++)
{
if (j >= 8 && pDiscard[n + j] == 1)
break;
if (pDiscard[n + j] == 2)
{
consec = 0;
pDiscard[n + j] = 0;
}
else if (pDiscard[n + j] == 0)
consec = 0;
else
consec++;
if (consec == 3)
break;
}
/* I advances to the last line of the run. */
n += length - 1;
/* Same thing, from end. */
for (j = 0, consec = 0; j < length; j++)
{
if (j >= 8 && pDiscard[n - j] == 1)
break;
if (pDiscard[n - j] == 2)
{
consec = 0;
pDiscard[n - j] = 0;
}
else if (pDiscard[n - j] == 0)
consec = 0;
else
consec++;
if (consec == 3)
break;
}
}
}
}
}
Compare::MovedData::MovedData( CompareData& rData, const char* pDiscard )
: m_nCount( 0 )
{
sal_uLong nLen = rData.GetLineCount();
sal_uLong n;
for( n = 0; n < nLen; ++n )
if( pDiscard[ n ] )
rData.SetChanged( n );
else
++m_nCount;
if( m_nCount )
{
m_pIndex.reset( new sal_uLong[ m_nCount ] );
m_pLineNum.reset( new sal_uLong[ m_nCount ] );
for( n = 0, m_nCount = 0; n < nLen; ++n )
if( !pDiscard[ n ] )
{
m_pIndex[ m_nCount ] = rData.GetIndex( n );
m_pLineNum[ m_nCount++ ] = n;
}
}
}
/// Find the differing lines
Compare::CompareSequence::CompareSequence(
CompareData& rD1, CompareData& rD2,
const MovedData& rMD1, const MovedData& rMD2 )
: m_rData1( rD1 ), m_rData2( rD2 ), m_rMoved1( rMD1 ), m_rMoved2( rMD2 )
{
sal_uLong nSize = rMD1.GetCount() + rMD2.GetCount() + 3;
m_pMemory.reset( new tools::Long[ nSize * 2 ] );
m_pFDiag = m_pMemory.get() + ( rMD2.GetCount() + 1 );
m_pBDiag = m_pMemory.get() + ( nSize + rMD2.GetCount() + 1 );
Compare( 0, rMD1.GetCount(), 0, rMD2.GetCount() );
}
void Compare::CompareSequence::Compare( sal_uLong nStt1, sal_uLong nEnd1,
sal_uLong nStt2, sal_uLong nEnd2 )
{
/* Slide down the bottom initial diagonal. */
while( nStt1 < nEnd1 && nStt2 < nEnd2 &&
m_rMoved1.GetIndex( nStt1 ) == m_rMoved2.GetIndex( nStt2 ))
{
++nStt1;
++nStt2;
}
/* Slide up the top initial diagonal. */
while( nEnd1 > nStt1 && nEnd2 > nStt2 &&
m_rMoved1.GetIndex( nEnd1 - 1 ) == m_rMoved2.GetIndex( nEnd2 - 1 ))
{
--nEnd1;
--nEnd2;
}
/* Handle simple cases. */
if( nStt1 == nEnd1 )
while( nStt2 < nEnd2 )
m_rData2.SetChanged( m_rMoved2.GetLineNum( nStt2++ ));
else if (nStt2 == nEnd2)
while (nStt1 < nEnd1)
m_rData1.SetChanged( m_rMoved1.GetLineNum( nStt1++ ));
else
{
sal_uLong c, d, b;
/* Find a point of correspondence in the middle of the files. */
d = CheckDiag( nStt1, nEnd1, nStt2, nEnd2, &c );
b = m_pBDiag[ std::make_signed_t<decltype(d)>(d) ];
if( 1 != c )
{
/* Use that point to split this problem into two subproblems. */
Compare( nStt1, b, nStt2, b - d );
/* This used to use f instead of b,
but that is incorrect!
It is not necessarily the case that diagonal d
has a snake from b to f. */
Compare( b, nEnd1, b - d, nEnd2 );
}
}
}
sal_uLong Compare::CompareSequence::CheckDiag( sal_uLong nStt1, sal_uLong nEnd1,
sal_uLong nStt2, sal_uLong nEnd2, sal_uLong* pCost )
{
const tools::Long dmin = nStt1 - nEnd2; /* Minimum valid diagonal. */
const tools::Long dmax = nEnd1 - nStt2; /* Maximum valid diagonal. */
const tools::Long fmid = nStt1 - nStt2; /* Center diagonal of top-down search. */
const tools::Long bmid = nEnd1 - nEnd2; /* Center diagonal of bottom-up search. */
tools::Long fmin = fmid, fmax = fmid; /* Limits of top-down search. */
tools::Long bmin = bmid, bmax = bmid; /* Limits of bottom-up search. */
tools::Long c; /* Cost. */
tools::Long odd = (fmid - bmid) & 1; /* True if southeast corner is on an odd
diagonal with respect to the northwest. */
m_pFDiag[fmid] = nStt1;
m_pBDiag[bmid] = nEnd1;
for (c = 1;; ++c)
{
tools::Long d; /* Active diagonal. */
/* Extend the top-down search by an edit step in each diagonal. */
if (fmin > dmin)
m_pFDiag[--fmin - 1] = -1;
else
++fmin;
if (fmax < dmax)
m_pFDiag[++fmax + 1] = -1;
else
--fmax;
for (d = fmax; d >= fmin; d -= 2)
{
tools::Long x, y, tlo = m_pFDiag[d - 1], thi = m_pFDiag[d + 1];
if (tlo >= thi)
x = tlo + 1;
else
x = thi;
y = x - d;
while( o3tl::make_unsigned(x) < nEnd1 && o3tl::make_unsigned(y) < nEnd2 &&
m_rMoved1.GetIndex( x ) == m_rMoved2.GetIndex( y ))
{
++x;
++y;
}
m_pFDiag[d] = x;
if( odd && bmin <= d && d <= bmax && m_pBDiag[d] <= m_pFDiag[d] )
{
*pCost = 2 * c - 1;
return d;
}
}
/* Similar extend the bottom-up search. */
if (bmin > dmin)
m_pBDiag[--bmin - 1] = INT_MAX;
else
++bmin;
if (bmax < dmax)
m_pBDiag[++bmax + 1] = INT_MAX;
else
--bmax;
for (d = bmax; d >= bmin; d -= 2)
{
tools::Long x, y, tlo = m_pBDiag[d - 1], thi = m_pBDiag[d + 1];
if (tlo < thi)
x = tlo;
else
x = thi - 1;
y = x - d;
while( o3tl::make_unsigned(x) > nStt1 && o3tl::make_unsigned(y) > nStt2 &&
m_rMoved1.GetIndex( x - 1 ) == m_rMoved2.GetIndex( y - 1 ))
{
--x;
--y;
}
m_pBDiag[d] = x;
if (!odd && fmin <= d && d <= fmax && m_pBDiag[d] <= m_pFDiag[d])
{
*pCost = 2 * c;
return d;
}
}
}
}
namespace
{
void lcl_ShiftBoundariesOneway( CompareData* const pData, CompareData const * const pOtherData)
{
sal_uLong i = 0;
sal_uLong j = 0;
sal_uLong i_end = pData->GetLineCount();
sal_uLong preceding = ULONG_MAX;
sal_uLong other_preceding = ULONG_MAX;
while (true)
{
sal_uLong start, other_start;
/* Scan forwards to find beginning of another run of changes.
Also keep track of the corresponding point in the other file. */
while( i < i_end && !pData->GetChanged( i ) )
{
while( pOtherData->GetChanged( j++ ))
/* Non-corresponding lines in the other file
will count as the preceding batch of changes. */
other_preceding = j;
i++;
}
if (i == i_end)
break;
start = i;
other_start = j;
while (true)
{
/* Now find the end of this run of changes. */
while( pData->GetChanged( ++i ))
;
/* If the first changed line matches the following unchanged one,
and this run does not follow right after a previous run,
and there are no lines deleted from the other file here,
then classify the first changed line as unchanged
and the following line as changed in its place. */
/* You might ask, how could this run follow right after another?
Only because the previous run was shifted here. */
if( i != i_end &&
pData->GetIndex( start ) == pData->GetIndex( i ) &&
!pOtherData->GetChanged( j ) &&
start != preceding && other_start != other_preceding )
{
pData->SetChanged( start++, false );
pData->SetChanged( i );
/* Since one line-that-matches is now before this run
instead of after, we must advance in the other file
to keep in sync. */
++j;
}
else
break;
}
preceding = i;
other_preceding = j;
}
}
}
void Compare::ShiftBoundaries( CompareData& rData1, CompareData& rData2 )
{
lcl_ShiftBoundariesOneway(&rData1, &rData2);
lcl_ShiftBoundariesOneway(&rData2, &rData1);
}
sal_uLong SwCompareLine::GetHashValue() const
{
sal_uLong nRet = 0;
switch( m_pNode->GetNodeType() )
{
case SwNodeType::Text:
nRet = GetTextNodeHashValue( *m_pNode->GetTextNode(), nRet );
break;
case SwNodeType::Table:
{
const SwNode* pEndNd = m_pNode->EndOfSectionNode();
SwNodeIndex aIdx( *m_pNode );
while( &aIdx.GetNode() != pEndNd )
{
if( aIdx.GetNode().IsTextNode() )
nRet = GetTextNodeHashValue( *aIdx.GetNode().GetTextNode(), nRet );
++aIdx;
}
}
break;
case SwNodeType::Section:
{
OUString sStr( GetText() );
for( sal_Int32 n = 0; n < sStr.getLength(); ++n )
nRet = (nRet << 1) + sStr[ n ];
}
break;
case SwNodeType::Grf:
case SwNodeType::Ole:
// Fixed ID? Should never occur ...
break;
default: break;
}
return nRet;
}
const SwNode& SwCompareLine::GetEndNode() const
{
const SwNode* pNd = m_pNode;
switch( m_pNode->GetNodeType() )
{
case SwNodeType::Table:
pNd = m_pNode->EndOfSectionNode();
break;
case SwNodeType::Section:
{
const SwSectionNode& rSNd = static_cast<const SwSectionNode&>(*m_pNode);
const SwSection& rSect = rSNd.GetSection();
if( SectionType::Content != rSect.GetType() || rSect.IsProtect() )
pNd = m_pNode->EndOfSectionNode();
}
break;
default: break;
}
return *pNd;
}
bool SwCompareLine::Compare( const SwCompareLine& rLine ) const
{
return CompareNode( *m_pNode, *rLine.m_pNode );
}
namespace
{
OUString SimpleTableToText(const SwNode &rNode)
{
OUStringBuffer sRet;
const SwNode* pEndNd = rNode.EndOfSectionNode();
SwNodeIndex aIdx( rNode );
while (&aIdx.GetNode() != pEndNd)
{
if (aIdx.GetNode().IsTextNode())
{
if (sRet.getLength())
{
sRet.append( '\n' );
}
sRet.append( aIdx.GetNode().GetTextNode()->GetExpandText(nullptr) );
}
++aIdx;
}
return sRet.makeStringAndClear();
}
}
bool SwCompareLine::CompareNode( const SwNode& rDstNd, const SwNode& rSrcNd )
{
if( rSrcNd.GetNodeType() != rDstNd.GetNodeType() )
return false;
bool bRet = false;
switch( rDstNd.GetNodeType() )
{
case SwNodeType::Text:
bRet = CompareTextNd( *rDstNd.GetTextNode(), *rSrcNd.GetTextNode() )
&& ( !CmpOptions.bUseRsid || rDstNd.GetTextNode()->CompareParRsid( *rSrcNd.GetTextNode() ) );
break;
case SwNodeType::Table:
{
const SwTableNode& rTSrcNd = static_cast<const SwTableNode&>(rSrcNd);
const SwTableNode& rTDstNd = static_cast<const SwTableNode&>(rDstNd);
bRet = ( rTSrcNd.EndOfSectionIndex() - rTSrcNd.GetIndex() ) ==
( rTDstNd.EndOfSectionIndex() - rTDstNd.GetIndex() );
// --> #i107826#: compare actual table content
if (bRet)
{
bRet = (SimpleTableToText(rSrcNd) == SimpleTableToText(rDstNd));
}
}
break;
case SwNodeType::Section:
{
const SwSectionNode& rSSrcNd = static_cast<const SwSectionNode&>(rSrcNd),
& rSDstNd = static_cast<const SwSectionNode&>(rDstNd);
const SwSection& rSrcSect = rSSrcNd.GetSection(),
& rDstSect = rSDstNd.GetSection();
SectionType eSrcSectType = rSrcSect.GetType(),
eDstSectType = rDstSect.GetType();
switch( eSrcSectType )
{
case SectionType::Content:
bRet = SectionType::Content == eDstSectType &&
rSrcSect.IsProtect() == rDstSect.IsProtect();
if( bRet && rSrcSect.IsProtect() )
{
// the only have they both the same size
bRet = ( rSSrcNd.EndOfSectionIndex() - rSSrcNd.GetIndex() ) ==
( rSDstNd.EndOfSectionIndex() - rSDstNd.GetIndex() );
}
break;
case SectionType::ToxHeader:
case SectionType::ToxContent:
if( SectionType::ToxHeader == eDstSectType ||
SectionType::ToxContent == eDstSectType )
{
// the same type of TOX?
const SwTOXBase* pSrcTOX = rSrcSect.GetTOXBase();
const SwTOXBase* pDstTOX = rDstSect.GetTOXBase();
bRet = pSrcTOX && pDstTOX
&& pSrcTOX->GetType() == pDstTOX->GetType()
&& pSrcTOX->GetTitle() == pDstTOX->GetTitle()
&& pSrcTOX->GetTypeName() == pDstTOX->GetTypeName()
;
}
break;
case SectionType::DdeLink:
case SectionType::FileLink:
bRet = eSrcSectType == eDstSectType &&
rSrcSect.GetLinkFileName() ==
rDstSect.GetLinkFileName();
break;
}
}
break;
case SwNodeType::End:
bRet = rSrcNd.StartOfSectionNode()->GetNodeType() ==
rDstNd.StartOfSectionNode()->GetNodeType();
// --> #i107826#: compare actual table content
if (bRet && rSrcNd.StartOfSectionNode()->GetNodeType() == SwNodeType::Table)
{
bRet = CompareNode(
*rSrcNd.StartOfSectionNode(), *rDstNd.StartOfSectionNode());
}
break;
default: break;
}
return bRet;
}
OUString SwCompareLine::GetText() const
{
OUString sRet;
switch( m_pNode->GetNodeType() )
{
case SwNodeType::Text:
sRet = m_pNode->GetTextNode()->GetExpandText(nullptr);
break;
case SwNodeType::Table:
{
sRet = "Tabelle: " + SimpleTableToText(*m_pNode);
}
break;
case SwNodeType::Section:
{
sRet = "Section - Node:";
const SwSectionNode& rSNd = static_cast<const SwSectionNode&>(*m_pNode);
const SwSection& rSect = rSNd.GetSection();
switch( rSect.GetType() )
{
case SectionType::Content:
if( rSect.IsProtect() )
sRet += OUString::number(
sal_Int32(rSNd.EndOfSectionIndex() - rSNd.GetIndex()) );
break;
case SectionType::ToxHeader:
case SectionType::ToxContent:
{
const SwTOXBase* pTOX = rSect.GetTOXBase();
if( pTOX )
sRet += pTOX->GetTitle() + pTOX->GetTypeName() +
OUString::number(pTOX->GetType());
}
break;
case SectionType::DdeLink:
case SectionType::FileLink:
sRet += rSect.GetLinkFileName();
break;
}
}
break;
case SwNodeType::Grf:
sRet = "Grafik - Node:";
break;
case SwNodeType::Ole:
sRet = "OLE - Node:";
break;
default: break;
}
return sRet;
}
sal_uLong SwCompareLine::GetTextNodeHashValue( const SwTextNode& rNd, sal_uLong nVal )
{
OUString sStr( rNd.GetExpandText(nullptr) );
for( sal_Int32 n = 0; n < sStr.getLength(); ++n )
nVal = (nVal << 1 ) + sStr[ n ];
return nVal;
}
bool SwCompareLine::CompareTextNd( const SwTextNode& rDstNd,
const SwTextNode& rSrcNd )
{
bool bRet = false;
// Very simple at first
if( rDstNd.GetText() == rSrcNd.GetText() )
{
// The text is the same, but are the "special attributes" (0xFF) also the same?
bRet = true;
}
return bRet;
}
bool SwCompareLine::ChangesInLine( const SwCompareLine& rLine,
std::unique_ptr<SwPaM>& rpInsRing, std::unique_ptr<SwPaM>& rpDelRing ) const
{
bool bRet = false;
// Only compare textnodes
if( SwNodeType::Text == m_pNode->GetNodeType() &&
SwNodeType::Text == rLine.GetNode().GetNodeType() )
{
SwTextNode& rDstNd = *const_cast<SwTextNode*>(m_pNode->GetTextNode());
const SwTextNode& rSrcNd = *rLine.GetNode().GetTextNode();
SwDoc& rDstDoc = rDstNd.GetDoc();
int nLcsLen = 0;
int nDstLen = rDstNd.GetText().getLength();
int nSrcLen = rSrcNd.GetText().getLength();
int nMinLen = std::min( nDstLen , nSrcLen );
int nAvgLen = ( nDstLen + nSrcLen )/2;
std::vector<int> aLcsDst( nMinLen + 1 );
std::vector<int> aLcsSrc( nMinLen + 1 );
if( CmpOptions.eCmpMode == SwCompareMode::ByWord )
{
std::vector<int> aTmpLcsDst( nMinLen + 1 );
std::vector<int> aTmpLcsSrc( nMinLen + 1 );
WordArrayComparator aCmp( &rDstNd, &rSrcNd );
LgstCommonSubseq aSeq( aCmp );
nLcsLen = aSeq.Find( aTmpLcsDst.data(), aTmpLcsSrc.data() );
if( CmpOptions.nIgnoreLen )
{
nLcsLen = CommonSubseq::IgnoreIsolatedPieces( aTmpLcsDst.data(), aTmpLcsSrc.data(),
aCmp.GetLen1(), aCmp.GetLen2(),
nLcsLen, CmpOptions.nIgnoreLen );
}
nLcsLen = aCmp.GetCharSequence( aTmpLcsDst.data(), aTmpLcsSrc.data(),
aLcsDst.data(), aLcsSrc.data(), nLcsLen );
}
else
{
CharArrayComparator aCmp( &rDstNd, &rSrcNd );
LgstCommonSubseq aSeq( aCmp );
nLcsLen = aSeq.Find( aLcsDst.data(), aLcsSrc.data() );
if( CmpOptions.nIgnoreLen )
{
nLcsLen = CommonSubseq::IgnoreIsolatedPieces( aLcsDst.data(), aLcsSrc.data(), nDstLen,
nSrcLen, nLcsLen,
CmpOptions.nIgnoreLen );
}
}
// find the sum of the squares of the continuous substrings
int nSqSum = 0;
int nCnt = 1;
for( int i = 0; i < nLcsLen; i++ )
{
if( i != nLcsLen - 1 && aLcsDst[i] + 1 == aLcsDst[i + 1]
&& aLcsSrc[i] + 1 == aLcsSrc[i + 1] )
{
nCnt++;
}
else
{
nSqSum += nCnt*nCnt;
nCnt = 1;
}
}
// Don't compare if there aren't enough similarities
if ( nAvgLen >= 8 && nSqSum*32 < nAvgLen*nAvgLen )
{
return false;
}
// Show the differences
int nSkip = 0;
for( int i = 0; i <= nLcsLen; i++ )
{
int nDstFrom = i ? (aLcsDst[i - 1] + 1) : 0;
int nDstTo = ( i == nLcsLen ) ? nDstLen : aLcsDst[i];
int nSrcFrom = i ? (aLcsSrc[i - 1] + 1) : 0;
int nSrcTo = ( i == nLcsLen ) ? nSrcLen : aLcsSrc[i];
SwPaM aPam( rDstNd, nDstTo + nSkip );
if ( nDstFrom < nDstTo )
{
SwPaM* pTmp = new SwPaM( *aPam.GetPoint(), rpInsRing.get() );
if( !rpInsRing )
rpInsRing.reset(pTmp);
pTmp->SetMark();
pTmp->GetMark()->SetContent(nDstFrom + nSkip);
}
if ( nSrcFrom < nSrcTo )
{
bool bUndo = rDstDoc.GetIDocumentUndoRedo().DoesUndo();
rDstDoc.GetIDocumentUndoRedo().DoUndo( false );
SwPaM aCpyPam( rSrcNd, nSrcFrom );
aCpyPam.SetMark();
aCpyPam.GetPoint()->SetContent(nSrcTo);
aCpyPam.GetDoc().getIDocumentContentOperations().CopyRange( aCpyPam, *aPam.GetPoint(),
SwCopyFlags::CheckPosInFly);
rDstDoc.GetIDocumentUndoRedo().DoUndo( bUndo );
SwPaM* pTmp = new SwPaM( *aPam.GetPoint(), rpDelRing.get() );
if( !rpDelRing )
rpDelRing.reset(pTmp);
pTmp->SetMark();
pTmp->GetMark()->SetContent(nDstTo + nSkip);
nSkip += nSrcTo - nSrcFrom;
if( rpInsRing )
{
SwPaM* pCorr = rpInsRing->GetPrev();
if( *pCorr->GetPoint() == *pTmp->GetPoint() )
*pCorr->GetPoint() = *pTmp->GetMark();
}
}
}
bRet = true;
}
return bRet;
}
SwNodeOffset CompareData::NextIdx( const SwNode* pNd )
{
if( pNd->IsStartNode() )
{
if( pNd->IsTableNode() )
pNd = pNd->EndOfSectionNode();
else
{
const SwSectionNode* pSNd = pNd->GetSectionNode();
if( pSNd &&
( SectionType::Content != pSNd->GetSection().GetType() ||
pSNd->GetSection().IsProtect() ) )
pNd = pNd->EndOfSectionNode();
}
}
return pNd->GetIndex() + 1;
}
SwNodeOffset CompareData::PrevIdx( const SwNode* pNd )
{
if( pNd->IsEndNode() )
{
if( pNd->StartOfSectionNode()->IsTableNode() )
pNd = pNd->StartOfSectionNode();
else
{
const SwSectionNode* pSNd = pNd->StartOfSectionNode()->GetSectionNode();
if( pSNd &&
( SectionType::Content != pSNd->GetSection().GetType() ||
pSNd->GetSection().IsProtect() ) )
pNd = pNd->StartOfSectionNode();
}
}
return pNd->GetIndex() - 1;
}
void CompareData::CheckRanges( CompareData& rData )
{
const SwNodes& rSrcNds = rData.m_rDoc.GetNodes();
const SwNodes& rDstNds = m_rDoc.GetNodes();
const SwNode& rSrcEndNd = rData.GetEndOfContent();
const SwNode& rDstEndNd = GetEndOfContent();
SwNodeOffset nSrcSttIdx = NextIdx( rSrcEndNd.StartOfSectionNode() );
SwNodeOffset nSrcEndIdx = rSrcEndNd.GetIndex();
SwNodeOffset nDstSttIdx = NextIdx( rDstEndNd.StartOfSectionNode() );
SwNodeOffset nDstEndIdx = rDstEndNd.GetIndex();
while( nSrcSttIdx < nSrcEndIdx && nDstSttIdx < nDstEndIdx )
{
const SwNode* pSrcNd = rSrcNds[ nSrcSttIdx ];
const SwNode* pDstNd = rDstNds[ nDstSttIdx ];
if( !SwCompareLine::CompareNode( *pSrcNd, *pDstNd ))
break;
nSrcSttIdx = NextIdx( pSrcNd );
nDstSttIdx = NextIdx( pDstNd );
}
nSrcEndIdx = PrevIdx( &rSrcEndNd );
nDstEndIdx = PrevIdx( &rDstEndNd );
while( nSrcSttIdx < nSrcEndIdx && nDstSttIdx < nDstEndIdx )
{
const SwNode* pSrcNd = rSrcNds[ nSrcEndIdx ];
const SwNode* pDstNd = rDstNds[ nDstEndIdx ];
if( !SwCompareLine::CompareNode( *pSrcNd, *pDstNd ))
break;
nSrcEndIdx = PrevIdx( pSrcNd );
nDstEndIdx = PrevIdx( pDstNd );
}
while( nSrcSttIdx <= nSrcEndIdx )
{
const SwNode* pNd = rSrcNds[ nSrcSttIdx ];
rData.InsertLine( SwCompareLine( *pNd ) );
nSrcSttIdx = NextIdx( pNd );
}
while( nDstSttIdx <= nDstEndIdx )
{
const SwNode* pNd = rDstNds[ nDstSttIdx ];
InsertLine( SwCompareLine( *pNd ) );
nDstSttIdx = NextIdx( pNd );
}
}
void CompareData::ShowInsert( sal_uLong nStt, sal_uLong nEnd )
{
SwPaM* pTmp = new SwPaM( GetLine( nStt ).GetNode(), 0,
GetLine( nEnd-1 ).GetEndNode(), 0,
m_pInsertRing.get() );
if( !m_pInsertRing )
m_pInsertRing.reset( pTmp );
// #i65201#: These SwPaMs are calculated smaller than needed, see comment below
}
void CompareData::ShowDelete(
const CompareData& rData,
sal_uLong nStt,
sal_uLong nEnd,
sal_uLong nInsPos )
{
SwNodeRange aRg(
rData.GetLine( nStt ).GetNode(), SwNodeOffset(0),
rData.GetLine( nEnd-1 ).GetEndNode(), SwNodeOffset(1) );
SwNodeOffset nOffset(0);
std::optional<SwCompareLine> xLine;
if( nInsPos >= 1 )
{
if( GetLineCount() == nInsPos )
{
xLine = GetLine( nInsPos-1 );
nOffset = SwNodeOffset(1);
}
else
xLine = GetLine( nInsPos );
}
const SwNode* pLineNd;
if( xLine )
{
if( nOffset )
pLineNd = &xLine->GetEndNode();
else
pLineNd = &xLine->GetNode();
}
else
{
pLineNd = &GetEndOfContent();
nOffset = SwNodeOffset(0);
}
SwNodeIndex aInsPos( *pLineNd, nOffset );
SwNodeIndex aSavePos( aInsPos, -1 );
rData.m_rDoc.GetDocumentContentOperationsManager().CopyWithFlyInFly(aRg, aInsPos.GetNode());
m_rDoc.getIDocumentState().SetModified();
++aSavePos;
// #i65201#: These SwPaMs are calculated when the (old) delete-redlines are hidden,
// they will be inserted when the delete-redlines are shown again.
// To avoid unwanted insertions of delete-redlines into these new redlines, what happens
// especially at the end of the document, I reduce the SwPaM by one node.
// Before the new redlines are inserted, they have to expand again.
SwPaM* pTmp = new SwPaM( aSavePos.GetNode(), aInsPos.GetNode(), SwNodeOffset(0), SwNodeOffset(-1), m_pDelRing.get() );
if( !m_pDelRing )
m_pDelRing.reset(pTmp);
if( m_pInsertRing )
{
SwPaM* pCorr = m_pInsertRing->GetPrev();
if( *pCorr->GetPoint() == *pTmp->GetPoint() )
{
SwNodeIndex aTmpPos( pTmp->GetMark()->GetNode(), -1 );
pCorr->GetPoint()->Assign( aTmpPos );
}
}
}
void CompareData::CheckForChangesInLine( const CompareData& rData,
sal_uLong nStt, sal_uLong nEnd,
sal_uLong nThisStt, sal_uLong nThisEnd )
{
LineArrayComparator aCmp( *this, rData, nThisStt, nThisEnd,
nStt, nEnd );
int nMinLen = std::min( aCmp.GetLen1(), aCmp.GetLen2() );
std::unique_ptr<int[]> pLcsDst(new int[ nMinLen ]);
std::unique_ptr<int[]> pLcsSrc(new int[ nMinLen ]);
FastCommonSubseq subseq( aCmp );
int nLcsLen = subseq.Find( pLcsDst.get(), pLcsSrc.get() );
for (int i = 0; i <= nLcsLen; i++)
{
// Beginning of inserted lines (inclusive)
int nDstFrom = i ? pLcsDst[i - 1] + 1 : 0;
// End of inserted lines (exclusive)
int nDstTo = ( i == nLcsLen ) ? aCmp.GetLen1() : pLcsDst[i];
// Beginning of deleted lines (inclusive)
int nSrcFrom = i ? pLcsSrc[i - 1] + 1 : 0;
// End of deleted lines (exclusive)
int nSrcTo = ( i == nLcsLen ) ? aCmp.GetLen2() : pLcsSrc[i];
if( i )
{
const SwCompareLine aDstLn = GetLine( nThisStt + nDstFrom - 1 );
const SwCompareLine aSrcLn = rData.GetLine( nStt + nSrcFrom - 1 );
// Show differences in detail for lines that
// were matched as only slightly different
if( !aDstLn.ChangesInLine( aSrcLn, m_pInsertRing, m_pDelRing ) )
{
ShowInsert( nThisStt + nDstFrom - 1, nThisStt + nDstFrom );
ShowDelete( rData, nStt + nSrcFrom - 1, nStt + nSrcFrom,
nThisStt + nDstFrom );
}
}
// Lines missing from source are inserted
if( nDstFrom != nDstTo )
{
ShowInsert( nThisStt + nDstFrom, nThisStt + nDstTo );
}
// Lines missing from destination are deleted
if( nSrcFrom != nSrcTo )
{
ShowDelete( rData, nStt + nSrcFrom, nStt + nSrcTo, nThisStt + nDstTo );
}
}
}
void CompareData::SetRedlinesToDoc( bool bUseDocInfo )
{
SwPaM* pTmp = m_pDelRing.get();
// get the Author / TimeStamp from the "other" document info
std::size_t nAuthor = m_rDoc.getIDocumentRedlineAccess().GetRedlineAuthor();
DateTime aTimeStamp( DateTime::SYSTEM );
SwDocShell *pDocShell(m_rDoc.GetDocShell());
OSL_ENSURE(pDocShell, "no SwDocShell");
if (pDocShell) {
uno::Reference<document::XDocumentPropertiesSupplier> xDPS(
pDocShell->GetModel(), uno::UNO_QUERY_THROW);
uno::Reference<document::XDocumentProperties> xDocProps(
xDPS->getDocumentProperties());
OSL_ENSURE(xDocProps.is(), "Doc has no DocumentProperties");
if( bUseDocInfo && xDocProps.is() ) {
OUString aTmp( 1 == xDocProps->getEditingCycles()
? xDocProps->getAuthor()
: xDocProps->getModifiedBy() );
util::DateTime uDT( 1 == xDocProps->getEditingCycles()
? xDocProps->getCreationDate()
: xDocProps->getModificationDate() );
if( !aTmp.isEmpty() )
{
nAuthor = m_rDoc.getIDocumentRedlineAccess().InsertRedlineAuthor( aTmp );
aTimeStamp = DateTime(uDT);
}
}
}
if( pTmp )
{
SwRedlineData aRedlnData( RedlineType::Delete, nAuthor, aTimeStamp, 0,
OUString(), nullptr );
do {
// #i65201#: Expand again, see comment above.
if( pTmp->GetPoint()->GetContentIndex() == 0 )
{
pTmp->GetPoint()->Adjust(SwNodeOffset(1));
}
// #i101009#
// prevent redlines that end on structural end node
if (& GetEndOfContent() ==
& pTmp->GetPoint()->GetNode())
{
pTmp->GetPoint()->Adjust(SwNodeOffset(-1));
SwContentNode *const pContentNode( pTmp->GetPointContentNode() );
if( pContentNode )
pTmp->GetPoint()->SetContent( pContentNode->Len() );
// tdf#106218 try to avoid losing a paragraph break here:
if (pTmp->GetMark()->GetContentIndex() == 0)
{
SwNodeIndex const prev(pTmp->GetMark()->GetNode(), -1);
if (prev.GetNode().IsTextNode())
{
pTmp->GetMark()->Assign(
*prev.GetNode().GetTextNode(),
prev.GetNode().GetTextNode()->Len());
}
}
}
m_rDoc.getIDocumentRedlineAccess().DeleteRedline( *pTmp, false, RedlineType::Any );
if (m_rDoc.GetIDocumentUndoRedo().DoesUndo())
{
m_rDoc.GetIDocumentUndoRedo().AppendUndo(
std::make_unique<SwUndoCompDoc>( *pTmp, false ));
}
m_rDoc.getIDocumentRedlineAccess().AppendRedline( new SwRangeRedline( aRedlnData, *pTmp ), true );
} while( m_pDelRing.get() != ( pTmp = pTmp->GetNext()) );
}
pTmp = m_pInsertRing.get();
if( !pTmp )
return;
do {
if( pTmp->GetPoint()->GetContentIndex() == 0 )
{
pTmp->GetPoint()->Adjust(SwNodeOffset(1));
}
// #i101009#
// prevent redlines that end on structural end node
if (& GetEndOfContent() ==
& pTmp->GetPoint()->GetNode())
{
pTmp->GetPoint()->Adjust(SwNodeOffset(-1));
SwContentNode *const pContentNode( pTmp->GetPointContentNode() );
if( pContentNode )
pTmp->GetPoint()->SetContent( pContentNode->Len() );
// tdf#106218 try to avoid losing a paragraph break here:
if (pTmp->GetMark()->GetContentIndex() == 0)
{
SwNodeIndex const prev(pTmp->GetMark()->GetNode(), -1);
if (prev.GetNode().IsTextNode())
{
pTmp->GetMark()->Assign(
*prev.GetNode().GetTextNode(),
prev.GetNode().GetTextNode()->Len());
}
}
}
} while( m_pInsertRing.get() != ( pTmp = pTmp->GetNext()) );
SwRedlineData aRedlnData( RedlineType::Insert, nAuthor, aTimeStamp, 0,
OUString(), nullptr );
// combine consecutive
if( pTmp->GetNext() != m_pInsertRing.get() )
{
do {
// coverity[deref_arg] - the SwPaM delete moves a new entry into GetNext()
SwPosition& rSttEnd = *pTmp->End(),
& rEndStt = *pTmp->GetNext()->Start();
const SwContentNode* pCNd;
if( rSttEnd == rEndStt ||
(!rEndStt.GetContentIndex() &&
rEndStt.GetNodeIndex() - 1 == rSttEnd.GetNodeIndex() &&
nullptr != ( pCNd = rSttEnd.GetNode().GetContentNode() ) &&
rSttEnd.GetContentIndex() == pCNd->Len()))
{
if( pTmp->GetNext() == m_pInsertRing.get() )
{
// are consecutive, so combine
rEndStt = *pTmp->Start();
delete pTmp;
pTmp = m_pInsertRing.get();
}
else
{
// are consecutive, so combine
rSttEnd = *pTmp->GetNext()->End();
delete pTmp->GetNext();
}
}
else
pTmp = pTmp->GetNext();
} while( m_pInsertRing.get() != pTmp );
}
do {
// coverity[deref_arg] - pTmp is valid here
if (IDocumentRedlineAccess::AppendResult::APPENDED ==
m_rDoc.getIDocumentRedlineAccess().AppendRedline(
new SwRangeRedline(aRedlnData, *pTmp), true) &&
m_rDoc.GetIDocumentUndoRedo().DoesUndo())
{
m_rDoc.GetIDocumentUndoRedo().AppendUndo(
std::make_unique<SwUndoCompDoc>( *pTmp, true ));
}
} while( m_pInsertRing.get() != ( pTmp = pTmp->GetNext()) );
}
typedef std::shared_ptr<CompareData> CompareDataPtr;
typedef std::pair<CompareDataPtr, CompareDataPtr> CompareDataPtrPair;
typedef std::vector<CompareDataPtrPair> Comparators;
namespace
{
Comparators buildComparators(SwDoc &rSrcDoc, SwDoc &rDestDoc)
{
Comparators aComparisons;
//compare main text
aComparisons.emplace_back(std::make_shared<CompareMainText>(rSrcDoc, true),
std::make_shared<CompareMainText>(rDestDoc, true));
//if we have the same number of frames then try to compare within them
const sw::SpzFrameFormats* pSrcFrameFormats = rSrcDoc.GetSpzFrameFormats();
const sw::SpzFrameFormats* pDestFrameFormats = rDestDoc.GetSpzFrameFormats();
if (pSrcFrameFormats->size() == pDestFrameFormats->size())
{
for(sw::FrameFormats<sw::SpzFrameFormat*>::size_type i = 0; i < pSrcFrameFormats->size(); ++i)
{
const sw::SpzFrameFormat& rSrcFormat = *(*pSrcFrameFormats)[i];
const sw::SpzFrameFormat& rDestFormat = *(*pDestFrameFormats)[i];
const SwNodeIndex* pSrcIdx = rSrcFormat.GetContent().GetContentIdx();
const SwNodeIndex* pDestIdx = rDestFormat.GetContent().GetContentIdx();
if (!pSrcIdx && !pDestIdx)
continue;
if (!pSrcIdx || !pDestIdx)
break;
const SwNode* pSrcNode = pSrcIdx->GetNode().EndOfSectionNode();
const SwNode* pDestNode = pDestIdx->GetNode().EndOfSectionNode();
if (!pSrcNode && !pDestNode)
continue;
if (!pSrcNode || !pDestNode)
break;
if (pSrcIdx->GetNodes()[pSrcIdx->GetIndex() + 1]->IsNoTextNode()
|| pDestIdx->GetNodes()[pDestIdx->GetIndex() + 1]->IsNoTextNode())
{
continue; // tdf#125660 don't redline GrfNode/OLENode
}
aComparisons.emplace_back(std::make_shared<CompareFrameFormatText>(rSrcDoc, *pSrcIdx),
std::make_shared<CompareFrameFormatText>(rDestDoc, *pDestIdx));
}
}
return aComparisons;
}
}
// Returns (the difference count?) if something is different
tools::Long SwDoc::CompareDoc( const SwDoc& rDoc )
{
if( &rDoc == this )
return 0;
tools::Long nRet = 0;
// Get comparison options
CmpOptions.eCmpMode = SW_MOD()->GetCompareMode();
if( CmpOptions.eCmpMode == SwCompareMode::Auto )
{
if( getRsidRoot() == rDoc.getRsidRoot() )
{
CmpOptions.eCmpMode = SwCompareMode::ByChar;
CmpOptions.bUseRsid = true;
CmpOptions.nIgnoreLen = 2;
}
else
{
CmpOptions.eCmpMode = SwCompareMode::ByWord;
CmpOptions.bUseRsid = false;
CmpOptions.nIgnoreLen = 3;
}
}
else
{
CmpOptions.bUseRsid = getRsidRoot() == rDoc.getRsidRoot() && SW_MOD()->IsUseRsid();
CmpOptions.nIgnoreLen = SW_MOD()->IsIgnorePieces() ? SW_MOD()->GetPieceLen() : 0;
}
GetIDocumentUndoRedo().StartUndo(SwUndoId::EMPTY, nullptr);
bool bDocWasModified = getIDocumentState().IsModified();
SwDoc& rSrcDoc = const_cast<SwDoc&>(rDoc);
bool bSrcModified = rSrcDoc.getIDocumentState().IsModified();
RedlineFlags eSrcRedlMode = rSrcDoc.getIDocumentRedlineAccess().GetRedlineFlags();
rSrcDoc.getIDocumentRedlineAccess().SetRedlineFlags( RedlineFlags::ShowInsert );
getIDocumentRedlineAccess().SetRedlineFlags(RedlineFlags::On | RedlineFlags::ShowInsert);
Comparators aComparisons(buildComparators(rSrcDoc, *this));
for (auto& a : aComparisons)
{
CompareData& rD0 = *a.first;
CompareData& rD1 = *a.second;
rD1.CompareLines( rD0 );
nRet |= rD1.ShowDiffs( rD0 );
}
if( nRet )
{
getIDocumentRedlineAccess().SetRedlineFlags(RedlineFlags::On |
RedlineFlags::ShowInsert | RedlineFlags::ShowDelete);
for (auto& a : aComparisons)
{
CompareData& rD1 = *a.second;
rD1.SetRedlinesToDoc( !bDocWasModified );
}
getIDocumentState().SetModified();
}
rSrcDoc.getIDocumentRedlineAccess().SetRedlineFlags( eSrcRedlMode );
getIDocumentRedlineAccess().SetRedlineFlags(RedlineFlags::ShowInsert | RedlineFlags::ShowDelete);
if( !bSrcModified )
rSrcDoc.getIDocumentState().ResetModified();
GetIDocumentUndoRedo().EndUndo(SwUndoId::EMPTY, nullptr);
return nRet;
}
namespace
{
struct SaveMergeRedline
{
const SwRangeRedline* pSrcRedl;
SwRangeRedline* pDestRedl;
SaveMergeRedline( const SwNode& rDstNd, const SwRangeRedline& rSrcRedl);
sal_uInt16 InsertRedline(SwPaM* pLastDestRedline);
};
}
SaveMergeRedline::SaveMergeRedline( const SwNode& rDstNd,
const SwRangeRedline& rSrcRedl)
: pSrcRedl( &rSrcRedl )
{
SwPosition aPos( rDstNd );
const SwPosition* pStt = rSrcRedl.Start();
if( rDstNd.IsContentNode() )
aPos.SetContent( pStt->GetContentIndex() );
pDestRedl = new SwRangeRedline( rSrcRedl.GetRedlineData(), aPos );
if( RedlineType::Delete != pDestRedl->GetType() )
return;
// mark the area as deleted
const SwPosition* pEnd = rSrcRedl.End();
pDestRedl->SetMark();
pDestRedl->GetPoint()->Adjust( pEnd->GetNodeIndex() -
pStt->GetNodeIndex() );
if( pDestRedl->GetPointContentNode() )
pDestRedl->GetPoint()->SetContent( pEnd->GetContentIndex() );
}
sal_uInt16 SaveMergeRedline::InsertRedline(SwPaM* pLastDestRedline)
{
sal_uInt16 nIns = 0;
SwDoc& rDoc = pDestRedl->GetDoc();
if( RedlineType::Insert == pDestRedl->GetType() )
{
// the part was inserted so copy it from the SourceDoc
::sw::UndoGuard const undoGuard(rDoc.GetIDocumentUndoRedo());
SwNodeIndex aSaveNd( pDestRedl->GetPoint()->GetNode(), -1 );
const sal_Int32 nSaveCnt = pDestRedl->GetPoint()->GetContentIndex();
RedlineFlags eOld = rDoc.getIDocumentRedlineAccess().GetRedlineFlags();
rDoc.getIDocumentRedlineAccess().SetRedlineFlags_intern(eOld | RedlineFlags::Ignore);
pSrcRedl->GetDoc().getIDocumentContentOperations().CopyRange(
*const_cast<SwPaM*>(static_cast<const SwPaM*>(pSrcRedl)),
*pDestRedl->GetPoint(), SwCopyFlags::CheckPosInFly);
rDoc.getIDocumentRedlineAccess().SetRedlineFlags_intern( eOld );
pDestRedl->SetMark();
++aSaveNd;
pDestRedl->GetMark()->Assign( aSaveNd, nSaveCnt );
if( pLastDestRedline && *pLastDestRedline->GetPoint() == *pDestRedl->GetPoint() )
*pLastDestRedline->GetPoint() = *pDestRedl->GetMark();
}
else
{
//JP 21.09.98: Bug 55909
// If there already is a deleted or inserted one at the same position, we have to split it!
SwPosition* pDStt = pDestRedl->GetMark(),
* pDEnd = pDestRedl->GetPoint();
SwRedlineTable::size_type n = 0;
// find the first redline for StartPos
if (!rDoc.getIDocumentRedlineAccess().GetRedline( *pDStt, &n ) && n > 0)
--n;
const SwRedlineTable& rRedlineTable = rDoc.getIDocumentRedlineAccess().GetRedlineTable();
for( ; n < rRedlineTable.size(); ++n )
{
SwRangeRedline* pRedl = rRedlineTable[ n ];
SwPosition* pRStt = pRedl->Start(),
* pREnd = pRedl->End();
if( RedlineType::Delete == pRedl->GetType() ||
RedlineType::Insert == pRedl->GetType() )
{
SwComparePosition eCmpPos = ComparePosition( *pDStt, *pDEnd, *pRStt, *pREnd );
switch( eCmpPos )
{
case SwComparePosition::CollideStart:
case SwComparePosition::Behind:
break;
case SwComparePosition::Inside:
case SwComparePosition::Equal:
delete pDestRedl;
pDestRedl = nullptr;
[[fallthrough]];
case SwComparePosition::CollideEnd:
case SwComparePosition::Before:
n = rRedlineTable.size();
break;
case SwComparePosition::Outside:
assert(pDestRedl && "is this actually impossible");
if (pDestRedl)
{
SwRangeRedline* pCpyRedl = new SwRangeRedline(
pDestRedl->GetRedlineData(), *pDStt );
pCpyRedl->SetMark();
*pCpyRedl->GetPoint() = *pRStt;
std::unique_ptr<SwUndoCompDoc> pUndo;
if (rDoc.GetIDocumentUndoRedo().DoesUndo())
pUndo.reset(new SwUndoCompDoc( *pCpyRedl ));
// now modify doc: append redline, undo (and count)
rDoc.getIDocumentRedlineAccess().AppendRedline( pCpyRedl, true );
if( pUndo )
{
rDoc.GetIDocumentUndoRedo().AppendUndo(std::move(pUndo));
}
++nIns;
*pDStt = *pREnd;
// we should start over now
n = SwRedlineTable::npos;
}
break;
case SwComparePosition::OverlapBefore:
*pDEnd = *pRStt;
break;
case SwComparePosition::OverlapBehind:
*pDStt = *pREnd;
break;
}
}
else if( *pDEnd <= *pRStt )
break;
}
}
if( pDestRedl )
{
std::unique_ptr<SwUndoCompDoc> pUndo;
if (rDoc.GetIDocumentUndoRedo().DoesUndo())
pUndo.reset(new SwUndoCompDoc( *pDestRedl ));
// now modify doc: append redline, undo (and count)
IDocumentRedlineAccess::AppendResult const result(
rDoc.getIDocumentRedlineAccess().AppendRedline(pDestRedl, true));
if( pUndo )
{
rDoc.GetIDocumentUndoRedo().AppendUndo( std::move(pUndo) );
}
++nIns;
// if AppendRedline has deleted our redline, we may not keep a
// reference to it
if (IDocumentRedlineAccess::AppendResult::APPENDED != result)
pDestRedl = nullptr;
}
return nIns;
}
/// Merge two documents
tools::Long SwDoc::MergeDoc( const SwDoc& rDoc )
{
if( &rDoc == this )
return 0;
tools::Long nRet = 0;
GetIDocumentUndoRedo().StartUndo(SwUndoId::EMPTY, nullptr);
SwDoc& rSrcDoc = const_cast<SwDoc&>(rDoc);
bool bSrcModified = rSrcDoc.getIDocumentState().IsModified();
RedlineFlags eSrcRedlMode = rSrcDoc.getIDocumentRedlineAccess().GetRedlineFlags();
rSrcDoc.getIDocumentRedlineAccess().SetRedlineFlags( RedlineFlags::ShowDelete );
getIDocumentRedlineAccess().SetRedlineFlags( RedlineFlags::ShowDelete );
CompareMainText aD0(rSrcDoc, false);
CompareMainText aD1(*this, false);
aD1.CompareLines( aD0 );
if( !aD1.HasDiffs( aD0 ) )
{
// we want to get all redlines from the SourceDoc
// look for all insert redlines from the SourceDoc and determine their position in the DestDoc
std::vector<SaveMergeRedline> vRedlines;
const SwRedlineTable& rSrcRedlTable = rSrcDoc.getIDocumentRedlineAccess().GetRedlineTable();
SwNodeOffset nEndOfExtra = rSrcDoc.GetNodes().GetEndOfExtras().GetIndex();
SwNodeOffset nMyEndOfExtra = GetNodes().GetEndOfExtras().GetIndex();
for(const SwRangeRedline* pRedl : rSrcRedlTable)
{
SwNodeOffset nNd = pRedl->GetPoint()->GetNodeIndex();
RedlineType eType = pRedl->GetType();
if( nEndOfExtra < nNd &&
( RedlineType::Insert == eType || RedlineType::Delete == eType ))
{
const SwNode* pDstNd = GetNodes()[
nMyEndOfExtra + nNd - nEndOfExtra ];
// Found the position.
// Then we also have to insert the redline to the line in the DestDoc.
vRedlines.emplace_back(*pDstNd, *pRedl);
}
}
if( !vRedlines.empty() )
{
// Carry over all into DestDoc
rSrcDoc.getIDocumentRedlineAccess().SetRedlineFlags(RedlineFlags::ShowInsert | RedlineFlags::ShowDelete);
getIDocumentRedlineAccess().SetRedlineFlags(
RedlineFlags::On |
RedlineFlags::ShowInsert |
RedlineFlags::ShowDelete);
SwPaM* pLastDestRedline(nullptr);
for(SaveMergeRedline& rRedline: vRedlines)
{
nRet += rRedline.InsertRedline(pLastDestRedline);
pLastDestRedline = rRedline.pDestRedl;
}
}
}
rSrcDoc.getIDocumentRedlineAccess().SetRedlineFlags( eSrcRedlMode );
if( !bSrcModified )
rSrcDoc.getIDocumentState().ResetModified();
getIDocumentRedlineAccess().SetRedlineFlags(RedlineFlags::ShowInsert | RedlineFlags::ShowDelete);
GetIDocumentUndoRedo().EndUndo(SwUndoId::EMPTY, nullptr);
return nRet;
}
LineArrayComparator::LineArrayComparator( const CompareData &rD1,
const CompareData &rD2, int nStt1,
int nEnd1, int nStt2, int nEnd2 )
: m_rData1( rD1 ), m_rData2( rD2 ), m_nFirst1( nStt1 ), m_nFirst2( nStt2 )
{
m_nLen1 = nEnd1 - nStt1;
m_nLen2 = nEnd2 - nStt2;
}
bool LineArrayComparator::Compare( int nIdx1, int nIdx2 ) const
{
if( nIdx1 < 0 || nIdx2 < 0 || nIdx1 >= m_nLen1 || nIdx2 >= m_nLen2 )
{
OSL_ENSURE( false, "Index out of range!" );
return false;
}
const SwTextNode *pTextNd1 = m_rData1.GetLine( m_nFirst1 + nIdx1 ).GetNode().GetTextNode();
const SwTextNode *pTextNd2 = m_rData2.GetLine( m_nFirst2 + nIdx2 ).GetNode().GetTextNode();
if( !pTextNd1 || !pTextNd2
|| ( CmpOptions.bUseRsid && !pTextNd1->CompareParRsid( *pTextNd2 ) ) )
{
return false;
}
const sal_Int32 nPar1Len = pTextNd1->Len();
const sal_Int32 nPar2Len = pTextNd2->Len();
if( std::min( nPar1Len, nPar2Len ) * 3 < std::max( nPar1Len, nPar2Len ) )
{
return false;
}
sal_Int32 nBorderLen = ( nPar1Len + nPar2Len )/16;
if( nBorderLen < 3 )
{
nBorderLen = std::min<sal_Int32>( 3, std::min( nPar1Len, nPar2Len ) );
}
std::set<unsigned> aHashes;
unsigned nHash = 0;
unsigned nMul = 251;
unsigned nPow = 1;
sal_Int32 i;
for( i = 0; i < nBorderLen - 1; i++ )
{
nPow *= nMul;
}
for( i = 0; i < nBorderLen; i++ )
{
nHash = nHash*nMul + pTextNd1->GetText()[i];
}
aHashes.insert( nHash );
for( ; i < nPar1Len; i++ )
{
nHash = nHash - nPow*pTextNd1->GetText()[ i - nBorderLen ];
nHash = nHash*nMul + pTextNd1->GetText()[ i ];
aHashes.insert( nHash );
}
nHash = 0;
for( i = 0; i < nBorderLen; i++ )
{
nHash = nHash*nMul + pTextNd2->GetText()[ i ];
}
if( aHashes.find( nHash ) != aHashes.end() )
{
return true;
}
for( ; i < nPar2Len; i++ )
{
nHash = nHash - nPow*pTextNd2->GetText()[ i - nBorderLen ];
nHash = nHash*nMul + pTextNd2->GetText()[ i ];
if( aHashes.find( nHash ) != aHashes.end() )
{
return true;
}
}
return false;
}
bool CharArrayComparator::Compare( int nIdx1, int nIdx2 ) const
{
if( nIdx1 < 0 || nIdx2 < 0 || nIdx1 >= GetLen1() || nIdx2 >= GetLen2() )
{
OSL_ENSURE( false, "Index out of range!" );
return false;
}
return ( !CmpOptions.bUseRsid
|| m_pTextNode1->CompareRsid( *m_pTextNode2, nIdx1 + 1, nIdx2 + 1 ) )
&& m_pTextNode1->GetText()[ nIdx1 ] == m_pTextNode2->GetText()[ nIdx2 ];
}
WordArrayComparator::WordArrayComparator( const SwTextNode *pNode1,
const SwTextNode *pNode2 )
: m_pTextNode1( pNode1 ), m_pTextNode2( pNode2 )
{
m_pPos1.reset( new int[ m_pTextNode1->GetText().getLength() + 1 ] );
m_pPos2.reset( new int[ m_pTextNode2->GetText().getLength() + 1 ] );
CalcPositions( m_pPos1.get(), m_pTextNode1, m_nCount1 );
CalcPositions( m_pPos2.get(), m_pTextNode2, m_nCount2 );
}
bool WordArrayComparator::Compare( int nIdx1, int nIdx2 ) const
{
int nLen = m_pPos1[ nIdx1 + 1 ] - m_pPos1[ nIdx1 ];
if( nLen != m_pPos2[ nIdx2 + 1 ] - m_pPos2[ nIdx2 ] )
{
return false;
}
for( int i = 0; i < nLen; i++)
{
if( m_pTextNode1->GetText()[ m_pPos1[ nIdx1 ] + i ]
!= m_pTextNode2->GetText()[ m_pPos2[ nIdx2 ] + i ]
|| ( CmpOptions.bUseRsid && !m_pTextNode1->CompareRsid( *m_pTextNode2,
m_pPos1[ nIdx1 ] + i, m_pPos2[ nIdx2 ] + i ) ) )
{
return false;
}
}
return true;
}
int WordArrayComparator::GetCharSequence( const int *pWordLcs1,
const int *pWordLcs2, int *pSubseq1, int *pSubseq2, int nLcsLen )
{
int nLen = 0;
for( int i = 0; i < nLcsLen; i++ )
{
// Check for hash collisions
if( m_pPos1[ pWordLcs1[i] + 1 ] - m_pPos1[ pWordLcs1[i] ]
!= m_pPos2[ pWordLcs2[i] + 1 ] - m_pPos2[ pWordLcs2[i] ] )
{
continue;
}
for( int j = 0; j < m_pPos1[pWordLcs1[i]+1] - m_pPos1[pWordLcs1[i]]; j++)
{
pSubseq1[ nLen ] = m_pPos1[ pWordLcs1[i] ] + j;
pSubseq2[ nLen ] = m_pPos2[ pWordLcs2[i] ] + j;
if( m_pTextNode1->GetText()[ m_pPos1[ pWordLcs1[i] ] + j ]
!= m_pTextNode2->GetText()[ m_pPos2[ pWordLcs2[i] ] + j ] )
{
nLen -= j;
break;
}
nLen++;
}
}
return nLen;
}
void WordArrayComparator::CalcPositions( int *pPos, const SwTextNode *pTextNd,
int &nCnt )
{
nCnt = -1;
for (int i = 0; i <= pTextNd->GetText().getLength(); ++i)
{
if (i == 0 || i == pTextNd->GetText().getLength()
|| !rtl::isAsciiAlphanumeric( pTextNd->GetText()[ i - 1 ])
|| !rtl::isAsciiAlphanumeric( pTextNd->GetText()[ i ]))
{ // Begin new word
nCnt++;
pPos[ nCnt ] = i;
}
}
}
int CommonSubseq::FindLCS( int *pLcs1, int *pLcs2, int nStt1, int nEnd1,
int nStt2, int nEnd2 )
{
int nLen1 = nEnd1 ? nEnd1 - nStt1 : m_rComparator.GetLen1();
int nLen2 = nEnd2 ? nEnd2 - nStt2 : m_rComparator.GetLen2();
assert( nLen1 >= 0 );
assert( nLen2 >= 0 );
std::unique_ptr<int*[]> pLcs( new int*[ nLen1 + 1 ] );
pLcs[ 0 ] = m_pData.get();
for( int i = 1; i < nLen1 + 1; i++ )
pLcs[ i ] = pLcs[ i - 1 ] + nLen2 + 1;
for( int i = 0; i <= nLen1; i++ )
pLcs[i][0] = 0;
for( int j = 0; j <= nLen2; j++ )
pLcs[0][j] = 0;
// Find lcs
for( int i = 1; i <= nLen1; i++ )
{
for( int j = 1; j <= nLen2; j++ )
{
if( m_rComparator.Compare( nStt1 + i - 1, nStt2 + j - 1 ) )
pLcs[i][j] = pLcs[i - 1][j - 1] + 1;
else
pLcs[i][j] = std::max( pLcs[i][j - 1], pLcs[i - 1][j] );
}
}
int nLcsLen = pLcs[ nLen1 ][ nLen2 ];
// Recover the lcs in the two sequences
if( pLcs1 && pLcs2 )
{
int nIdx1 = nLen1;
int nIdx2 = nLen2;
int nIdx = nLcsLen - 1;
while( nIdx1 > 0 && nIdx2 > 0 )
{
if( pLcs[ nIdx1 ][ nIdx2 ] == pLcs[ nIdx1 - 1 ][ nIdx2 ] )
nIdx1--;
else if( pLcs[ nIdx1 ][ nIdx2 ] == pLcs[ nIdx1 ][ nIdx2 - 1 ] )
nIdx2--;
else
{
nIdx1--;
nIdx2--;
pLcs1[ nIdx ] = nIdx1 + nStt1;
pLcs2[ nIdx ] = nIdx2 + nStt2;
nIdx--;
}
}
}
return nLcsLen;
}
int CommonSubseq::IgnoreIsolatedPieces( int *pLcs1, int *pLcs2, int nLen1,
int nLen2, int nLcsLen, int nPieceLen )
{
if( !nLcsLen )
{
return 0;
}
int nNext = 0;
// Don't ignore text at the beginning of the paragraphs
if( pLcs1[ 0 ] == 0 && pLcs2[ 0 ] == 0 )
{
while( nNext < nLcsLen - 1 && pLcs1[ nNext ] + 1 == pLcs1[ nNext + 1 ]
&& pLcs2[ nNext ] + 1 == pLcs2[ nNext + 1 ] )
{
nNext++;
}
nNext++;
}
int nCnt = 1;
for( int i = nNext; i < nLcsLen; i++ )
{
if( i != nLcsLen - 1 && pLcs1[ i ] + 1 == pLcs1[ i + 1 ]
&& pLcs2[ i ] + 1 == pLcs2[ i + 1 ] )
{
nCnt++;
}
else
{
if( nCnt > nPieceLen
// Don't ignore text at the end of the paragraphs
|| ( i == nLcsLen - 1
&& pLcs1[i] == nLen1 - 1 && pLcs2[i] == nLen2 - 1 ))
{
for( int j = i + 1 - nCnt; j <= i; j++ )
{
pLcs2[ nNext ] = pLcs2[ j ];
pLcs1[ nNext ] = pLcs1[ j ];
nNext++;
}
}
nCnt = 1;
}
}
return nNext;
}
LgstCommonSubseq::LgstCommonSubseq( ArrayComparator &rComparator )
: CommonSubseq( rComparator, CUTOFF )
{
m_pBuff1.reset( new int[ rComparator.GetLen2() + 1 ] );
m_pBuff2.reset( new int[ rComparator.GetLen2() + 1 ] );
m_pL1.reset( new int[ rComparator.GetLen2() + 1 ] );
m_pL2.reset( new int[ rComparator.GetLen2() + 1 ] );
}
void LgstCommonSubseq::FindL( int *pL, int nStt1, int nEnd1,
int nStt2, int nEnd2 )
{
int nLen1 = nEnd1 ? nEnd1 - nStt1 : m_rComparator.GetLen1();
int nLen2 = nEnd2 ? nEnd2 - nStt2 : m_rComparator.GetLen2();
int *currL = m_pBuff1.get();
int *prevL = m_pBuff2.get();
// Avoid memory corruption
if( nLen2 > m_rComparator.GetLen2() )
{
assert( false );
return;
}
memset( m_pBuff1.get(), 0, sizeof( m_pBuff1[0] ) * ( nLen2 + 1 ) );
memset( m_pBuff2.get(), 0, sizeof( m_pBuff2[0] ) * ( nLen2 + 1 ) );
// Find lcs
for( int i = 1; i <= nLen1; i++ )
{
for( int j = 1; j <= nLen2; j++ )
{
if( m_rComparator.Compare( nStt1 + i - 1, nStt2 + j - 1 ) )
currL[j] = prevL[j - 1] + 1;
else
currL[j] = std::max( currL[j - 1], prevL[j] );
}
std::swap( currL, prevL );
}
memcpy( pL, prevL, ( nLen2 + 1 ) * sizeof( *prevL ) );
}
int LgstCommonSubseq::HirschbergLCS( int *pLcs1, int *pLcs2, int nStt1,
int nEnd1, int nStt2, int nEnd2 )
{
static int nLen1;
static int nLen2;
nLen1 = nEnd1 - nStt1;
nLen2 = nEnd2 - nStt2;
if( ( nLen1 + 1 ) * ( nLen2 + 1 ) <= CUTOFF )
{
if( !nLen1 || !nLen2 )
{
return 0;
}
return FindLCS(pLcs1, pLcs2, nStt1, nEnd1, nStt2, nEnd2);
}
int nMid = nLen1/2;
FindL( m_pL1.get(), nStt1, nStt1 + nMid, nStt2, nEnd2 );
FindL( m_pL2.get(), nStt1 + nMid, nEnd1, nStt2, nEnd2 );
int nMaxPos = 0;
static int nMaxVal;
nMaxVal = -1;
static int i;
for( i = 0; i <= nLen2; i++ )
{
if( m_pL1[i] + ( m_pL2[nLen2] - m_pL2[i] ) > nMaxVal )
{
nMaxPos = i;
nMaxVal = m_pL1[i]+( m_pL2[nLen2] - m_pL2[i] );
}
}
int nRet = HirschbergLCS( pLcs1, pLcs2, nStt1, nStt1 + nMid,
nStt2, nStt2 + nMaxPos );
nRet += HirschbergLCS( pLcs1 + nRet, pLcs2 + nRet, nStt1 + nMid, nEnd1,
nStt2 + nMaxPos, nEnd2 );
return nRet;
}
int LgstCommonSubseq::Find( int *pSubseq1, int *pSubseq2 )
{
int nStt = 0;
int nCutEnd = 0;
int nEnd1 = m_rComparator.GetLen1();
int nEnd2 = m_rComparator.GetLen2();
// Check for corresponding lines in the beginning of the sequences
while( nStt < nEnd1 && nStt < nEnd2 && m_rComparator.Compare( nStt, nStt ) )
{
pSubseq1[ nStt ] = nStt;
pSubseq2[ nStt ] = nStt;
nStt++;
}
pSubseq1 += nStt;
pSubseq2 += nStt;
// Check for corresponding lines in the end of the sequences
while( nStt < nEnd1 && nStt < nEnd2
&& m_rComparator.Compare( nEnd1 - 1, nEnd2 - 1 ) )
{
nCutEnd++;
nEnd1--;
nEnd2--;
}
int nLen = HirschbergLCS( pSubseq1, pSubseq2, nStt, nEnd1, nStt, nEnd2 );
for( int i = 0; i < nCutEnd; i++ )
{
pSubseq1[ nLen + i ] = nEnd1 + i;
pSubseq2[ nLen + i ] = nEnd2 + i;
}
return nStt + nLen + nCutEnd;
}
int FastCommonSubseq::FindFastCS( int *pSeq1, int *pSeq2, int nStt1,
int nEnd1, int nStt2, int nEnd2 )
{
int nCutBeg = 0;
int nCutEnd = 0;
// Check for corresponding lines in the beginning of the sequences
while( nStt1 < nEnd1 && nStt2 < nEnd2 && m_rComparator.Compare( nStt1, nStt2 ) )
{
pSeq1[ nCutBeg ] = nStt1++;
pSeq2[ nCutBeg ] = nStt2++;
nCutBeg++;
}
pSeq1 += nCutBeg;
pSeq2 += nCutBeg;
// Check for corresponding lines in the end of the sequences
while( nStt1 < nEnd1 && nStt2 < nEnd2
&& m_rComparator.Compare( nEnd1 - 1, nEnd2 - 1 ) )
{
nCutEnd++;
nEnd1--;
nEnd2--;
}
int nLen1 = nEnd1 - nStt1;
int nLen2 = nEnd2 - nStt2;
// Return if a sequence is empty
if( nLen1 <= 0 || nLen2 <= 0 )
{
for( int i = 0; i < nCutEnd; i++ )
{
pSeq1[ i ] = nEnd1 + i;
pSeq2[ i ] = nEnd2 + i;
}
return nCutBeg + nCutEnd;
}
// Cut to LCS for small values
if( nLen1 < 3 || nLen2 < 3 || ( nLen1 + 1 ) * ( nLen2 + 1 ) <= CUTOFF )
{
int nLcsLen = FindLCS( pSeq1, pSeq2, nStt1, nEnd1, nStt2, nEnd2);
for( int i = 0; i < nCutEnd; i++ )
{
pSeq1[ nLcsLen + i ] = nEnd1 + i;
pSeq2[ nLcsLen + i ] = nEnd2 + i;
}
return nCutBeg + nLcsLen + nCutEnd;
}
int nMid1 = nLen1/2;
int nMid2 = nLen2/2;
int nRad;
int nPos1 = -1, nPos2 = -1;
// Find a point of correspondence in the middle of the sequences
for( nRad = 0; nRad*nRad < std::min( nMid1, nMid2 ); nRad++ )
{
// Search to the left and to the right of the middle of the first sequence
for( int i = nMid1 - nRad; i <= nMid1 + nRad; i++ )
{
if( m_rComparator.Compare( nStt1 + i, nStt2 + nMid2 - nRad ) )
{
nPos1 = nStt1 + i;
nPos2 = nStt2 + nMid2 - nRad;
break;
}
if( m_rComparator.Compare( nStt1 + i, nStt2 + nMid2 + nRad ) )
{
nPos1 = nStt1 + i;
nPos2 = nStt2 + nMid2 - nRad;
break;
}
}
// Search to the left and to the right of the middle of the second sequence
for( int i = nMid2 - nRad; i <= nMid2 + nRad; i++ )
{
if( m_rComparator.Compare( nStt2 + nMid2 - nRad, nStt2 + i ) )
{
nPos2 = nStt2 + i;
nPos1 = nStt1 + nMid1 - nRad;
break;
}
if( m_rComparator.Compare( nStt2 + nMid2 - nRad, nStt2 + i ) )
{
nPos2 = nStt2 + i;
nPos1 = nStt1 + nMid1 - nRad;
break;
}
}
}
// return if no point of correspondence found
if( nPos1 == -1 )
{
for( int i = 0; i < nCutEnd; i++ )
{
pSeq1[ i ] = nEnd1 + i;
pSeq2[ i ] = nEnd2 + i;
}
return nCutBeg + nCutEnd;
}
// Run the same on the sequences to the left of the correspondence point
int nLen = FindFastCS( pSeq1, pSeq2, nStt1, nPos1, nStt2, nPos2 );
pSeq1[ nLen ] = nPos1;
pSeq2[ nLen ] = nPos2;
// Run the same on the sequences to the right of the correspondence point
nLen += FindFastCS( pSeq1 + nLen + 1, pSeq2 + nLen + 1,
nPos1 + 1, nEnd1, nPos2 + 1, nEnd2 ) + 1;
for( int i = 0; i < nCutEnd; i++ )
{
pSeq1[ nLen + i ] = nEnd1 + i;
pSeq2[ nLen + i ] = nEnd2 + i;
}
return nLen + nCutBeg + nCutEnd;
}
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
↑ V530 The return value of function 'append' is required to be utilized.