mirror of
https://github.com/ONLYOFFICE/core.git
synced 2026-04-07 13:55:33 +08:00
325 lines
10 KiB
C++
325 lines
10 KiB
C++
/*
|
|
* (c) Copyright Ascensio System SIA 2010-2018
|
|
*
|
|
* This program is a free software product. You can redistribute it and/or
|
|
* modify it under the terms of the GNU Affero General Public License (AGPL)
|
|
* version 3 as published by the Free Software Foundation. In accordance with
|
|
* Section 7(a) of the GNU AGPL its Section 15 shall be amended to the effect
|
|
* that Ascensio System SIA expressly excludes the warranty of non-infringement
|
|
* of any third-party rights.
|
|
*
|
|
* This program is distributed WITHOUT ANY WARRANTY; without even the implied
|
|
* warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. For
|
|
* details, see the GNU AGPL at: http://www.gnu.org/licenses/agpl-3.0.html
|
|
*
|
|
* You can contact Ascensio System SIA at Lubanas st. 125a-25, Riga, Latvia,
|
|
* EU, LV-1021.
|
|
*
|
|
* The interactive user interfaces in modified source and object code versions
|
|
* of the Program must display Appropriate Legal Notices, as required under
|
|
* Section 5 of the GNU AGPL version 3.
|
|
*
|
|
* Pursuant to Section 7(b) of the License you must retain the original Product
|
|
* logo when distributing the program. Pursuant to Section 7(e) we decline to
|
|
* grant you any rights under trademark law for use of our trademarks.
|
|
*
|
|
* All the Product's GUI elements, including illustrations and icon sets, as
|
|
* well as technical writing content are licensed under the terms of the
|
|
* Creative Commons Attribution-ShareAlike 4.0 International. See the License
|
|
* terms at http://creativecommons.org/licenses/by-sa/4.0/legalcode
|
|
*
|
|
*/
|
|
|
|
#include "FormattedDiskPagePAPX.h"
|
|
|
|
namespace DocFileFormat
|
|
{
|
|
FormattedDiskPagePAPX::~FormattedDiskPagePAPX()
|
|
{
|
|
RELEASEARRAYOBJECTS( rgfc );
|
|
RELEASEARRAYOBJECTS( rgbx );
|
|
|
|
if ( grppapx != NULL )
|
|
{
|
|
for ( unsigned int i = 0; i < grppapxSize; i++ )
|
|
{
|
|
RELEASEOBJECT( grppapx[i] );
|
|
}
|
|
|
|
RELEASEARRAYOBJECTS( grppapx );
|
|
}
|
|
}
|
|
|
|
/*========================================================================================================*/
|
|
|
|
FormattedDiskPagePAPX::FormattedDiskPagePAPX( POLE::Stream* wordStream, int offset, POLE::Stream* dataStream, bool oldVersion, bool fComplex):
|
|
FormattedDiskPage(), rgbx(NULL), grppapxSize(0), grppapx(NULL)
|
|
{
|
|
Type = Paragraph;
|
|
WordStream = wordStream;
|
|
|
|
//read the 512 bytes (FKP)
|
|
unsigned char* bytes = NULL;
|
|
bytes = new unsigned char[512];
|
|
|
|
WordStream->seek( offset);
|
|
WordStream->read( bytes, 512);
|
|
|
|
//get the count
|
|
crun = bytes[511];
|
|
|
|
//create and fill the array with the adresses
|
|
rgfcSize = crun + 1;
|
|
rgfc = new int[rgfcSize];
|
|
|
|
int j = 0;
|
|
|
|
for ( unsigned int i = 0; i < rgfcSize; i++ )
|
|
{
|
|
rgfc[i] = FormatUtils::BytesToInt32( bytes, j, 512 );
|
|
j += 4;
|
|
}
|
|
|
|
//create arrays
|
|
rgbx = new BX[crun];
|
|
grppapxSize = crun;
|
|
grppapx = new ParagraphPropertyExceptions*[grppapxSize];
|
|
|
|
for ( unsigned int i = 0; i < grppapxSize; i++ )
|
|
{
|
|
grppapx[i] = NULL;
|
|
}
|
|
|
|
j = 4 * ( crun + 1 );
|
|
|
|
//read the 12 for PHE
|
|
unsigned char* phe = NULL;
|
|
phe = new unsigned char[12];
|
|
|
|
unsigned char* papx = NULL;
|
|
|
|
for ( int i = 0; i < crun; i++ )
|
|
{
|
|
BX bx;
|
|
bx.wordOffset = bytes[j];
|
|
j++;
|
|
|
|
if (fComplex || !oldVersion)
|
|
{
|
|
memcpy( phe, ( bytes + j), 12 );
|
|
|
|
//fill the rgbx array
|
|
bx.phe = ParagraphHeight( phe, 12, false );
|
|
|
|
j += 12;
|
|
}
|
|
else
|
|
{
|
|
memcpy( phe, ( bytes + j), 6);
|
|
|
|
//fill the rgbx array
|
|
bx.phe = ParagraphHeight( phe, 6, false );
|
|
|
|
j += 6;
|
|
}
|
|
rgbx[i] = bx;
|
|
|
|
if ( bx.wordOffset != 0 )
|
|
{
|
|
//read first unsigned char of PAPX
|
|
//PAPX is stored in a FKP; so the first unsigned char is a count of words
|
|
unsigned char padbyte = 0;
|
|
unsigned char cw = bytes[bx.wordOffset * 2];
|
|
|
|
//if that unsigned char is zero, it's a pad unsigned char, and the word count is the following unsigned char
|
|
if ( cw == 0 )
|
|
{
|
|
padbyte = 1;
|
|
cw = bytes[bx.wordOffset * 2 + 1];
|
|
}
|
|
|
|
if ( cw != 0 )
|
|
{
|
|
//read the bytes for papx
|
|
papx = new unsigned char[cw * 2];
|
|
memcpy( papx, ( bytes + (bx.wordOffset * 2) + padbyte + 1 ), ( cw * 2 ) );
|
|
|
|
//parse PAPX and fill grppapx
|
|
grppapx[i] = new ParagraphPropertyExceptions( papx, ( cw * 2 ), dataStream, oldVersion );
|
|
|
|
RELEASEARRAYOBJECTS( papx );
|
|
}
|
|
}
|
|
else
|
|
{
|
|
//create a PAPX which doesn't modify anything
|
|
grppapx[i] = new ParagraphPropertyExceptions();
|
|
}
|
|
}
|
|
|
|
RELEASEARRAYOBJECTS( phe );
|
|
RELEASEARRAYOBJECTS( bytes );
|
|
}
|
|
|
|
/*========================================================================================================*/
|
|
|
|
/// Parses the 0Table (or 1Table) for FKP _entries containing PAPX
|
|
std::list<FormattedDiskPagePAPX*>* FormattedDiskPagePAPX::GetAllPAPXFKPs( FileInformationBlock* fib, POLE::Stream* wordStream, POLE::Stream* tableStream, POLE::Stream* dataStream)
|
|
{
|
|
std::list<FormattedDiskPagePAPX*>* PAPXlist = new std::list<FormattedDiskPagePAPX*>();
|
|
|
|
//get bintable for PAPX
|
|
unsigned char* binTablePapx = new unsigned char[fib->m_FibWord97.lcbPlcfBtePapx];
|
|
|
|
if (tableStream)
|
|
{
|
|
tableStream->seek( fib->m_FibWord97.fcPlcfBtePapx);
|
|
tableStream->read( binTablePapx, fib->m_FibWord97.lcbPlcfBtePapx);
|
|
}
|
|
|
|
//there are n offsets and n-1 fkp's in the bin table
|
|
|
|
if (fib->m_bOlderVersion && fib->m_FibBase.fComplex == false)
|
|
{
|
|
int n = ( ( (int)fib->m_FibWord97.lcbPlcfBtePapx - 8 ) / 6 ) + 1;
|
|
|
|
unsigned int first = FormatUtils::BytesToInt32(binTablePapx, 0, fib->m_FibWord97.lcbPlcfBtePapx );
|
|
unsigned int last = FormatUtils::BytesToInt32(binTablePapx, 4, fib->m_FibWord97.lcbPlcfBtePapx );
|
|
|
|
int start_papx = 8;
|
|
if (fib->m_FibWord97.lcbPlcfBtePapx - 8 > (n - 1) * 4)
|
|
{
|
|
start_papx+= ((n-1) * 4); //дублирование crun
|
|
}
|
|
|
|
int offset = 0;
|
|
for ( unsigned int i = start_papx; i < fib->m_FibWord97.lcbPlcfBtePapx; i += 2 )
|
|
{
|
|
//indexed FKP is the xth 512byte page
|
|
int fkpnr = FormatUtils::BytesToInt16( binTablePapx, i, fib->m_FibWord97.lcbPlcfBtePapx );
|
|
|
|
//so starts at:
|
|
int offset = fkpnr * 512;
|
|
|
|
//parse the FKP and add it to the list
|
|
PAPXlist->push_back( new FormattedDiskPagePAPX( wordStream, offset, dataStream, fib->m_bOlderVersion, fib->m_FibBase.fComplex) );
|
|
}
|
|
|
|
//if (PAPXlist->back()->rgfc[PAPXlist->back()->rgfcSize-1] < last)
|
|
//{
|
|
// PAPXlist->back()->rgfc[PAPXlist->back()->rgfcSize-1] = last;
|
|
// //tableStream->read( binTablePapx, fib->m_FibWord97.lcbPlcfBtePapx);
|
|
// //offset+=512;
|
|
// //PAPXlist->push_back( new FormattedDiskPagePAPX( wordStream, offset, dataStream ) );
|
|
//}
|
|
}
|
|
else
|
|
{
|
|
int n = ( ( (int)fib->m_FibWord97.lcbPlcfBtePapx - 4 ) / 8 ) + 1;
|
|
//Get the indexed PAPX FKPs
|
|
for ( unsigned int i = ( n * 4 ); i < fib->m_FibWord97.lcbPlcfBtePapx; i += 4 )
|
|
{
|
|
//indexed FKP is the xth 512byte page
|
|
int fkpnr = FormatUtils::BytesToInt32( binTablePapx, i, fib->m_FibWord97.lcbPlcfBtePapx );
|
|
|
|
//so starts at:
|
|
int offset = fkpnr * 512;
|
|
|
|
//parse the FKP and add it to the list
|
|
PAPXlist->push_back( new FormattedDiskPagePAPX( wordStream, offset, dataStream, fib->m_bOlderVersion, fib->m_FibBase.fComplex) );
|
|
}
|
|
|
|
}
|
|
|
|
RELEASEARRAYOBJECTS( binTablePapx );
|
|
|
|
return PAPXlist;
|
|
}
|
|
|
|
/*========================================================================================================*/
|
|
|
|
/// Returns a list of all PAPX FCs between they given boundaries.
|
|
std::list<int>* FormattedDiskPagePAPX::GetFileCharacterPositions
|
|
(
|
|
int fcMin,
|
|
int fcMax,
|
|
FileInformationBlock* fib,
|
|
POLE::Stream* wordStream,
|
|
POLE::Stream* tableStream,
|
|
POLE::Stream* dataStream
|
|
)
|
|
{
|
|
std::list<int>* cpList = new std::list<int>();
|
|
std::list<FormattedDiskPagePAPX*> *fkps = FormattedDiskPagePAPX::GetAllPAPXFKPs( fib, wordStream, tableStream, dataStream );
|
|
unsigned int i = 0;
|
|
FormattedDiskPagePAPX* fkp = NULL;
|
|
|
|
for ( std::list<FormattedDiskPagePAPX*>::iterator iter = fkps->begin(); iter != fkps->end(); iter++ )
|
|
{
|
|
fkp = (*iter);
|
|
|
|
//the last entry of each is always the same as the first entry of the next FKP
|
|
//so, ignore all last _entries except for the last FKP.
|
|
int max = fkp->rgfcSize;
|
|
|
|
if ( i++ < fkps->size() - 1 )
|
|
{
|
|
max--;
|
|
}
|
|
|
|
for ( int j = 0; j < max; j++ )
|
|
{
|
|
if( ( fkp->rgfc[j] >= fcMin ) && ( fkp->rgfc[j] < fcMax ) )
|
|
{
|
|
cpList->push_back( fkp->rgfc[j] );
|
|
}
|
|
}
|
|
|
|
RELEASEOBJECT( fkp );
|
|
}
|
|
|
|
fkps->clear();
|
|
RELEASEOBJECT( fkps );
|
|
|
|
return cpList;
|
|
}
|
|
|
|
/*========================================================================================================*/
|
|
|
|
/// Returnes a list of all ParagraphPropertyExceptions which correspond to text
|
|
/// between the given offsets.
|
|
std::list<ParagraphPropertyExceptions*>* FormattedDiskPagePAPX::GetParagraphPropertyExceptions
|
|
(
|
|
int fcMin,
|
|
int fcMax,
|
|
FileInformationBlock* fib,
|
|
POLE::Stream* wordStream,
|
|
POLE::Stream* tableStream,
|
|
POLE::Stream* dataStream
|
|
)
|
|
{
|
|
std::list<ParagraphPropertyExceptions*>* ppxList = new std::list<ParagraphPropertyExceptions*>();
|
|
std::list<FormattedDiskPagePAPX*>* fkps = FormattedDiskPagePAPX::GetAllPAPXFKPs( fib, wordStream, tableStream, dataStream );
|
|
FormattedDiskPagePAPX *fkp = NULL;
|
|
|
|
for ( std::list<FormattedDiskPagePAPX*>::iterator iter = fkps->begin(); iter != fkps->end(); iter++ )
|
|
{
|
|
fkp = (*iter);
|
|
|
|
for ( unsigned int j = 0; j < fkp->grppapxSize; j++ )
|
|
{
|
|
if ( ( fkp->rgfc[j] >= fcMin ) && ( fkp->rgfc[j] < fcMax ) )
|
|
{
|
|
ppxList->push_back( fkp->grppapx[j] );
|
|
}
|
|
}
|
|
|
|
RELEASEOBJECT( fkp );
|
|
|
|
fkps->clear();
|
|
RELEASEOBJECT( fkps );
|
|
}
|
|
|
|
return ppxList;
|
|
}
|
|
} |