mirror of
https://github.com/ONLYOFFICE/core.git
synced 2026-02-10 18:05:41 +08:00
696 lines
24 KiB
C++
696 lines
24 KiB
C++
/*
|
||
* (c) Copyright Ascensio System SIA 2010-2019
|
||
*
|
||
* This program is a free software product. You can redistribute it and/or
|
||
* modify it under the terms of the GNU Affero General Public License (AGPL)
|
||
* version 3 as published by the Free Software Foundation. In accordance with
|
||
* Section 7(a) of the GNU AGPL its Section 15 shall be amended to the effect
|
||
* that Ascensio System SIA expressly excludes the warranty of non-infringement
|
||
* of any third-party rights.
|
||
*
|
||
* This program is distributed WITHOUT ANY WARRANTY; without even the implied
|
||
* warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. For
|
||
* details, see the GNU AGPL at: http://www.gnu.org/licenses/agpl-3.0.html
|
||
*
|
||
* You can contact Ascensio System SIA at 20A-12 Ernesta Birznieka-Upisha
|
||
* street, Riga, Latvia, EU, LV-1050.
|
||
*
|
||
* The interactive user interfaces in modified source and object code versions
|
||
* of the Program must display Appropriate Legal Notices, as required under
|
||
* Section 5 of the GNU AGPL version 3.
|
||
*
|
||
* Pursuant to Section 7(b) of the License you must retain the original Product
|
||
* logo when distributing the program. Pursuant to Section 7(e) we decline to
|
||
* grant you any rights under trademark law for use of our trademarks.
|
||
*
|
||
* All the Product's GUI elements, including illustrations and icon sets, as
|
||
* well as technical writing content are licensed under the terms of the
|
||
* Creative Commons Attribution-ShareAlike 4.0 International. See the License
|
||
* terms at http://creativecommons.org/licenses/by-sa/4.0/legalcode
|
||
*
|
||
*/
|
||
|
||
#define errMemory 12
|
||
|
||
#include "../DesktopEditor/graphics/pro/Graphics.h"
|
||
#include "PdfReader.h"
|
||
|
||
#include "Src/Adaptors.h"
|
||
#include "lib/xpdf/ErrorCodes.h"
|
||
|
||
#include "../Common/OfficeDefines.h"
|
||
#include "../DesktopEditor/raster/BgraFrame.h"
|
||
#include "../DesktopEditor/graphics/IRenderer.h"
|
||
#include "../DesktopEditor/common/Directory.h"
|
||
|
||
#include "lib/xpdf/PDFDoc.h"
|
||
#include "lib/xpdf/GlobalParams.h"
|
||
#include "lib/xpdf/ErrorCodes.h"
|
||
#include "lib/xpdf/ImageOutputDev.h"
|
||
#include "Src/RendererOutputDev.h"
|
||
|
||
#ifdef BUILDING_WASM_MODULE
|
||
#include "../DesktopEditor/graphics/pro/js/wasm/src/serialize.h"
|
||
#include "lib/xpdf/Outline.h"
|
||
#include "lib/xpdf/Link.h"
|
||
#include "lib/xpdf/TextOutputDev.h"
|
||
#include "lib/goo/GList.h"
|
||
#include "../DesktopEditor/common/StringExt.h"
|
||
#include <vector>
|
||
//#include <fstream>
|
||
#endif
|
||
|
||
namespace PdfReader
|
||
{
|
||
class CPdfReader_Private
|
||
{
|
||
public:
|
||
PDFDoc* m_pPDFDocument;
|
||
std::wstring m_wsTempFolder;
|
||
std::wstring m_wsCMapFolder;
|
||
NSFonts::IApplicationFonts* m_pAppFonts;
|
||
NSFonts::IFontManager* m_pFontManager;
|
||
CFontList* m_pFontList;
|
||
};
|
||
|
||
CPdfReader::CPdfReader(NSFonts::IApplicationFonts* pAppFonts)
|
||
{
|
||
m_pInternal = new CPdfReader_Private();
|
||
|
||
m_pInternal->m_wsTempFolder = L"";
|
||
m_pInternal->m_wsCMapFolder = L"";
|
||
|
||
m_pInternal->m_pPDFDocument = NULL;
|
||
m_pInternal->m_pFontManager = NULL;
|
||
|
||
globalParams = new GlobalParamsAdaptor(NULL);
|
||
#ifndef _DEBUG
|
||
globalParams->setErrQuiet(gTrue);
|
||
#endif
|
||
|
||
m_pInternal->m_pFontList = new CFontList();
|
||
|
||
m_pInternal->m_pAppFonts = pAppFonts;
|
||
|
||
// Создаем менеджер шрифтов с собственным кэшем
|
||
m_pInternal->m_pFontManager = pAppFonts->GenerateFontManager();
|
||
NSFonts::IFontsCache* pMeasurerCache = NSFonts::NSFontCache::Create();
|
||
pMeasurerCache->SetStreams(pAppFonts->GetStreams());
|
||
m_pInternal->m_pFontManager->SetOwnerCache(pMeasurerCache);
|
||
pMeasurerCache->SetCacheSize(1);
|
||
((GlobalParamsAdaptor*)globalParams)->SetFontManager(m_pInternal->m_pFontManager);
|
||
#ifndef BUILDING_WASM_MODULE
|
||
globalParams->setupBaseFonts(NULL);
|
||
#endif
|
||
|
||
m_eError = errNone;
|
||
}
|
||
CPdfReader::~CPdfReader()
|
||
{
|
||
if (m_pInternal->m_pFontList)
|
||
{
|
||
m_pInternal->m_pFontList->Clear();
|
||
delete m_pInternal->m_pFontList;
|
||
}
|
||
|
||
m_pInternal->m_wsCMapFolder = L"";
|
||
|
||
if (!m_pInternal->m_wsTempFolder.empty())
|
||
{
|
||
NSDirectory::DeleteDirectory(m_pInternal->m_wsTempFolder);
|
||
m_pInternal->m_wsTempFolder = L"";
|
||
}
|
||
|
||
RELEASEOBJECT((m_pInternal->m_pPDFDocument));
|
||
RELEASEOBJECT((globalParams));
|
||
RELEASEINTERFACE((m_pInternal->m_pFontManager));
|
||
}
|
||
bool CPdfReader::LoadFromFile(const std::wstring& wsSrcPath, const std::wstring& wsOptions,
|
||
const std::wstring& wsOwnerPassword, const std::wstring& wsUserPassword)
|
||
{
|
||
// TODO: Сейчас при загрузке каждой новой картинки мы пересоздаем
|
||
// FontManager, потому что сейчас в нем кэш без ограничения.
|
||
//------------------------------------------------------
|
||
RELEASEINTERFACE((m_pInternal->m_pFontManager));
|
||
m_pInternal->m_pFontManager = m_pInternal->m_pAppFonts->GenerateFontManager();
|
||
NSFonts::IFontsCache* pMeasurerCache = NSFonts::NSFontCache::Create();
|
||
pMeasurerCache->SetStreams(m_pInternal->m_pAppFonts->GetStreams());
|
||
m_pInternal->m_pFontManager->SetOwnerCache(pMeasurerCache);
|
||
pMeasurerCache->SetCacheSize(1);
|
||
((GlobalParamsAdaptor*)globalParams)->SetFontManager(m_pInternal->m_pFontManager);
|
||
//------------------------------------------------------
|
||
|
||
if (m_pInternal->m_pPDFDocument)
|
||
delete m_pInternal->m_pPDFDocument;
|
||
|
||
if (GetTempDirectory() == L"")
|
||
{
|
||
SetTempDirectory(NSDirectory::GetTempPath());
|
||
}
|
||
|
||
m_eError = errNone;
|
||
GString* owner_pswd = NSStrings::CreateString(wsOwnerPassword);
|
||
GString* user_pswd = NSStrings::CreateString(wsUserPassword);
|
||
|
||
// конвертим путь в utf8 - под виндой они сконвертят в юникод, а на остальных - так и надо
|
||
std::string sPathUtf8 = U_TO_UTF8(wsSrcPath);
|
||
m_pInternal->m_pPDFDocument = new PDFDoc((char*)sPathUtf8.c_str(), owner_pswd, user_pswd);
|
||
|
||
delete owner_pswd;
|
||
delete user_pswd;
|
||
|
||
if (m_pInternal->m_pPDFDocument)
|
||
m_eError = m_pInternal->m_pPDFDocument->getErrorCode();
|
||
else
|
||
m_eError = errMemory;
|
||
|
||
if (!m_pInternal->m_pPDFDocument || !m_pInternal->m_pPDFDocument->isOk())
|
||
{
|
||
RELEASEOBJECT(m_pInternal->m_pPDFDocument);
|
||
return false;
|
||
}
|
||
|
||
m_pInternal->m_pFontList->Clear();
|
||
|
||
return (errNone == m_eError);
|
||
}
|
||
bool CPdfReader::LoadFromMemory(BYTE* data, DWORD length, const std::wstring& options,
|
||
const std::wstring& owner_password, const std::wstring& user_password)
|
||
{
|
||
// TODO: Сейчас при загрузке каждой новой картинки мы пересоздаем
|
||
// FontManager, потому что сейчас в нем кэш без ограничения.
|
||
//------------------------------------------------------
|
||
RELEASEINTERFACE((m_pInternal->m_pFontManager));
|
||
m_pInternal->m_pFontManager = m_pInternal->m_pAppFonts->GenerateFontManager();
|
||
NSFonts::IFontsCache* pMeasurerCache = NSFonts::NSFontCache::Create();
|
||
pMeasurerCache->SetStreams(m_pInternal->m_pAppFonts->GetStreams());
|
||
m_pInternal->m_pFontManager->SetOwnerCache(pMeasurerCache);
|
||
pMeasurerCache->SetCacheSize(1);
|
||
((GlobalParamsAdaptor*)globalParams)->SetFontManager(m_pInternal->m_pFontManager);
|
||
//------------------------------------------------------
|
||
|
||
RELEASEOBJECT(m_pInternal->m_pPDFDocument);
|
||
m_eError = errNone;
|
||
GString* owner_pswd = NSStrings::CreateString(owner_password);
|
||
GString* user_pswd = NSStrings::CreateString(user_password);
|
||
|
||
Object obj;
|
||
obj.initNull();
|
||
// будет освобожден в деструкторе PDFDoc
|
||
BaseStream *str = new MemStream((char*)data, 0, length, &obj);
|
||
m_pInternal->m_pPDFDocument = new PDFDoc(str, owner_pswd, user_pswd);
|
||
|
||
delete owner_pswd;
|
||
delete user_pswd;
|
||
|
||
m_eError = m_pInternal->m_pPDFDocument ? m_pInternal->m_pPDFDocument->getErrorCode() : errMemory;
|
||
|
||
if (!m_pInternal->m_pPDFDocument || !m_pInternal->m_pPDFDocument->isOk())
|
||
{
|
||
RELEASEOBJECT(m_pInternal->m_pPDFDocument);
|
||
return false;
|
||
}
|
||
|
||
m_pInternal->m_pFontList->Clear();
|
||
|
||
return (errNone == m_eError);
|
||
}
|
||
void CPdfReader::Close()
|
||
{
|
||
RELEASEOBJECT((m_pInternal->m_pPDFDocument));
|
||
}
|
||
NSFonts::IApplicationFonts* CPdfReader::GetFonts()
|
||
{
|
||
return m_pInternal->m_pAppFonts;
|
||
}
|
||
|
||
OfficeDrawingFileType CPdfReader::GetType()
|
||
{
|
||
return odftPDF;
|
||
}
|
||
int CPdfReader::GetError()
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return m_eError;
|
||
|
||
if (m_pInternal->m_pPDFDocument->isOk())
|
||
return 0;
|
||
|
||
return m_pInternal->m_pPDFDocument->getErrorCode();
|
||
}
|
||
int CPdfReader::GetPagesCount()
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return 0;
|
||
|
||
return m_pInternal->m_pPDFDocument->getNumPages();
|
||
}
|
||
double CPdfReader::GetVersion()
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return 0;
|
||
|
||
return m_pInternal->m_pPDFDocument->getPDFVersion();
|
||
}
|
||
int CPdfReader::GetPermissions()
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return 0;
|
||
|
||
int nPermissions = 0;
|
||
|
||
if (m_pInternal->m_pPDFDocument->okToPrint())
|
||
nPermissions += PERMISSION_PRINT;
|
||
if (m_pInternal->m_pPDFDocument->okToCopy())
|
||
nPermissions += PERMISSION_COPY;
|
||
if (m_pInternal->m_pPDFDocument->okToChange())
|
||
nPermissions += PERMISSION_CHANGE;
|
||
|
||
return nPermissions;
|
||
}
|
||
std::wstring CPdfReader::GetPageLabel(int nPageIndex)
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return std::wstring();
|
||
// todo label
|
||
// StringExt* seLabel = m_pInternal->m_pPDFDocument->GetPageLabels()->GetLabel(nPageIndex);
|
||
// if (seLabel)
|
||
// {
|
||
// std::wstring wsResult(seLabel->GetWString());
|
||
// delete seLabel;
|
||
// return wsResult;
|
||
// }
|
||
|
||
return std::wstring();
|
||
}
|
||
bool CPdfReader::ExtractAllImages(const wchar_t* wsDstPath, const wchar_t* wsPrefix)
|
||
{
|
||
std::wstring sDstPath(wsDstPath);
|
||
if (sDstPath.empty())
|
||
return false;
|
||
|
||
// check last symbol (directory)
|
||
wchar_t nLastSymbol = sDstPath[sDstPath.length() - 1];
|
||
if ('\\' != nLastSymbol && '/' != nLastSymbol)
|
||
sDstPath += '/';
|
||
// prefix for each file
|
||
if (NULL != wsPrefix)
|
||
sDstPath += std::wstring(wsPrefix);
|
||
|
||
std::string sDstPathA = U_TO_UTF8(sDstPath);
|
||
ImageOutputDev *pOutputDev = new ImageOutputDev((char*)sDstPathA.c_str(), true, false, false);
|
||
if (!pOutputDev)
|
||
return false;
|
||
|
||
int nPagesCount = GetPagesCount();
|
||
for (int nIndex = 1; nIndex <= nPagesCount; nIndex++)
|
||
{
|
||
m_pInternal->m_pPDFDocument->displayPage(pOutputDev, nIndex, 72, 72, 0, false, false, false);
|
||
}
|
||
|
||
delete pOutputDev;
|
||
|
||
return true;
|
||
}
|
||
void CPdfReader::GetPageInfo(int _nPageIndex, double* pdWidth, double* pdHeight, double* pdDpiX, double* pdDpiY)
|
||
{
|
||
int nPageIndex = _nPageIndex + 1;
|
||
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return;
|
||
|
||
const double c_dInch = 25.399; // Миллиметров в дюйме
|
||
const double c_dXResolution = 154.0;
|
||
const double c_dYResolution = 154.0;
|
||
|
||
double dKoefX = c_dInch / c_dXResolution;
|
||
double dKoefY = c_dInch / c_dYResolution;
|
||
|
||
int nRotate = m_pInternal->m_pPDFDocument->getPageRotate(nPageIndex);
|
||
|
||
while (nRotate >= 360)
|
||
nRotate -= 360;
|
||
|
||
while (nRotate < 0)
|
||
nRotate += 360;
|
||
|
||
if (0 != nRotate && 180 != nRotate)
|
||
{
|
||
*pdHeight = m_pInternal->m_pPDFDocument->getPageCropWidth(nPageIndex);
|
||
*pdWidth = m_pInternal->m_pPDFDocument->getPageCropHeight(nPageIndex);
|
||
}
|
||
else
|
||
{
|
||
*pdWidth = m_pInternal->m_pPDFDocument->getPageCropWidth(nPageIndex);
|
||
*pdHeight = m_pInternal->m_pPDFDocument->getPageCropHeight(nPageIndex);
|
||
}
|
||
|
||
*pdDpiX = 72;
|
||
*pdDpiY = 72;
|
||
}
|
||
void CPdfReader::DrawPageOnRenderer(IRenderer* pRenderer, int _nPageIndex, bool* pbBreak)
|
||
{
|
||
int nPageIndex = _nPageIndex + 1;
|
||
|
||
if (m_pInternal->m_pPDFDocument && pRenderer)
|
||
{
|
||
RendererOutputDev oRendererOut(pRenderer, m_pInternal->m_pFontManager, m_pInternal->m_pFontList);
|
||
oRendererOut.NewPDF(m_pInternal->m_pPDFDocument->getXRef());
|
||
oRendererOut.SetBreak(pbBreak);
|
||
m_pInternal->m_pPDFDocument->displayPage(&oRendererOut, nPageIndex, 72.0, 72.0, 0, false, true, false);
|
||
}
|
||
}
|
||
int CPdfReader::GetImagesCount()
|
||
{
|
||
// ImageOutputDev *pOutputDev = new ImageOutputDev(NULL, true, true, false);
|
||
// if (!pOutputDev)
|
||
// return 0;
|
||
//
|
||
// for (int nIndex = 1; nIndex <= m_pInternal->m_pPDFDocument->GetPagesCount(); nIndex++)
|
||
// {
|
||
// m_pInternal->m_pPDFDocument->displayPage(pOutputDev, nIndex, 72, 72, 0, false, false, false);
|
||
// }
|
||
//
|
||
// return pOutputDev->
|
||
return 0;
|
||
}
|
||
void CPdfReader::SetTempDirectory(const std::wstring& wsTempFolder)
|
||
{
|
||
if (!m_pInternal->m_wsTempFolder.empty())
|
||
{
|
||
NSDirectory::DeleteDirectory(m_pInternal->m_wsTempFolder);
|
||
m_pInternal->m_wsTempFolder = wsTempFolder;
|
||
}
|
||
|
||
if (!wsTempFolder.empty())
|
||
{
|
||
std::wstring wsFolderName = std::wstring(wsTempFolder) + L"//pdftemp";
|
||
std::wstring wsFolder = wsFolderName;
|
||
int nCounter = 0;
|
||
while (NSDirectory::Exists(wsFolder))
|
||
{
|
||
nCounter++;
|
||
wsFolder = wsFolderName + L"_" + std::to_wstring(nCounter);
|
||
}
|
||
NSDirectory::CreateDirectory(wsFolder);
|
||
m_pInternal->m_wsTempFolder = wsFolder;
|
||
}
|
||
else
|
||
m_pInternal->m_wsTempFolder = L"";
|
||
|
||
if (globalParams)
|
||
((GlobalParamsAdaptor*)globalParams)->SetTempFolder(m_pInternal->m_wsTempFolder.c_str());
|
||
}
|
||
std::wstring CPdfReader::GetTempDirectory()
|
||
{
|
||
return m_pInternal->m_wsTempFolder;
|
||
}
|
||
|
||
void CPdfReader::SetCMapFolder(const wchar_t* wsCMapFolder)
|
||
{
|
||
m_pInternal->m_wsCMapFolder = std::wstring(wsCMapFolder);
|
||
|
||
if (globalParams)
|
||
((GlobalParamsAdaptor*)globalParams)->SetCMapFolder(m_pInternal->m_wsCMapFolder.c_str());
|
||
}
|
||
NSFonts::IFontManager* CPdfReader::GetFontManager()
|
||
{
|
||
return m_pInternal->m_pFontManager;
|
||
}
|
||
std::wstring CPdfReader::ToXml(const std::wstring& wsFilePath)
|
||
{
|
||
//todo
|
||
// std::wstring wsXml = m_pInternal->m_pPDFDocument->ToXml();
|
||
//
|
||
// if (wsFilePath != L"")
|
||
// {
|
||
// NSFile::CFileBinary oFile;
|
||
// if (!oFile.CreateFileW(wsFilePath))
|
||
// return wsXml;
|
||
//
|
||
// oFile.WriteStringUTF8(wsXml);
|
||
// oFile.CloseFile();
|
||
// }
|
||
//
|
||
// return wsXml;
|
||
return L"";
|
||
}
|
||
#define DICT_LOOKUP(info, obj1, name) \
|
||
if (info.dictLookup(name, &obj1)->isString())\
|
||
{\
|
||
char* str = obj1.getString()->getCString();\
|
||
int length = obj1.getString()->getLength();\
|
||
if (str && length > 0)\
|
||
{\
|
||
sRes += "\"";\
|
||
sRes += name;\
|
||
sRes += "\":\"";\
|
||
sRes += std::string(str, length);\
|
||
sRes += "\",";\
|
||
}\
|
||
}\
|
||
|
||
#define DICT_LOOKUP_DATE(info, obj1, name) \
|
||
if (info.dictLookup(name, &obj1)->isString())\
|
||
{\
|
||
char* str = obj1.getString()->getCString();\
|
||
int length = obj1.getString()->getLength();\
|
||
if (str && length > 21)\
|
||
{\
|
||
std::string sNoDate = std::string(str, length);\
|
||
std::string sDate = sNoDate.substr(2, 4) + '-' + sNoDate.substr(6, 2) + '-' + sNoDate.substr(8, 2) + 'T' +\
|
||
sNoDate.substr(10, 2) + ':' + sNoDate.substr(12, 2) + ':' + sNoDate.substr(14, 2) + ".000+" +\
|
||
sNoDate.substr(17, 2) + ':' + sNoDate.substr(20, 2);\
|
||
sRes += "\"";\
|
||
sRes += name;\
|
||
sRes += "\":\"";\
|
||
sRes += sDate;\
|
||
sRes += "\",";\
|
||
}\
|
||
}\
|
||
|
||
BYTE* CPdfReader::GetInfo()
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return NULL;
|
||
|
||
std::string sRes = "{";
|
||
|
||
Object info, obj1;
|
||
m_pInternal->m_pPDFDocument->getDocInfo(&info);
|
||
if (info.isDict())
|
||
{
|
||
DICT_LOOKUP(info, obj1, "Title");
|
||
DICT_LOOKUP(info, obj1, "Author");
|
||
DICT_LOOKUP(info, obj1, "Subject");
|
||
DICT_LOOKUP(info, obj1, "Keywords");
|
||
DICT_LOOKUP(info, obj1, "Creator");
|
||
DICT_LOOKUP(info, obj1, "Producer");
|
||
|
||
DICT_LOOKUP_DATE(info, obj1, "CreationDate");
|
||
DICT_LOOKUP_DATE(info, obj1, "ModDate");
|
||
}
|
||
|
||
info.free();
|
||
obj1.free();
|
||
|
||
std::string version = std::to_string(GetVersion());
|
||
sRes += "\"Version\":";
|
||
sRes += version.substr(0, version.length() - 5);
|
||
double nW = 0;
|
||
double nH = 0;
|
||
double nDpi = 0;
|
||
GetPageInfo(0, &nW, &nH, &nDpi, &nDpi);
|
||
sRes += ",\"PageSize\":\"";
|
||
version = std::to_string(nW);
|
||
sRes += version.substr(0, version.length() - 4);
|
||
sRes += "x";
|
||
version = std::to_string(nH);
|
||
sRes += version.substr(0, version.length() - 4);
|
||
sRes += "\",\"NumberOfPages\":";
|
||
sRes += std::to_string(GetPagesCount());
|
||
sRes += ",\"FastWebView\":";
|
||
sRes += m_pInternal->m_pPDFDocument->isLinearized() ? "true" : "false";
|
||
sRes += ",\"Tagged\":";
|
||
sRes += m_pInternal->m_pPDFDocument->getStructTreeRoot()->isDict() ? "true" : "false";
|
||
sRes += "}";
|
||
|
||
NSWasm::CData oRes;
|
||
oRes.SkipLen();
|
||
oRes.WriteString((BYTE*)sRes.c_str(), sRes.length());
|
||
oRes.WriteLen();
|
||
|
||
BYTE* bRes = oRes.GetBuffer();
|
||
oRes.ClearWithoutAttack();
|
||
return bRes;
|
||
}
|
||
#ifdef BUILDING_WASM_MODULE
|
||
void getBookmars(PDFDoc* pdfDoc, OutlineItem* pOutlineItem, NSWasm::CData& out, int level)
|
||
{
|
||
int nLengthTitle = pOutlineItem->getTitleLength();
|
||
Unicode* pTitle = pOutlineItem->getTitle();
|
||
std::string sTitle = NSStringExt::CConverter::GetUtf8FromUTF32(pTitle, nLengthTitle);
|
||
|
||
LinkAction* pLinkAction = pOutlineItem->getAction();
|
||
if (!pLinkAction)
|
||
return;
|
||
LinkActionKind kind = pLinkAction->getKind();
|
||
if (kind != actionGoTo)
|
||
return;
|
||
|
||
GString* str = ((LinkGoTo*)pLinkAction)->getNamedDest();
|
||
LinkDest* pLinkDest = str ? pdfDoc->findDest(str) : ((LinkGoTo*)pLinkAction)->getDest();
|
||
if (!pLinkDest)
|
||
return;
|
||
int pg;
|
||
if (pLinkDest->isPageRef())
|
||
{
|
||
Ref pageRef = pLinkDest->getPageRef();
|
||
pg = pdfDoc->findPage(pageRef.num, pageRef.gen);
|
||
}
|
||
else
|
||
pg = pLinkDest->getPageNum();
|
||
double dy = pdfDoc->getPageCropHeight(pg) - pLinkDest->getTop();
|
||
if (str)
|
||
RELEASEOBJECT(pLinkDest);
|
||
|
||
out.AddInt(pg - 1);
|
||
out.AddInt(level);
|
||
out.AddDouble(dy);
|
||
out.WriteString((BYTE*)sTitle.c_str(), sTitle.length());
|
||
|
||
pOutlineItem->open();
|
||
GList* pList = pOutlineItem->getKids();
|
||
if (!pList)
|
||
return;
|
||
int num = pList->getLength();
|
||
for (int i = 0; i < num; i++)
|
||
{
|
||
OutlineItem* pOutlineItemKid = (OutlineItem*)pList->get(i);
|
||
if (!pOutlineItemKid)
|
||
continue;
|
||
getBookmars(pdfDoc, pOutlineItemKid, out, level + 1);
|
||
}
|
||
pOutlineItem->close();
|
||
}
|
||
BYTE* CPdfReader::GetStructure()
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return NULL;
|
||
Outline* pOutline = m_pInternal->m_pPDFDocument->getOutline();
|
||
if (!pOutline)
|
||
return NULL;
|
||
GList* pList = pOutline->getItems();
|
||
if (!pList)
|
||
return NULL;
|
||
|
||
NSWasm::CData oRes;
|
||
oRes.SkipLen();
|
||
int num = pList->getLength();
|
||
for (int i = 0; i < num; i++)
|
||
{
|
||
OutlineItem* pOutlineItem = (OutlineItem*)pList->get(i);
|
||
if (pOutlineItem)
|
||
getBookmars(m_pInternal->m_pPDFDocument, pOutlineItem, oRes, 1);
|
||
}
|
||
oRes.WriteLen();
|
||
|
||
BYTE* bRes = oRes.GetBuffer();
|
||
oRes.ClearWithoutAttack();
|
||
return bRes;
|
||
}
|
||
BYTE* CPdfReader::GetLinks(int nPageIndex)
|
||
{
|
||
if (!m_pInternal->m_pPDFDocument)
|
||
return NULL;
|
||
|
||
nPageIndex++;
|
||
|
||
NSWasm::CPageLink oLinks;
|
||
double height = m_pInternal->m_pPDFDocument->getPageCropHeight(nPageIndex);
|
||
|
||
// Текст-ссылка
|
||
TextOutputControl textOutControl;
|
||
textOutControl.mode = textOutReadingOrder;
|
||
TextOutputDev* pTextOut = new TextOutputDev(NULL, &textOutControl, gFalse);
|
||
m_pInternal->m_pPDFDocument->displayPage(pTextOut, nPageIndex, 72, 72, 0, gFalse, gTrue, gFalse);
|
||
m_pInternal->m_pPDFDocument->processLinks(pTextOut, nPageIndex);
|
||
TextWordList* pWordList = pTextOut->makeWordList();
|
||
for (int i = 0; i < pWordList->getLength(); i++)
|
||
{
|
||
TextWord* pWord = pWordList->get(i);
|
||
if (!pWord)
|
||
continue;
|
||
GString* sLink = pWord->getText();
|
||
if (!sLink)
|
||
continue;
|
||
std::string link(sLink->getCString(), sLink->getLength());
|
||
size_t find = link.find("http://");
|
||
if (find == std::string::npos)
|
||
find = link.find("https://");
|
||
if (find == std::string::npos)
|
||
find = link.find("www.");
|
||
if (find != std::string::npos)
|
||
{
|
||
link.erase(0, find);
|
||
double x1, y1, x2, y2;
|
||
pWord->getBBox(&x1, &y1, &x2, &y2);
|
||
oLinks.m_arLinks.push_back({link, 0, x1, y1, x2 - x1, y2 - y1});
|
||
}
|
||
}
|
||
RELEASEOBJECT(pTextOut);
|
||
|
||
// Гиперссылка
|
||
Links* pLinks = m_pInternal->m_pPDFDocument->getLinks(nPageIndex);
|
||
if (!pLinks)
|
||
return NULL;
|
||
|
||
int num = pLinks->getNumLinks();
|
||
for (int i = 0; i < num; i++)
|
||
{
|
||
Link* pLink = pLinks->getLink(i);
|
||
if (!pLink)
|
||
continue;
|
||
|
||
GString* str = NULL;
|
||
double x1 = 0.0, y1 = 0.0, x2 = 0.0, y2 = 0.0, dy = 0.0;
|
||
pLink->getRect(&x1, &y1, &x2, &y2);
|
||
y1 = height - y1;
|
||
y2 = height - y2;
|
||
|
||
LinkAction* pLinkAction = pLink->getAction();
|
||
if (!pLinkAction)
|
||
continue;
|
||
LinkActionKind kind = pLinkAction->getKind();
|
||
if (kind == actionGoTo)
|
||
{
|
||
str = ((LinkGoTo*)pLinkAction)->getNamedDest();
|
||
LinkDest* pLinkDest = m_pInternal->m_pPDFDocument->findDest(str);
|
||
if (pLinkDest)
|
||
{
|
||
int pg;
|
||
if (pLinkDest->isPageRef())
|
||
{
|
||
Ref pageRef = pLinkDest->getPageRef();
|
||
pg = m_pInternal->m_pPDFDocument->findPage(pageRef.num, pageRef.gen);
|
||
}
|
||
else
|
||
pg = pLinkDest->getPageNum();
|
||
std::string sLink = "#" + std::to_string(pg - 1);
|
||
str = new GString(sLink.c_str());
|
||
dy = m_pInternal->m_pPDFDocument->getPageCropHeight(pg) - pLinkDest->getTop();
|
||
}
|
||
RELEASEOBJECT(pLinkDest);
|
||
}
|
||
else if (kind == actionURI)
|
||
str = ((LinkURI*)pLinkAction)->getURI()->copy();
|
||
|
||
oLinks.m_arLinks.push_back({str ? std::string(str->getCString(), str->getLength()) : "", dy, x1, y2, x2 - x1, y1 - y2});
|
||
RELEASEOBJECT(str);
|
||
}
|
||
RELEASEOBJECT(pLinks);
|
||
return oLinks.Serialize();
|
||
}
|
||
#endif
|
||
}
|