// Copyright 2014 PDFium Authors. All rights reserved.
|
// Use of this source code is governed by a BSD-style license that can be
|
// found in the LICENSE file.
|
|
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
|
|
#include "public/fpdf_flatten.h"
|
|
#include <algorithm>
|
|
#include "core/fpdfapi/fpdf_page/include/cpdf_page.h"
|
#include "core/fpdfapi/fpdf_page/include/cpdf_pageobject.h"
|
#include "core/fpdfapi/fpdf_parser/include/cpdf_array.h"
|
#include "core/fpdfapi/fpdf_parser/include/cpdf_document.h"
|
#include "core/fpdfapi/fpdf_parser/include/cpdf_number.h"
|
#include "core/fpdfapi/fpdf_parser/include/cpdf_stream.h"
|
#include "core/fpdfapi/fpdf_parser/include/cpdf_stream_acc.h"
|
#include "fpdfsdk/include/fsdk_define.h"
|
|
typedef CFX_ArrayTemplate<CPDF_Dictionary*> CPDF_ObjectArray;
|
typedef CFX_ArrayTemplate<CFX_FloatRect> CPDF_RectArray;
|
|
enum FPDF_TYPE { MAX, MIN };
|
enum FPDF_VALUE { TOP, LEFT, RIGHT, BOTTOM };
|
|
FX_BOOL IsValiableRect(CFX_FloatRect rect, CFX_FloatRect rcPage) {
|
if (rect.left - rect.right > 0.000001f || rect.bottom - rect.top > 0.000001f)
|
return FALSE;
|
|
if (rect.left == 0.0f && rect.top == 0.0f && rect.right == 0.0f &&
|
rect.bottom == 0.0f)
|
return FALSE;
|
|
if (!rcPage.IsEmpty()) {
|
if (rect.left - rcPage.left < -10.000001f ||
|
rect.right - rcPage.right > 10.000001f ||
|
rect.top - rcPage.top > 10.000001f ||
|
rect.bottom - rcPage.bottom < -10.000001f)
|
return FALSE;
|
}
|
|
return TRUE;
|
}
|
|
void GetContentsRect(CPDF_Document* pDoc,
|
CPDF_Dictionary* pDict,
|
CPDF_RectArray* pRectArray) {
|
std::unique_ptr<CPDF_Page> pPDFPage(new CPDF_Page(pDoc, pDict, false));
|
pPDFPage->ParseContent();
|
|
for (const auto& pPageObject : *pPDFPage->GetPageObjectList()) {
|
CFX_FloatRect rc;
|
rc.left = pPageObject->m_Left;
|
rc.right = pPageObject->m_Right;
|
rc.bottom = pPageObject->m_Bottom;
|
rc.top = pPageObject->m_Top;
|
if (IsValiableRect(rc, pDict->GetRectBy("MediaBox")))
|
pRectArray->Add(rc);
|
}
|
}
|
|
void ParserStream(CPDF_Dictionary* pPageDic,
|
CPDF_Dictionary* pStream,
|
CPDF_RectArray* pRectArray,
|
CPDF_ObjectArray* pObjectArray) {
|
if (!pStream)
|
return;
|
CFX_FloatRect rect;
|
if (pStream->KeyExist("Rect"))
|
rect = pStream->GetRectBy("Rect");
|
else if (pStream->KeyExist("BBox"))
|
rect = pStream->GetRectBy("BBox");
|
|
if (IsValiableRect(rect, pPageDic->GetRectBy("MediaBox")))
|
pRectArray->Add(rect);
|
|
pObjectArray->Add(pStream);
|
}
|
|
int ParserAnnots(CPDF_Document* pSourceDoc,
|
CPDF_Dictionary* pPageDic,
|
CPDF_RectArray* pRectArray,
|
CPDF_ObjectArray* pObjectArray,
|
int nUsage) {
|
if (!pSourceDoc || !pPageDic)
|
return FLATTEN_FAIL;
|
|
GetContentsRect(pSourceDoc, pPageDic, pRectArray);
|
CPDF_Array* pAnnots = pPageDic->GetArrayBy("Annots");
|
if (!pAnnots)
|
return FLATTEN_NOTHINGTODO;
|
|
uint32_t dwSize = pAnnots->GetCount();
|
for (int i = 0; i < (int)dwSize; i++) {
|
CPDF_Dictionary* pAnnotDic = ToDictionary(pAnnots->GetDirectObjectAt(i));
|
if (!pAnnotDic)
|
continue;
|
|
CFX_ByteString sSubtype = pAnnotDic->GetStringBy("Subtype");
|
if (sSubtype == "Popup")
|
continue;
|
|
int nAnnotFlag = pAnnotDic->GetIntegerBy("F");
|
if (nAnnotFlag & ANNOTFLAG_HIDDEN)
|
continue;
|
|
if (nUsage == FLAT_NORMALDISPLAY) {
|
if (nAnnotFlag & ANNOTFLAG_INVISIBLE)
|
continue;
|
|
ParserStream(pPageDic, pAnnotDic, pRectArray, pObjectArray);
|
} else {
|
if (nAnnotFlag & ANNOTFLAG_PRINT)
|
ParserStream(pPageDic, pAnnotDic, pRectArray, pObjectArray);
|
}
|
}
|
return FLATTEN_SUCCESS;
|
}
|
|
FX_FLOAT GetMinMaxValue(CPDF_RectArray& array,
|
FPDF_TYPE type,
|
FPDF_VALUE value) {
|
int nRects = array.GetSize();
|
FX_FLOAT fRet = 0.0f;
|
|
if (nRects <= 0)
|
return 0.0f;
|
|
FX_FLOAT* pArray = new FX_FLOAT[nRects];
|
switch (value) {
|
case LEFT: {
|
for (int i = 0; i < nRects; i++)
|
pArray[i] = CFX_FloatRect(array.GetAt(i)).left;
|
|
break;
|
}
|
case TOP: {
|
for (int i = 0; i < nRects; i++)
|
pArray[i] = CFX_FloatRect(array.GetAt(i)).top;
|
|
break;
|
}
|
case RIGHT: {
|
for (int i = 0; i < nRects; i++)
|
pArray[i] = CFX_FloatRect(array.GetAt(i)).right;
|
|
break;
|
}
|
case BOTTOM: {
|
for (int i = 0; i < nRects; i++)
|
pArray[i] = CFX_FloatRect(array.GetAt(i)).bottom;
|
|
break;
|
}
|
default:
|
// Not reachable.
|
return 0.0f;
|
}
|
fRet = pArray[0];
|
if (type == MAX) {
|
for (int i = 1; i < nRects; i++)
|
if (fRet <= pArray[i])
|
fRet = pArray[i];
|
} else {
|
for (int i = 1; i < nRects; i++)
|
if (fRet >= pArray[i])
|
fRet = pArray[i];
|
}
|
delete[] pArray;
|
return fRet;
|
}
|
|
CFX_FloatRect CalculateRect(CPDF_RectArray* pRectArray) {
|
CFX_FloatRect rcRet;
|
|
rcRet.left = GetMinMaxValue(*pRectArray, MIN, LEFT);
|
rcRet.top = GetMinMaxValue(*pRectArray, MAX, TOP);
|
rcRet.right = GetMinMaxValue(*pRectArray, MAX, RIGHT);
|
rcRet.bottom = GetMinMaxValue(*pRectArray, MIN, BOTTOM);
|
|
return rcRet;
|
}
|
|
void SetPageContents(CFX_ByteString key,
|
CPDF_Dictionary* pPage,
|
CPDF_Document* pDocument) {
|
CPDF_Object* pContentsObj = pPage->GetStreamBy("Contents");
|
if (!pContentsObj) {
|
pContentsObj = pPage->GetArrayBy("Contents");
|
}
|
|
if (!pContentsObj) {
|
// Create a new contents dictionary
|
if (!key.IsEmpty()) {
|
CPDF_Stream* pNewContents =
|
new CPDF_Stream(nullptr, 0, new CPDF_Dictionary);
|
pPage->SetAtReference("Contents", pDocument,
|
pDocument->AddIndirectObject(pNewContents));
|
|
CFX_ByteString sStream;
|
sStream.Format("q 1 0 0 1 0 0 cm /%s Do Q", key.c_str());
|
pNewContents->SetData(sStream.raw_str(), sStream.GetLength(), FALSE,
|
FALSE);
|
}
|
return;
|
}
|
|
CPDF_Array* pContentsArray = nullptr;
|
|
switch (pContentsObj->GetType()) {
|
case CPDF_Object::STREAM: {
|
pContentsArray = new CPDF_Array;
|
CPDF_Stream* pContents = pContentsObj->AsStream();
|
uint32_t dwObjNum = pDocument->AddIndirectObject(pContents);
|
CPDF_StreamAcc acc;
|
acc.LoadAllData(pContents);
|
CFX_ByteString sStream = "q\n";
|
CFX_ByteString sBody =
|
CFX_ByteString((const FX_CHAR*)acc.GetData(), acc.GetSize());
|
sStream = sStream + sBody + "\nQ";
|
pContents->SetData(sStream.raw_str(), sStream.GetLength(), FALSE, FALSE);
|
pContentsArray->AddReference(pDocument, dwObjNum);
|
break;
|
}
|
|
case CPDF_Object::ARRAY: {
|
pContentsArray = pContentsObj->AsArray();
|
break;
|
}
|
default:
|
break;
|
}
|
|
if (!pContentsArray)
|
return;
|
|
uint32_t dwObjNum = pDocument->AddIndirectObject(pContentsArray);
|
pPage->SetAtReference("Contents", pDocument, dwObjNum);
|
|
if (!key.IsEmpty()) {
|
CPDF_Stream* pNewContents =
|
new CPDF_Stream(nullptr, 0, new CPDF_Dictionary);
|
dwObjNum = pDocument->AddIndirectObject(pNewContents);
|
pContentsArray->AddReference(pDocument, dwObjNum);
|
|
CFX_ByteString sStream;
|
sStream.Format("q 1 0 0 1 0 0 cm /%s Do Q", key.c_str());
|
pNewContents->SetData(sStream.raw_str(), sStream.GetLength(), FALSE, FALSE);
|
}
|
}
|
|
CFX_Matrix GetMatrix(CFX_FloatRect rcAnnot,
|
CFX_FloatRect rcStream,
|
const CFX_Matrix& matrix) {
|
if (rcStream.IsEmpty())
|
return CFX_Matrix();
|
|
matrix.TransformRect(rcStream);
|
rcStream.Normalize();
|
|
FX_FLOAT a = rcAnnot.Width() / rcStream.Width();
|
FX_FLOAT d = rcAnnot.Height() / rcStream.Height();
|
|
FX_FLOAT e = rcAnnot.left - rcStream.left * a;
|
FX_FLOAT f = rcAnnot.bottom - rcStream.bottom * d;
|
return CFX_Matrix(a, 0, 0, d, e, f);
|
}
|
|
void GetOffset(FX_FLOAT& fa,
|
FX_FLOAT& fd,
|
FX_FLOAT& fe,
|
FX_FLOAT& ff,
|
CFX_FloatRect rcAnnot,
|
CFX_FloatRect rcStream,
|
const CFX_Matrix& matrix) {
|
FX_FLOAT fStreamWidth = 0.0f;
|
FX_FLOAT fStreamHeight = 0.0f;
|
|
if (matrix.a != 0 && matrix.d != 0) {
|
fStreamWidth = rcStream.right - rcStream.left;
|
fStreamHeight = rcStream.top - rcStream.bottom;
|
} else {
|
fStreamWidth = rcStream.top - rcStream.bottom;
|
fStreamHeight = rcStream.right - rcStream.left;
|
}
|
|
FX_FLOAT x1 =
|
matrix.a * rcStream.left + matrix.c * rcStream.bottom + matrix.e;
|
FX_FLOAT y1 =
|
matrix.b * rcStream.left + matrix.d * rcStream.bottom + matrix.f;
|
FX_FLOAT x2 = matrix.a * rcStream.left + matrix.c * rcStream.top + matrix.e;
|
FX_FLOAT y2 = matrix.b * rcStream.left + matrix.d * rcStream.top + matrix.f;
|
FX_FLOAT x3 =
|
matrix.a * rcStream.right + matrix.c * rcStream.bottom + matrix.e;
|
FX_FLOAT y3 =
|
matrix.b * rcStream.right + matrix.d * rcStream.bottom + matrix.f;
|
FX_FLOAT x4 = matrix.a * rcStream.right + matrix.c * rcStream.top + matrix.e;
|
FX_FLOAT y4 = matrix.b * rcStream.right + matrix.d * rcStream.top + matrix.f;
|
|
FX_FLOAT left = std::min(std::min(x1, x2), std::min(x3, x4));
|
FX_FLOAT bottom = std::min(std::min(y1, y2), std::min(y3, y4));
|
|
fa = (rcAnnot.right - rcAnnot.left) / fStreamWidth;
|
fd = (rcAnnot.top - rcAnnot.bottom) / fStreamHeight;
|
fe = rcAnnot.left - left * fa;
|
ff = rcAnnot.bottom - bottom * fd;
|
}
|
|
DLLEXPORT int STDCALL FPDFPage_Flatten(FPDF_PAGE page, int nFlag) {
|
CPDF_Page* pPage = CPDFPageFromFPDFPage(page);
|
if (!page) {
|
return FLATTEN_FAIL;
|
}
|
|
CPDF_Document* pDocument = pPage->m_pDocument;
|
CPDF_Dictionary* pPageDict = pPage->m_pFormDict;
|
|
if (!pDocument || !pPageDict) {
|
return FLATTEN_FAIL;
|
}
|
|
CPDF_ObjectArray ObjectArray;
|
CPDF_RectArray RectArray;
|
|
int iRet = FLATTEN_FAIL;
|
iRet = ParserAnnots(pDocument, pPageDict, &RectArray, &ObjectArray, nFlag);
|
if (iRet == FLATTEN_NOTHINGTODO || iRet == FLATTEN_FAIL)
|
return iRet;
|
|
CFX_FloatRect rcOriginalCB;
|
CFX_FloatRect rcMerger = CalculateRect(&RectArray);
|
CFX_FloatRect rcOriginalMB = pPageDict->GetRectBy("MediaBox");
|
|
if (pPageDict->KeyExist("CropBox"))
|
rcOriginalMB = pPageDict->GetRectBy("CropBox");
|
|
if (rcOriginalMB.IsEmpty()) {
|
rcOriginalMB = CFX_FloatRect(0.0f, 0.0f, 612.0f, 792.0f);
|
}
|
|
rcMerger.left =
|
rcMerger.left < rcOriginalMB.left ? rcOriginalMB.left : rcMerger.left;
|
rcMerger.right =
|
rcMerger.right > rcOriginalMB.right ? rcOriginalMB.right : rcMerger.right;
|
rcMerger.top =
|
rcMerger.top > rcOriginalMB.top ? rcOriginalMB.top : rcMerger.top;
|
rcMerger.bottom = rcMerger.bottom < rcOriginalMB.bottom ? rcOriginalMB.bottom
|
: rcMerger.bottom;
|
|
if (pPageDict->KeyExist("ArtBox"))
|
rcOriginalCB = pPageDict->GetRectBy("ArtBox");
|
else
|
rcOriginalCB = rcOriginalMB;
|
|
if (!rcOriginalMB.IsEmpty()) {
|
CPDF_Array* pMediaBox = new CPDF_Array();
|
pMediaBox->Add(new CPDF_Number(rcOriginalMB.left));
|
pMediaBox->Add(new CPDF_Number(rcOriginalMB.bottom));
|
pMediaBox->Add(new CPDF_Number(rcOriginalMB.right));
|
pMediaBox->Add(new CPDF_Number(rcOriginalMB.top));
|
pPageDict->SetAt("MediaBox", pMediaBox);
|
}
|
|
if (!rcOriginalCB.IsEmpty()) {
|
CPDF_Array* pCropBox = new CPDF_Array();
|
pCropBox->Add(new CPDF_Number(rcOriginalCB.left));
|
pCropBox->Add(new CPDF_Number(rcOriginalCB.bottom));
|
pCropBox->Add(new CPDF_Number(rcOriginalCB.right));
|
pCropBox->Add(new CPDF_Number(rcOriginalCB.top));
|
pPageDict->SetAt("ArtBox", pCropBox);
|
}
|
|
CPDF_Dictionary* pRes = pPageDict->GetDictBy("Resources");
|
if (!pRes) {
|
pRes = new CPDF_Dictionary;
|
pPageDict->SetAt("Resources", pRes);
|
}
|
|
CPDF_Stream* pNewXObject = new CPDF_Stream(nullptr, 0, new CPDF_Dictionary);
|
uint32_t dwObjNum = pDocument->AddIndirectObject(pNewXObject);
|
CPDF_Dictionary* pPageXObject = pRes->GetDictBy("XObject");
|
if (!pPageXObject) {
|
pPageXObject = new CPDF_Dictionary;
|
pRes->SetAt("XObject", pPageXObject);
|
}
|
|
CFX_ByteString key = "";
|
int nStreams = ObjectArray.GetSize();
|
|
if (nStreams > 0) {
|
for (int iKey = 0; /*iKey < 100*/; iKey++) {
|
char sExtend[5] = {};
|
FXSYS_itoa(iKey, sExtend, 10);
|
key = CFX_ByteString("FFT") + CFX_ByteString(sExtend);
|
if (!pPageXObject->KeyExist(key))
|
break;
|
}
|
}
|
|
SetPageContents(key, pPageDict, pDocument);
|
|
CPDF_Dictionary* pNewXORes = nullptr;
|
|
if (!key.IsEmpty()) {
|
pPageXObject->SetAtReference(key, pDocument, dwObjNum);
|
CPDF_Dictionary* pNewOXbjectDic = pNewXObject->GetDict();
|
pNewXORes = new CPDF_Dictionary;
|
pNewOXbjectDic->SetAt("Resources", pNewXORes);
|
pNewOXbjectDic->SetAtName("Type", "XObject");
|
pNewOXbjectDic->SetAtName("Subtype", "Form");
|
pNewOXbjectDic->SetAtInteger("FormType", 1);
|
pNewOXbjectDic->SetAtName("Name", "FRM");
|
CFX_FloatRect rcBBox = pPageDict->GetRectBy("ArtBox");
|
pNewOXbjectDic->SetAtRect("BBox", rcBBox);
|
}
|
|
for (int i = 0; i < nStreams; i++) {
|
CPDF_Dictionary* pAnnotDic = ObjectArray.GetAt(i);
|
if (!pAnnotDic)
|
continue;
|
|
CFX_FloatRect rcAnnot = pAnnotDic->GetRectBy("Rect");
|
rcAnnot.Normalize();
|
|
CFX_ByteString sAnnotState = pAnnotDic->GetStringBy("AS");
|
CPDF_Dictionary* pAnnotAP = pAnnotDic->GetDictBy("AP");
|
if (!pAnnotAP)
|
continue;
|
|
CPDF_Stream* pAPStream = pAnnotAP->GetStreamBy("N");
|
if (!pAPStream) {
|
CPDF_Dictionary* pAPDic = pAnnotAP->GetDictBy("N");
|
if (!pAPDic)
|
continue;
|
|
if (!sAnnotState.IsEmpty()) {
|
pAPStream = pAPDic->GetStreamBy(sAnnotState);
|
} else {
|
auto it = pAPDic->begin();
|
if (it != pAPDic->end()) {
|
CPDF_Object* pFirstObj = it->second;
|
if (pFirstObj) {
|
if (pFirstObj->IsReference())
|
pFirstObj = pFirstObj->GetDirect();
|
if (!pFirstObj->IsStream())
|
continue;
|
pAPStream = pFirstObj->AsStream();
|
}
|
}
|
}
|
}
|
if (!pAPStream)
|
continue;
|
|
CPDF_Dictionary* pAPDic = pAPStream->GetDict();
|
CFX_Matrix matrix = pAPDic->GetMatrixBy("Matrix");
|
|
CFX_FloatRect rcStream;
|
if (pAPDic->KeyExist("Rect"))
|
rcStream = pAPDic->GetRectBy("Rect");
|
else if (pAPDic->KeyExist("BBox"))
|
rcStream = pAPDic->GetRectBy("BBox");
|
|
if (rcStream.IsEmpty())
|
continue;
|
|
CPDF_Object* pObj = pAPStream;
|
|
if (pObj) {
|
CPDF_Dictionary* pObjDic = pObj->GetDict();
|
if (pObjDic) {
|
pObjDic->SetAtName("Type", "XObject");
|
pObjDic->SetAtName("Subtype", "Form");
|
}
|
}
|
|
CPDF_Dictionary* pXObject = pNewXORes->GetDictBy("XObject");
|
if (!pXObject) {
|
pXObject = new CPDF_Dictionary;
|
pNewXORes->SetAt("XObject", pXObject);
|
}
|
|
CFX_ByteString sFormName;
|
sFormName.Format("F%d", i);
|
uint32_t dwStreamObjNum = pDocument->AddIndirectObject(pObj);
|
pXObject->SetAtReference(sFormName, pDocument, dwStreamObjNum);
|
|
CPDF_StreamAcc acc;
|
acc.LoadAllData(pNewXObject);
|
|
const uint8_t* pData = acc.GetData();
|
CFX_ByteString sStream(pData, acc.GetSize());
|
CFX_ByteString sTemp;
|
|
if (matrix.IsIdentity()) {
|
matrix.a = 1.0f;
|
matrix.b = 0.0f;
|
matrix.c = 0.0f;
|
matrix.d = 1.0f;
|
matrix.e = 0.0f;
|
matrix.f = 0.0f;
|
}
|
|
CFX_Matrix m = GetMatrix(rcAnnot, rcStream, matrix);
|
sTemp.Format("q %f 0 0 %f %f %f cm /%s Do Q\n", m.a, m.d, m.e, m.f,
|
sFormName.c_str());
|
sStream += sTemp;
|
pNewXObject->SetData(sStream.raw_str(), sStream.GetLength(), FALSE, FALSE);
|
}
|
pPageDict->RemoveAt("Annots");
|
|
ObjectArray.RemoveAll();
|
RectArray.RemoveAll();
|
|
return FLATTEN_SUCCESS;
|
}
|