1

我们有大量的 pdf 文档,每个文档都有打开其他 pdf 文档的链接。单击链接时,它将打开同一文件系统中的另一个 pdf 文档。问题是我们需要更改某些目录的名称,这将需要更改指向该目录中 pdf 文档的所有链接。我们会手动执行此操作,但实际上有数千个链接需要更改。

我们尝试使用 iTextSharp 和 PdfSharp 来更改链接,但很难找到正确的对象。下面显示了带有两个链接的示例 pdf 文件的内容。您可以看到对象 12 是一个引用对象 21 的链接,对象 21 使用对象 20 中的引用打开一个新窗口。对象 20,类型为 Filespec 包含链接的 pdf 的路径,Folder-Name/A.pdf。第二个链接遵循相同的模式,但使用对象 16、23 和 22。

12 0 obj<</Type/Annot/P 5 0 R/F 4/C[1 0 0]/Subtype/Link/A 21 0 R/M(D:20130710103035-07'00')/Border[0 0 0]/Rect[144 612 216 630]/NM(QVDTKWKAZGVAAGHJ)/BS 13 0 R>>
endobj
13 0 obj<</W 0/S/S/Type/Border>>
endobj
16 0 obj<</Type/Annot/P 5 0 R/F 4/C[1 0 0]/Subtype/Link/A 23 0 R/M(D:20130710103040-07'00')/Border[0 0 0]/Rect[126 594 216 612]/NM(WFAYQFGTTIESQOKW)/BS 17 0 R>>
endobj
17 0 obj<</W 0/S/S/Type/Border>>
endobj
20 0 obj<</Type/Filespec/F(Folder-Name/A.pdf)/UF(Folder-Name/A.pdf)/Desc()>>
endobj
21 0 obj<</S/GoToR/D[0/Fit]/NewWindow true/F 20 0 R>>
endobj
22 0 obj<</Type/Filespec/F(Folder-Name-2/B.pdf)/UF(Folder-Name-2/B.pdf)/Desc()>>
endobj
23 0 obj<</S/GoToR/D[0/Fit]/NewWindow true/F 22 0 R>>
endobj

我们如何使用 iTextSharp 或 PdfSharp 将“Folder-Name”和“Folder-Name-2”更改为其他任意文件夹路径?

4

1 回答 1

2

万一有人关心,我可以在上面的第一条评论中使用 Chris Haas 链接的代码,但对其进行了如下修改:

foreach (FileInfo file in files)
{                    

    PdfReader reader = default(PdfReader);

    bool linkReplaced = false;

    //Setup some variables to be used later
    reader = new PdfReader(file.FullName);

    int pageCount = reader.NumberOfPages;
    PdfDictionary pageDictionary = default(PdfDictionary);
    PdfArray annots = default(PdfArray);

    //Loop through each page
    for (int i = 1; i <= pageCount; i++)
    {
        //Get the current page
        pageDictionary = reader.GetPageN(i);

        //Get all of the annotations for the current page
        annots = pageDictionary.GetAsArray(PdfName.ANNOTS);

        //Make sure we have something
        if ((annots == null) || (annots.Length == 0))
            continue;

        foreach (PdfObject A in annots.ArrayList)
        {
            //Convert the itext-specific object as a generic PDF object
            PdfDictionary AnnotationDictionary = (PdfDictionary)PdfReader.GetPdfObject(A);

            //Make sure this annotation has a link
            if (!AnnotationDictionary.Get(PdfName.SUBTYPE).Equals(PdfName.LINK))
                continue;

            //Make sure this annotation has an ACTION
            if (AnnotationDictionary.Get(PdfName.A) == null)
                continue;

            string fValue = string.Empty;
            string ufValue = string.Empty;
            string uriValue = string.Empty;

            PdfObject a = AnnotationDictionary.Get(PdfName.A);
            if (a.IsDictionary())
            {
                //Get the ACTION for the current annotation
                PdfDictionary AnnotationAction = (PdfDictionary)a;

                //Test if it is a URI action
                if (AnnotationAction.Get(PdfName.S).Equals(PdfName.URI))
                {
                    uriValue = AnnotationAction.Get(PdfName.URI).ToString();

                    if ((uriValue.IndexOf(findValue, StringComparison.OrdinalIgnoreCase) > -1))
                    {
                        string uriValueReplace = Replace(uriValue, findValue, replaceValue, StringComparison.OrdinalIgnoreCase);

                        //Change the URI to something else
                        AnnotationAction.Put(PdfName.URI, new PdfString(uriValueReplace));                                          
                        linkReplaced = true;
                    }
                }                                               
            }
            else if (a.IsIndirect())
            {
                // Get the indirect reference
                PdfIndirectReference indirectRef = (PdfIndirectReference)a;

                // Get the GoToR type object which is at the document level
                PdfDictionary goToR = (PdfDictionary)reader.GetPdfObject(indirectRef.Number);

                // Get the FileSpec object whic his at the document lelvel
                PdfObject f = goToR.Get(PdfName.F);

                if (f == null || !f.IsIndirect())
                    continue;

                PdfObject fileSpecObject = reader.GetPdfObject(((PdfIndirectReference)goToR.Get(PdfName.F)).Number);

                if (!fileSpecObject.IsDictionary())
                    continue;

                PdfDictionary fileSpec = (PdfDictionary)fileSpecObject;

                fValue = fileSpec.Get(PdfName.F).ToString();
                ufValue = fileSpec.Get(PdfName.UF).ToString();

                if ((fValue.IndexOf(findValue, StringComparison.OrdinalIgnoreCase) > -1) || (ufValue.IndexOf(findValue, StringComparison.OrdinalIgnoreCase) > -1))
                {
                    string fValueReplace = Replace(fValue, findValue, replaceValue, StringComparison.OrdinalIgnoreCase);// fValue.Replace(findValue, replaceValue);
                    string ufValueReplace = Replace(fValue, findValue, replaceValue, StringComparison.OrdinalIgnoreCase);// ufValue.Replace(findValue, replaceValue);

                    // Update the references to the file
                    fileSpec.Put(PdfName.F, new PdfString(fValueReplace));
                    fileSpec.Put(PdfName.UF, new PdfString(ufValueReplace));                                    

                    linkReplaced = true;
                }
            }                                
        }
    }
}   
于 2013-07-23T13:56:11.837 回答