当很少有 pdf 文件不是英文并且他们的字体无法识别并且我遇到异常时,我经常遇到 pdfclown 的问题。请找到pdf 路径和代码路径。在 CompositeFont.java 和 SimpleFont 中加载编码方法都失败。爪哇。是否有任何特定版本的 jar 我需要用于解决此问题。请提供您的意见以支持此类 pdf 文件。
java.lang.NullPointerException
at org.pdfclown.documents.contents.fonts.CompositeFont.loadEncoding(CompositeFont.java:178)
at org.pdfclown.documents.contents.fonts.CompositeFont.onLoad(CompositeFont.java:202)
at org.pdfclown.documents.contents.fonts.Font.load(Font.java:878)
at org.pdfclown.documents.contents.fonts.Font.<init>(Font.java:368)
at org.pdfclown.documents.contents.fonts.CompositeFont.<init>(CompositeFont.java:114)
at org.pdfclown.documents.contents.fonts.Type0Font.<init>(Type0Font.java:62)
at org.pdfclown.documents.contents.fonts.Font.wrap(Font.java:268)
at org.pdfclown.documents.contents.FontResources.wrap(FontResources.java:72)
at org.pdfclown.documents.contents.FontResources.wrap(FontResources.java:1)
at org.pdfclown.documents.contents.ResourceItems.get(ResourceItems.java:119)
at org.pdfclown.documents.contents.objects.SetFont.getResource(SetFont.java:119)
at org.pdfclown.documents.contents.objects.SetFont.getFont(SetFont.java:83)
at org.pdfclown.documents.contents.objects.SetFont.scan(SetFont.java:97)
at org.pdfclown.documents.contents.ContentScanner.moveNext(ContentScanner.java:1360)
at org.pdfclown.documents.contents.ContentScanner$TextWrapper.extract(ContentScanner.java:819)
at org.pdfclown.documents.contents.ContentScanner$TextWrapper.<init>(ContentScanner.java:771)
at org.pdfclown.documents.contents.ContentScanner$TextWrapper.<init>(ContentScanner.java:764)
at org.pdfclown.documents.contents.ContentScanner$GraphicsObjectWrapper.get(ContentScanner.java:684)
at org.pdfclown.documents.contents.ContentScanner$GraphicsObjectWrapper.access$0(ContentScanner.java:676)
at org.pdfclown.documents.contents.ContentScanner.getCurrentWrapper(ContentScanner.java:1184)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:636)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:299)
at pdfclown2.highlight(pdfclown2.java:89)
at pdfclown2.main(pdfclown2.java:48)
*****************************其他pdf问题****************** ******************************
java.lang.NullPointerException
at org.pdfclown.documents.contents.fonts.SimpleFont.loadEncoding(SimpleFont.java:150)
at org.pdfclown.documents.contents.fonts.SimpleFont.onLoad(SimpleFont.java:170)
at org.pdfclown.documents.contents.fonts.Font.load(Font.java:878)
at org.pdfclown.documents.contents.fonts.Font.<init>(Font.java:368)
at org.pdfclown.documents.contents.fonts.SimpleFont.<init>(SimpleFont.java:65)
at org.pdfclown.documents.contents.fonts.TrueTypeFont.<init>(TrueTypeFont.java:47)
at org.pdfclown.documents.contents.fonts.Font.wrap(Font.java:262)
at org.pdfclown.documents.contents.FontResources.wrap(FontResources.java:72)
at org.pdfclown.documents.contents.FontResources.wrap(FontResources.java:1)
at org.pdfclown.documents.contents.ResourceItems.get(ResourceItems.java:119)
at org.pdfclown.documents.contents.objects.SetFont.getResource(SetFont.java:119)
at org.pdfclown.documents.contents.objects.SetFont.getFont(SetFont.java:83)
at org.pdfclown.documents.contents.objects.SetFont.scan(SetFont.java:97)
at org.pdfclown.documents.contents.ContentScanner.moveNext(ContentScanner.java:1360)
at org.pdfclown.documents.contents.ContentScanner$TextWrapper.extract(ContentScanner.java:819)
at org.pdfclown.documents.contents.ContentScanner$TextWrapper.<init>(ContentScanner.java:771)
at org.pdfclown.documents.contents.ContentScanner$TextWrapper.<init>(ContentScanner.java:764)
at org.pdfclown.documents.contents.ContentScanner$GraphicsObjectWrapper.get(ContentScanner.java:684)
at org.pdfclown.documents.contents.ContentScanner$GraphicsObjectWrapper.access$0(ContentScanner.java:676)
at org.pdfclown.documents.contents.ContentScanner.getCurrentWrapper(ContentScanner.java:1184)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:636)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:645)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:653)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:299)
at pdfclown2.highlight(pdfclown2.java:89)
at pdfclown2.main(pdfclown2.java:48)
************************************另一个问题****************** ***********************
java.lang.RuntimeException: Odd number of characters.
at org.pdfclown.util.ConvertUtils.hexToByteArray(ConvertUtils.java:106)
at org.pdfclown.objects.PdfString.setValue(PdfString.java:287)
at org.pdfclown.objects.PdfString.<init>(PdfString.java:126)
at org.pdfclown.objects.PdfByteString.<init>(PdfByteString.java:58)
at org.pdfclown.documents.contents.tokens.ContentParser.parsePdfObject(ContentParser.java:182)
at org.pdfclown.documents.contents.tokens.ContentParser.parseOperation(ContentParser.java:164)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObject(ContentParser.java:98)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObjects(ContentParser.java:134)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObject(ContentParser.java:112)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObjects(ContentParser.java:134)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObject(ContentParser.java:112)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObjects(ContentParser.java:134)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObject(ContentParser.java:112)
at org.pdfclown.documents.contents.tokens.ContentParser.parseContentObjects(ContentParser.java:134)
at org.pdfclown.documents.contents.Contents.load(Contents.java:598)
at org.pdfclown.documents.contents.Contents.<init>(Contents.java:372)
at org.pdfclown.documents.contents.Contents.wrap(Contents.java:351)
at org.pdfclown.documents.Page.getContents(Page.java:585)
at org.pdfclown.documents.contents.ContentScanner.<init>(ContentScanner.java:1056)
at org.pdfclown.tools.TextExtractor.extract(TextExtractor.java:300)
at pdfclown2.highlight(pdfclown2.java:3124)
at pdfclown2.main(pdfclown2.java:50)