我使用apache pdfbox 1.5从pdf中提取文本。这是正在使用的code。这似乎适用于某些pdf。但是对于一个具有以下错误的pdf,它失败了。如果有人遇到过这样的问题,请告诉我。解决
java.lang.IndexOutOfBoundsException: Index: 2,Size: 2
at java.util.SubList.rangeCheck(AbstractList.java:864)
at java.util.SubList.get(AbstractList.java:737)
at org.apache.fontbox.cff.CharStringConverter.drawCurve(CharStringConverter.java:415)
at org.apache.fontbox.cff.CharStringConverter.handleType2Command(CharStringConverter.java:277)
at org.apache.fontbox.cff.CharStringConverter.handleCommand(CharStringConverter.java:81)
at org.apache.fontbox.cff.CharStringHandler.handleSequence(CharStringHandler.java:53)
at org.apache.fontbox.cff.CharStringConverter.handleType2Command(CharStringConverter.java:307)
at org.apache.fontbox.cff.CharStringConverter.handleCommand(CharStringConverter.java:81)
at org.apache.fontbox.cff.CharStringHandler.handleSequence(CharStringHandler.java:53)
at org.apache.fontbox.cff.CharStringConverter.convert(CharStringConverter.java:64)
at org.apache.fontbox.cff.CFFFont$Mapping.toType1Sequence(CFFFont.java:374)
at org.apache.fontbox.cff.AFMFormatter.renderFont(AFMFormatter.java:126)
at org.apache.fontbox.cff.AFMFormatter.printFontMetrics(AFMFormatter.java:64)
at org.apache.fontbox.cff.AFMFormatter.printFont(AFMFormatter.java:57)
at org.apache.fontbox.cff.AFMFormatter.format(AFMFormatter.java:50)