Beruflich Dokumente
Kultur Dokumente
public class ConvertPDFToTEXT { public static void main(String[] args) throws IOException { try { Document document = new Document(); document.open(); PdfReader reader = new PdfReader("C:\\resume.pdf"); PdfDictionary dictionary = reader.getPageN(1); PRIndirectReference reference = (PRIndirectReference) dictionary.get(PdfName.CONTENTS); PRStream stream = (PRStream) PdfReader.getPdfObject(reference); byte[] bytes = PdfReader.getStreamBytes(stream); PRTokeniser tokenizer = new PRTokeniser(bytes); FileOutputStream fos=new FileOutputStream("pdf.txt"); StringBuffer buffer = new StringBuffer(); while (tokenizer.nextToken()) { if (tokenizer.getTokenType() == PRTokeniser.TK_STRING) { buffer.append(tokenizer.getStringValue()); }
} String test=buffer.toString(); StringReader stReader = new StringReader(test); int t; while((t=stReader.read())>0) fos.write(t); document.add(new Paragraph("..")); document.close(); } catch (Exception e) {} } }