Guest User

Untitled

a guest
Feb 20th, 2018
76
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.59 KB | None | 0 0
  1. String text = new PDFTextStripper().getText(PDDocument.load(content));
  2.  
  3. import ammonite.ops._
  4. import org.apache.pdfbox.pdmodel.PDDocument
  5. import org.apache.pdfbox.text.PDFTextStripper
  6.  
  7. (0 until 100).par.foreach { i =>
  8. println(s"#$i. START.")
  9. val pdfTextStripper = new java.lang.ThreadLocal[PDFTextStripper] {
  10. override def initialValue: PDFTextStripper = {
  11. println(s"new PDFTextStripper. #$i")
  12. new PDFTextStripper
  13. }
  14. }
  15.  
  16. val content = read.bytes! Path(FilePath(s"/data/file_$i.pdf"), pwd)
  17. val doc = PDDocument.load(content)
  18. println(pdfTextStripper.get.getText(doc))
  19. }
Add Comment
Please, Sign In to add comment