Advertisement
Guest User

Untitled

a guest
Oct 1st, 2016
219
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Groovy 0.48 KB | None | 0 0
  1. URL_PREFIX='http://poprzednia.univ.gda.pl/slang/hasla'
  2. NTHREADS=10
  3.  
  4. def definitionLinks = "$URL_PREFIX/litery.html".toURL().text.findAll(/[a-z]\.html/).sum {
  5.     ("$URL_PREFIX/$it".toURL().text =~ /<a href="([^"]+)" target="znaczenie".*/)*.getAt(1)
  6. }
  7. groovyx.gpars.GParsPool.withPool(NTHREADS) {
  8.    definitionLinks.collectParallel {
  9.        def text = "$URL_PREFIX/$it".toURL().getText('iso-8859-2')
  10.        return [text.find(/(?<=<dt>)[^<]+/), text.find(/.+(?=<\/dd>)/)]
  11.    }
  12. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement