Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- URL_PREFIX='http://poprzednia.univ.gda.pl/slang/hasla'
- NTHREADS=10
- def definitionLinks = "$URL_PREFIX/litery.html".toURL().text.findAll(/[a-z]\.html/).sum {
- ("$URL_PREFIX/$it".toURL().text =~ /<a href="([^"]+)" target="znaczenie".*/)*.getAt(1)
- }
- groovyx.gpars.GParsPool.withPool(NTHREADS) {
- definitionLinks.collectParallel {
- def text = "$URL_PREFIX/$it".toURL().getText('iso-8859-2')
- return [text.find(/(?<=<dt>)[^<]+/), text.find(/.+(?=<\/dd>)/)]
- }
- }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement