Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- object htmlLinkCounter extends App {
- import scala.io.Source
- import scala.io.Codec
- import java.nio.charset.MalformedInputException
- import scala.util.matching.Regex
- import scala.util.matching
- def readFromURL(url: String) = try {
- Source.fromURL(url)(Codec.UTF8) mkString
- } catch {
- case _: MalformedInputException => Source.fromURL(url)(Codec.ISO8859) mkString
- }
- def extractLinks(content:String){
- val regex= """<\.*href\\s*?=\\s*?["|']\.*["|']\\S+\1""".r
- val matchesFound= regex.findAllIn(content)
- matchesFound.foreach(println)
- }
- val url= scala.io.StdIn.readLine("Enter your URL(e.g. http://orf.at):")
- val content = readFromURL(url)
- val links = extractLinks(content)
- println(s"There are $links on $url!".length())
- }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement