Advertisement
Guest User

2chproxy-readcgi7-2.patch

a guest
May 3rd, 2017
503
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Diff 1.74 KB | None | 0 0
  1. --- 2chproxy.pl.org 2017-04-23 18:41:00.093118359 +0900
  2. +++ 2chproxy.pl 2017-05-04 03:08:15.969105825 +0900
  3. @@ -102,7 +102,7 @@
  4.    RESPONSE_REGEX => '<dt>(\d+)\s[^<]*<(?:a href="mailto:([^"]+)"|font[^>]*)><b>(.*?)</b></(?:a|font)>.((?:[^<]+?)(?:\s*<a href="?http[^">]*"?[^>]*>[^<]*</a>)?(?:\s*(?:[^<]+?(?:(?:<\d+>)+[^<]*)?))?)?\s*(?:<a\s[^>]*be\(([^)]*)\)[^>]*>\?([^<]+)</a>)?<dd>([^\n]+)',
  5.    RESPONSE_REGEX2 => '<div class="number">(\d+)[^>]*</div><div class="name"><b>(?:<a href="mailto:([^"]+)">(.*?)</a>|(.*?))</b></div><div class="date">([^<]+)</div>(?:<div class="be\s[^"]+"><a href="http://be.2ch.net/user/(\d+)"[^>]*>\?([^<]+)</a></div>)?<div class="message">(.*?)</div>',
  6.    RESPONSE_REGEX3 => '<span class="number">(\d+)[^>]*</span><span class="name"><b>(?:<a href="mailto:([^"]+)">(.*?)</a>|(.*?))</b></span><span class="date">([^<]+)</span>(?:<span class="be\s[^"]+"><a href="http://be.2ch.net/user/(\d+)"[^>]*>\?([^<]+)</a></span>)?</dt><dd class="thread_in">(.*?)</dd>',
  7. -  RESPONSE_REGEX4 => '<span class="number">(\d+)[^>]*</span><span class="name"><b>(?:<a href="mailto:([^"]+)">(.*?)</a>|(.*?))</b></span><span class="date">([^<]+)</span>(?:<span class="be\s[^"]+"><a href="http://be.2ch.net/user/(\d+)"[^>]*>\?([^<]+)</a></span>)?</div><div class="message"><span class="escaped">(.*?)</span></div>',
  8. +  RESPONSE_REGEX4 => '<span class="number">(\d+)[^>]*</span><span class="name"><b>(?:<a href="mailto:([^"]+)">(.*?)</a>|(.*?))</b></span><span class="date">([^<]+)</span>(?:<span class="uid">[^<]*</span>)?(?:<span class="be\s[^"]+"><a href="http://be.2ch.net/user/(\d+)"[^>]*>\?([^<]+)</a></span>)?</div><div class="message"><span class="escaped">(.*?)</span></div>',
  9.    #WEBスクレイピングの細かい部分の正規表現は下の方
  10.  };
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement