Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- cat Desktop/list.txt | \
- grep \
- -e "<li>" \
- -e "</li>" | \
- grep -v \
- -e "</div>" \
- -e "href\="| \
- sed \
- -e 's/\<li\>//' \
- -e 's/\<\/li\>//' \
- -e 's/\<strong\>//' \
- -e 's/\<\/strong\>//' \
- -e 's/\<p\>//' \
- -e 's/\<\/p\>//' \
- -e 's/\<br\>//' \
- -e 's/\<em\>//' \
- -e 's/\<\/em\>//' \
- -e 's/ en / \& /' \
- -e 's/ and / \& /' \
- -e 's/ et / \& /' \
- -e 's/\&\;/\&/' \
- -e 's/[[:space:]]*$//' | \
- sed 'y/āáǎàēéëěèīíǐìōóǒòūúǔùǖǘǚǜĀÁǍÀĒÉĚÈĪÍǏÌŌÓǑÒŪÚǓÙǕǗǙǛ/aaaaeeeeeiiiioooouuuuüüüüAAAAEEEEIIIIOOOOUUUUÜÜÜÜ/' | \
- gawk '{print tolower($0);}' > Desktop/templijst.txt
- cat Desktop/templijst.txt | \
- sed \
- -e 's/.*suske.*/suske \& wiske/' \
- -e 's/.*asterix.*/asterix \& obelix/' \
- -e 's/.*michel va.*/michel vaillant/' \
- -e 's/.*robin ho.*/robin hood/' \
- -e 's/.*robbe.*/spirou/' \
- -e 's/.*spirou.*/spirou/' \
- -e 's/.*vrouwen in.*/vrouwen in het wit/' \
- -e 's/.*tintin.*/tintin/' \
- -e 's/.*kuifje.*/tintin/' \
- -e 's/.*johan \&.*/johan \& pierewiet/' \
- -e 's/.*jommeke.*/jommeke/' \
- -e 's/.*guus.*/guust flater/' \
- -e 's/.*gaston.*/guust flater/' \
- -e 's/.*tuniques.*/blauwbloezen/' \
- -e 's/.*blauwbloezen.*/blauwbloezen/' \
- -e 's/.*kampioenen.*/f.c. de kampioenen/' \
- -e 's/.*schtroumpf.*/smurfen/' \
- -e 's/.*mensjes.*/mini-mensjes/' \
- -e 's/.*raf zerk.*/g.raf zerk/' \
- -e 's/.*boule.*/bollie \& billie/' \
- -e 's/.*bollie.*/bollie \& billie/' \
- -e 's/.*bakeland.*/bakelandt/' \
- -e 's/.*astrix.*/asterix/' \
- -e 's/.*212.*/agent 212/' \
- -e 's/.*kiekeboe.*/kiekeboe/' \
- -e 's/.*ping.*/pol\, pel \& pingo/' \
- | \
- sort -n | \
- uniq -c
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement