Advertisement
Guest User

Untitled

a guest
Jul 23rd, 2016
68
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 9.51 KB | None | 0 0
  1. <pre style='color:#000000;background:#ffffff;'><span style='color:#800000; font-weight:bold; '>def</span> separateParaghraps<span style='color:#808030; '>(</span>txt<span style='color:#808030; '>,</span> forbidden<span style='color:#808030; '>)</span><span style='color:#808030; '>:</span>
  2. sizeof_chars <span style='color:#808030; '>=</span> <span style='color:#400000; '>len</span><span style='color:#808030; '>(</span>forbidden<span style='color:#808030; '>)</span> <span style='color:#44aadd; '>-</span> <span style='color:#008c00; '>1</span>
  3. <span style='color:#800000; font-weight:bold; '>for</span> e <span style='color:#800000; font-weight:bold; '>in</span> <span style='color:#400000; '>range</span><span style='color:#808030; '>(</span><span style='color:#008c00; '>0</span><span style='color:#808030; '>,</span> sizeof_chars<span style='color:#808030; '>)</span><span style='color:#808030; '>:</span>
  4. txt <span style='color:#808030; '>=</span> txt<span style='color:#808030; '>.</span>replace<span style='color:#808030; '>(</span>forbidden<span style='color:#808030; '>[</span>e<span style='color:#808030; '>]</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" &lt;/s></span><span style='color:#0f69ff; '>\n</span><span style='color:#0000e6; '>&lt;s> "</span><span style='color:#808030; '>)</span> <span style='color:#696969; '># Replaces given set of char with end of sentence punctuations,</span>
  5. <span style='color:#800000; font-weight:bold; '>return</span> txt <span style='color:#696969; '># puts a &lt;/s> , skips a line then puts a &lt;s></span>
  6.  
  7.  
  8. <span style='color:#800000; font-weight:bold; '>def</span> replaceNumbers<span style='color:#808030; '>(</span>txt<span style='color:#808030; '>,</span> forbidden<span style='color:#808030; '>,</span> allowed<span style='color:#808030; '>)</span><span style='color:#808030; '>:</span>
  9. sizeof_chars <span style='color:#808030; '>=</span> <span style='color:#400000; '>len</span><span style='color:#808030; '>(</span>forbidden<span style='color:#808030; '>)</span> <span style='color:#44aadd; '>-</span> <span style='color:#008c00; '>1</span>
  10. <span style='color:#800000; font-weight:bold; '>for</span> e <span style='color:#800000; font-weight:bold; '>in</span> <span style='color:#400000; '>range</span><span style='color:#808030; '>(</span><span style='color:#008c00; '>0</span><span style='color:#808030; '>,</span> sizeof_chars<span style='color:#808030; '>)</span><span style='color:#808030; '>:</span>
  11. txt <span style='color:#808030; '>=</span> txt<span style='color:#808030; '>.</span>replace<span style='color:#808030; '>(</span>forbidden<span style='color:#808030; '>[</span>e<span style='color:#808030; '>]</span><span style='color:#808030; '>,</span> allowed<span style='color:#808030; '>[</span>e<span style='color:#808030; '>]</span><span style='color:#808030; '>)</span> <span style='color:#696969; '># Replaces the numerical formatted numbers into the letters</span>
  12. <span style='color:#800000; font-weight:bold; '>return</span> txt
  13.  
  14.  
  15. <span style='color:#800000; font-weight:bold; '>def</span> replacePunctuation<span style='color:#808030; '>(</span>txt<span style='color:#808030; '>,</span> forbidden<span style='color:#808030; '>)</span><span style='color:#808030; '>:</span>
  16. sizeof_chars <span style='color:#808030; '>=</span> <span style='color:#400000; '>len</span><span style='color:#808030; '>(</span>forbidden<span style='color:#808030; '>)</span> <span style='color:#44aadd; '>-</span> <span style='color:#008c00; '>1</span>
  17. <span style='color:#800000; font-weight:bold; '>for</span> e <span style='color:#800000; font-weight:bold; '>in</span> <span style='color:#400000; '>range</span><span style='color:#808030; '>(</span><span style='color:#008c00; '>0</span><span style='color:#808030; '>,</span> sizeof_chars<span style='color:#808030; '>)</span><span style='color:#808030; '>:</span>
  18. txt <span style='color:#808030; '>=</span> txt<span style='color:#808030; '>.</span>replace<span style='color:#808030; '>(</span>forbidden<span style='color:#808030; '>[</span>e<span style='color:#808030; '>]</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>""</span><span style='color:#808030; '>)</span> <span style='color:#696969; '># Deletes given set of char then puts a ""</span>
  19. <span style='color:#800000; font-weight:bold; '>return</span> txt
  20.  
  21.  
  22. <span style='color:#400000; '>file</span> <span style='color:#808030; '>=</span> <span style='color:#400000; '>open</span><span style='color:#808030; '>(</span><span style='color:#0000e6; '>"/Users/ugurcem/PycharmProjects/untitled1/text"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"r+"</span><span style='color:#808030; '>)</span> <span style='color:#696969; '># Text file without modification</span>
  23. text <span style='color:#808030; '>=</span> <span style='color:#400000; '>file</span><span style='color:#808030; '>.</span>read<span style='color:#808030; '>(</span><span style='color:#808030; '>)</span>
  24. text <span style='color:#808030; '>=</span> <span style='color:#0000e6; '>"&lt;s> "</span> <span style='color:#44aadd; '>+</span> text <span style='color:#696969; '># Writes a sentence starting point tag</span>
  25.  
  26. endpoint <span style='color:#808030; '>=</span> <span style='color:#808030; '>[</span><span style='color:#0000e6; '>"."</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"!"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"?"</span><span style='color:#808030; '>]</span> <span style='color:#696969; '># List of chars that stands for end of sentence.</span>
  27. nums <span style='color:#808030; '>=</span> <span style='color:#808030; '>[</span><span style='color:#0000e6; '>"0"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"1"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"2"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"3"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"4"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"5"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"6"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"7"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"8"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"9"</span><span style='color:#808030; '>]</span> <span style='color:#696969; '># Numbers that will convert into letters</span>
  28. nums_normalized <span style='color:#808030; '>=</span> <span style='color:#808030; '>[</span><span style='color:#0000e6; '>" sıfır "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" bir "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" iki "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" üç "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" dört "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" beş "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" altı "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" yedi "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" sekiz "</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>" dokuz "</span><span style='color:#808030; '>]</span>
  29. punctuation <span style='color:#808030; '>=</span> <span style='color:#808030; '>[</span><span style='color:#0000e6; '>","</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>";"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>":"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"'"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"("</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>")"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"-"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"_"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"="</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"+"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"&amp;"</span><span style='color:#808030; '>,</span> <span style='color:#0000e6; '>"*"</span><span style='color:#808030; '>]</span> <span style='color:#696969; '># Chars that will deleted ( writes a "" )</span>
  30.  
  31.  
  32. text <span style='color:#808030; '>=</span> separateParaghraps<span style='color:#808030; '>(</span>text<span style='color:#808030; '>,</span> endpoint<span style='color:#808030; '>)</span>
  33. text <span style='color:#808030; '>=</span> replaceNumbers<span style='color:#808030; '>(</span>text<span style='color:#808030; '>,</span> nums<span style='color:#808030; '>,</span> nums_normalized<span style='color:#808030; '>)</span>
  34. text <span style='color:#808030; '>=</span> replacePunctuation<span style='color:#808030; '>(</span>text<span style='color:#808030; '>,</span> punctuation<span style='color:#808030; '>)</span>
  35. <span style='color:#800000; font-weight:bold; '>print</span><span style='color:#808030; '>(</span>text<span style='color:#808030; '>)</span>
  36. </pre>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement