Advertisement
Guest User

Untitled

a guest
Jun 22nd, 2017
62
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.82 KB | None | 0 0
  1. use utf8;
  2. use strict;
  3. use warnings;
  4. use open qw<:encoding(utf8) :std>;
  5. use Data::Dumper;
  6. use Hailo::Tokenizer::Words;
  7.  
  8. my $self = bless {} => __PACKAGE__;
  9. my $text = 'STARGΛ̊TE';
  10. print Dumper($text);
  11.  
  12. my $toke = Hailo::Tokenizer::Words->new();
  13. my $parsed = $toke->make_tokens($text);
  14. print Dumper($parsed);
  15.  
  16.  
  17. #################
  18.  
  19.  
  20. $ perlbrew switch perl-5.10.1
  21. $ perl utf8-text.t
  22. $VAR1 = "STARG\x{39b}\x{30a}TE";
  23. $VAR1 = [
  24. [
  25. 0,
  26. "STARG\x{39b}\x{30a}TE"
  27. ]
  28. ];
  29.  
  30. $ perlbrew switch perl-5.13.5
  31. $ perl utf8-text.t
  32. $VAR1 = "STARG\x{39b}\x{30a}TE";
  33. $VAR1 = [
  34. [
  35. 0,
  36. "STARG\x{39b}"
  37. ],
  38. [
  39. 3,
  40. "\x{30a}"
  41. ],
  42. [
  43. 0,
  44. 'TE'
  45. ]
  46. ];
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement