File: basic_greek_test.rb

package info (click to toggle)
ruby-stringex 2.8.6-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 1,220 kB
  • sloc: ruby: 3,749; makefile: 5
file content (113 lines) | stat: -rw-r--r-- 3,285 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
# encoding: UTF-8

require "test/unit"
require "stringex"
require File.join(File.expand_path(File.dirname(__FILE__)), "codepoint_test_helper.rb")
include CodepointTestHelper

class BasicGreekTest < Test::Unit::TestCase
  # This test suite is just regression test and debugging
  # to better transliterate the Basic Latin Unicode codepoints
  #
  # http://unicode.org/charts/
  # http://unicode.org/charts/PDF/U0000.pdf

  # NOTE: I can't figure out how to test control characters.
  # Get weird results trying to pack them to unicode.

  def test_greek_letters
    {
      "Α" => "A",
      "Ά" => "A",
      "Β" => "B",
      "Γ" => "G",
      "Δ" => "D",
      "Ε" => "E",
      "Έ" => "E",
      "Ζ" => "Z",
      "Η" => "H",
      "Θ" => "Th",
      "Ι" => "I",
      "Ί" => "I",
      "Ϊ" => "I",
      "Κ" => "K",
      "Λ" => "L",
      "Μ" => "M",
      "Ν" => "N",
      "Ξ" => "Ks",
      "Ο" => "O",
      "Ό" => "O",
      "Π" => "P",
      "Ρ" => "R",
      "Σ" => "S",
      "Τ" => "T",
      "Υ" => "Y",
      "Ϋ" => "Y",
      "Ύ" => "Y",
      "Φ" => "Ph",
      "Χ" => "X",
      "Ψ" => "Ps",
      "Ω" => "O",
      "Ώ" => "O",
      "α" => "a",
      "ά" => "a",
      "β" => "b",
      "γ" => "g",
      "δ" => "d",
      "ε" => "e",
      "έ" => "e",
      "ζ" => "z",
      "η" => "i",
      "ή" => "i",
      "θ" => "th",
      "ι" => "i",
      "ί" => "i",
      "ϊ" => "i",
      "ΐ" => "i",
      "κ" => "k",
      "λ" => "l",
      "μ" => "m",
      "ν" => "n",
      "ξ" => "ks",
      "ο" => "o",
      "ό" => "o",
      "π" => "p",
      "ρ" => "r",
      "σ" => "s",
      "ς" => "s",
      "τ" => "t",
      "υ" => "u",
      "ύ" => "u",
      "ϋ" => "u",
      "ΰ" => "u",
      "φ" => "ph",
      "χ" => "x",
      "ψ" => "ps",
      "ω" => "o",
      "ώ" => "o"
    }.each do |letter, ascii|
      assert_equal letter.to_ascii, ascii
    end
  end


  def test_greek_words
    {
      "Καλημέρα" => "Kalimera",
      "Προϊόν" => "Proion",
      "Θαλασσογραφία" => "Thalassographia",
      "Να μας πάρεις μακριά" => "Na mas pareis makria",
      "να μας πας στα πέρα μέρη" => "na mas pas sta pera meri",
      "φύσα θάλασσα πλατιά" => "phusa thalassa platia",
      "φύσα αγέρι φύσα αγέρι" => "phusa ageri phusa ageri",
      "Αν θέλεις να λέγεσαι άνθρωπος" => "An theleis na legesai anthropos",
      "δεν θα πάψεις ούτε στιγμή ν΄αγωνίζεσαι για την ειρήνη και" => "den tha papseis oute stigmi nagonizesai gia tin eirini kai",
      "για το δίκαιο." => "gia to dikaio.",
      "Θα βγείς στους δρόμους, θα φωνάξεις, τα χείλια σου θα" => "Tha bgeis stous dromous, tha phonakseis, ta xeilia sou tha",
      "ματώσουν απ΄τις φωνές" => "matosoun aptis phones",
      "το πρόσωπό σου θα ματώσει από τις σφαίρες – μα ούτε βήμα πίσω." => "to prosopo sou tha matosei apo tis sphaires -- ma oute bima piso.",
    }.each do |letter, ascii|
      assert_equal letter.to_ascii, ascii
    end
  end
end