File: characters_strategy.rb

package info (click to toggle)
ruby-string-direction 1.2.2-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 212 kB
  • sloc: ruby: 657; makefile: 7; sh: 3
file content (48 lines) | stat: -rw-r--r-- 1,335 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
module StringDirection
  # Strategy to detect direction from the scripts to which string characters belong
  class CharactersStrategy < Strategy
    # Ignored characters: unicode marks, punctuations, symbols, separator and other general categories
    IGNORED_CHARS = '\p{M}\p{P}\p{S}\p{Z}\p{C}'.freeze

    # Inspect to wich scripts characters belongs and  infer from them the string direction. right-to-left scripts are those in {Configuration#rtl_scripts}
    #
    # params [String] The string to inspect
    # @return [String, nil]
    def run(string)
      string = string.to_s
      if ltr_characters?(string) && rtl_characters?(string)
        bidi
      elsif ltr_characters?(string)
        ltr
      elsif rtl_characters?(string)
        rtl
      end
    end

    private

    def rtl_regex
      @rtl_regex ||= /[#{rtl_script_character_classes}]/
    end

    def ltr_regex
      @ltr_regex ||= /[^#{rtl_script_character_classes}#{IGNORED_CHARS}]/
    end

    def rtl_characters?(string)
      string.match(rtl_regex)
    end

    def ltr_characters?(string)
      string.match(ltr_regex)
    end

    def rtl_script_character_classes
      @rtl_script_character_classes ||= rtl_scripts.map { |script| "\\p{#{script}}" }.join
    end

    def rtl_scripts
      StringDirection.configuration.rtl_scripts
    end
  end
end