summaryrefslogtreecommitdiffstats
path: root/util/bin/ukrepl
blob: 9b084027311a8d9c42fd42b996546598b62be418 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
#!/usr/bin/python2
# -*- coding: utf-8 -*-
import sys

wont_change = { ' '  : ' ' , 
           '\n' : '\n'
           }
def fixed_width_replace(char): #f
    if char in wont_change: return unicode(char)
    else: 
      try:
        if not 32 < ord(char) < 126: raise Exception("not in range")
        return unichr(0xFF00 + ord(char)-32)
      except:
        return char

cyrillic_dict = {
    'A' : u'А', 'a' : 'а','Ä' : u'Ӓ', 'ä' : u'ӓ',
    'B' : u'В',
    'c' : u'с',
    'E' : u'Е',
    'e' : u'е',
    'H' : u'Н',
    'I' : u'І', 'i' : u'і',
    'j' : u'ј','J' : u'Ј',
    'K' : u'К',
    'M' : u'М',
    'O' : u'О', 'o' : u'о', 'Ö' : u'Ӧ', 'ö' : u'ӧ',
    'P' : u'Р', 'p' : u'р',
    'S' : u'Ѕ',
    'T' : u'г'
    }

def cyrillic_replace(char): #c
  return cyrillic_dict.get(char,char)
historic_latin_dict = { 
    'B' : u'Ɓ',
    'b' : u'ƅ',
    'u' : u'ư',
    'U' : u'Ư',
    ''  : 'Ǟ',
    #'5' : 'ƽ',
    'o' : 'ơ',
    'O' : 'Ơ',
    '5' : 'Ƽ'
    }
def historic_latin(char): #H
  return historic_latin_dict.get(char,char)
punctuation_dict = {
    '!' : u'ǃ',
    '\'': u'’',
    '\"': u'ˮ',
    '(' : u'⟨',
    ')' : u'⟩',
    ':' : u'ː',
    ' ' : u' ',
    # all different spaces, made for perfect trolling
    #' ' : u' ',
    #' ' : u' ',
    #' ' : u'⁠',
    #'-' : u'‒',
    #'-' : u'—',
    #'-' : u'―',
    #'-' : u'‐',
    #'-' : u'⁃',
    '-' : u'–',
    '_' : u'−',
    '~' : u'⁓',
    #'~' : u'∼',
    #'~' : u'〜',

    }
def punctuation(char): #p
  return punctuation_dict.get(char,char)
def helpme():
  print "usage %s [modes]" % sys.argv[0]
  print "modes:"
  print "  c -- cyrillic replace"
  print "  f -- fixed width"
  print "  p -- replace punctuation"
  print "  H -- replace with historic latin chars"
  print "  h -- this message"
  sys.exit(0)

#parsing happens inside the nested loop
modes = ''.join(sys.argv[1:])
# sane defaults if no mode given
if not modes : modes = "f"

if 'h' in modes: helpme()

for line in sys.stdin:
  for char in line:
    for mode in modes:
      if mode is 'c':
        char = cyrillic_replace(char)
      elif mode is 'f':
        char = fixed_width_replace(char)
      elif mode is 'H':
        char = historic_latin(char)
      elif mode is 'p':
        char = punctuation(char)
      else:
        print "unknown mode %c" % mode
        helpme()
    try:
        sys.stdout.write(char)
    except:
        sys.stdout.write(char.encode("utf-8"))