X-Git-Url: http://git.veekun.com/zzz-pokedex.git/blobdiff_plain/e50aca7ae94c04b5cec1baacef6e0a115a0305e0..152e16ebb4e70b5f5cf8986e4ce76cf804d0c4d3:/pokedex/roomaji.py

diff --git a/pokedex/roomaji.py b/pokedex/roomaji.py
index 9db6b07..e91c960 100644
--- a/pokedex/roomaji.py
+++ b/pokedex/roomaji.py
@@ -60,7 +60,7 @@ _roomaji_small_kana_combos = {
     # particularly weird, but it seems to be what GF intends
 
     # Simple vowel replacement
-                    u'ã¦ã£': 'wi',  u'ã¦ã¥': 'wu',  u'ã¦ã§': 'we',
+                    u'ã¦ã£': 'wi',  u'ã¦ã¥': 'wu',  u'ã¦ã§': 'we',  u'ã¦ã©': 'wo',
     u'ã´ã¡': 'va',  u'ã´ã£': 'vi',                  u'ã´ã§': 've',  u'ã´ã©': 'vo',
                                                     u'ãã§': 'che',
                                                     u'ã·ã§': 'she',
@@ -71,6 +71,7 @@ _roomaji_small_kana_combos = {
 
     # Not so much
     u'ã·ã£': 'sy',
+    u'ãã£': 'my',
     u'ãã£': 'by',
     u'ãã£': 'py',
 }
@@ -85,11 +86,12 @@ def romanize(string):
     last_char = None  # Used for small kana combos
     for char in string:
         # Full-width Latin
-        if ord(char) >= 0xff11 and ord(char) <= 0xff5e:
+        if 0xff01 <= ord(char) <= 0xff5e:
             if last_kana == 'sokuon':
                 raise ValueError("Sokuon cannot precede Latin characters.")
 
-            char = chr(ord(char) - 0xff11 + 0x31)
+            # XXX Real Unicode decomposition would be nicer
+            char = chr(ord(char) - 0xff01 + 0x21)
             characters.append(char)
 
             last_kana = None