summaryrefslogtreecommitdiffstatshomepage
path: root/tests/phpunit/data/formatting/windows1252.py
blob: bca7499b9ca38cf3082fe9a6a2918f5f43753937 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
# Generates test data for functions converting between
# dodgy windows-1252-only values and their unicode counterparts

unichars = ["201A", "0192", "201E", "2026", "2020", "2021", 
            "02C6", "2030", "0160", "2039", "0152", "2018", 
            "2019", "201C", "201D", "2022", "2013", "2014", 
            "02DC", "2122", "0161", "203A", "0153", "0178"];

winpoints = []
unipoints = []

for char in unichars:
    char = unichr(int(char, 16))
    dec = ord(char)
    win = ord(char.encode("windows-1252"))
    
    unipoints.append(dec)
    winpoints.append(win)

def entitize(s):
    return "&#%s;" % s

winpoints = map(entitize, winpoints)
unipoints = map(entitize, unipoints)

print "".join(winpoints), "".join(unipoints)