summaryrefslogtreecommitdiff
path: root/script/unicodify.sed
blob: d0df04b02c40f11a86050429cbcaf1b1fa019659 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
# Remove spaces on either end of an em-dash.
s,[[:space:]]--[[:space:]],\&\#8212;,g

# Explicitly handle double-quotes before single-quotes.
s,"`,\&\#8220;,g
s,`",\&\#8221;,g
s,'`,\&\#8216;,g
s,`',\&\#8217;,g

# Diacritics.
s,\ï,\&\#239;,g
s,\è,\&\#232;,g
s,\é,\&\#233;,g

# Remove Asciidoc comments now, for the sake of getting more accurate
# wordcounts.
s,//.*,,g