ref: 0fcba1a2f0ec907683c005f7e9bef09e15163459
dir: /sys/src/cmd/tcs/charsets.awk/
#!/bin/awk -f
# makes a table of character sets from http://www.iana.org/assignments/character-sets/character-sets.xml
# and tcs.txt
/<name>/, /<\/name>/ {
gsub(/[<>\/]+/, " ")
i = 0
name = tolower($2)
names[name] = name
alias[name i] = name
nalias[name] = ++i
next
}
/<alias>/, /<\/alias>/ {
gsub(/[<>\/]+/, " ")
a = tolower($2)
names[a] = name
alias[name i] = a
nalias[name] = ++i
next
}
END {
while(getline <ARGV[2]){
tcs = $1
if(tcs in names){
name = names[tcs]
for(n = 0; n < nalias[name]; n++)
print "\"" alias[name n] "\", \"" $2 "\","
}
}
}