blob: 5f9281c07d9076d2ba709bba0d17fad4b17eb4c4 [file] [log] [blame]
# Blank out non-zero weights.
# Helper script for manual review of UCA DUCET and CLDR root collation data files.
# Most of the collation element weights change with every new version.
# "Blanking out" the weights makes files comparable,
# for finding changes in sort order and changes in lengths of weights.
#
# sed -r -f blankweights.sed FractionalUCA.txt > frac-7.0.txt
# protect allkeys 0000 weights
s/0000/@@4ZEROES@@/g
# fractional primary weights
s/\[[0-9A-F]{2},/[pp,/g
s/\[[0-9A-F]{2} [0-9A-F]{2},/[pp pp,/g
s/\[[0-9A-F]{2} [0-9A-F]{2} [0-9A-F]{2},/[pp pp pp,/g
# fractional secondary weights
s/, [0-9A-F]{2},/, ss,/g
s/, [0-9A-F]{2} [0-9A-F]{2},/, ss ss,/g
# fractional tertiary weights
s/, [0-9A-F]{2}\]/, tt]/g
# allkeys primary weights
s/\[[0-9A-F]{4}/[pppp/g
s/\[([.*])[0-9A-F]{4}/[\1pppp/g
# allkeys secondary weights
s/\.[0-9A-F]{4}\./.ssss./g
# leave fixed allkeys tertiary weights
# s/\.[0-9A-F]{4}\]/.tttt]/g
# restore zero weights
s/@@4ZEROES@@/0000/g