forked from jasder/antlr
22 lines
716 B
Python
22 lines
716 B
Python
|
from __future__ import print_function
|
||
|
import codecs
|
||
|
import re
|
||
|
import sys
|
||
|
|
||
|
def main(input, output):
|
||
|
code_point_re = re.compile(r'^U\+([0-9a-fA-F]+)\s*;\s*ExtendedPictographic.*$')
|
||
|
code_point_range_re = re.compile(r'^U\+([0-9a-fA-F]+)\.\.U\+([0-9a-fA-F]+)\s*;\s*ExtendedPictographic.*$')
|
||
|
|
||
|
for line in input:
|
||
|
m = code_point_re.match(line)
|
||
|
if m:
|
||
|
print('set.add(0x' + m.group(1) + ');', file=output)
|
||
|
else:
|
||
|
m = code_point_range_re.match(line)
|
||
|
if m:
|
||
|
print('set.add(0x' + m.group(1) + ', 0x' + m.group(2) + ');', file=output)
|
||
|
|
||
|
if __name__ == '__main__':
|
||
|
with codecs.open(sys.argv[1], 'r', 'utf-8') as f:
|
||
|
main(f, sys.stdout)
|