Blame view
egs/wsj/s5/utils/lang/bpe/reverse.py
492 Bytes
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 |
#!/usr/bin/env python3 # -*- coding: utf-8 -*- # This script, reverse all latin and digits sequences # (including words like MP3) to put them in the right order in the images. import re, os, sys, io in_stream = io.TextIOWrapper(sys.stdin.buffer, encoding='utf-8') out_stream = io.TextIOWrapper(sys.stdout.buffer, encoding='utf-8') for line in in_stream: out_stream.write(re.sub(r'[a-zA-Z0-9][a-zA-Z0-9\s\.\:]*[a-zA-Z0-9]', lambda m:m.group(0)[::-1], line)) |