filt.py
353 Bytes
#!/usr/bin/env python
# Apache 2.0
from __future__ import print_function
import sys
vocab=set()
with open(sys.argv[1]) as vocabfile:
for line in vocabfile:
vocab.add(line.strip())
with open(sys.argv[2]) as textfile:
for line in textfile:
print(" ".join([word if word in vocab else '<UNK>' for word in line.strip().split()]))