__author__  = "Hugo Liu <hugo@media.mit.edu>"
__version__ = "1.3"
import MontyTagger
import string,sys,time
if __name__ == "__main__":
    if '/?' in sys.argv or '-?' in sys.argv:
        print 'USAGE: python MontyTagFile.py "input.txt" "output.txt"\n'
    print 'Loading Corpus...'
    paragraphs = ['']
    f = open(sys.argv[-2],'r')
    paragraph_index = 0
    line = f.readline()
    while line:
        stripped = string.strip(line)
        if stripped == '' and paragraphs[paragraph_index] != '':
            paragraph_index += 1
            paragraphs.append("")
            line = f.readline()
            continue
        paragraphs[paragraph_index] += ' ' + line
        line = f.readline()
    paragraphs = filter(lambda x: x != '',paragraphs)
    print 'Loading Monty...'
    m = MontyTagger.MontyTagger(0)
    print 'Tagging...'
    starttime = time.time()
    tagged = []
    for p in paragraphs:
        tagged.append(m.tag_tokenized(p))
    stoptime = time.time()
    print 'Tagging took',stoptime-starttime,'seconds...'
    print 'Saving...'
    filename = sys.argv[-1]
    g = open(filename,'w')
    output = string.join(tagged,' ')
    g.write(output)
    g.close()
    print 'Done!'