26 lines
640 B
Python
26 lines
640 B
Python
|
#!/usr/bin/env python3
|
||
|
import csv
|
||
|
import sys
|
||
|
import re
|
||
|
|
||
|
|
||
|
def preprocess(prefix, hour, suffix):
|
||
|
sentence = prefix + hour + suffix
|
||
|
sentence = re.sub(r'\\n', r' \\n ', sentence)
|
||
|
sentence = re.sub(' +', ' ', sentence)
|
||
|
return sentence
|
||
|
|
||
|
|
||
|
def main():
|
||
|
# csv.reader(sys.stdin, delimiter='\t')
|
||
|
next(sys.stdin)
|
||
|
for line in sys.stdin:
|
||
|
prefix, hour, suffix, is_mass, yes_count, no_count, url, button_text, depth, filepath, line_no = line.rstrip(
|
||
|
'\n').rsplit('\t')
|
||
|
sentence = preprocess(prefix, hour, suffix)
|
||
|
print(f'__label__{is_mass} {sentence}')
|
||
|
|
||
|
|
||
|
if __name__ == '__main__':
|
||
|
main()
|