import random most_popular_words = [ "be:0.5 and:0.2 of:0.1 :0.2", "a:0.5 in:0.2 to:0.1 :0.2", "have:0.5 too:0.2 it:0.1 :0.2", "I:0.5 that:0.2 for:0.1 :0.2", "you:0.5 he:0.2 with:0.1 :0.2", "on:0.5 do:0.2 say:0.1 :0.2", "this:0.5 they:0.2 at:0.1 :0.2", "but:0.5 we:0.2 his:0.1 :0.2" ] folder = "dev-0" with open(folder + "/in.tsv", "r", encoding='utf-8') as in_file: lines = in_file.readlines() with open(folder + "/out.tsv", "w", encoding='utf-8') as out_file: for line in lines: out_file.write(random.choice(most_popular_words) + "\n") # słowo:prawdopodobieństwo słowo:prawdopodobieństwo :prawdopodobieństwo-reszty słów # "the:0.2 at:0.3 :0.1"