Python2018/labs02/task03.py

#!/usr/bin/env python
# -*- coding: utf-8 -*-

"""
Zad 4. Napisz funkcje oov(text, vocab), która zwraca listę wyrazów
(bez duplikatów), które występują w tekście text i nie występują w liście
znanych wyrazów vocab. Argumenty funkcji text i vocab to odpowiednio łańcuch
znakowy i lista łańuchów znakowych. Wszystkie wyrazy należy zmienić na małe
litery. (OOV = out of vocabulary) (W pythonie istnieje struktura danych tak
jak 'set', która przechowuje elementy bez powtórzeń.)
"""

def oov(text, vocab):
    text_lower = ''
    vocab_lower = []
    for i in text:
        if i.islower():
            text_lower += i
        else:
            text_lower += i.lower()
    for i in vocab:
        if i.islower():
            vocab_lower.append(i)
        else:
            vocab_lower.append(i.lower())
    return sorted(set(text_lower.split()) - set(vocab_lower))

def tests(f):
    inputs = [("this is a string , which i will use for string testing",
               [',', 'this', 'is', 'a', 'which', 'for', 'will', 'i'])]
    outputs = [['string', 'testing', 'use']]

    for input, output in zip(inputs, outputs):
        if set(f(*input)) != set(output):
            return "ERROR: {}!={}".format(f(*input), output)
            break
    return "TESTS PASSED"

if __name__ == "__main__":
    print(tests(oov))
Add labs 02 2018-05-12 11:37:19 +02:00			`#!/usr/bin/env python`
			`# -- coding: utf-8 --`

			`"""`
			`Zad 4. Napisz funkcje oov(text, vocab), która zwraca listę wyrazów`
			`(bez duplikatów), które występują w tekście text i nie występują w liście`
			`znanych wyrazów vocab. Argumenty funkcji text i vocab to odpowiednio łańcuch`
			`znakowy i lista łańuchów znakowych. Wszystkie wyrazy należy zmienić na małe`
			`litery. (OOV = out of vocabulary) (W pythonie istnieje struktura danych tak`
			`jak 'set', która przechowuje elementy bez powtórzeń.)`
			`"""`

			`def oov(text, vocab):`
modified codes for labs02 2018-06-02 20:20:33 +02:00			`text_lower = ''`
			`vocab_lower = []`
			`for i in text:`
			`if i.islower():`
			`text_lower += i`
			`else:`
			`text_lower += i.lower()`
			`for i in vocab:`
			`if i.islower():`
			`vocab_lower.append(i)`
			`else:`
			`vocab_lower.append(i.lower())`
			`return sorted(set(text_lower.split()) - set(vocab_lower))`
Add labs 02 2018-05-12 11:37:19 +02:00
			`def tests(f):`
			`inputs = [("this is a string , which i will use for string testing",`
			`[',', 'this', 'is', 'a', 'which', 'for', 'will', 'i'])]`
			`outputs = [['string', 'testing', 'use']]`

			`for input, output in zip(inputs, outputs):`
			`if set(f(*input)) != set(output):`
			`return "ERROR: {}!={}".format(f(*input), output)`
			`break`
			`return "TESTS PASSED"`

			`if __name__ == "__main__":`
			`print(tests(oov))`