Compare commits
No commits in common. "6b3df7cf2b9e0562461a693c61b7995bc39796d7" and "5c8fc0ab48b138826e61d4c1ea7f1f764e1a4b2e" have entirely different histories.
6b3df7cf2b
...
5c8fc0ab48
@ -1,6 +0,0 @@
|
|||||||
<?xml version="1.0" encoding="UTF-8"?>
|
|
||||||
<project version="4">
|
|
||||||
<component name="VcsDirectoryMappings">
|
|
||||||
<mapping directory="" vcs="Git" />
|
|
||||||
</component>
|
|
||||||
</project>
|
|
187
README.md
187
README.md
@ -52,190 +52,3 @@ B05 - jedno dla wszystkich
|
|||||||
|
|
||||||
C00 - zadanie wykonywane wspólnie na zajęciach
|
C00 - zadanie wykonywane wspólnie na zajęciach
|
||||||
C01-C03, C04-C06 - po jedno dla każdego
|
C01-C03, C04-C06 - po jedno dla każdego
|
||||||
|
|
||||||
## Zajęcia 3 13.11.2023 Wyrażenia regularne
|
|
||||||
|
|
||||||
D01 - D04 - do wykonania przez każdego
|
|
||||||
|
|
||||||
Dokumentacja wyrażeń regularnych w python3: https://docs.python.org/3/library/re.html
|
|
||||||
|
|
||||||
### Podstawowe funkcje
|
|
||||||
|
|
||||||
search - zwraca pierwsze dopasowanie w napisie
|
|
||||||
|
|
||||||
findall - zwraca listę wszystkich dopasowań (nienakładających się na siebie)
|
|
||||||
|
|
||||||
match - zwraca dopasowanie od początku string
|
|
||||||
|
|
||||||
To tylko podstawowe funkcje, z których będziemy korzystać. W dokumentacji opisane są wszystkie.
|
|
||||||
|
|
||||||
### Obiekt match
|
|
||||||
|
|
||||||
```
|
|
||||||
import re
|
|
||||||
answer = re.search('na','banan')
|
|
||||||
print(answer)
|
|
||||||
print(type(answer))
|
|
||||||
print(answer.start())
|
|
||||||
print(answer.end())
|
|
||||||
print(answer.group())
|
|
||||||
|
|
||||||
answer = re.search('na','kabanos')
|
|
||||||
print(answer)
|
|
||||||
|
|
||||||
if answer:
|
|
||||||
print(answer.group())
|
|
||||||
else:
|
|
||||||
pass
|
|
||||||
```
|
|
||||||
|
|
||||||
### Metaznaki
|
|
||||||
|
|
||||||
|
|
||||||
- [] - zbiór znaków
|
|
||||||
- . - jakikolwiek znak
|
|
||||||
|
|
||||||
- ^ - początek napisu
|
|
||||||
- $ - koniec napisu
|
|
||||||
|
|
||||||
- ? - znak występuje lub nie występuje
|
|
||||||
- \* - zero albo więcej pojawień się
|
|
||||||
- \+ - jeden albo więcej pojawień się
|
|
||||||
- {} - dokładnie tyle pojawień się
|
|
||||||
|
|
||||||
- | - lub
|
|
||||||
- () - grupa
|
|
||||||
- \ -znak ucieczki
|
|
||||||
|
|
||||||
- \d digit
|
|
||||||
- \D nie digit
|
|
||||||
- \s whitespace
|
|
||||||
- \S niewhitespace
|
|
||||||
|
|
||||||
|
|
||||||
### Flagi
|
|
||||||
|
|
||||||
Można użyć specjalnych flag, np:
|
|
||||||
`re.search('ma', 'AlA Ma KoTa', re.IGNORECASE)`.
|
|
||||||
|
|
||||||
### Przykłady (objaśnienia na laboratoriach)
|
|
||||||
|
|
||||||
```
|
|
||||||
import re
|
|
||||||
|
|
||||||
text = 'Ala ma kota i hamak, oraz 150 bananów.'
|
|
||||||
|
|
||||||
re.search('ma',text)
|
|
||||||
re.match('ma',text)
|
|
||||||
re.match('Ala ma',text)
|
|
||||||
re.findall('ma',text)
|
|
||||||
|
|
||||||
re.findall('[mn]a',text)
|
|
||||||
re.findall('[0-9]',text)
|
|
||||||
re.findall('[0-9abc]',text)
|
|
||||||
re.findall('[a-z][a-z]ma[a-z]',text)
|
|
||||||
re.findall('[a-zA-Z][a-zA-Z]ma[a-zA-z0-9]',text)
|
|
||||||
re.findall('\d',text)
|
|
||||||
|
|
||||||
re.search('[0-9][0-9][0-9]',text)
|
|
||||||
re.search('[\d][\d][\d]',text)
|
|
||||||
|
|
||||||
re.search('\d{2}',text)
|
|
||||||
re.search('\d{3}',text)
|
|
||||||
|
|
||||||
re.search('\d+',text)
|
|
||||||
|
|
||||||
re.search('\d+ bananów',text)
|
|
||||||
re.search('\d* bananów','Ala ma dużo bananów')
|
|
||||||
re.search('\d* bananów',text)
|
|
||||||
re.search('ma \d? bananów','Ala ma 5 bananów')
|
|
||||||
re.search('ma ?\d? bananów','Ala ma bananów')
|
|
||||||
re.search('ma( \d)? bananów','Ala ma bananów')
|
|
||||||
|
|
||||||
re.search('\d+ bananów','Ala ma 10 bananów albo 20 bananów')
|
|
||||||
re.search('\d+ bananów$','Ala ma 10 bananów albo 20 bananów')
|
|
||||||
|
|
||||||
text = 'Ala ma kota i hamak, oraz 150 bananów.'
|
|
||||||
|
|
||||||
re.search('\d+ bananów',text)
|
|
||||||
|
|
||||||
re.search('\d+\sbananów',text)
|
|
||||||
|
|
||||||
re.search('kota . hamak',text)
|
|
||||||
|
|
||||||
re.search('kota . hamak','Ala ma kota z hamakiem')
|
|
||||||
|
|
||||||
re.search('kota .* hamak','Ala ma kota lub hamak')
|
|
||||||
|
|
||||||
re.search('\.',text)
|
|
||||||
|
|
||||||
re.search('kota|psa','Ala ma kota lub hamak')
|
|
||||||
|
|
||||||
re.findall('kota|psa','Ala ma kota lub psa')
|
|
||||||
|
|
||||||
re.search('kota (i|lub) psa','Ala ma kota lub psa')
|
|
||||||
|
|
||||||
re.search('mam (kota).*(kota|psa)','Ja mam kota. Ala ma psa.').group(0)
|
|
||||||
|
|
||||||
re.search('mam (kota).*(kota|psa)','Ja mam kota. Ala ma psa.').group(1)
|
|
||||||
|
|
||||||
re.search('mam (kota).*(kota|psa)','Ja mam kota. Ala ma psa.').group(2)
|
|
||||||
```
|
|
||||||
|
|
||||||
### Przykłady wyrażenia regularne 2 (objaśnienia na laboratoriach)
|
|
||||||
|
|
||||||
#### ^
|
|
||||||
```
|
|
||||||
re.search('[0-9]+', '123-456-789')
|
|
||||||
re.search('[^0-9][0-9]+[^0-9]', '123-456-789')
|
|
||||||
```
|
|
||||||
|
|
||||||
#### cudzysłów
|
|
||||||
'' oraz "" - oznaczają to samo w pythonie
|
|
||||||
|
|
||||||
' ala ma psa o imieniu "Burek"'
|
|
||||||
|
|
||||||
" ala ma psa o imieniu 'Burek' "
|
|
||||||
|
|
||||||
' ala ma psa o imieniu \'Burek\' '
|
|
||||||
|
|
||||||
" ala ma psa o imieniu \"Burek\" "
|
|
||||||
|
|
||||||
#### multiline string
|
|
||||||
|
|
||||||
#### raw string
|
|
||||||
|
|
||||||
przy raw string znaki \ traktowane są jako zwykłe znaki \
|
|
||||||
|
|
||||||
chociaż nawet w raw string nadal są escapowane (ale wtedy \ pozostają również w stringu bez zmian)
|
|
||||||
|
|
||||||
https://docs.python.org/3/reference/lexical_analysis.html
|
|
||||||
|
|
||||||
dobra praktyka - wszędzie escapować
|
|
||||||
|
|
||||||
```
|
|
||||||
'\\'
|
|
||||||
print('\\')
|
|
||||||
|
|
||||||
r'\\'
|
|
||||||
print(r'\\')
|
|
||||||
|
|
||||||
|
|
||||||
print("abcd")
|
|
||||||
print("ab\cd")
|
|
||||||
print(r"ab\cd")
|
|
||||||
|
|
||||||
print("ab\nd")
|
|
||||||
print(r"ab\nd")
|
|
||||||
|
|
||||||
|
|
||||||
print("\"")
|
|
||||||
print(r"\"")
|
|
||||||
|
|
||||||
print("\")
|
|
||||||
print(r"\")
|
|
||||||
|
|
||||||
re.search('\\', r'a\bc')
|
|
||||||
re.search(r'\\', r'a\bc')
|
|
||||||
re.search('\\\\', r'a\bc')
|
|
||||||
```
|
|
@ -4,8 +4,8 @@ Deterministic automaton III
|
|||||||
Read a description of a finite-state automaton in the AT&T format
|
Read a description of a finite-state automaton in the AT&T format
|
||||||
(without weights) from the file in the first argument. Then, read strings from the
|
(without weights) from the file in the first argument. Then, read strings from the
|
||||||
standard input. If a string is
|
standard input. If a string is
|
||||||
accepted by the automaton, write TRUE, a space and the string on the
|
accepted by the automated, write YES, a space and the string on the
|
||||||
standard output, otherwise — write FALSE, a space and the string.
|
standard output, otherwise — write NO, a space and the string.
|
||||||
|
|
||||||
If there is a non-determinism in the automaton, the first transition should be chosen.
|
If there is a non-determinism in the automaton, the first transition should be chosen.
|
||||||
|
|
||||||
@ -17,11 +17,8 @@ is at most one epsilon transition from a given state and that there
|
|||||||
are no cycles with epsilon transition.
|
are no cycles with epsilon transition.
|
||||||
|
|
||||||
Your program does not have to check whether the description is correct
|
Your program does not have to check whether the description is correct
|
||||||
and whether the automaton is deterministic.
|
and whether the automaton is deterministic. You can assume that the
|
||||||
|
automaton does not contain epsilon transitions.
|
||||||
long.arg - this automaton accepts two texts - "aaaa" and "a" replicated 4038 times.
|
|
||||||
simple1.arg - simple automaton accepting only text "abc"
|
|
||||||
simple2.arg - automaton accepting text "ab*c" (b replicated any number of times) and "kot"
|
|
||||||
|
|
||||||
POINTS: 3
|
POINTS: 3
|
||||||
DEADLINE: 2023-11-12 23:59:59
|
DEADLINE: 2023-11-12 23:59:59
|
||||||
|
@ -1,3 +1,4 @@
|
|||||||
|
# automat akceptuje dwa napisy - "aaaa" i "a" powielone 4038 razy
|
||||||
0 1 a
|
0 1 a
|
||||||
1 2 a
|
1 2 a
|
||||||
2 3 a
|
2 3 a
|
||||||
|
@ -1,3 +1,4 @@
|
|||||||
|
# prosty automat akceptujący tylko napis "abc"
|
||||||
0 1 a
|
0 1 a
|
||||||
1 2 b
|
1 2 b
|
||||||
2 3 c
|
2 3 c
|
||||||
|
@ -1,3 +1,4 @@
|
|||||||
|
# automat akceptujący napis "ab*c" (b powielony dowolną liczbę razy) i "kot"
|
||||||
0 1 a
|
0 1 a
|
||||||
1 1 b
|
1 1 b
|
||||||
1 2 c
|
1 2 c
|
||||||
|
1
TaskC06/medium2.exp
Normal file
1
TaskC06/medium2.exp
Normal file
@ -0,0 +1 @@
|
|||||||
|
a
|
13989
TaskC06/medium2.in
Normal file
13989
TaskC06/medium2.in
Normal file
File diff suppressed because it is too large
Load Diff
0
TaskC06/medium2.out
Normal file
0
TaskC06/medium2.out
Normal file
@ -1,5 +0,0 @@
|
|||||||
Write a program to find lines containing the word "Hamlet".
|
|
||||||
Do use regular expressions.
|
|
||||||
|
|
||||||
POINTS: 1
|
|
||||||
DEADLINE: 2023-11-26 23:59:59
|
|
@ -1,7 +0,0 @@
|
|||||||
import re
|
|
||||||
import sys
|
|
||||||
|
|
||||||
for line in sys.stdin:
|
|
||||||
stripped_line = line.strip()
|
|
||||||
if re.search("Hamlet", stripped_line):
|
|
||||||
print(stripped_line)
|
|
@ -1,2 +0,0 @@
|
|||||||
Here comes Hamlet
|
|
||||||
Hamlet Hamlet again
|
|
@ -1,3 +0,0 @@
|
|||||||
Here comes Hamlet
|
|
||||||
ABC
|
|
||||||
Hamlet Hamlet again
|
|
@ -1,2 +0,0 @@
|
|||||||
Here comes Hamlet
|
|
||||||
Hamlet Hamlet again
|
|
@ -1,7 +0,0 @@
|
|||||||
Write a program to find lines containing the word "pies" separated by spaces.
|
|
||||||
The word does not need to have space on the left if it is the line beginning or space on the right if it is line ending.
|
|
||||||
Return line no matter of word "pies" casing.
|
|
||||||
Do use regular expressions.
|
|
||||||
|
|
||||||
POINTS: 1
|
|
||||||
DEADLINE: 2023-11-26 23:59:59
|
|
@ -1,7 +0,0 @@
|
|||||||
import re
|
|
||||||
import sys
|
|
||||||
|
|
||||||
for line in sys.stdin:
|
|
||||||
stripped_line = line.strip()
|
|
||||||
if re.search(r"\bpies\b", stripped_line, re.IGNORECASE):
|
|
||||||
print(stripped_line)
|
|
@ -1,3 +0,0 @@
|
|||||||
Pies ma Alę
|
|
||||||
Kot i pies to zwierzęta
|
|
||||||
pies
|
|
@ -1,5 +0,0 @@
|
|||||||
Pies ma Alę
|
|
||||||
Ala ma psa
|
|
||||||
tu nic nie ma
|
|
||||||
Kot i pies to zwierzęta
|
|
||||||
pies
|
|
@ -1,3 +0,0 @@
|
|||||||
Pies ma Alę
|
|
||||||
Kot i pies to zwierzęta
|
|
||||||
pies
|
|
@ -1,6 +0,0 @@
|
|||||||
Write a program to find lines containing date from 1900 to 1999 in format '19XX r.' no matter what on the left or right of the expression.
|
|
||||||
Note that part ' r.' is obligatory.
|
|
||||||
Do use regular expressions.
|
|
||||||
|
|
||||||
POINTS: 1
|
|
||||||
DEADLINE: 2023-11-26 23:59:59
|
|
@ -1,7 +0,0 @@
|
|||||||
import re
|
|
||||||
import sys
|
|
||||||
|
|
||||||
for line in sys.stdin:
|
|
||||||
stripped_line = line.strip()
|
|
||||||
if re.search("19[0-9][0-9] r\.", stripped_line, re.IGNORECASE):
|
|
||||||
print(stripped_line)
|
|
@ -1,3 +0,0 @@
|
|||||||
Kiedyś był 1934 r.
|
|
||||||
Kiedyś był 1934 r.fsdfsdfsdf
|
|
||||||
1934 r. to jakaś data
|
|
@ -1,5 +0,0 @@
|
|||||||
Kiedyś był 1934 r.
|
|
||||||
Kiedyś był 1934 r.fsdfsdfsdf
|
|
||||||
Kiedyś był 1935 rok
|
|
||||||
1934 r. to jakaś data
|
|
||||||
1934 to też jakaś data
|
|
@ -1,3 +0,0 @@
|
|||||||
Kiedyś był 1934 r.
|
|
||||||
Kiedyś był 1934 r.fsdfsdfsdf
|
|
||||||
1934 r. to jakaś data
|
|
@ -1,6 +0,0 @@
|
|||||||
Write a program to find all maximum substrings of digits.
|
|
||||||
Return only these substrings separated by spaces in their order.
|
|
||||||
Do use regular expressions.
|
|
||||||
|
|
||||||
POINTS: 2
|
|
||||||
DEADLINE: 2023-11-26 23:59:59
|
|
@ -1,10 +0,0 @@
|
|||||||
import re
|
|
||||||
import sys
|
|
||||||
|
|
||||||
for line in sys.stdin:
|
|
||||||
stripped_line = line.strip()
|
|
||||||
if re.search("\d+", stripped_line):
|
|
||||||
sub = re.findall("\d+", stripped_line)
|
|
||||||
print(' '.join(sub))
|
|
||||||
|
|
||||||
|
|
@ -1,4 +0,0 @@
|
|||||||
34234 34 5
|
|
||||||
34535
|
|
||||||
34
|
|
||||||
1992 1999
|
|
@ -1,5 +0,0 @@
|
|||||||
34234 34 dfd gfd 5
|
|
||||||
34535
|
|
||||||
fsdflskfjsdflk
|
|
||||||
fsdkfj sdf34fdfd
|
|
||||||
Firma powstała w 1992 r., z połączenia Authorware, Inc. (twórców pakietu Authorware) i MacroMind-Paracomp (producenta Macromind Director). W 1999 r. Macromedia zakupiła firmę Allaire i jej bi
|
|
@ -1,4 +0,0 @@
|
|||||||
34234 34 5
|
|
||||||
34535
|
|
||||||
34
|
|
||||||
1992 1999
|
|
@ -1,6 +0,0 @@
|
|||||||
import sys
|
|
||||||
|
|
||||||
count = 0
|
|
||||||
for line in sys.stdin:
|
|
||||||
count += 1
|
|
||||||
print(count)
|
|
@ -11,9 +11,7 @@ def execute_task(dir):
|
|||||||
for task_set in task_sets:
|
for task_set in task_sets:
|
||||||
try:
|
try:
|
||||||
with open(Path(dir, f'{task_set}.in')) as f_in, open(Path(dir, f'{task_set}.out'), 'w') as f_out:
|
with open(Path(dir, f'{task_set}.in')) as f_in, open(Path(dir, f'{task_set}.out'), 'w') as f_out:
|
||||||
arg = [x for x in dir.iterdir() if str(x).endswith(f'{task_set}.arg')] # arg = [x for x in dir.iterdir() if str(x).endswith(f'{task_set}.arg')]
|
arg = [x for x in dir.iterdir() if str(x).endswith('.arg')] # arg = [x for x in dir.iterdir() if str(x).endswith(f'{task_set}.arg')]
|
||||||
if not arg:
|
|
||||||
arg = [x for x in dir.iterdir() if str(x).endswith('fsa_description.arg')] # arg = Path(dir, 'fsa_description.arg') #
|
|
||||||
if str(dir).startswith('TaskH'):
|
if str(dir).startswith('TaskH'):
|
||||||
compilation_command = ['thraxcompiler', f'--input_grammar={Path(dir, "grammar.grm")}',
|
compilation_command = ['thraxcompiler', f'--input_grammar={Path(dir, "grammar.grm")}',
|
||||||
f'--output_far={Path(dir, "grammar.far")}']
|
f'--output_far={Path(dir, "grammar.far")}']
|
||||||
@ -41,7 +39,7 @@ def get_index():
|
|||||||
|
|
||||||
def is_task_set_correct(dir, task_set):
|
def is_task_set_correct(dir, task_set):
|
||||||
try:
|
try:
|
||||||
with open(Path(dir, f'{task_set}.out')) as f_out, open(Path(dir, f'{task_set}.exp')) as f_exp:
|
with open(Path(dir, f'{task_set}.out')) as f_exp, open(Path(dir, f'{task_set}.exp')) as f_out:
|
||||||
f_out_lines = ''.join(f_out.readlines())
|
f_out_lines = ''.join(f_out.readlines())
|
||||||
f_exp_lines = ''.join(f_exp.readlines())
|
f_exp_lines = ''.join(f_exp.readlines())
|
||||||
return f_out_lines == f_exp_lines
|
return f_out_lines == f_exp_lines
|
||||||
|
Loading…
Reference in New Issue
Block a user