2022-05-19 18:15:11 +02:00
|
|
|
from typing import Generator, Any
|
2022-05-17 22:16:45 +02:00
|
|
|
from random import randint
|
|
|
|
|
|
|
|
import pandas as pd
|
|
|
|
|
|
|
|
from .exceptions import InvalidNameOrTypeHeaderException
|
|
|
|
from ..students.models import Student
|
|
|
|
|
|
|
|
|
2022-05-19 18:15:11 +02:00
|
|
|
def check_columns(df: pd.DataFrame) -> bool:
|
|
|
|
headers = set(df.keys().values)
|
2022-06-12 21:20:11 +02:00
|
|
|
columns = ['NAZWISKO','IMIE','INDEKS','PESEL','EMAIL']
|
|
|
|
|
2022-05-19 18:15:11 +02:00
|
|
|
if len(headers - set(columns)) != 0:
|
|
|
|
return False
|
|
|
|
|
2022-05-17 22:16:45 +02:00
|
|
|
flag = True
|
2022-06-12 21:20:11 +02:00
|
|
|
col_types = ['object', 'object', 'int', 'float64', 'object']
|
2022-05-19 18:15:11 +02:00
|
|
|
|
2022-05-17 22:16:45 +02:00
|
|
|
for name, col_type in zip(columns, col_types):
|
2022-05-19 18:15:11 +02:00
|
|
|
if not str(df.dtypes[name]).startswith(col_type):
|
2022-05-17 22:16:45 +02:00
|
|
|
flag = False
|
|
|
|
break
|
|
|
|
|
|
|
|
return flag
|
|
|
|
|
|
|
|
|
2022-06-12 19:01:16 +02:00
|
|
|
def parse_csv(file, mode) -> Generator[Student, Any, None]:
|
2022-06-12 23:09:34 +02:00
|
|
|
df = pd.read_csv(file)
|
2022-05-17 22:16:45 +02:00
|
|
|
|
2022-06-12 21:20:11 +02:00
|
|
|
# if not check_columns(df):
|
|
|
|
# raise InvalidNameOrTypeHeaderException
|
2022-05-17 22:16:45 +02:00
|
|
|
|
2022-06-12 21:20:11 +02:00
|
|
|
students = (Student(last_name = dict(item.items())['NAZWISKO'],
|
|
|
|
first_name = dict(item.items())['NAZWISKO'],
|
|
|
|
index = dict(item.items())['INDEKS'],
|
|
|
|
pesel = str(int(dict(item.items())['PESEL'])) if not pd.isna(dict(item.items())['PESEL']) else '',
|
|
|
|
email = dict(item.items())['EMAIL'],
|
|
|
|
mode=mode)
|
2022-05-19 18:15:11 +02:00
|
|
|
for _, item in df.iterrows())
|
2022-06-12 21:20:11 +02:00
|
|
|
|
2022-05-17 22:16:45 +02:00
|
|
|
return students
|