anpassungen und verbesserungen
This commit is contained in:
10
src/step2.py
10
src/step2.py
@@ -3,7 +3,7 @@ import pandas as pd
|
||||
from Levenshtein import distance
|
||||
|
||||
|
||||
def compare_data(new, sys, count_test, path):
|
||||
def compare_data(new, sys, count_test, path, school):
|
||||
print(f"\nEinträge in System Liste: {len(sys)}")
|
||||
print(f"Einträge in Import Liste: {len(new)}")
|
||||
|
||||
@@ -12,8 +12,8 @@ def compare_data(new, sys, count_test, path):
|
||||
if bool_class:
|
||||
if 'index' in new.columns:
|
||||
new = new.drop('index', axis=1)
|
||||
unique_classes(new)
|
||||
unique_classes(sys)
|
||||
unique_classes(new, school)
|
||||
unique_classes(sys, school)
|
||||
sys = sys.drop(columns=['klasse'])
|
||||
merged_df = pd.merge(new[['name', 'vorname', 'klasse']], sys, on=['name', 'vorname'], how='outer', indicator=True)
|
||||
matches = pd.merge(new, sys, on=['name', 'vorname'])
|
||||
@@ -47,11 +47,11 @@ def search_typos(new, sys):
|
||||
print('Mögliche Tippfehler: keine Fehler gefunden!')
|
||||
|
||||
|
||||
def unique_classes(df):
|
||||
def unique_classes(df, school):
|
||||
df['klasse'] = df['klasse'].str.split(',')
|
||||
df = df.explode('klasse')
|
||||
eindeutige_klassen = df['klasse'].unique()
|
||||
with open('./output/klassen.txt', 'a') as file:
|
||||
with open(f'./Data/{school}/gen_klassen.txt', 'a') as file:
|
||||
file.write(np.array_str(eindeutige_klassen))
|
||||
# print(eindeutige_klassen)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user