123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869 |
- import pandas as pd
- # import numpy as np
- from pathlib import Path
- class skr51_validation():
- current_dir = Path('C:/Projekte/Python/SKR51')
- def __init__(self):
- filter_csv = pd.read_csv(self.current_dir.joinpath('SKR51_Kostenrechnungsmerkmale.csv'), sep=';', quotechar='"') # , encoding='ansi')
- filter_csv['Filter'] = filter_csv['Filter'].apply(self.create_list)
- self.filter = filter_csv.set_index('Block').to_dict(orient='dict')['Filter']
- # print(self.filter)
- explode_cols = ['Kostenstelle', 'Absatzkanal', 'Kostenträger']
- matrix_csv = pd.read_csv(self.current_dir.joinpath('Plausibilitaetsmatrix.csv'), sep=';', converters={i: str for i in range(0, 200)}) # , encoding='ansi' .set_index('Konto_Nr')
- matrix_csv['valid'] = True
- for col in explode_cols:
- matrix_csv[col] = matrix_csv[col].apply(self.create_list)
- self.matrix = matrix_csv
- # self.matrix['Kostenstelle'] = matrix_csv[['Konto_Nr', 'Kostenstelle', 'valid']].explode('Kostenstelle')
- # print(self.matrix[self.matrix['Konto_Nr'] == '3300'])
- def create_list(self, whitelist):
- if whitelist == '':
- return [str(i).zfill(2) for i in range(0, 100)]
- result = []
- for x in whitelist.split(','):
- if '-' in x:
- result += [str(i).zfill(2) for i in range(int(x.split('-')[0]), int(x.split('-')[1]) + 1)]
- else:
- result.append(x)
- return result
- def check_bookings(self, bookings_file):
- export_csv = pd.read_csv(self.current_dir.joinpath(bookings_file), sep=';', converters={i: str for i in range(0, 200)}, decimal=',', encoding='ansi')
- export_csv = export_csv.merge(self.matrix[['Konto_Nr', 'valid']], how='left', on='Konto_Nr', suffixes=(None, '_matrix'))
- export_csv['Konto_Nr_valid'] = export_csv['valid'] == True
- temp = export_csv['Konto_Nr_Händler']
- export_csv.drop(['Konto_Nr_Händler'], axis=1, inplace=True)
- export_csv.insert(0, 'Konto_Nr_Händler', temp)
- for col in ['Marke', 'Standort']:
- export_csv[col + '_valid'] = export_csv[col].isin(self.filter[col])
- export_csv['valid'] = export_csv['valid'] & export_csv[col + '_valid']
- for col in ['Kostenstelle', 'Absatzkanal', 'Kostenträger']:
- export_csv = export_csv.merge(self.matrix[['Konto_Nr', col, 'valid']].explode(col), how='left', on=['Konto_Nr', col], suffixes=(None, '_' + col))
- export_csv[col + '_valid'] = export_csv[col].isin(self.filter[col]) & export_csv['valid_' + col] == True
- export_csv.drop(['valid_' + col], axis=1, inplace=True)
- export_csv['valid'] = export_csv['valid'] & export_csv[col + '_valid']
- return export_csv
- @staticmethod
- def format_konto(konto):
- return f"{konto['Kontonummer']}-{konto['Marke']}-{konto['Standort']}-{konto['Kostenstelle']}-{konto['Absatzkanal']}-{konto['Kostentraeger']}"
- @staticmethod
- def format_konto_neu(konto):
- return f"{konto['Kontonummer_neu']}-{konto['Marke_neu']}-{konto['Standort_neu']}-{konto['Kostenstelle_neu']}-{konto['Absatzkanal_neu']}-{konto['Kostentraeger_neu']}"
- if __name__ == '__main__':
- skr = skr51_validation()
- df = skr.check_bookings('Kontenrahmen_kombiniert.csv')
- df[['Konto_Nr_Händler', 'Marke', 'Marke_valid', 'Standort', 'Standort_valid', 'Konto_Nr', 'Konto_Nr_valid',
- 'Kostenstelle', 'Kostenstelle_valid', 'Absatzkanal', 'Absatzkanal_valid', 'Kostenträger', 'Kostenträger_valid',
- 'Kostenträger_Ebene', 'valid']].to_csv(skr.current_dir.joinpath('SKR51_Validierung.csv'), sep=';', encoding='ansi', index=False)
|