gchr_error.py 1.2 KB

123456789101112131415161718192021222324
  1. import pandas as pd
  2. base_dir = '/home/robert/projekte/python/gcstruct/Siebrecht/'
  3. def read_csv():
  4. header = ['Kontonummer', 'Wert', 'Fehler', 'Beschreibung']
  5. df_log = pd.read_csv(base_dir + 'Siebrecht_12_2021.txt', decimal=',', sep='\t', encoding='latin-1',
  6. converters={0: str, 1: str, 2: str, 3: str}, header=None, names=header) # , skiprows=3)
  7. df_log['Marke_HBV'] = df_log['Kontonummer'].str.slice(4, 8)
  8. df_log['Site'] = df_log['Kontonummer'].str.slice(8, 10)
  9. df_log['Account'] = df_log['Kontonummer'].str.slice(0, 4)
  10. df_log['Origin'] = df_log['Kontonummer'].str.slice(10, 12)
  11. df_log['SalesChannel'] = df_log['Kontonummer'].str.slice(12, 14)
  12. df_log['CostCarrier'] = df_log['Kontonummer'].str.slice(14, 16)
  13. df_export = pd.read_csv(base_dir + 'export_2021-12.csv', sep=';', encoding='latin-1',
  14. converters={i: str for i in range(0, 200)})
  15. df = df_export.merge(df_log, how='left', on=['Marke_HBV', 'Site', 'Account', 'Origin', 'SalesChannel', 'CostCarrier'])
  16. df.to_csv(base_dir + 'export_error_2021-12.csv', decimal=',', sep=';', encoding='latin-1', index=False)
  17. if __name__ == '__main__':
  18. read_csv()