export_extf.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370
  1. import calendar
  2. import csv
  3. import hashlib
  4. import os
  5. import re
  6. import shutil
  7. from datetime import datetime, timedelta
  8. from pathlib import Path
  9. from typing import Any, Generator, Literal
  10. import pyodbc
  11. DSN = "dsn=GC_OPTIMA_64;uid=gaps;pwd=Gcbs12ma"
  12. class DatevConfig:
  13. base_dir: str = str(Path(__file__).resolve().parent)
  14. data_path: str = base_dir + "/data"
  15. export_path: str = base_dir + "/export/temp"
  16. translation_file: str = data_path + "/uebersetzungstabelle.csv"
  17. csv_date: datetime = datetime.now() # datetime(2023, 11, 20, 19, 2, 28, 714000)
  18. geschaeftsjahr_monat: int = 1
  19. periode: str = "202301"
  20. berater: int = 30612
  21. mandant: int = 10139
  22. konto_laenge: int = 5
  23. @property
  24. def datum_von(self) -> datetime:
  25. return datetime(int(self.periode[:4]), int(self.periode[4:]), 1)
  26. @property
  27. def datum_bis(self) -> datetime:
  28. year = int(self.periode[:4])
  29. month = int(self.periode[4:])
  30. end_of_month = calendar.monthrange(year, month)[1]
  31. return datetime(year, month, end_of_month)
  32. @property
  33. def geschaeftsjahr_beginn(self) -> datetime:
  34. year = int(self.periode[:4])
  35. if self.geschaeftsjahr_monat > datetime.now().month:
  36. year -= 1
  37. return datetime(year, self.geschaeftsjahr_monat, 1)
  38. @property
  39. def header2(self) -> str:
  40. res = [
  41. "Umsatz (ohne Soll/Haben-Kz)",
  42. "Soll/Haben-Kennzeichen",
  43. "WKZ Umsatz",
  44. "Kurs",
  45. "Basis-Umsatz",
  46. "WKZ Basis-Umsatz",
  47. "Konto",
  48. "Gegenkonto (ohne BU-Schlüssel)",
  49. "BU-Schlüssel",
  50. "Belegdatum",
  51. "Belegfeld 1",
  52. "Belegfeld 2",
  53. "Skonto",
  54. "Buchungstext",
  55. "Postensperre",
  56. "Diverse Adressnummer",
  57. "Geschäftspartnerbank",
  58. "Sachverhalt",
  59. "Zinssperre",
  60. "Beleglink",
  61. "Beleginfo - Art 1",
  62. "Beleginfo - Inhalt 1",
  63. "Beleginfo - Art 2",
  64. "Beleginfo - Inhalt 2",
  65. "Beleginfo - Art 3",
  66. "Beleginfo - Inhalt 3",
  67. "Beleginfo - Art 4",
  68. "Beleginfo - Inhalt 4",
  69. "Beleginfo - Art 5",
  70. "Beleginfo - Inhalt 5",
  71. "Beleginfo - Art 6",
  72. "Beleginfo - Inhalt 6",
  73. "Beleginfo - Art 7",
  74. "Beleginfo - Inhalt 7",
  75. "Beleginfo - Art 8",
  76. "Beleginfo - Inhalt 8",
  77. "KOST1 - Kostenstelle",
  78. "KOST2 - Kostenstelle",
  79. "Kost-Menge",
  80. "EU-Land u. UStID",
  81. "EU-Steuersatz",
  82. "Abw. Versteuerungsart",
  83. "Sachverhalt L+L",
  84. "Funktionsergänzung L+L",
  85. "BU 49 Hauptfunktionstyp",
  86. "BU 49 Hauptfunktionsnummer",
  87. "BU 49 Funktionsergänzung",
  88. "Zusatzinformation - Art 1",
  89. "Zusatzinformation- Inhalt 1",
  90. "Zusatzinformation - Art 2",
  91. "Zusatzinformation- Inhalt 2",
  92. "Zusatzinformation - Art 3",
  93. "Zusatzinformation- Inhalt 3",
  94. "Zusatzinformation - Art 4",
  95. "Zusatzinformation- Inhalt 4",
  96. "Zusatzinformation - Art 5",
  97. "Zusatzinformation- Inhalt 5",
  98. "Zusatzinformation - Art 6",
  99. "Zusatzinformation- Inhalt 6",
  100. "Zusatzinformation - Art 7",
  101. "Zusatzinformation- Inhalt 7",
  102. "Zusatzinformation - Art 8",
  103. "Zusatzinformation- Inhalt 8",
  104. "Zusatzinformation - Art 9",
  105. "Zusatzinformation- Inhalt 9",
  106. "Zusatzinformation - Art 10",
  107. "Zusatzinformation- Inhalt 10",
  108. "Zusatzinformation - Art 11",
  109. "Zusatzinformation- Inhalt 11",
  110. "Zusatzinformation - Art 12",
  111. "Zusatzinformation- Inhalt 12",
  112. "Zusatzinformation - Art 13",
  113. "Zusatzinformation- Inhalt 13",
  114. "Zusatzinformation - Art 14",
  115. "Zusatzinformation- Inhalt 14",
  116. "Zusatzinformation - Art 15",
  117. "Zusatzinformation- Inhalt 15",
  118. "Zusatzinformation - Art 16",
  119. "Zusatzinformation- Inhalt 16",
  120. "Zusatzinformation - Art 17",
  121. "Zusatzinformation- Inhalt 17",
  122. "Zusatzinformation - Art 18",
  123. "Zusatzinformation- Inhalt 18",
  124. "Zusatzinformation - Art 19",
  125. "Zusatzinformation- Inhalt 19",
  126. "Zusatzinformation - Art 20",
  127. "Zusatzinformation- Inhalt 20",
  128. "Stück",
  129. "Gewicht",
  130. "Zahlweise",
  131. "Forderungsart",
  132. "Veranlagungsjahr",
  133. "Zugeordnete Fälligkeit",
  134. "Skontotyp",
  135. "Auftragsnummer",
  136. "Buchungstyp",
  137. "Ust-Schlüssel (Anzahlungen)",
  138. "EU-Land (Anzahlungen)",
  139. "Sachverhalt L+L (Anzahlungen)",
  140. "EU-Steuersatz (Anzahlungen)",
  141. "Erlöskonto (Anzahlungen)",
  142. "Herkunft-Kz",
  143. "Leerfeld",
  144. "KOST-Datum",
  145. "Mandatsreferenz",
  146. "Skontosperre",
  147. "Gesellschaftername",
  148. "Beteiligtennummer",
  149. "Identifikationsnummer",
  150. "Zeichnernummer",
  151. "Postensperre bis",
  152. "Bezeichnung SoBil-Sachverhalt",
  153. "Kennzeichen SoBil-Buchung",
  154. "Festschreibung",
  155. "Leistungsdatum",
  156. "Datum Zuord.Steuerperiode",
  157. ]
  158. return ";".join(res)
  159. row_template = (
  160. '{0};"{1}";"{2}";;;"";"{9}";"{4}";"";{5};"{6}";"";;"{7}";;"";;;;"";"";'
  161. + '"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"{10}";"";;"";;"";;;;;;"";"";"";"";"";"";"";"";"";"";"";"";"";'
  162. + '"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";"";;;;"";;;;"";"";;"";;'
  163. + ';;"";"";;"";;"";;"";"";;"";;0;;'
  164. )
  165. # '592.80;H;EUR;"15800";90900;0101;6288;Opel Bank VoST 12/22 Lagerwag;1'
  166. @property
  167. def export_file(self) -> str:
  168. timestamp = self.csv_date.strftime("%Y%m%d_%H%M%S")
  169. period = self.datum_von.strftime("%Y%m")
  170. return f"{self.export_path}/EXTF_Buchungsstapel_30612_10139_{period}_{timestamp}.csv"
  171. @property
  172. def header(self) -> str:
  173. datev_header = {
  174. "Datev-Format-KZ": "EXTF",
  175. "Versionsnummer": 510,
  176. "Datenkategorie": 21,
  177. "Formatname": "Buchungsstapel",
  178. "Formatversion": 7,
  179. "Erzeugt_am": self.csv_date.strftime("%Y%m%d%H%M%S%f")[:-3],
  180. "Importiert_am": "",
  181. "Herkunftskennzeichen": "SV",
  182. "Exportiert_von": "dracar",
  183. "Importiert_von": "",
  184. "Berater": self.berater,
  185. "Mandant": self.mandant,
  186. "WJ-Beginn": self.geschaeftsjahr_beginn.strftime("%Y%m%d"),
  187. "Sachkontenlänge": self.konto_laenge,
  188. "Datum_von": self.datum_von.strftime("%Y%m%d"),
  189. "Datum_bis": self.datum_bis.strftime("%Y%m%d"),
  190. "Bezeichnung": "",
  191. "Diktatkürzel": "HE",
  192. "Buchungstyp": 1,
  193. "Rechnungslegungszweck": "",
  194. "Festschreibeinformation": 1,
  195. "WKZ": "",
  196. "reserviert_1": "",
  197. "Derivatskennzeichen": "",
  198. "reserviert_2": "",
  199. "reserviert_3": "",
  200. "SKR": "",
  201. "Branchenlösung-Id": "",
  202. "reserviert_4": "",
  203. "reserviert_5": "",
  204. "Anwendungsinformation": "",
  205. }
  206. template = (
  207. '"EXTF";{Versionsnummer};{Datenkategorie};"Buchungsstapel";{Formatversion};{Erzeugt_am};'
  208. + ';"SV";"dracar";"";{Berater};{Mandant};{WJ-Beginn};{Sachkontenlänge};{Datum_von};{Datum_bis};"";"HE";1;;1;"";;"";;;"";;;"";""'
  209. )
  210. return template.format(**datev_header)
  211. def get_translation(cfg: DatevConfig) -> dict[str, str]:
  212. translation = {}
  213. with Path(cfg.translation_file).open("r", encoding="latin-1") as frh:
  214. for line in csv.reader(frh, delimiter=";"):
  215. acct_no = line[0][:4] + "0"
  216. acct_details = "11" + line[0][11:].replace("-", "")
  217. translation[line[2]] = (acct_no, acct_details)
  218. return translation
  219. def from_database(period) -> Generator[list[str], Any, None]:
  220. with pyodbc.connect(DSN) as conn:
  221. cursor = conn.cursor()
  222. query = (
  223. "SELECT * FROM [import].[DATEV_Buchungsstapel] "
  224. + f"WHERE [BOOKKEEP_PERIOD] = '{period}' ORDER BY [BOOKKEEP_DATE], [UNIQUE_IDENT]"
  225. )
  226. cursor.execute(query)
  227. for row in cursor.fetchall():
  228. yield list(map(str, row[:9]))
  229. def from_csv(import_file) -> Generator[list[str], Any, None]:
  230. with import_file.open("r", encoding="latin-1") as frh:
  231. csv_reader = csv.reader(frh, delimiter=";")
  232. next(csv_reader) # ignore header
  233. for row in csv_reader:
  234. yield row
  235. def export_extf(period: str, import_method: Literal["csv", "db"] = "csv") -> None:
  236. cfg = DatevConfig()
  237. cfg.periode = period
  238. translation = get_translation(cfg)
  239. if import_method == "csv":
  240. import_file = Path(f"datev/data/{period}.csv")
  241. cfg.csv_date = datetime.fromtimestamp(import_file.stat().st_mtime)
  242. get_row = from_csv(import_file)
  243. else:
  244. get_row = from_database(cfg.periode)
  245. missing = []
  246. with Path(cfg.export_file).open("w", encoding="latin-1", newline="") as fwh:
  247. fwh.write(cfg.header + "\r\n")
  248. fwh.write(cfg.header2 + "\r\n")
  249. for row in get_row:
  250. row[0] = row[0].replace(".", ",")
  251. row.extend(translation.get(row[3], (row[3], "11000000")))
  252. if row[9] == row[3]:
  253. missing.append(row[3])
  254. fwh.write(cfg.row_template.format(*row) + "\r\n")
  255. # print(set(missing))
  256. def export_all_periods() -> None:
  257. dt = datetime.now()
  258. prev = str(dt.year - 1)
  259. periods = [f"{prev}{x:02}" for x in range(1, 13)] + [f"{dt.year}{x:02}" for x in range(1, dt.month + 1)]
  260. for p in periods:
  261. export_extf(p, "db")
  262. def extf_get_hash(filename):
  263. with open(filename, "r", encoding="latin-1") as frh1:
  264. frh1.readline() # ignore header
  265. data = frh1.read()
  266. return calculate_sha256(data)
  267. def extf_files_equal_content(file1, file2):
  268. with open(file1, "r", encoding="latin-1") as frh1:
  269. frh1.readline() # ignore header
  270. data1 = frh1.read()
  271. with open(file2, "r", encoding="latin-1") as frh2:
  272. frh2.readline() # ignore header
  273. data2 = frh2.read()
  274. print(calculate_sha256(data1))
  275. print(calculate_sha256(data2))
  276. return calculate_sha256(data1) == calculate_sha256(data2)
  277. def calculate_sha256(data) -> str:
  278. return hashlib.sha256(data.encode()).hexdigest()
  279. def test_content():
  280. print(
  281. extf_files_equal_content(
  282. "datev/export/EXTF_Buchungsstapel_30612_10139_202312_20240514_112734.csv",
  283. "datev/export/EXTF_Buchungsstapel_30612_10139_202312_20240514_112734.csv",
  284. )
  285. )
  286. print(
  287. extf_files_equal_content(
  288. "datev/export/EXTF_Buchungsstapel_30612_10139_202312_20240222_155629.csv",
  289. "datev/export/EXTF_Buchungsstapel_30612_10139_202312_20240514_112734.csv",
  290. )
  291. )
  292. print(
  293. extf_files_equal_content(
  294. "datev/export/EXTF_Buchungsstapel_30612_10139_202312_20240514_112734.csv",
  295. "datev/export/EXTF_Buchungsstapel_30612_10139_202312_20240515_104021.csv",
  296. )
  297. )
  298. def archive_files():
  299. last_week = (datetime.now() - timedelta(days=6)).timestamp()
  300. for file in Path("datev/export").glob("*.csv"):
  301. if file.stat().st_ctime < last_week:
  302. file.unlink()
  303. archive_path = Path("datev/export/Archiv")
  304. for file in Path("datev/export/temp").glob("*.csv"):
  305. p = re.search(r"_(\d{6})_", file.name)
  306. if not p:
  307. continue
  308. period = p[1]
  309. target = archive_path / period[:4] / period
  310. os.makedirs(target, exist_ok=True)
  311. file_hash = extf_get_hash(file)
  312. if has_identical_file(target, file_hash):
  313. file.unlink()
  314. continue
  315. shutil.copy(file, archive_path.parent / file.name)
  316. file.rename(target / file.name)
  317. def has_identical_file(target: Path, file_hash: str) -> bool:
  318. for archived_file in Path(target).glob("*.csv"):
  319. if extf_get_hash(archived_file) == file_hash:
  320. return True
  321. return False
  322. if __name__ == "__main__":
  323. export_all_periods()
  324. archive_files()
  325. # os.makedirs(Path(filename).parent.joinpath("info"), exist_ok=True)