c11_admin.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263
  1. import base64
  2. import os
  3. import time
  4. import requests
  5. from requests_toolbelt.multipart import decoder
  6. import jinja2
  7. import json
  8. import re
  9. from bs4 import BeautifulSoup
  10. from xml_prettify import prettify_xml
  11. class ca_webscraper:
  12. webservice = "http://localhost:9300/bi/"
  13. templates_dir = "tools/cognos11/templates"
  14. # templates_dir = "C:/GlobalCube/Tasks/gctools/templates"
  15. export_dir = "C:/GlobalCube/ReportOutput"
  16. log_dir = "C:/GlobalCube/Tasks/gctools/logs"
  17. credentials = '{"parameters":[{"name":"CAMNamespace","value":"CognosEx"},{"name":"h_CAM_action","value":"logonAs"},{"name":"CAMUsername","value":"Global1"},{"name":"CAMPassword","value":"Cognos#11"}]}'
  18. headers = {}
  19. caf = ""
  20. cam = ""
  21. auth_token = ""
  22. def __init__(self):
  23. self._env = jinja2.Environment(
  24. loader=jinja2.FileSystemLoader(self.templates_dir),
  25. autoescape=jinja2.select_autoescape(['html', 'xml'])
  26. )
  27. self.template = self._env.get_template('get_report.xml')
  28. @staticmethod
  29. def generate_token(message_base64):
  30. version = "V1".encode("utf-8")
  31. header_len = 4
  32. msg = base64.b64decode(message_base64)[1:]
  33. chunks = []
  34. while len(msg) >= header_len:
  35. chunk_len = int.from_bytes(msg[:header_len], byteorder="little")
  36. msg = msg[header_len:]
  37. chunks.append(msg[:chunk_len])
  38. msg = msg[chunk_len:]
  39. return base64.b64encode(version + chunks[-1]).decode("utf-8")
  40. def login(self):
  41. self.session = requests.Session()
  42. r = self.session.get(self.webservice)
  43. self.headers = {'Content-Type': "application/json; charset=UTF-8", 'X-XSRF-TOKEN': self.session.cookies.get('XSRF-TOKEN')}
  44. r = self.session.post(self.webservice + "v1/login", data=self.credentials, headers=self.headers)
  45. self.caf = r.json()['cafContextId']
  46. self.cam = self.generate_token(r.cookies["usersessionid"])
  47. return r.status_code
  48. def report_list(self):
  49. # "v1/objects/_dot_public_folders/items"
  50. filter = "type|analysis|interactiveReport|powerPlayReport|powerPlay8Report|powerPlay8ReportView|query|report|reportTemplate"
  51. res = self.session.get(
  52. self.webservice + "v1/search/cm?fields=defaultName|id|ancestors&results=1000&query=.&hide_internal=all&filter=" + filter,
  53. headers=self.headers
  54. )
  55. # print(res.content)
  56. filename = self.log_dir + '/reports_error.log'
  57. os.makedirs(os.path.dirname(filename), exist_ok=True)
  58. with open(filename, "wb") as f:
  59. f.write(res.content)
  60. self.reports = res.json()['results']
  61. for r in self.reports:
  62. r['path'] = "/".join([a['defaultName'].replace('/', '_') for a in r['ancestors']])
  63. r['name'] = r['defaultName']
  64. del(r['ancestors'])
  65. del(r['defaultName'])
  66. filename = self.log_dir + '/config/reports.json'
  67. os.makedirs(os.path.dirname(filename), exist_ok=True)
  68. json.dump(self.reports, open(filename, 'w'), indent=2)
  69. return self.reports
  70. def export_folder(self, folder, format='PDF'):
  71. reports = [r for r in self.reports if r['path'].startswith(folder)]
  72. for r in reports:
  73. print(r['name'])
  74. # continue
  75. path = r['path'].replace(folder, '')
  76. r['filename'] = f"{path}/{r['name']}.pdf"
  77. r['params'] = list(re.findall(r'\[([^\]]+)\]', r['filename']))
  78. for i, p in enumerate(r['params']):
  79. r['filename'] = r['filename'].replace('[' + p + ']', '{' + str(i) + '}')
  80. self.export(r, format)
  81. def export(self, report, format='XML'):
  82. headers = {
  83. 'Content-Type': 'text/xml; charset=UTF-8',
  84. 'X-XSRF-TOKEN': self.headers['X-XSRF-TOKEN'],
  85. 'X-RsCMStoreID': report['id'],
  86. 'X-UseRsConsumerMode': 'true',
  87. 'SOAPAction': 'http://www.ibm.com/xmlns/prod/cognos/reportService/202004/'
  88. }
  89. soap = self.template.render({"caf": self.caf, "cam": self.cam,
  90. "report": report, "format": 'XHTML',
  91. "prompt": 'true', "tracking": "", "params": {}})
  92. r = None
  93. while r is None or r.status_code == 500:
  94. r = self.session.post(self.webservice + 'v1/reports', data=soap, headers=headers)
  95. time.sleep(2)
  96. parts = decoder.MultipartDecoder.from_response(r).parts
  97. self.auth_token = re.findall(
  98. r'<bus:authenticityToken xsi:type="xs:base64Binary">(.*)</bus:authenticityToken>',
  99. parts[0].text)[0]
  100. # for i, p in enumerate(parts):
  101. # with open(f"export/{report['report']}_{i}.xml", "w") as f:
  102. # f.write(p.text.replace('\x81', ''))
  103. meta = {'required': {}, 'optional': {}}
  104. bs = BeautifulSoup(parts[1].content, 'lxml')
  105. # print(bs.prettify())
  106. for sv in bs.find_all('selectvalue'):
  107. k = sv['parameter']
  108. req = 'required' if sv['required'] == 'true' else 'optional'
  109. v = dict([(opt['usevalue'], opt['displayvalue']) for opt in sv.find_all('selectoption')])
  110. meta[req][k] = v
  111. for sv in bs.find_all('selectdate'):
  112. k = sv['parameter']
  113. req = 'required' if sv['required'] == 'true' else 'optional'
  114. v = dict([(opt['usevalue'], opt['displayvalue']) for opt in sv.find_all('selectoption')])
  115. meta[req][k] = v
  116. filename = self.log_dir + f"/config/{report['path']}/{report['name']}.json"
  117. os.makedirs(os.path.dirname(filename), exist_ok=True)
  118. json.dump(meta, open(filename, 'w'), indent=2)
  119. spec = parts[2].text
  120. if format == 'PDF':
  121. return self.export_pdf(report, meta)
  122. return self.export_unstubbed(report, spec)
  123. def export_unstubbed(self, report, spec):
  124. payload = json.dumps({'reportspec_stubbed': spec, 'storeid': report['id']})
  125. headers = {
  126. 'Content-Type': 'application/json; charset=UTF-8',
  127. 'X-XSRF-TOKEN': self.session.cookies.get('XSRF-TOKEN'),
  128. 'authenticityToken': self.auth_token,
  129. 'X-UseRsConsumerMode': 'true',
  130. 'cafContextId': self.caf
  131. }
  132. r = self.session.post(self.webservice + 'v1/reports/unstubreport', data=payload, headers=headers)
  133. unstubbed = json.loads(r.text)['reportspec_full']
  134. unstubbed = re.sub(r' iid="[^"]*"', '', unstubbed)
  135. bs = BeautifulSoup(unstubbed, 'xml')
  136. for xa in bs.find_all('XMLAttributes'):
  137. if (
  138. xa.find_all('XMLAttribute', {'name': 'RS_dataType'}) or
  139. xa.find_all('XMLAttribute', {'name': 'RS_CreateExtendedDataItems'}) or
  140. xa.find_all('XMLAttribute', {'name': 'RS_legacyDrillDown'})
  141. ):
  142. continue
  143. if xa.find_all('XMLAttribute', {'name': 'supportsDefaultDataFormatting'}):
  144. for xa2 in xa.find_all('XMLAttribute'):
  145. if xa2.attrs['name'] != 'supportsDefaultDataFormatting':
  146. xa2.decompose()
  147. continue
  148. xa.decompose()
  149. for cti in bs.find_all('crosstabIntersection'):
  150. if len(list(cti.children)) == 0:
  151. cti.decompose()
  152. unstubbed_report = str(bs).replace("'", '&apos;')
  153. unstubbed_report = prettify_xml(unstubbed_report)
  154. filename = self.log_dir + f"/config/{report['path']}/{report['name']}.xml"
  155. os.makedirs(os.path.dirname(filename), exist_ok=True)
  156. with open(filename, "w") as f:
  157. f.write(unstubbed_report)
  158. return unstubbed_report
  159. def export_pdf(self, report, meta):
  160. headers = {
  161. 'Content-Type': 'text/xml; charset=UTF-8',
  162. 'X-XSRF-TOKEN': self.headers['X-XSRF-TOKEN'],
  163. 'X-RsCMStoreID': report['id'],
  164. 'X-UseRsConsumerMode': 'true',
  165. 'SOAPAction': 'http://www.ibm.com/xmlns/prod/cognos/reportService/202004/'
  166. }
  167. if len(report['params']) == 0:
  168. params = {}
  169. filename = report['filename']
  170. self.request_file(report, headers, params, filename)
  171. return True
  172. if len(report['params']) == 1:
  173. params = {}
  174. filename = report['filename'].format('1')
  175. self.request_file(report, headers, params, filename)
  176. key1 = report['params'][0]
  177. for k1, v1 in meta['optional'][key1].items():
  178. filename = report['filename'].format(v1)
  179. params = {key1: {k1: v1}}
  180. self.request_file(report, headers, params, filename)
  181. return True
  182. if len(report['params']) == 2:
  183. key1, key2 = report['params']
  184. for k1, v1 in meta['optional'][key1].items():
  185. for k2, v2 in meta['optional'][key2].items():
  186. filename = report['filename'].format(v1, v2)
  187. params = {key1: {k1: v1}, key2: {k2: v2}}
  188. self.request_file(report, headers, params, filename)
  189. return True
  190. def request_file(self, report, headers, params, filename):
  191. soap = self.template.render({"caf": self.caf, "cam": self.cam,
  192. "report": report, "format": 'PDF',
  193. "prompt": 'false', "tracking": "", "params": params}).encode("utf-8")
  194. try:
  195. r = self.session.post(self.webservice + 'v1/reports', data=soap, headers=headers)
  196. except UnicodeEncodeError:
  197. filename = self.log_dir + '/' + os.path.basename(filename) + '.log'
  198. os.makedirs(os.path.dirname(filename), exist_ok=True)
  199. with open(filename, "w") as f:
  200. f.write(soap)
  201. return False
  202. if r.status_code == 200:
  203. parts = decoder.MultipartDecoder.from_response(r).parts
  204. filename = self.export_dir + filename
  205. os.makedirs(os.path.dirname(filename), exist_ok=True)
  206. with open(filename, "wb") as f:
  207. f.write(parts[1].content)
  208. else:
  209. filename = self.log_dir + '/' + os.path.basename(filename) + '.log'
  210. os.makedirs(os.path.dirname(filename), exist_ok=True)
  211. with open(filename, "wb") as f:
  212. f.write(r.content)
  213. return True
  214. def admin(self):
  215. r = self.session.get(self.webservice + "v1/disp?m_p_owner=&changed_m_p_owner=0&changed_genprop=0&so.select=&so.return.m=portal%2Fproperties_general.xts&so.defaultLocation=&so.defaultObject=&ro_name=false&origDefLang=de&m_email=&m_defaultName=&m_t_default_name_de=CARLO_F_Belege&m_t_default_description_de=&m_t_default_screenTip_de=&ifrmcmd=save&m_p_disabled=false&m_p_hidden=false&icon_radio=standard&m_transloc=de&pty_activeLang=de&pty_deactivLang=&pty_del=&pty_add=&pty_name=CARLO_F_Belege&pty_scrt=&pty_desc=&m_new_class=&b_action=xts.run&sharedPagesChanged=&from_tool=true&backURL=%2Fbi%2Fv1%2Fdisp%3Fb_action%3Dxts.run%26m%3Dportal%2Flegacy_tools%2Ftools_directory.xts%26m_pathID%3Di339AF66BADEC411E943590402582B75B%26m_path%3DCAMID%28%2522%253a%2522%29%252fdataSource%255b%2540name%253d%2527CARLO_F_Belege%2527%255d%26tool_tab%3Dd&m_selectedPage=&m_classSubtype=&m_obj=CAMID%28%22%3A%22%29%2FdataSource%5B%40name%3D%27CARLO_F_Belege%27%5D%2FdataSourceConnection%5B%40name%3D%27CARLO_F_Belege%27%5D&b_report_type=&encoding=UTF-8&m=portal%2Fproperties_connection.xts&m_class=dataSourceConnection&m_name=CARLO_F_Belege&ui.cafcontextid=CAFW000000a0Q0FGQTYwMDAwMDAwMDlBaFFBQUFERWpZV1g4bEExbmlJd29ualF1cEgwWVVTeGtnY0FBQUJUU0VFdE1qVTJJQUFBQUxha3gqeHQ5TXN3Ukw2dGhjMTJVRzN1NVhaMWVzNU5FLXRvWXI1VzlwYTE0NDI0NzN8cHM_&m_path=CAMID%28%22%3A%22%29%2FdataSource%5B%40name%3D%27CARLO_F_Belege%27%5D&cmd=&m_location=&reportLocation=&ps_nav_op=maintain&ps_nav_stack=&ps_nav_source=portal%2Fproperties_general.xts")
  216. print(r.cookies.keys())
  217. # CRN=http%3A%2F%2Fdeveloper.cognos.com%2Fceba%2Fconstants%2FbiDirectionalOptionEnum%23biDirectionalFeaturesEnabled%3Dfalse%26http%3A%2F%2Fdeveloper.cognos.com%2Fceba%2Fconstants%2FsystemOptionEnum%23accessibilityFeatures%3Dfalse%26skin%3Dcorporate%26contentLocale%3Dde-de%26showHiddenObjects%3Dfalse%26showWelcomePage%3Dtrue%26backgroundSessionLogging%3D1970-01-01%2B00%253A00%253A00%26showOptionSummary%3Dtrue%26productLocale%3Dde%26listViewSeparator%3Dnone%26showHints%3DhideAll%26timeZoneID%3DEurope%252FBerlin%26linesPerPage%3D15%26displayMode%3Dlist%26automaticPageRefresh%3D30%26format%3DHTML%26columnsPerPage%3D3%26;
  218. # cea-ssa=false;
  219. # userCapabilities=f%3Bfdbffc6d%3Bf07c1faf%3Bff27defa%26AwcAAABTSEEtMjU2FAAAAMSNhZfyUDWeIjCieNC6kfRhRLGSDPui1gb2UKZPMWVW5x3QHrHM%2BIVk5gFTzsNq1oOMioU%3D;
  220. # userCapabilitiesEx=603%3Bf%3Bfdbffc6d%3Bf07c1faf%3Bff27defa%26AhQAAADEjYWX8lA1niIwonjQupH0YUSxkgcAAABTSEEtMjU2IAAAAMI%2BRz7opwjhYGXonwHJpD3Ya1agg0lFOa1JK%2FkZiDTS;
  221. # caf=CAFW000000e0Q0FGQTYwMDAwMDAwM2FBaFFBQUFERWpZV1g4bEExbmlJd29ualF1cEgwWVVTeGtnY0FBQUJUU0VFdE1qVTJJQUFBQUY3d3JJLW1zREhXcnQtT0VWLUhhKjF0c01TZFVrWlB0aXNYdEVJOUcqZm40NDI0NzN8MTAxOjc5ZTJiNDdhLTIyNjgtZDcxYS1jMGIxLWYwMDYyY2QxYWQwZTozNDAxNTQ5MzI1;
  222. # cc_session=s_cc:|s_conf:na|s_sch:td|s_hd:sa|s_serv:na|s_disp:na|s_set:|s_dep:na|s_dir:na|s_sms:dd|s_ct:sa|s_cs:sa|s_so:sa|e_hp:CAMID(*22CognosEx*3au*3auid*3dglobal1*22)|e_proot:Team*20Content|prootid:i1F610DE4196544319A27C5709282EF95|e_mroot:Eigene*20Ordner|mrootid:iBAA3C16EC2D743B7B221BBFCDBC625D7|e_mrootpath:CAMID(*22CognosEx*3au*3auid*3dglobal1*22)*2ffolder*5b*40name*3d*27Eigene*20Ordner*27*5d|e_user:Global*20Cube|e_tenantID:|e_tenantDisplayName:|e_showTenantInfo:false|e_isSysAdmin:true|e_isTenantAdmin:false|e_isImpersonating:false|cl:de-de|dcid:i1F610DE4196544319A27C5709282EF95|show_logon:false|uig:|ui:|rsuiprofile:all|lch:f|lca:f|ci:f|write:true|eom:0|pp:3401549325;
  223. # up=H4sIAAAAAAAAAFWQ204CMRCGX4X0GuIuF5rlDgXEBBQUgxIT0sOwW2k7mx4UNL67sxgRk0ma+Tr5+nc+WdQWVujgZsB6bJg81vBydgneaMfaLGzp6LFHF8E7qCw0cIPe8kh4vJhOqBdcbkuPyakHCEGjm2BZalfSRF5cZJ0sp2plWe9QjbXC97F2MdBEpRX0jSGaAvhbboHgtUHBTU4w7usGcCnJHwlUaGHGywZSR7x5Umij434EPCYPZN1wE6DNdOg7dHuL6Y/VHlWScYKSm0ai4BhIKXB34hVkPFEomtnNu4UTtvi4fyrP1aLO+XJerLq7t2c7CtP5ek0Kae0MfeTmJ5jQA+3JRNvg5jfY0HFhQB3lCjY8mfjv062rJJpIEmnn7jRn5xBV8AAL2MWjnu76KSL7+gaz/bFgzAEAAA==;
  224. # MRUStorage=%7B%22xQ29nbm9zRXg6dTp1aWQ9Z2xvYmFsMQ__%22%3Atrue%7D;
  225. # usersessionid=AggAAADOAvteAAAAAAoAAAAPMXuCsi7eLj2GFAAAAMSNhZfyUDWeIjCieNC6kfRhRLGSBwAAAFNIQS0yNTYgAAAAxhTjzCpYnRF3ryJ/z/gpU9G5UeFYyp1vKc/PjuCT/r4=;
  226. # cam_passport=MTsxMDE6NzllMmI0N2EtMjI2OC1kNzFhLWMwYjEtZjAwNjJjZDFhZDBlOjM0MDE1NDkzMjU7MDszOzA7
  227. if __name__ == '__main__':
  228. caws = ca_webscraper()
  229. caws.login()
  230. caws.report_list()
  231. caws.export_folder('Team Content/Verkauf/1. Gesamtverkauf', 'XML')