flint-jmx-prometheus.yaml 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126
  1. #****************************************************************
  2. # Licensed Materials - Property of IBM
  3. # IBM Cognos Products: Flint
  4. #
  5. # (C) Copyright IBM Corp. 2018, 2018
  6. #
  7. # US Government Users Restricted Rights -
  8. # Use, duplication or disclosure restricted by GSA ADP Schedule
  9. # Contract with IBM Corp.
  10. #*****************************************************************
  11. # Configuration for the JMX Prometheus Exporter Java Agent
  12. rules:
  13. # System CPU load reported by JVM.
  14. - pattern: "java\\.lang<type=OperatingSystem><>SystemCpuLoad:"
  15. name: jvm_cpu_system_load
  16. # Process CPU load reported by JVM.
  17. - pattern: "java\\.lang<type=OperatingSystem><>ProcessCpuLoad:"
  18. name: jvm_cpu_process_load
  19. # These come from the master
  20. # Example: master.aliveWorkers
  21. - pattern: "metrics<name=master\\.(.*)><>(.*):"
  22. name: spark_master_$1_$2
  23. # These come from the worker
  24. # Example: worker.coresFree
  25. - pattern: "metrics<name=worker\\.(.*)><>(.*):"
  26. name: spark_worker_$1_$2
  27. # These come from the application driver
  28. # Example: app-20160809000059-0000.driver.DAGScheduler.stage.failedStages
  29. - pattern: "metrics<name=(.*)\\.driver\\.(DAGScheduler|BlockManager)\\.(.*)><>(.*):"
  30. name: spark_driver_$2_$3_$4
  31. labels:
  32. app_id: "$1"
  33. # These come from the FlintServer running in application driver
  34. # Example: app-20160809000059-0000.driver.FlintServer.UserMetrics.request.TOUCH_DATASET.duration_millis
  35. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.request\\.(.*)\\.(.*)><>(.*):"
  36. name: spark_driver_FlintServer_request_$3_$4
  37. labels:
  38. app_id: "$1"
  39. request_type: "$2"
  40. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.transport\\.(.*)><>(.*):"
  41. name: spark_driver_FlintServer_transport_$2_$3
  42. labels:
  43. app_id: "$1"
  44. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.dataset\\.(.*)><>(.*):"
  45. name: spark_driver_FlintServer_dataset_$2_$3
  46. labels:
  47. app_id: "$1"
  48. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.query\\.(.*)><>(.*):"
  49. name: spark_driver_FlintServer_query_$2_$3
  50. labels:
  51. app_id: "$1"
  52. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.wlm\\.under_pressure><>(.*):"
  53. name: spark_driver_FlintServer_wlm_under_pressure_$2
  54. labels:
  55. app_id: "$1"
  56. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.wlm\\.pool\\.(.*)\\.(.*)><>(.*):"
  57. name: spark_driver_FlintServer_wlm_pool_$3_$4
  58. labels:
  59. app_id: "$1"
  60. permit_pool: "$2"
  61. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.memory\\.max_off_heap_bytes><>(.*):"
  62. name: spark_driver_FlintServer_memory_max_off_heap_bytes_$2
  63. labels:
  64. app_id: "$1"
  65. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.memory\\.max_off_heap_storage_bytes><>(.*):"
  66. name: spark_driver_FlintServer_memory_max_off_heap_storage_bytes_$2
  67. labels:
  68. app_id: "$1"
  69. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.memory\\.max_on_heap_storage_bytes><>(.*):"
  70. name: spark_driver_FlintServer_memory_max_on_heap_storage_bytes_$2
  71. labels:
  72. app_id: "$1"
  73. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.memory\\.used_storage_bytes><>(.*):"
  74. name: spark_driver_FlintServer_memory_used_storage_bytes_$2
  75. labels:
  76. app_id: "$1"
  77. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.memory\\.used_execution_bytes><>(.*):"
  78. name: spark_driver_FlintServer_memory_used_execution_bytes_$2
  79. labels:
  80. app_id: "$1"
  81. - pattern: "metrics<name=(.*)\\.driver\\.FlintServer\\.UserMetrics\\.memory\\.pool\\.(.*)\\.(.*)><>(.*):"
  82. name: spark_driver_FlintServer_memory_pool_$3_$4
  83. labels:
  84. app_id: "$1"
  85. mem_pool: "$2"
  86. # These come from the application driver if it's a streaming application
  87. # Example: app-20160809000059-0000.driver.com.example.ClassName.StreamingMetrics.streaming.lastCompletedBatch_schedulingDelay
  88. - pattern: "metrics<name=(.*)\\.driver\\.(.*)\\.StreamingMetrics\\.streaming\\.(.*)><>(.*):"
  89. name: spark_streaming_driver_$3_$4
  90. labels:
  91. app_id: "$1"
  92. app_name: "$2"
  93. # These come from the application driver if it's a structured streaming application
  94. # Example: app-20160809000059-0000.driver.spark.streaming.QueryName.inputRate-total
  95. - pattern: "metrics<name=(.*)\\.driver\\.spark\\.streaming\\.(.*)\\.(.*)><>(.*):"
  96. name: spark_structured_streaming_driver_$3_$4
  97. labels:
  98. app_id: "$1"
  99. query_name: "$2"
  100. # These come from the application executors
  101. # Example: app-20160809000059-0000.0.executor.threadpool.activeTasks
  102. - pattern: "metrics<name=(.*)\\.(.*)\\.executor\\.(.*)><>(.*):"
  103. name: spark_executor_$3_$4
  104. labels:
  105. app_id: "$1"
  106. executor_id: "$2"
  107. # These come from the master
  108. # Example: application.com.example.ClassName.1470700859054.cores
  109. - pattern: "metrics<name=application\\.(.*)\\.([0-9]+)\\.(.*)><>(.*):"
  110. name: spark_application_$3_$4
  111. labels:
  112. app_name: "$1"
  113. app_start_epoch: "$2"