Skip to content

Commit 2ee9f70

Browse files
authored
[GCP] Add ingest pipeline for dataproc (#4344)
1 parent 6adb710 commit 2ee9f70

3 files changed

Lines changed: 106 additions & 1 deletion

File tree

packages/gcp/changelog.yml

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,9 @@
11
# newer versions go on top
2+
- version: "2.11.10-beta.6"
3+
changes:
4+
- description: Add ingest pipeline for dataproc.
5+
type: enhancement
6+
link: https://github.com/elastic/integrations/pull/4344
27
- version: "2.11.10-beta.5"
38
changes:
49
- description: Add GCP loadbalancing ingest pipeline
Lines changed: 100 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,100 @@
1+
---
2+
description: Pipeline for parsing GCP Dataproc metrics.
3+
processors:
4+
- rename:
5+
field: gcp.metrics.batch.spark.executors.count
6+
target_field: gcp.dataproc.batch.spark.executors.count
7+
ignore_missing: true
8+
- rename:
9+
field: gcp.metrics.cluster.hdfs.datanodes.count
10+
target_field: gcp.dataproc.cluster.hdfs.datanodes.count
11+
ignore_missing: true
12+
- rename:
13+
field: gcp.metrics.cluster.hdfs.storage_capacity.value
14+
target_field: gcp.dataproc.cluster.hdfs.storage_capacity.value
15+
ignore_missing: true
16+
- rename:
17+
field: gcp.metrics.cluster.hdfs.storage_utilization.value
18+
target_field: gcp.dataproc.cluster.hdfs.storage_utilization.value
19+
ignore_missing: true
20+
- rename:
21+
field: gcp.metrics.cluster.hdfs.unhealthy_blocks.count
22+
target_field: gcp.dataproc.cluster.hdfs.unhealthy_blocks.count
23+
ignore_missing: true
24+
- rename:
25+
field: gcp.metrics.cluster.job.failed.count
26+
target_field: gcp.dataproc.cluster.job.failed.count
27+
ignore_missing: true
28+
- rename:
29+
field: gcp.metrics.cluster.job.running.count
30+
target_field: gcp.dataproc.cluster.job.running.count
31+
ignore_missing: true
32+
- rename:
33+
field: gcp.metrics.cluster.job.submitted.count
34+
target_field: gcp.dataproc.cluster.job.submitted.count
35+
ignore_missing: true
36+
- rename:
37+
field: gcp.metrics.cluster.operation.failed.count
38+
target_field: gcp.dataproc.cluster.operation.failed.count
39+
ignore_missing: true
40+
- rename:
41+
field: gcp.metrics.cluster.operation.running.count
42+
target_field: gcp.dataproc.cluster.operation.running.count
43+
ignore_missing: true
44+
- rename:
45+
field: gcp.metrics.cluster.operation.submitted.count
46+
target_field: gcp.dataproc.cluster.operation.submitted.count
47+
ignore_missing: true
48+
- rename:
49+
field: gcp.metrics.cluster.yarn.allocated_memory_percentage.value
50+
target_field: gcp.dataproc.cluster.yarn.allocated_memory_percentage.value
51+
ignore_missing: true
52+
- rename:
53+
field: gcp.metrics.cluster.yarn.apps.count
54+
target_field: gcp.dataproc.cluster.yarn.apps.count
55+
ignore_missing: true
56+
- rename:
57+
field: gcp.metrics.cluster.yarn.containers.count
58+
target_field: gcp.dataproc.cluster.yarn.containers.count
59+
ignore_missing: true
60+
- rename:
61+
field: gcp.metrics.cluster.yarn.memory_size.value
62+
target_field: gcp.dataproc.cluster.yarn.memory_size.value
63+
ignore_missing: true
64+
- rename:
65+
field: gcp.metrics.cluster.yarn.nodemanagers.count
66+
target_field: gcp.dataproc.cluster.yarn.nodemanagers.count
67+
ignore_missing: true
68+
- rename:
69+
field: gcp.metrics.cluster.yarn.pending_memory_size.value
70+
target_field: gcp.dataproc.cluster.yarn.pending_memory_size.value
71+
ignore_missing: true
72+
- rename:
73+
field: gcp.metrics.cluster.yarn.virtual_cores.count
74+
target_field: gcp.dataproc.cluster.yarn.virtual_cores.count
75+
ignore_missing: true
76+
- rename:
77+
field: gcp.metrics.cluster.job.completion_time.value
78+
target_field: gcp.dataproc.cluster.job.completion_time.value
79+
ignore_missing: true
80+
- rename:
81+
field: gcp.metrics.cluster.job.duration.value
82+
target_field: gcp.dataproc.cluster.job.duration.value
83+
ignore_missing: true
84+
- rename:
85+
field: gcp.metrics.cluster.operation.completion_time.value
86+
target_field: gcp.dataproc.cluster.operation.completion_time.value
87+
ignore_missing: true
88+
- rename:
89+
field: gcp.metrics.cluster.operation.duration.value
90+
target_field: gcp.dataproc.cluster.operation.duration.value
91+
ignore_missing: true
92+
- remove:
93+
ignore_missing: true
94+
field:
95+
- gcp.metrics
96+
97+
on_failure:
98+
- set:
99+
field: error.message
100+
value: '{{ _ingest.on_failure_message }}'

packages/gcp/manifest.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
name: gcp
22
title: Google Cloud Platform
3-
version: "2.11.10-beta.5"
3+
version: "2.11.10-beta.6"
44
release: ga
55
description: Collect logs from Google Cloud Platform with Elastic Agent.
66
type: integration

0 commit comments

Comments
 (0)