Skip to content

Commit ceb6139

Browse files
Felix Muellermohabusama
Felix Mueller
authored andcommitted
Allow sampling and redaction rules for Scalyr (zalando-incubator#62)
* Allow sampling and redaction rules for Scalyr This feature enables using sampling and redaction rules for Scalyr. More details about sampling_rules and redaction_rules can be found here: https://eu.scalyr.com/help/scalyr-agent * Updating requirements.txt * fixing flake8 errors * Updating readme * Updated README
1 parent ef0a769 commit ceb6139

File tree

6 files changed

+164
-7
lines changed

6 files changed

+164
-7
lines changed

README.rst

+23
Original file line numberDiff line numberDiff line change
@@ -321,6 +321,29 @@ The default parser for container logs is ``json`` parser. In some cases however
321321
322322
The value of ``kubernetes-log-watcher/scalyr-parser`` annotation should be a json serialized list. If ``container`` value did not match, then default parser is used (i.e. ``json``).
323323

324+
Scalyr sampling rules
325+
....................
326+
327+
Sampling rules enable to only ship a certain pattern that matches a regular expression and specified amount of log percentage to Scalyr. The example shows an expression that matches ``app-1`` and a match expression ``my-expression``. If it's met, only 10% of it will be shipped to Scalyr using a ``sampling_rate`` of ``0.1``.
328+
329+
.. code-block:: yaml
330+
331+
annotations:
332+
kubernetes-log-watcher/scalyr-sampling-rules: '[{"container": "app-1", "sampling-rules":[{ "match_expression": "my-expression", "sampling_rate": "0.1" }]}]'
333+
334+
335+
Scalyr log redaction
336+
....................
337+
338+
Redaction rules enable to avoid shipping sensitive data that shouldn't get transferred to Scalyr either getting fully removed from log files or to replace them with specific strings. The first example below shows how matches will be fully removed and the second shows how matches will be replaced with a different string.
339+
340+
.. code-block:: yaml
341+
342+
annotations:
343+
kubernetes-log-watcher/scalyr-redaction-rules: '[{"container": "app-1", "redaction-rules":[{ "match_expression": "my-expression" }]}]'
344+
kubernetes-log-watcher/scalyr-redaction-rules: '[{"container": "app-1", "redaction-rules":[{ "match_expression": "my-expression", "replacement": "replacement-expression" }]}]'
345+
346+
324347
AppDynamics configuration agent
325348
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
326349

kube_log_watcher/agents/scalyr.py

+61
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,12 @@
1515

1616
# If exists! we expect serialized json str: '[{"container": "my-container", "parser": "my-custom-parser"}]'
1717
SCALYR_ANNOTATION_PARSER = 'kubernetes-log-watcher/scalyr-parser'
18+
# If exists! we expect serialized json str:
19+
# '[{"container": "my-container", "sampling-rules":[{ "match_expression": "<expression here>",
20+
# "sampling_rate": "0" }]}]'
21+
SCALYR_ANNOTATION_SAMPLING_RULES = 'kubernetes-log-watcher/scalyr-sampling-rules'
22+
# '[{"container": "my-container", "redaction-rules":[{ "match_expression": "<expression here>" }]}]'
23+
SCALYR_ANNOTATION_REDACTION_RULES = 'kubernetes-log-watcher/scalyr-redaction-rules'
1824
SCALYR_DEFAULT_PARSER = 'json'
1925
SCALYR_DEFAULT_WRITE_RATE = 10000
2026
SCALYR_DEFAULT_WRITE_BURST = 200000
@@ -89,6 +95,8 @@ def add_log_target(self, target: dict):
8995
return
9096

9197
parser = SCALYR_DEFAULT_PARSER
98+
sampling_rules = None
99+
redaction_rules = None
92100

93101
annotations = target['kwargs'].get('pod_annotations', {})
94102
if annotations and SCALYR_ANNOTATION_PARSER in annotations:
@@ -105,11 +113,64 @@ def add_log_target(self, target: dict):
105113
parser = p.get('parser', SCALYR_DEFAULT_PARSER)
106114
logger.debug('Scalyr watcher agent loaded parser: {} for container: {}'.format(
107115
parser, target['kwargs']['container_name']))
116+
break
108117
except Exception:
109118
logger.error('Scalyr watcher agent failed to load annotation {}'.format(SCALYR_ANNOTATION_PARSER))
110119

120+
if annotations and SCALYR_ANNOTATION_SAMPLING_RULES in annotations:
121+
try:
122+
containers_sampling_rules = json.loads(annotations[SCALYR_ANNOTATION_SAMPLING_RULES])
123+
if type(containers_sampling_rules) is not list:
124+
logger.warning(
125+
('Scalyr watcher agent found invalid {} annotation in pod: {}. '
126+
'Expected `list` found: `{}`').format(
127+
SCALYR_ANNOTATION_SAMPLING_RULES,
128+
target['kwargs']['pod_name'], type(containers_sampling_rules)))
129+
else:
130+
for p in containers_sampling_rules:
131+
if p.get('container') == target['kwargs']['container_name']:
132+
sampling_rules = p.get('sampling-rules')
133+
if not sampling_rules:
134+
logger.warning(
135+
('Scalyr watcher agent did not find sampling rules for {}').format(
136+
target['kwargs']['container_name']))
137+
else:
138+
logger.debug('Scalyr watcher agent loaded sampling-rule: {} for container: {}'.format(
139+
sampling_rules, target['kwargs']['container_name']))
140+
break
141+
except Exception:
142+
logger.error('Scalyr watcher agent failed to load annotation {}'.format
143+
(SCALYR_ANNOTATION_SAMPLING_RULES))
144+
145+
if annotations and SCALYR_ANNOTATION_REDACTION_RULES in annotations:
146+
try:
147+
containers_redaction_rules = json.loads(annotations[SCALYR_ANNOTATION_REDACTION_RULES])
148+
if type(containers_redaction_rules) is not list:
149+
logger.warning(
150+
('Scalyr watcher agent found invalid {} annotation in pod: {}. '
151+
'Expected `list` found: `{}`').format(
152+
SCALYR_ANNOTATION_REDACTION_RULES,
153+
target['kwargs']['pod_name'], type(containers_redaction_rules)))
154+
else:
155+
for p in containers_redaction_rules:
156+
if p.get('container') == target['kwargs']['container_name']:
157+
redaction_rules = p.get('redaction-rules')
158+
if not redaction_rules:
159+
logger.warning(
160+
('Scalyr watcher agent did not find redaction rules for {}').format(
161+
target['kwargs']['container_name']))
162+
else:
163+
logger.debug('Scalyr watcher agent loaded redaction-rule: {} for container: {}'.format(
164+
redaction_rules, target['kwargs']['container_name']))
165+
break
166+
except Exception:
167+
logger.error('Scalyr watcher agent failed to load annotation {}'.format
168+
(SCALYR_ANNOTATION_REDACTION_RULES))
169+
111170
log = {
112171
'path': log_path,
172+
'sampling_rules': sampling_rules,
173+
'redaction_rules': redaction_rules,
113174
'attributes': {
114175
'application': target['kwargs']['application_id'],
115176
'version': target['kwargs']['application_version'],

kube_log_watcher/templates/scalyr.json.jinja2

+9-5
Original file line numberDiff line numberDiff line change
@@ -17,13 +17,17 @@
1717
{
1818
"path": "{{ log.path }}",
1919

20+
{% if log.sampling_rules %}
21+
"sampling_rules": {{ log.sampling_rules | tojson }},
22+
{% endif %}
23+
24+
{% if log.redaction_rules %}
25+
"redaction_rules": {{ log.redaction_rules | tojson }},
26+
{% endif %}
27+
2028
"copy_from_start": true,
2129

22-
"attributes": {
23-
{% for k, v in log.attributes.items() %}
24-
"{{ k }}": "{{ v }}"{% if not loop.last %},{% endif %}
25-
{% endfor %}
26-
}
30+
"attributes": {{ log.attributes | tojson }}
2731
}{% if not loop.last %},{% endif %}
2832
{% endfor %}
2933
],

requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
1-
Jinja2==2.8
1+
Jinja2
22
pykube>=0.15.0

tests/conftest.py

+10-1
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,8 @@
1515
'write_burst': 200000
1616
}
1717
SCALYR_ANNOTATION_PARSER = 'kubernetes-log-watcher/scalyr-parser'
18+
SCALYR_ANNOTATION_SAMPLING_RULES = 'kubernetes-log-watcher/scalyr-sampling-rules'
19+
SCALYR_ANNOTATION_REDACTION_RULES = 'kubernetes-log-watcher/scalyr-redaction-rules'
1820

1921
TARGET = {
2022
'id': 'container-1',
@@ -31,7 +33,14 @@
3133
'container_id': 'container-1',
3234
'container_path': '/mnt/containers/container-1',
3335
'log_file_name': 'container-1-json.log',
34-
'pod_annotations': {SCALYR_ANNOTATION_PARSER: '[{"container": "app-1-container-1", "parser": "custom-parser"}]'}
36+
'pod_annotations': {
37+
SCALYR_ANNOTATION_PARSER: '[{"container": "app-1-container-1", "parser": "custom-parser"}]',
38+
SCALYR_ANNOTATION_SAMPLING_RULES:
39+
'[{"container": "app-1-container-1", "sampling-rules":[{ "match_expression": "<expression here>", '
40+
'"sampling_rate": "0" }]}]',
41+
SCALYR_ANNOTATION_REDACTION_RULES:
42+
'[{"container": "app-1-container-1", "redaction-rules":[{ "match_expression": "<expression here>" }]}]'
43+
}
3544

3645
},
3746
'pod_labels': {}

tests/test_scalyr.py

+60
Original file line numberDiff line numberDiff line change
@@ -429,6 +429,66 @@ def test_remove_log_target(monkeypatch, env, exc):
429429
]
430430
},
431431
),
432+
(
433+
{
434+
'scalyr_key': SCALYR_KEY,
435+
'cluster_id': CLUSTER_ID,
436+
'monitor_journald': None,
437+
'logs': [
438+
{
439+
'path': '/p1',
440+
'attributes': {'a1': 'v1', 'parser': 'c-parser'},
441+
'copy_from_start': True,
442+
'sampling_rules': {"match_expression": "match-expression"}
443+
}
444+
]
445+
},
446+
{
447+
'api_key': 'scalyr-key-123',
448+
'implicit_metric_monitor': False,
449+
'implicit_agent_process_metrics_monitor': False,
450+
'server_attributes': {'serverHost': 'kube-cluster'},
451+
'monitors': [],
452+
'logs': [
453+
{
454+
'path': '/p1',
455+
'attributes': {'a1': 'v1', 'parser': 'c-parser'},
456+
'copy_from_start': True,
457+
'sampling_rules': {'match_expression': 'match-expression'}
458+
}
459+
],
460+
},
461+
),
462+
(
463+
{
464+
'scalyr_key': SCALYR_KEY,
465+
'cluster_id': CLUSTER_ID,
466+
'monitor_journald': None,
467+
'logs': [
468+
{
469+
'path': '/p1',
470+
'attributes': {'a1': 'v1', 'parser': 'c-parser'},
471+
'copy_from_start': True,
472+
'redaction_rules': {'match_expression': 'match-expression'}
473+
}
474+
]
475+
},
476+
{
477+
'api_key': 'scalyr-key-123',
478+
'implicit_metric_monitor': False,
479+
'implicit_agent_process_metrics_monitor': False,
480+
'server_attributes': {'serverHost': 'kube-cluster'},
481+
'monitors': [],
482+
'logs': [
483+
{
484+
'attributes': {'a1': 'v1', 'parser': 'c-parser'},
485+
'path': '/p1',
486+
'copy_from_start': True,
487+
'redaction_rules': {'match_expression': 'match-expression'}
488+
}
489+
],
490+
},
491+
),
432492
)
433493
)
434494
def test_tpl_render(monkeypatch, kwargs, expected):

0 commit comments

Comments
 (0)