feat(internal): span sampling file config envar (backport #4042) (#4073)

mergify[bot] · web-flow · commit d0a3adc3196a · 2022-08-16T20:20:36.000Z
This is an automatic backport of pull request #4042 done by [Mergify](https://mergify.com). Cherry-pick of c0e9a9b has failed: ``` On branch mergify/bp/1.4/pr-4042 Your branch is up to date with 'origin/1.4'. You are currently cherry-picking commit c0e9a9b. (fix conflicts and run "git cherry-pick --continue") (use "git cherry-pick --skip" to skip this patch) (use "git cherry-pick --abort" to cancel the cherry-pick operation) Changes to be committed: modified: ddtrace/constants.py Unmerged paths: (use "git add/rm <file>..." as appropriate to mark resolution) both modified: ddtrace/internal/sampling.py deleted by us: tests/tracer/test_single_span_sampling_rules.py ``` To fix up this pull request, you can check it out locally. See documentation: https://docs.github.com/en/github/collaborating-with-pull-requests/reviewing-changes-in-pull-requests/checking-out-pull-requests-locally --- <details> <summary>Mergify commands and options</summary> <br /> More conditions and actions can be found in the [documentation](https://docs.mergify.com/). You can also trigger Mergify actions by commenting on this pull request: - `@Mergifyio refresh` will re-evaluate the rules - `@Mergifyio rebase` will rebase this PR on its base branch - `@Mergifyio update` will merge the base branch into this PR - `@Mergifyio backport <destination>` will backport this PR on `<destination>` branch Additionally, on Mergify [dashboard](https://dashboard.mergify.com/) you can: - look at your merge queues - generate the Mergify configuration with the config editor. Finally, you can contact us on https://mergify.com </details>
diff --git a/ddtrace/constants.py b/ddtrace/constants.py
@@ -7,6 +7,7 @@
 _SINGLE_SPAN_SAMPLING_MECHANISM = "_dd.span_sampling.mechanism"
 _SINGLE_SPAN_SAMPLING_RATE = "_dd.span_sampling.rule_rate"
 _SINGLE_SPAN_SAMPLING_MAX_PER_SEC = "_dd.span_sampling.max_per_second"
+_SINGLE_SPAN_SAMPLING_MAX_PER_SEC_NO_LIMIT = -1
 
 ORIGIN_KEY = "_dd.origin"
 HOSTNAME_KEY = "_dd.hostname"
diff --git a/ddtrace/internal/sampling.py b/ddtrace/internal/sampling.py
@@ -4,6 +4,8 @@
 from typing import Optional
 from typing import TYPE_CHECKING
 
+from six import string_types
+
 
 # TypedDict was added to typing in python 3.8
 try:
@@ -12,6 +14,7 @@
     from typing_extensions import TypedDict
 
 from ddtrace.constants import _SINGLE_SPAN_SAMPLING_MAX_PER_SEC
+from ddtrace.constants import _SINGLE_SPAN_SAMPLING_MAX_PER_SEC_NO_LIMIT
 from ddtrace.constants import _SINGLE_SPAN_SAMPLING_MECHANISM
 from ddtrace.constants import _SINGLE_SPAN_SAMPLING_RATE
 from ddtrace.internal.glob_matching import GlobMatcher
@@ -29,6 +32,7 @@
     JSONDecodeError = ValueError  # type: ignore
 
 if TYPE_CHECKING:
+    from typing import Any
     from typing import Dict
     from typing import List
     from typing import Text
@@ -208,44 +212,82 @@ def apply_span_sampling_tags(self, span):
 
 def get_span_sampling_rules():
     # type: () -> List[SpanSamplingRule]
-    json_rules_raw = os.getenv("DD_SPAN_SAMPLING_RULES")
-    if json_rules_raw is None:
-        return []
-    else:
-        sampling_rules = []
+    json_rules = _get_span_sampling_json()
+    sampling_rules = []
+    for rule in json_rules:
+        if not isinstance(rule, dict):
+            raise TypeError("rule specified via DD_SPAN_SAMPLING_RULES is not a dictionary:%r" % rule)
+        # If sample_rate not specified default to 100%
+        sample_rate = float(rule.get("sample_rate", 1.0))
+        service = rule.get("service")
+        name = rule.get("name")
+        # If max_per_second not specified default to no limit
+        max_per_second = int(rule.get("max_per_second", _SINGLE_SPAN_SAMPLING_MAX_PER_SEC_NO_LIMIT))
+        if service is not None and not isinstance(service, string_types):
+            raise ValueError("The service value is not a string or None:%r" % service)
+        if name is not None and not isinstance(name, string_types):
+            raise ValueError("The name value is not a string or None:%r" % name)
+
+        if service is None and name is None:
+            raise ValueError("Neither service or name specified for single span sampling rule:%r" % rule)
+        if service:
+            _check_unsupported_pattern(service)
+        if name:
+            _check_unsupported_pattern(name)
+
         try:
-            json_rules = json.loads(json_rules_raw)  # type: List[SpanSamplingRules]
-            if not isinstance(json_rules, list):
-                raise TypeError("DD_SPAN_SAMPLING_RULES is not list, got %r" % json_rules)
-        except JSONDecodeError:
-            raise ValueError("Unable to parse DD_SPAN_SAMPLING_RULES=%r" % json_rules_raw)
-        for rule in json_rules:
-            if not isinstance(rule, dict):
-                raise TypeError("rule specified via DD_SPAN_SAMPLING_RULES is not a dictionary:%r" % rule)
-            # If sample_rate not specified default to 100%
-            sample_rate = float(rule.get("sample_rate", 1.0))
-            service = rule.get("service")
-            name = rule.get("name")
-            # If max_per_second not specified default to no limit
-            max_per_second = int(rule.get("max_per_second", -1))
-            if service is None and name is None:
-                raise ValueError(
-                    "Neither service or name specified for single span sampling rule:%r,"
-                    "at least one of these must be specified" % rule
-                )
-            if service:
-                _check_unsupported_pattern(service)
-            if name:
-                _check_unsupported_pattern(name)
-
-            try:
-                sampling_rule = SpanSamplingRule(
-                    sample_rate=sample_rate, service=service, name=name, max_per_second=max_per_second
-                )
-            except Exception as e:
-                raise ValueError("Error creating single span sampling rule {}: {}".format(json.dumps(rule), e))
-            sampling_rules.append(sampling_rule)
-        return sampling_rules
+            sampling_rule = SpanSamplingRule(
+                sample_rate=sample_rate, service=service, name=name, max_per_second=max_per_second
+            )
+        except Exception as e:
+            raise ValueError("Error creating single span sampling rule {}: {}".format(json.dumps(rule), e))
+        sampling_rules.append(sampling_rule)
+    return sampling_rules
+
+
+def _get_span_sampling_json():
+    # type: () -> List[Dict[str, Any]]
+    env_json_rules = _get_env_json()
+    file_json_rules = _get_file_json()
+
+    if env_json_rules and file_json_rules:
+        log.warning(
+            (
+                "DD_SPAN_SAMPLING_RULES and DD_SPAN_SAMPLING_RULES_FILE detected. "
+                "Defaulting to DD_SPAN_SAMPLING_RULES value."
+            )
+        )
+        return env_json_rules
+    return env_json_rules or file_json_rules or []
+
+
+def _get_file_json():
+    # type: () -> Optional[List[Dict[str, Any]]]
+    file_json_raw = os.getenv("DD_SPAN_SAMPLING_RULES_FILE")
+    if file_json_raw:
+        with open(file_json_raw) as f:
+            return _load_span_sampling_json(f.read())
+    return None
+
+
+def _get_env_json():
+    # type: () -> Optional[List[Dict[str, Any]]]
+    env_json_raw = os.getenv("DD_SPAN_SAMPLING_RULES")
+    if env_json_raw:
+        return _load_span_sampling_json(env_json_raw)
+    return None
+
+
+def _load_span_sampling_json(raw_json_rules):
+    # type: (str) -> List[Dict[str, Any]]
+    try:
+        json_rules = json.loads(raw_json_rules)
+        if not isinstance(json_rules, list):
+            raise TypeError("DD_SPAN_SAMPLING_RULES is not list, got %r" % json_rules)
+    except JSONDecodeError:
+        raise ValueError("Unable to parse DD_SPAN_SAMPLING_RULES=%r" % raw_json_rules)
+
+    return json_rules
 
 
 def _check_unsupported_pattern(string):
diff --git a/tests/tracer/test_single_span_sampling_rules.py b/tests/tracer/test_single_span_sampling_rules.py
@@ -1,3 +1,5 @@
+import sys
+
 import pytest
 
 from ddtrace import Tracer
@@ -6,6 +8,7 @@
 from ddtrace.constants import _SINGLE_SPAN_SAMPLING_MECHANISM
 from ddtrace.constants import _SINGLE_SPAN_SAMPLING_RATE
 from ddtrace.internal.sampling import SamplingMechanism
+from ddtrace.internal.sampling import _get_file_json
 from ddtrace.internal.sampling import get_span_sampling_rules
 from tests.utils import DummyWriter
 
@@ -75,7 +78,23 @@ def test_sampling_rule_init_via_env():
             sampling_rules = get_span_sampling_rules()
 
 
-def test_rules_sample_span():
+def test_json_not_list_error():
+    with override_env(
+        dict(DD_SPAN_SAMPLING_RULES='{"sample_rate":0.5,"service":"xyz","name":"abc","max_per_second":100}')
+    ):
+        with pytest.raises(TypeError):
+            get_span_sampling_rules()
+
+
+def test_json_decode_error_throws_ValueError():
+    with override_env(
+        dict(DD_SPAN_SAMPLING_RULES='{"sample_rate":0.5,"service":"xyz","name":"abc","max_per_second":100')
+    ):
+        with pytest.raises(ValueError):
+            get_span_sampling_rules()
+
+
+def test_rules_sample_span_via_env():
     """Test that single span sampling tags are applied to spans that should get sampled when envars set"""
     with override_env(dict(DD_SPAN_SAMPLING_RULES='[{"service":"test_service","name":"test_name"}]')):
         sampling_rules = get_span_sampling_rules()
@@ -89,7 +108,7 @@ def test_rules_sample_span():
         assert_sampling_decision_tags(span)
 
 
-def test_rules_do_not_sample_wrong_span():
+def test_rules_do_not_sample_wrong_span_via_env():
     """Test that single span sampling tags are not applied to spans that do not match rules"""
     with override_env(dict(DD_SPAN_SAMPLING_RULES='[{"service":"test_ser","name":"test_na"}]')):
         sampling_rules = get_span_sampling_rules()
@@ -103,7 +122,7 @@ def test_rules_do_not_sample_wrong_span():
         assert_sampling_decision_tags(span, sample_rate=None, mechanism=None, limit=None)
 
 
-def test_single_span_rules_do_not_tag_if_tracer_samples():
+def test_single_span_rules_do_not_tag_if_tracer_samples_via_env():
     """Test that single span sampling rules aren't applied if a span is already going to be sampled by trace sampler"""
     with override_env(dict(DD_SPAN_SAMPLING_RULES='[{"service":"test_service","name":"test_name"}]')):
         sampling_rules = get_span_sampling_rules()
@@ -119,6 +138,55 @@ def test_single_span_rules_do_not_tag_if_tracer_samples():
         assert_sampling_decision_tags(span, sample_rate=None, mechanism=None, limit=None, trace_sampling=True)
 
 
+def test_sampling_rule_init_config_multiple_sampling_rule_json_via_file(tmpdir):
+    file = tmpdir.join("rules.json")
+    file.write(
+        '[{"service":"xy?","name":"a*c"}, \
+            {"sample_rate":0.5,"service":"my-service","name":"my-name", "max_per_second":"20"}]'
+    )
+
+    with override_env(dict(DD_SPAN_SAMPLING_RULES_FILE=str(file))):
+        sampling_rules = _get_file_json()
+        assert sampling_rules == [
+            {"service": "xy?", "name": "a*c"},
+            {"sample_rate": 0.5, "service": "my-service", "name": "my-name", "max_per_second": "20"},
+        ]
+
+
+def test_wrong_file_path(tmpdir):
+    """Test that single span sampling tags are not applied to spans that do not match rules via file"""
+    with override_env(dict(DD_SPAN_SAMPLING_RULES_FILE="data/this_doesnt_exist.json")):
+        exception = FileNotFoundError if sys.version_info.major > 3 else IOError
+        with pytest.raises(exception):
+            get_span_sampling_rules()
+
+
+def test_default_to_env_if_both_env_and_file_config(tmpdir, caplog):
+    file = tmpdir.join("rules.json")
+    file.write('[{"sample_rate":1.0,"service":"x","name":"ab","max_per_second":1000}]')
+
+    with override_env(
+        dict(
+            DD_SPAN_SAMPLING_RULES_FILE=str(file),
+            DD_SPAN_SAMPLING_RULES='[{"sample_rate":0.5,"service":"xyz","name":"abc","max_per_second":100}]',
+        )
+    ):
+        sampling_rules = get_span_sampling_rules()
+        assert caplog.record_tuples == [
+            (
+                "ddtrace.internal.sampling",
+                30,
+                "DD_SPAN_SAMPLING_RULES and DD_SPAN_SAMPLING_RULES_FILE detected. "
+                "Defaulting to DD_SPAN_SAMPLING_RULES value.",
+            )
+        ]
+        assert sampling_rules[0]._sample_rate == 0.5
+        assert sampling_rules[0]._service_matcher.pattern == "xyz"
+        assert sampling_rules[0]._name_matcher.pattern == "abc"
+        assert sampling_rules[0]._max_per_second == 100
+        assert len(sampling_rules) == 1
+
+
 def traced_function(tracer, name="test_name", service="test_service", trace_sampling=False):
     with tracer.trace(name) as span:
         # If the trace sampler samples the trace, then we shouldn't add the span sampling tags
@@ -139,4 +207,4 @@ def assert_sampling_decision_tags(
     assert span.get_metric(_SINGLE_SPAN_SAMPLING_MAX_PER_SEC) == limit
 
     if trace_sampling:
-        assert span.get_metric(SAMPLING_PRIORITY_KEY) >= 0
+        assert span.get_metric(SAMPLING_PRIORITY_KEY) > 0