Skip to content

Commit 4beaa01

Browse files
authored
chore(profiling): more tests for libdd and stack_v2 (#11679)
First copied files from tests/profiling folder, and then modified them as needed. Tests checking for agent export urls are dropped. libdd exporter is created with agent url passed from tracer state whenever we try to upload, see [feat(profiling): support dynamic agent url](#11319) These tests will be run under libdd_enabled and some of them had been edited to also run under stack_v2 enabled ## Checklist - [x] PR author has checked that all the criteria below are met - The PR description includes an overview of the change - The PR description articulates the motivation for the change - The change includes tests OR the PR description describes a testing strategy - The PR description notes risks associated with the change, if any - Newly-added code is easy to change - The change follows the [library release note guidelines](https://ddtrace.readthedocs.io/en/stable/releasenotes.html) - The change includes or references documentation updates if necessary - Backport labels are set (if [applicable](https://ddtrace.readthedocs.io/en/latest/contributing.html#backporting)) ## Reviewer Checklist - [x] Reviewer has checked that all the criteria below are met - Title is accurate - All changes are related to the pull request's stated goal - Avoids breaking [API](https://ddtrace.readthedocs.io/en/stable/versioning.html#interfaces) changes - Testing strategy adequately addresses listed risks - Newly-added code is easy to change - Release note makes sense to a user of the library - If necessary, author has acknowledged and discussed the performance implications of this PR as reported in the benchmarks PR comment - Backport labels are set in a manner that is consistent with the [release branch maintenance policy](https://ddtrace.readthedocs.io/en/latest/contributing.html#backporting)
1 parent 42f69dc commit 4beaa01

10 files changed

+850
-47
lines changed

tests/profiling/collector/test_stack.py

+15-22
Original file line numberDiff line numberDiff line change
@@ -254,13 +254,12 @@ def test_ignore_profiler_single():
254254

255255

256256
@pytest.mark.skipif(not TESTING_GEVENT, reason="Not testing gevent")
257-
@pytest.mark.subprocess(ddtrace_run=True)
257+
@pytest.mark.subprocess(ddtrace_run=True, env=dict(DD_PROFILING_IGNORE_PROFILER="1", DD_PROFILING_API_TIMEOUT="0.1"))
258258
def test_ignore_profiler_gevent_task():
259259
import gevent.monkey
260260

261261
gevent.monkey.patch_all()
262262

263-
import os
264263
import time
265264

266265
from ddtrace.profiling import collector # noqa:F401
@@ -282,28 +281,22 @@ def collect(self):
282281
_fib(22)
283282
return []
284283

285-
for ignore in (True, False):
286-
os.environ["DD_PROFILING_API_TIMEOUT"] = "0.1"
287-
os.environ["DD_PROFILING_IGNORE_PROFILER"] = str(ignore)
288-
p = profiler.Profiler()
289-
p.start()
290-
# This test is particularly useful with gevent enabled: create a test collector that run often and for long
291-
# we're sure to catch it with the StackProfiler and that it's not ignored.
292-
c = CollectorTest(p._profiler._recorder, interval=0.00001)
293-
c.start()
284+
p = profiler.Profiler()
285+
p.start()
286+
# This test is particularly useful with gevent enabled: create a test collector that run often and for long
287+
# we're sure to catch it with the StackProfiler and that it's not ignored.
288+
c = CollectorTest(p._profiler._recorder, interval=0.00001)
289+
c.start()
294290

295-
for _ in range(100):
296-
events = p._profiler._recorder.reset()
297-
ids = {e.task_id for e in events[stack_event.StackSampleEvent]}
298-
if (c._worker.ident in ids) != str(ignore):
299-
break
300-
# Give some time for gevent to switch greenlets
301-
time.sleep(0.1)
302-
else:
303-
raise AssertionError("ignore == " + ignore)
291+
for _ in range(100):
292+
events = p._profiler._recorder.reset()
293+
ids = {e.task_id for e in events[stack_event.StackSampleEvent]}
294+
if c._worker.ident in ids:
295+
raise AssertionError("Collector thread found")
296+
time.sleep(0.1)
304297

305-
c.stop()
306-
p.stop(flush=False)
298+
c.stop()
299+
p.stop(flush=False)
307300

308301

309302
def test_collect():

tests/profiling/test_accuracy.py

+21-24
Original file line numberDiff line numberDiff line change
@@ -31,16 +31,16 @@ def spend_16():
3131

3232

3333
def spend_cpu_2():
34-
now = time.monotonic_ns()
34+
now = time.process_time_ns()
3535
# Active wait for 2 seconds
36-
while time.monotonic_ns() - now < 2e9:
36+
while time.process_time_ns() - now < 2e9:
3737
pass
3838

3939

4040
def spend_cpu_3():
4141
# Active wait for 3 seconds
42-
now = time.monotonic_ns()
43-
while time.monotonic_ns() - now < 3e9:
42+
now = time.process_time_ns()
43+
while time.process_time_ns() - now < 3e9:
4444
pass
4545

4646

@@ -51,8 +51,12 @@ def spend_cpu_3():
5151
CPU_TOLERANCE = 0.05
5252

5353

54-
def almost_equal(value, target, tolerance=TOLERANCE):
55-
return abs(value - target) / target <= tolerance
54+
def assert_almost_equal(value, target, tolerance=TOLERANCE):
55+
if abs(value - target) / target > tolerance:
56+
raise AssertionError(
57+
f"Assertion failed: {value} is not approximately equal to {target} "
58+
f"within tolerance={tolerance}, actual error={abs(value - target) / target}"
59+
)
5660

5761

5862
def total_time(time_data, funcname):
@@ -66,7 +70,7 @@ def test_accuracy():
6670
from ddtrace.profiling import profiler
6771
from ddtrace.profiling.collector import stack_event
6872
from tests.profiling.test_accuracy import CPU_TOLERANCE
69-
from tests.profiling.test_accuracy import almost_equal
73+
from tests.profiling.test_accuracy import assert_almost_equal
7074
from tests.profiling.test_accuracy import spend_16
7175
from tests.profiling.test_accuracy import total_time
7276

@@ -85,20 +89,13 @@ def test_accuracy():
8589
time_spent_ns[idx][frame[2]] += event.wall_time_ns
8690
cpu_spent_ns[idx][frame[2]] += event.cpu_time_ns
8791

88-
assert almost_equal(total_time(time_spent_ns, "spend_3"), 9e9)
89-
assert almost_equal(total_time(time_spent_ns, "spend_1"), 2e9)
90-
assert almost_equal(total_time(time_spent_ns, "spend_4"), 4e9)
91-
assert almost_equal(total_time(time_spent_ns, "spend_16"), 16e9)
92-
assert almost_equal(total_time(time_spent_ns, "spend_7"), 7e9)
93-
94-
try:
95-
from time import monotonic_ns # noqa:F401
96-
except ImportError:
97-
# If we don't have access to high resolution clocks, we can't really test accurately things as it's spread in
98-
# various Python implementation of monotonic, etc.
99-
pass
100-
else:
101-
assert almost_equal(total_time(time_spent_ns, "spend_cpu_2"), 2e9)
102-
assert almost_equal(total_time(time_spent_ns, "spend_cpu_3"), 3e9)
103-
assert almost_equal(total_time(time_spent_ns, "spend_cpu_2"), 2e9, CPU_TOLERANCE)
104-
assert almost_equal(total_time(time_spent_ns, "spend_cpu_3"), 3e9, CPU_TOLERANCE)
92+
assert_almost_equal(total_time(time_spent_ns, "spend_3"), 9e9)
93+
assert_almost_equal(total_time(time_spent_ns, "spend_1"), 2e9)
94+
assert_almost_equal(total_time(time_spent_ns, "spend_4"), 4e9)
95+
assert_almost_equal(total_time(time_spent_ns, "spend_16"), 16e9)
96+
assert_almost_equal(total_time(time_spent_ns, "spend_7"), 7e9)
97+
98+
assert_almost_equal(total_time(time_spent_ns, "spend_cpu_2"), 2e9)
99+
assert_almost_equal(total_time(time_spent_ns, "spend_cpu_3"), 3e9)
100+
assert_almost_equal(total_time(cpu_spent_ns, "spend_cpu_2"), 2e9, CPU_TOLERANCE)
101+
assert_almost_equal(total_time(cpu_spent_ns, "spend_cpu_3"), 3e9, CPU_TOLERANCE)

tests/profiling_v2/collector/test_stack.py

+130-1
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@
1313
from ddtrace.profiling.collector import stack
1414
from ddtrace.settings.profiling import config
1515
from tests.profiling.collector import pprof_utils
16+
from tests.profiling.collector import test_collector
1617

1718

1819
# Python 3.11.9 is not compatible with gevent, https://github.com/gevent/gevent/issues/2040
@@ -24,6 +25,43 @@
2425
)
2526

2627

28+
# Use subprocess as ddup config persists across tests.
29+
@pytest.mark.subprocess(
30+
env=dict(
31+
DD_PROFILING_MAX_FRAMES="5",
32+
DD_PROFILING_OUTPUT_PPROF="/tmp/test_collect_truncate",
33+
DD_PROFILING_STACK_V2_ENABLED="1",
34+
)
35+
)
36+
@pytest.mark.skipif(sys.version_info[:2] == (3, 7), reason="stack_v2 is not supported on Python 3.7")
37+
def test_collect_truncate():
38+
import os
39+
40+
from ddtrace.profiling import profiler
41+
from tests.profiling.collector import pprof_utils
42+
from tests.profiling.collector.test_stack import func1
43+
44+
pprof_prefix = os.environ["DD_PROFILING_OUTPUT_PPROF"]
45+
output_filename = pprof_prefix + "." + str(os.getpid())
46+
47+
max_nframes = int(os.environ["DD_PROFILING_MAX_FRAMES"])
48+
49+
p = profiler.Profiler()
50+
p.start()
51+
52+
func1()
53+
54+
p.stop()
55+
56+
profile = pprof_utils.parse_profile(output_filename)
57+
samples = pprof_utils.get_samples_with_value_type(profile, "wall-time")
58+
assert len(samples) > 0
59+
for sample in samples:
60+
# stack v2 adds one extra frame for "%d frames omitted" message
61+
# Also, it allows max_nframes + 1 frames, so we add 2 here.
62+
assert len(sample.location_id) <= max_nframes + 2, len(sample.location_id)
63+
64+
2765
@pytest.mark.parametrize("stack_v2_enabled", [True, False])
2866
def test_stack_locations(stack_v2_enabled, tmp_path):
2967
if sys.version_info[:2] == (3, 7) and stack_v2_enabled:
@@ -651,8 +689,23 @@ def _dofib():
651689
assert checked_thread, "No samples found for the expected threads"
652690

653691

692+
def test_max_time_usage():
693+
with pytest.raises(ValueError):
694+
stack.StackCollector(None, max_time_usage_pct=0)
695+
696+
697+
def test_max_time_usage_over():
698+
with pytest.raises(ValueError):
699+
stack.StackCollector(None, max_time_usage_pct=200)
700+
701+
654702
@pytest.mark.parametrize(
655-
("stack_v2_enabled", "ignore_profiler"), [(True, True), (True, False), (False, True), (False, False)]
703+
"stack_v2_enabled",
704+
[True, False],
705+
)
706+
@pytest.mark.parametrize(
707+
"ignore_profiler",
708+
[True, False],
656709
)
657710
def test_ignore_profiler(stack_v2_enabled, ignore_profiler, tmp_path):
658711
if sys.version_info[:2] == (3, 7) and stack_v2_enabled:
@@ -691,3 +744,79 @@ def test_ignore_profiler(stack_v2_enabled, ignore_profiler, tmp_path):
691744
assert collector_worker_thread_id in thread_ids
692745
else:
693746
assert collector_worker_thread_id not in thread_ids
747+
748+
749+
# TODO: support ignore profiler with stack_v2 and update this test
750+
@pytest.mark.skipif(not TESTING_GEVENT, reason="Not testing gevent")
751+
@pytest.mark.subprocess(
752+
ddtrace_run=True,
753+
env=dict(DD_PROFILING_IGNORE_PROFILER="1", DD_PROFILING_OUTPUT_PPROF="/tmp/test_ignore_profiler_gevent_task"),
754+
)
755+
def test_ignore_profiler_gevent_task():
756+
import gevent.monkey
757+
758+
gevent.monkey.patch_all()
759+
760+
import os
761+
import time
762+
import typing
763+
764+
from ddtrace.profiling import collector
765+
from ddtrace.profiling import event as event_mod
766+
from ddtrace.profiling import profiler
767+
from ddtrace.profiling.collector import stack
768+
from tests.profiling.collector import pprof_utils
769+
770+
def _fib(n):
771+
if n == 1:
772+
return 1
773+
elif n == 0:
774+
return 0
775+
else:
776+
return _fib(n - 1) + _fib(n - 2)
777+
778+
class CollectorTest(collector.PeriodicCollector):
779+
def collect(self) -> typing.Iterable[typing.Iterable[event_mod.Event]]:
780+
_fib(22)
781+
return []
782+
783+
output_filename = os.environ["DD_PROFILING_OUTPUT_PPROF"]
784+
785+
p = profiler.Profiler()
786+
787+
p.start()
788+
789+
for c in p._profiler._collectors:
790+
if isinstance(c, stack.StackCollector):
791+
c.ignore_profiler
792+
793+
c = CollectorTest(None, interval=0.00001)
794+
c.start()
795+
796+
time.sleep(3)
797+
798+
worker_ident = c._worker.ident
799+
800+
c.stop()
801+
p.stop()
802+
803+
profile = pprof_utils.parse_profile(output_filename + "." + str(os.getpid()))
804+
805+
samples = pprof_utils.get_samples_with_value_type(profile, "cpu-time")
806+
807+
thread_ids = set()
808+
for sample in samples:
809+
thread_id_label = pprof_utils.get_label_with_key(profile.string_table, sample, "thread id")
810+
thread_id = int(thread_id_label.num)
811+
thread_ids.add(thread_id)
812+
813+
assert worker_ident not in thread_ids
814+
815+
816+
def test_repr():
817+
test_collector._test_repr(
818+
stack.StackCollector,
819+
"StackCollector(status=<ServiceStatus.STOPPED: 'stopped'>, "
820+
"recorder=Recorder(default_max_events=16384, max_events={}), min_interval_time=0.01, max_time_usage_pct=1.0, "
821+
"nframes=64, ignore_profiler=False, endpoint_collection_enabled=None, tracer=None)",
822+
)

tests/profiling_v2/simple_program.py

+32
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,32 @@
1+
#!/usr/bin/env python
2+
import os
3+
import sys
4+
import time
5+
6+
from ddtrace.internal import service
7+
from ddtrace.profiling import bootstrap
8+
from ddtrace.profiling.collector import stack
9+
10+
11+
for running_collector in bootstrap.profiler._profiler._collectors:
12+
if isinstance(running_collector, stack.StackCollector):
13+
break
14+
else:
15+
raise AssertionError("Unable to find stack collector")
16+
17+
18+
print("hello world")
19+
assert running_collector.status == service.ServiceStatus.RUNNING
20+
print(running_collector.interval)
21+
22+
t0 = time.time()
23+
while time.time() - t0 < (running_collector.interval * 10):
24+
pass
25+
26+
# Do some serious memory allocations!
27+
for _ in range(5000000):
28+
object()
29+
30+
print(os.getpid())
31+
print(bootstrap.profiler._profiler._stack_v2_enabled)
32+
sys.exit(42)
+32
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,32 @@
1+
import os
2+
import sys
3+
import threading
4+
5+
from ddtrace.internal import service
6+
import ddtrace.profiling.auto
7+
import ddtrace.profiling.bootstrap
8+
import ddtrace.profiling.profiler
9+
10+
11+
lock = threading.Lock()
12+
lock.acquire()
13+
14+
15+
assert ddtrace.profiling.bootstrap.profiler.status == service.ServiceStatus.RUNNING
16+
17+
18+
child_pid = os.fork()
19+
if child_pid == 0:
20+
# Release it
21+
lock.release()
22+
23+
# We track this one though
24+
lock = threading.Lock()
25+
lock.acquire()
26+
lock.release()
27+
else:
28+
lock.release()
29+
assert ddtrace.profiling.bootstrap.profiler.status == service.ServiceStatus.RUNNING
30+
print(child_pid)
31+
pid, status = os.waitpid(child_pid, 0)
32+
sys.exit(os.WEXITSTATUS(status))
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
# Import from ddtrace before monkey patching to ensure that we grab all the
2+
# necessary references to the unpatched modules.
3+
import ddtrace.auto # noqa: F401, I001
4+
import ddtrace.profiling.auto # noqa:F401
5+
6+
7+
import gevent.monkey # noqa:F402
8+
9+
gevent.monkey.patch_all()
10+
11+
import threading # noqa: E402, F402, I001
12+
import time # noqa: E402, F402
13+
14+
15+
def fibonacci(n):
16+
if n == 0:
17+
return 0
18+
elif n == 1:
19+
return 1
20+
else:
21+
return fibonacci(n - 1) + fibonacci(n - 2)
22+
23+
24+
i = 1
25+
for _ in range(20):
26+
threads = []
27+
for _ in range(10):
28+
t = threading.Thread(target=fibonacci, args=(i,))
29+
t.start()
30+
threads.append(t)
31+
i += 1
32+
for t in threads:
33+
t.join()
34+
time.sleep(0.1)

0 commit comments

Comments
 (0)