mirror of
https://github.com/azaion/detections.git
synced 2026-04-22 10:16:31 +00:00
5a968edcba
- Added Cython generated files to .gitignore to prevent unnecessary tracking. - Updated paths in `inference.c` and `coreml_engine.c` to reflect the correct virtual environment. - Revised the execution environment documentation to clarify hardware dependency checks and local execution instructions, ensuring accurate guidance for users. - Removed outdated Docker suitability checks and streamlined the assessment process for test execution environments.
117 lines
3.3 KiB
Python
117 lines
3.3 KiB
Python
import json
|
|
import time
|
|
from concurrent.futures import ThreadPoolExecutor
|
|
|
|
import pytest
|
|
|
|
|
|
def _percentile_ms(sorted_ms, p):
|
|
n = len(sorted_ms)
|
|
if n == 0:
|
|
return 0.0
|
|
if n == 1:
|
|
return float(sorted_ms[0])
|
|
k = (n - 1) * (p / 100.0)
|
|
lo = int(k)
|
|
hi = min(lo + 1, n - 1)
|
|
w = k - lo
|
|
return sorted_ms[lo] * (1 - w) + sorted_ms[hi] * w
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.timeout(300)
|
|
def test_nft_perf_01_single_image_latency_p95(
|
|
warm_engine, http_client, image_small
|
|
):
|
|
times_ms = []
|
|
for _ in range(10):
|
|
t0 = time.perf_counter()
|
|
r = http_client.post(
|
|
"/detect",
|
|
files={"file": ("img.jpg", image_small, "image/jpeg")},
|
|
timeout=120,
|
|
)
|
|
elapsed_ms = (time.perf_counter() - t0) * 1000.0
|
|
assert r.status_code == 200
|
|
times_ms.append(elapsed_ms)
|
|
sorted_ms = sorted(times_ms)
|
|
p50 = _percentile_ms(sorted_ms, 50)
|
|
p95 = _percentile_ms(sorted_ms, 95)
|
|
p99 = _percentile_ms(sorted_ms, 99)
|
|
print(
|
|
"nft_perf_01_csv,run_ms,"
|
|
+ ",".join(f"{x:.2f}" for x in sorted_ms)
|
|
+ f",p50,{p50:.2f},p95,{p95:.2f},p99,{p99:.2f}"
|
|
)
|
|
assert p95 < 5000.0
|
|
|
|
|
|
def _post_small(http_client, image_small):
|
|
return http_client.post(
|
|
"/detect",
|
|
files={"file": ("img.jpg", image_small, "image/jpeg")},
|
|
timeout=120,
|
|
)
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.timeout(300)
|
|
def test_nft_perf_02_concurrent_throughput_queuing(
|
|
warm_engine, http_client, image_small
|
|
):
|
|
def run_two():
|
|
t0 = time.monotonic()
|
|
with ThreadPoolExecutor(max_workers=2) as ex:
|
|
futs = [ex.submit(_post_small, http_client, image_small) for _ in range(2)]
|
|
rs = [f.result() for f in futs]
|
|
return time.monotonic() - t0, rs
|
|
|
|
def run_three():
|
|
t0 = time.monotonic()
|
|
with ThreadPoolExecutor(max_workers=3) as ex:
|
|
futs = [ex.submit(_post_small, http_client, image_small) for _ in range(3)]
|
|
rs = [f.result() for f in futs]
|
|
return time.monotonic() - t0, rs
|
|
|
|
wall2, rs2 = run_two()
|
|
assert all(r.status_code == 200 for r in rs2)
|
|
wall3, rs3 = run_three()
|
|
assert all(r.status_code == 200 for r in rs3)
|
|
if wall2 < 4.0:
|
|
pytest.skip("wall clock too small for queuing comparison")
|
|
assert wall3 > wall2 + 0.25
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.timeout(300)
|
|
def test_nft_perf_03_tiling_overhead_large_image(
|
|
warm_engine, http_client, image_small, image_large
|
|
):
|
|
t_small = time.perf_counter()
|
|
r_small = http_client.post(
|
|
"/detect",
|
|
files={"file": ("small.jpg", image_small, "image/jpeg")},
|
|
timeout=120,
|
|
)
|
|
small_ms = (time.perf_counter() - t_small) * 1000.0
|
|
assert r_small.status_code == 200
|
|
config = json.dumps(
|
|
{"altitude": 400, "focal_length": 24, "sensor_width": 23.5}
|
|
)
|
|
t_large = time.perf_counter()
|
|
r_large = http_client.post(
|
|
"/detect",
|
|
files={"file": ("large.jpg", image_large, "image/jpeg")},
|
|
data={"config": config},
|
|
timeout=120,
|
|
)
|
|
large_ms = (time.perf_counter() - t_large) * 1000.0
|
|
assert r_large.status_code == 200
|
|
assert large_ms < 120_000.0
|
|
print(
|
|
f"nft_perf_03_csv,baseline_small_ms,{small_ms:.2f},large_ms,{large_ms:.2f}"
|
|
)
|
|
assert large_ms > small_ms - 500.0
|
|
|
|
|