diff --git a/Dockerfile.jetson b/Dockerfile.jetson index 1c95590..bd4fe57 100644 --- a/Dockerfile.jetson +++ b/Dockerfile.jetson @@ -1,4 +1,4 @@ -FROM nvcr.io/nvidia/l4t-jetpack:r36.2.0 +FROM nvcr.io/nvidia/l4t-jetpack:r36.4.0 ARG CI_COMMIT_SHA=unknown ENV AZAION_REVISION=$CI_COMMIT_SHA @@ -6,6 +6,7 @@ RUN apt-get update && apt-get install -y \ python3 python3-pip python3-dev gcc \ libgl1 libglib2.0-0 \ python3-libnvinfer python3-libnvinfer-dev \ + python3-pycuda \ && rm -rf /var/lib/apt/lists/* diff --git a/_docs/02_tasks/done/AZ-180_jetson_orin_nano_support.md b/_docs/02_tasks/done/AZ-180_jetson_orin_nano_support.md index d330e93..cf45f55 100644 --- a/_docs/02_tasks/done/AZ-180_jetson_orin_nano_support.md +++ b/_docs/02_tasks/done/AZ-180_jetson_orin_nano_support.md @@ -2,7 +2,7 @@ **Task**: AZ-180_jetson_orin_nano_support **Name**: Jetson Orin Nano Support -**Description**: Run the detection service on NVIDIA Jetson Orin Nano with a JetPack 6.x container image, INT8 engine conversion using a pre-generated calibration cache, and docker-compose configuration. +**Description**: Run the detection service on NVIDIA Jetson Orin Nano with a JetPack 6.2.x-compatible container image, INT8 engine conversion using a pre-generated calibration cache, and docker-compose configuration. **Complexity**: 5 points **Dependencies**: None **Component**: Deployment + Inference Engine @@ -75,7 +75,7 @@ Then the detections service is reachable on port 8080 ## Non-Functional Requirements **Compatibility** -- JetPack 6.x (CUDA 12.2, TensorRT 10.x) +- JetPack 6.2.x-compatible container (`nvcr.io/nvidia/l4t-jetpack:r36.4.0`, CUDA 12.6 / TensorRT 10.3 compute stack) - Jetson Orin Nano (aarch64, SM 8.7) **Reliability** diff --git a/_docs/04_deploy/containerization.md b/_docs/04_deploy/containerization.md index f446184..8373f5d 100644 --- a/_docs/04_deploy/containerization.md +++ b/_docs/04_deploy/containerization.md @@ -119,7 +119,7 @@ Already exists: `e2e/docker-compose.test.yml`. No changes needed — supports bo | Aspect | Specification | |--------|--------------| -| Base image | `nvcr.io/nvidia/l4t-base:r36.3.0` (JetPack 6.x, aarch64) | +| Base image | `nvcr.io/nvidia/l4t-jetpack:r36.4.0` (JetPack 6.2.x-compatible, aarch64) | | TensorRT | Pre-installed via JetPack — `python3-libnvinfer` apt package (NOT pip) | | PyCUDA | Pre-installed via JetPack — `python3-pycuda` apt package (NOT pip) | | Build stages | Single stage (Cython compile requires gcc) | @@ -129,7 +129,7 @@ Already exists: `e2e/docker-compose.test.yml`. No changes needed — supports bo | Runtime | Requires NVIDIA Container Runtime (`runtime: nvidia` in docker-compose) | **Jetson-specific behaviour**: -- `requirements-jetson.txt` derives from `requirements.txt` — `tensorrt` and `pycuda` are excluded from pip and provided by JetPack +- `requirements-jetson.txt` derives from `requirements.txt` — `tensorrt` and `pycuda` are excluded from pip; TensorRT and PyCUDA are installed from the JetPack/L4T apt packages in `Dockerfile.jetson` - Engine filename auto-encodes CC+SM (e.g. `azaion.cc_8.7_sm_16.engine` for Orin Nano), ensuring the Jetson engine is distinct from any x86-cached engine - INT8 is used when `azaion.int8_calib.cache` is available on the Loader service; precision suffix appended to engine filename (`*.int8.engine`); FP16 fallback when cache is absent - `docker-compose.jetson.yml` uses `runtime: nvidia` for the NVIDIA Container Runtime diff --git a/requirements-jetson.txt b/requirements-jetson.txt index 79fb685..fac7843 100644 --- a/requirements-jetson.txt +++ b/requirements-jetson.txt @@ -12,4 +12,3 @@ requests==2.32.4 loguru==0.7.3 av==14.2.0 xxhash==3.5.0 -pycuda