tuttlebr
diff --git a/‎.env
+19-15 b/‎.env
+19-15
diff --git a/‎.gitignore
+2-1 b/‎.gitignore
+2-1
diff --git a/‎.pre-commit-config.yaml
+37 b/‎.pre-commit-config.yaml
+37
diff --git a/‎README.md
+1-1 b/‎README.md
+1-1
diff --git a/‎docker-compose.yaml
+8-4 b/‎docker-compose.yaml
+8-4
diff --git a/‎docker/triton-server/Dockerfile
+6-4 b/‎docker/triton-server/Dockerfile
+6-4
diff --git a/‎docker/triton-server/facenet_model/serialize_dali.py
+7-7 b/‎docker/triton-server/facenet_model/serialize_dali.py
+7-7
diff --git a/‎docker/triton-server/fpenet_model/serialize_dali.py
+1-1 b/‎docker/triton-server/fpenet_model/serialize_dali.py
+1-1
diff --git a/‎docker/triton-server/tlt-converter.sh
+15-18 b/‎docker/triton-server/tlt-converter.sh
+15-18
diff --git a/‎triton-models/facenet/config.pbtxt
+8-4 b/‎triton-models/facenet/config.pbtxt
+8-4
diff --git a/‎triton-models/facenet_ensemble/config.pbtxt
+2-3 b/‎triton-models/facenet_ensemble/config.pbtxt
+2-3
diff --git a/‎triton-models/facenet_postprocess/1/postprocessing/postprocessor_config_pb2.py
+5-6 b/‎triton-models/facenet_postprocess/1/postprocessing/postprocessor_config_pb2.py
+5-6
diff --git a/‎triton-models/facenet_postprocess/config.pbtxt
+9-5 b/‎triton-models/facenet_postprocess/config.pbtxt
+9-5
@@ -1,24 +1,28 @@
-SUBNET=172.25.4.0/24
-TRITON_SERVER_IP=172.25.4.42
-TRITON_CLIENT_IP=172.25.4.45
-REDIS_DB_IP=172.25.4.47
-REDIS_OM_URL=redis://172.25.4.47:6379/0
-REDIS_INSIGHT_IP=172.25.4.49
+SUBNET="172.25.4.0/24"
+TRITON_SERVER_IP="172.25.4.42"
+TRITON_CLIENT_IP="172.25.4.45"
+REDIS_DB_IP="172.25.4.47"
+REDIS_OM_URL="redis://172.25.4.47:6379/0"
+REDIS_INSIGHT_IP="172.25.4.49"
 
-MAJOR_UPDATE_VERSION=23.02
-REDIS_DB_IMAGE=redislabs/redisearch:2.6.3
-DEBIAN_FRONTEND=noninteractive
-PROTOBUF_URL=https://github.com/protocolbuffers/protobuf/releases/download/v21.6/protoc-21.6-linux-x86_64.zip
+TAO_VERSION="v5.1.0_8.6.3.1_x86"
+MAJOR_UPDATE_VERSION="23.11"
+REDIS_DB_IMAGE="redislabs/redisearch:2.6.3"
+DEBIAN_FRONTEND="noninteractive"
+PROTOBUF_URL="https://github.com/protocolbuffers/protobuf/releases/download/v21.6/protoc-21.6-linux-x86_64.zip"
 
-TRT_LIB_PATH=/usr/lib/x86_64-linux-gnu
-TRT_INC_PATH=/usr/include/x86_64-linux-gnu
-CUDA_MODULE_LOADING=LAZY
+TRT_LIB_PATH="/usr/lib/x86_64-linux-gnu"
+TRT_INC_PATH="/usr/include/x86_64-linux-gnu"
+CUDA_MODULE_LOADING="LAZY"
 
-CONTAINER_IMAGE_FOLDER=/volume1/brandon/pictures
+CONTAINER_IMAGE_FOLDER="/volume1/brandon/pictures"
 MODEL_VERSION="1"
 TRITON_SERVER_URL="172.25.4.42:8001"
-HOST_IMAGE_FOLDER=/volume1/brandon/pictures
+HOST_IMAGE_FOLDER="/volume1/homes/brandon/Photos/PhotoLibrary"
 FACE_ALIGN_MODEL_NAME="facealign"
 FACE_DETECT_MODEL_NAME="facenet_ensemble"
 FPENET_MODEL_NAME="fpenet_ensemble"
 JUPYTER_ENABLE_LAB="yes"
+
+FACENET_MODEL_PATH="/volume1/brandon/models/facenet_vpruned_quantized_v2.0.1"
+FPENET_MODEL_PATH="/volume1/brandon/models/fpenet_vdeployable_v3.0"
@@ -14,4 +14,5 @@ ignore.py
 *.rdb
 *.whl
 *.log
-coco/instances.json
+coco/instances.json
+workspace/symetrical_batches.json
@@ -0,0 +1,37 @@
+repos:
+  - repo: https://github.com/pycqa/isort
+    rev: 5.12.0
+    hooks:
+      - id: isort
+  - repo: https://github.com/Lucas-C/pre-commit-hooks.git
+    rev: v1.1.13
+    hooks:
+      - id: remove-crlf
+        files: (?!.*third_party)^.*$ | (?!.*book)^.*$
+  - repo: https://github.com/pre-commit/mirrors-yapf
+    rev: v0.32.0
+    hooks:
+      - id: yapf
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.1.0
+    hooks:
+      - id: check-added-large-files
+        args: ['--maxkb=750']
+      - id: check-merge-conflict
+      - id: check-symlinks
+      - id: detect-private-key
+        files: (?!.*third_party)^.*$ | (?!.*book)^.*$
+      - id: end-of-file-fixer
+      - id: check-yaml
+      - id: sort-simple-yaml
+      - id: trailing-whitespace
+  - repo: https://github.com/PyCQA/autoflake
+    rev: v1.6.1
+    hooks:
+      - id: autoflake
+        args:
+          [
+            "--in-place",
+            "--remove-all-unused-imports",
+            "--remove-unused-variables",
+          ]
@@ -168,7 +168,7 @@ docker compose build
 ### Run Model Conversion
 
 ```sh
-docker compose run triton-model-builder
+docker compose up triton-model-builder
 ```
 
 ### Start Services
 
@@ -11,9 +11,9 @@ services:
       args:
         - TRITON_VERSION=${MAJOR_UPDATE_VERSION}
         - PROTOBUF_URL=${PROTOBUF_URL}
+        - TAO_VERSION=${TAO_VERSION}
       context: docker/triton-server
     image: triton-server-image
-    shm_size: 64g
     ulimits:
       memlock: -1
       stack: 1073741824
@@ -24,9 +24,15 @@ services:
     volumes:
       - type: bind
         source: docker/triton-server/facenet_model
-        target: /tmp/facenet_model
+        target: /tmp/dali/facenet_model
       - type: bind
         source: docker/triton-server/fpenet_model
+        target: /tmp/dali/fpenet_model
+      - type: bind
+        source: ${FACENET_MODEL_PATH}
+        target: /tmp/facenet_model
+      - type: bind
+        source: ${FPENET_MODEL_PATH}
         target: /tmp/fpenet_model
       - type: bind
         source: docker/triton-server/tlt-converter.sh
@@ -37,7 +43,6 @@ services:
 
   triton-server:
     image: triton-server-image
-    shm_size: 64g
     ulimits:
       memlock: -1
       stack: 67108864
@@ -76,7 +81,6 @@ services:
         - PROTOBUF_URL=${PROTOBUF_URL}
       context: docker/triton-client
     image: triton-client
-    shm_size: 64g
     ulimits:
       memlock: -1
       stack: 67108864
 
@@ -6,6 +6,7 @@ FROM ${BASE_IMAGE} as builder
 ENV DEBIAN_FRONTEND=noninteractive
 
 # Python dependencies.
+# https://docs.nvidia.com/deeplearning/dali/user-guide/docs/installation.html#nvidia-dali
 COPY requirements.txt .
 RUN pip install -r requirements.txt \
     && pip install --extra-index-url \
@@ -20,14 +21,15 @@ RUN wget ${PROTOBUF_URL} -O proto.zip \
     && mv bin/protoc /usr/local/bin
 
 # Download and install TAO Toolkit converter: https://catalog.ngc.nvidia.com/orgs/nvidia/teams/tao/resources/tao-converter
-RUN wget --content-disposition https://api.ngc.nvidia.com/v2/resources/nvidia/tao/tao-converter/versions/v4.0.0_trt8.5.1.7_x86/zip \
-    -O tao-converter_v4.0.0_trt8.5.1.7_x86.zip \
-    && unzip tao-converter_v4.0.0_trt8.5.1.7_x86.zip \
+ARG TAO_VERSION=v5.1.0_8.6.3.1_x86
+RUN wget --content-disposition https://api.ngc.nvidia.com/v2/resources/nvidia/tao/tao-converter/versions/${TAO_VERSION}/zip \
+    -O tao-converter_${TAO_VERSION}.zip \
+    && unzip tao-converter_${TAO_VERSION}.zip \
     && mv tao-converter /opt \
     && chmod +x /opt/tao-converter
 
 ENV TRT_LIB_PATH=/usr/lib/x86_64-linux-gnu
 ENV TRT_INC_PATH=/usr/include/x86_64-linux-gnu
 ENV PATH=/opt/tao-converter:$PATH
 
-WORKDIR /opt/tritonserver
+WORKDIR /opt/tritonserver
@@ -17,14 +17,14 @@ def __init__(self):
         self.one_over_255 = 1 / 255.0
 
     def load_images(self):
-        self.image_tensor = fn.decoders.image(
-            self.raw_image_tensor, output_type=types.GRAY, device="mixed"
-        )
+        self.image_tensor = fn.decoders.image(self.raw_image_tensor,
+                                              output_type=types.GRAY,
+                                              device="mixed")
 
     def color_space_conversion(self):
-        self.image_tensor = fn.color_space_conversion(
-            self.image_tensor, image_type=types.GRAY, output_type=types.RGB
-        )
+        self.image_tensor = fn.color_space_conversion(self.image_tensor,
+                                                      image_type=types.GRAY,
+                                                      output_type=types.RGB)
 
     def resize_images(self):
         self.image_tensor = fn.resize(
@@ -37,7 +37,7 @@ def resize_images(self):
     def transpose_images(self):
         self.image_tensor = fn.transpose(self.image_tensor, perm=[2, 0, 1])
 
-    @pipeline_def(batch_size=1, num_threads=64)
+    @pipeline_def(batch_size=32, num_threads=64)
     def facenet_reshape(self):
         self.load_images()
         self.color_space_conversion()
 
@@ -40,7 +40,7 @@ def resize_slice_bbox(self):
     def transpose_images(self):
         self.image_tensor = fn.transpose(self.image_tensor, perm=[2, 0, 1])
 
-    @pipeline_def(batch_size=1, num_threads=64)
+    @pipeline_def(batch_size=32, num_threads=64)
     def fpenet_transform(self):
         self.load_images()
         self.slice_bbox()
 
@@ -1,12 +1,11 @@
 #!/bin/bash
-MIN_BATCH=1
-OPT_BATCH=1
-MAX_BATCH=1
+MIN_BATCH=8
+OPT_BATCH=16
+MAX_BATCH=32
 
-echo "Preparing FaceNet Models"
-echo "----------------------------------------------------------------------------------------------------------------"
+echo "[INFO] Preparing FaceNet Models"
 echo "[INFO] Serializing FaceNet DALI model"
-python3 /tmp/facenet_model/serialize_dali.py
+python3 /tmp/dali/facenet_model/serialize_dali.py
 echo "[INFO] FaceNet DALI model serialization complete"
 
 # https://catalog.ngc.nvidia.com/orgs/nvidia/teams/tao/models/facenet/version
@@ -17,10 +16,10 @@ echo "[INFO] FaceNet DALI model serialization complete"
 #     -d 3,416,736 \
 #     -i nchw \
 #     -e /models/facenet/1/model.trt \
-#     -c /tmp/facenet_model/facenet_vpruned_quantized_v2.0.1/int8_calibration.txt \
-#     /tmp/facenet_model/facenet_vpruned_quantized_v2.0.1/model.etlt
+#     -c /tmp/facenet_model/int8_calibration.txt \
+#     /tmp/facenet_model/model.etlt
 
-## FP32 Calibration
+## Calibration
 /opt/tao-converter \
     -k nvidia_tlt \
     -d 3,416,736 \
@@ -29,18 +28,16 @@ echo "[INFO] FaceNet DALI model serialization complete"
     -b ${MIN_BATCH} \
     -m ${MAX_BATCH} \
     -p input_1,${MIN_BATCH}x3x416x736,${OPT_BATCH}x3x416x736,${MAX_BATCH}x3x416x736 \
-    /tmp/facenet_model/facenet_vdeployable_v1.0/model.etlt
+    /tmp/facenet_model/model.etlt
 
 
 protoc -I=/models/facenet_postprocess/1/postprocessing \
     --python_out=/models/facenet_postprocess/1/postprocessing \
     /models/facenet_postprocess/1/postprocessing/postprocessor_config.proto
 echo "[INFO] Completed FaceNet Models prep"
-echo
-echo "Preparing FPENet Model"
-echo "----------------------------------------------------------------------------------------------------------------"
+echo "[INFO] Preparing FPENet Model"
 echo "[INFO] Serializing FPENet DALI model"
-python3 /tmp/fpenet_model/serialize_dali.py
+python3 /tmp/dali/fpenet_model/serialize_dali.py
 echo "[INFO] FPENet DALI model serialization complete"
 
 # https://catalog.ngc.nvidia.com/orgs/nvidia/teams/tao/models/fpenet/version
@@ -53,15 +50,15 @@ echo "[INFO] FPENet DALI model serialization complete"
 #     -i nchw \
 #     -e /models/fpenet/1/model.trt \
 #     -p input_face_images,${MIN_BATCH}x1x80x80,${OPT_BATCH}x1x80x80,${MAX_BATCH}x1x80x80 \
-#     -c /tmp/fpenet_model/fpenet_vdeployable_v3.0/int8_calibration.txt \
-#     /tmp/fpenet_model/fpenet_vdeployable_v3.0/model.etlt
+#     -c /tmp/fpenet_model/int8_calibration.txt \
+#     /tmp/fpenet_model/model.etlt
 
-## FP32 Calibration
+## Calibration
 /opt/tao-converter \
     -k nvidia_tlt \
     -o conv_keypoints_m80 \
     -d 1,80,80 \
     -i nchw \
     -e /models/fpenet/1/model.trt \
     -p input_face_images,${MIN_BATCH}x1x80x80,${OPT_BATCH}x1x80x80,${MAX_BATCH}x1x80x80 \
-    /tmp/fpenet_model/fpenet_vdeployable_v3.0/model.etlt
+    /tmp/fpenet_model/model.etlt
@@ -1,11 +1,15 @@
 name: "facenet"
 platform: "tensorrt_plan"
 default_model_filename: "model.trt"
-max_batch_size: 1
+max_batch_size: 32
+dynamic_batching {
+  preferred_batch_size: [ 8, 16, 32 ]
+  max_queue_delay_microseconds: 100
+  }
 
 instance_group [
   {
-    count: 4
+    count: 2
     kind: KIND_GPU
   }
 ]
@@ -46,9 +50,9 @@ parameters {
   }
 }
 
-parameters {        
+parameters {
   key: "license"
   value: {
       string_value: "License to use this model is covered by the Model EULA. By downloading the unpruned or pruned version of the model, you accept the terms and conditions of these licenses. https://developer.nvidia.com/deep-learning-models-license-agreement"
   }
-}
+}
@@ -1,7 +1,6 @@
 name: "facenet_ensemble"
 platform: "ensemble"
-max_batch_size: 1
-
+max_batch_size: 32
 
 input [
   {
@@ -90,4 +89,4 @@ output [
         }
       }
     ]
-  }
+  }
@@ -1,15 +1,19 @@
 name: "facenet_postprocess"
 backend: "python"
 default_model_filename: "model.py"
-max_batch_size: 1
+max_batch_size: 32
+dynamic_batching {
+  preferred_batch_size: [ 8, 16, 32 ]
+  max_queue_delay_microseconds: 100
+  }
 
 instance_group [
   {
-    count: 4
-    kind: KIND_CPU
+    count: 2
+    kind: KIND_GPU
   }
 ]
-  
+
 input [
     {
       name: "output_bbox/BiasAdd"
@@ -39,4 +43,4 @@ output [
     data_type: TYPE_FP32,
     dims: [ -1, 1 ]
   }
-]
+]
Original file line number	Diff line number	Diff line change
`@@ -1,11 +1,15 @@`
`1`	`1`	`name: "facenet"`
`2`	`2`	`platform: "tensorrt_plan"`
`3`	`3`	`default_model_filename: "model.trt"`
`4`		`-max_batch_size: 1`
	`4`	`+max_batch_size: 32`
	`5`	`+dynamic_batching {`
	`6`	`+ preferred_batch_size: [ 8, 16, 32 ]`
	`7`	`+ max_queue_delay_microseconds: 100`
	`8`	`+ }`
`5`	`9`
`6`	`10`	`instance_group [`
`7`	`11`	`{`
`8`		`- count: 4`
	`12`	`+ count: 2`
`9`	`13`	`kind: KIND_GPU`
`10`	`14`	`}`
`11`	`15`	`]`
`@@ -46,9 +50,9 @@ parameters {`
`46`	`50`	`}`
`47`	`51`	`}`
`48`	`52`
`49`		`-parameters {`
	`53`	`+parameters {`
`50`	`54`	`key: "license"`
`51`	`55`	`value: {`
`52`	`56`	`string_value: "License to use this model is covered by the Model EULA. By downloading the unpruned or pruned version of the model, you accept the terms and conditions of these licenses. https://developer.nvidia.com/deep-learning-models-license-agreement"`
`53`	`57`	`}`
`54`		`-}`
	`58`	`+}`
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,6 @@`
`1`	`1`	`name: "facenet_ensemble"`
`2`	`2`	`platform: "ensemble"`
`3`		`-max_batch_size: 1`
`4`		`-`
	`3`	`+max_batch_size: 32`
`5`	`4`
`6`	`5`	`input [`
`7`	`6`	`{`
`@@ -90,4 +89,4 @@ output [`
`90`	`89`	`}`
`91`	`90`	`}`
`92`	`91`	`]`
`93`		`- }`
	`92`	`+ }`
Original file line number	Diff line number	Diff line change
`@@ -1,15 +1,19 @@`
`1`	`1`	`name: "facenet_postprocess"`
`2`	`2`	`backend: "python"`
`3`	`3`	`default_model_filename: "model.py"`
`4`		`-max_batch_size: 1`
	`4`	`+max_batch_size: 32`
	`5`	`+dynamic_batching {`
	`6`	`+ preferred_batch_size: [ 8, 16, 32 ]`
	`7`	`+ max_queue_delay_microseconds: 100`
	`8`	`+ }`
`5`	`9`
`6`	`10`	`instance_group [`
`7`	`11`	`{`
`8`		`- count: 4`
`9`		`- kind: KIND_CPU`
	`12`	`+ count: 2`
	`13`	`+ kind: KIND_GPU`
`10`	`14`	`}`
`11`	`15`	`]`
`12`		`-`
	`16`	`+`
`13`	`17`	`input [`
`14`	`18`	`{`
`15`	`19`	`name: "output_bbox/BiasAdd"`
`@@ -39,4 +43,4 @@ output [`
`39`	`43`	`data_type: TYPE_FP32,`
`40`	`44`	`dims: [ -1, 1 ]`
`41`	`45`	`}`
`42`		`-]`
	`46`	`+]`