Upload TensorRT & ONNX Model files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +32 -0
- benchmark_with_trtexec.sh +37 -0
- yolo_nas_pose_l_fp16.onnx +3 -0
- yolo_nas_pose_l_fp16.onnx.best.engine +3 -0
- yolo_nas_pose_l_fp16.onnx.best.engine.err +364 -0
- yolo_nas_pose_l_fp16.onnx.best.engine.log +331 -0
- yolo_nas_pose_l_fp16.onnx.engine.err +8 -0
- yolo_nas_pose_l_fp16.onnx.engine.log +91 -0
- yolo_nas_pose_l_fp16.onnx.fp16.engine +3 -0
- yolo_nas_pose_l_fp16.onnx.fp16.engine.err +423 -0
- yolo_nas_pose_l_fp16.onnx.fp16.engine.log +328 -0
- yolo_nas_pose_l_fp16.onnx.int8.engine.err +8 -0
- yolo_nas_pose_l_fp16.onnx.int8.engine.log +92 -0
- yolo_nas_pose_l_fp16.onnx.usage.txt +58 -0
- yolo_nas_pose_l_fp32.onnx +3 -0
- yolo_nas_pose_l_fp32.onnx.best.engine +3 -0
- yolo_nas_pose_l_fp32.onnx.best.engine.err +504 -0
- yolo_nas_pose_l_fp32.onnx.best.engine.log +331 -0
- yolo_nas_pose_l_fp32.onnx.engine +3 -0
- yolo_nas_pose_l_fp32.onnx.engine.err +237 -0
- yolo_nas_pose_l_fp32.onnx.engine.log +326 -0
- yolo_nas_pose_l_fp32.onnx.fp16.engine +3 -0
- yolo_nas_pose_l_fp32.onnx.fp16.engine.err +401 -0
- yolo_nas_pose_l_fp32.onnx.fp16.engine.log +328 -0
- yolo_nas_pose_l_fp32.onnx.int8.engine +3 -0
- yolo_nas_pose_l_fp32.onnx.int8.engine.err +256 -0
- yolo_nas_pose_l_fp32.onnx.int8.engine.log +332 -0
- yolo_nas_pose_l_fp32.onnx.usage.txt +58 -0
- yolo_nas_pose_l_int8.onnx +3 -0
- yolo_nas_pose_l_int8.onnx.best.engine +3 -0
- yolo_nas_pose_l_int8.onnx.best.engine.err +7 -0
- yolo_nas_pose_l_int8.onnx.best.engine.log +357 -0
- yolo_nas_pose_l_int8.onnx.engine.err +8 -0
- yolo_nas_pose_l_int8.onnx.engine.log +91 -0
- yolo_nas_pose_l_int8.onnx.fp16.engine.err +8 -0
- yolo_nas_pose_l_int8.onnx.fp16.engine.log +91 -0
- yolo_nas_pose_l_int8.onnx.int8.engine +3 -0
- yolo_nas_pose_l_int8.onnx.int8.engine.err +7 -0
- yolo_nas_pose_l_int8.onnx.int8.engine.log +357 -0
- yolo_nas_pose_l_int8.onnx.usage.txt +58 -0
- yolo_nas_pose_m_fp16.onnx +3 -0
- yolo_nas_pose_m_fp16.onnx.best.engine +3 -0
- yolo_nas_pose_m_fp16.onnx.best.engine.err +406 -0
- yolo_nas_pose_m_fp16.onnx.best.engine.log +312 -0
- yolo_nas_pose_m_fp16.onnx.engine.err +8 -0
- yolo_nas_pose_m_fp16.onnx.engine.log +91 -0
- yolo_nas_pose_m_fp16.onnx.fp16.engine +3 -0
- yolo_nas_pose_m_fp16.onnx.fp16.engine.err +348 -0
- yolo_nas_pose_m_fp16.onnx.fp16.engine.log +309 -0
- yolo_nas_pose_m_fp16.onnx.int8.engine.err +8 -0
.gitattributes
CHANGED
@@ -33,3 +33,35 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
yolo_nas_pose_l_fp16.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
37 |
+
yolo_nas_pose_l_fp16.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
38 |
+
yolo_nas_pose_l_fp32.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
39 |
+
yolo_nas_pose_l_fp32.onnx.engine filter=lfs diff=lfs merge=lfs -text
|
40 |
+
yolo_nas_pose_l_fp32.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
41 |
+
yolo_nas_pose_l_fp32.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
42 |
+
yolo_nas_pose_l_int8.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
43 |
+
yolo_nas_pose_l_int8.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
44 |
+
yolo_nas_pose_m_fp16.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
45 |
+
yolo_nas_pose_m_fp16.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
46 |
+
yolo_nas_pose_m_fp32.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
47 |
+
yolo_nas_pose_m_fp32.onnx.engine filter=lfs diff=lfs merge=lfs -text
|
48 |
+
yolo_nas_pose_m_fp32.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
49 |
+
yolo_nas_pose_m_fp32.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
50 |
+
yolo_nas_pose_m_int8.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
51 |
+
yolo_nas_pose_m_int8.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
52 |
+
yolo_nas_pose_n_fp16.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
53 |
+
yolo_nas_pose_n_fp16.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
54 |
+
yolo_nas_pose_n_fp32.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
55 |
+
yolo_nas_pose_n_fp32.onnx.engine filter=lfs diff=lfs merge=lfs -text
|
56 |
+
yolo_nas_pose_n_fp32.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
57 |
+
yolo_nas_pose_n_fp32.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
58 |
+
yolo_nas_pose_n_int8.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
59 |
+
yolo_nas_pose_n_int8.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
60 |
+
yolo_nas_pose_s_fp16.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
61 |
+
yolo_nas_pose_s_fp16.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
62 |
+
yolo_nas_pose_s_fp32.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
63 |
+
yolo_nas_pose_s_fp32.onnx.engine filter=lfs diff=lfs merge=lfs -text
|
64 |
+
yolo_nas_pose_s_fp32.onnx.fp16.engine filter=lfs diff=lfs merge=lfs -text
|
65 |
+
yolo_nas_pose_s_fp32.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
66 |
+
yolo_nas_pose_s_int8.onnx.best.engine filter=lfs diff=lfs merge=lfs -text
|
67 |
+
yolo_nas_pose_s_int8.onnx.int8.engine filter=lfs diff=lfs merge=lfs -text
|
benchmark_with_trtexec.sh
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
#!/bin/sh
|
2 |
+
|
3 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_n_fp32.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_n_fp32.onnx.fp32.engine > yolo_nas_pose_n_fp32.onnx.fp32.engine.log 2> yolo_nas_pose_n_fp32.onnx.fp32.engine.err
|
4 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_n_fp32.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_n_fp32.onnx.fp16.engine > yolo_nas_pose_n_fp32.onnx.fp16.engine.log 2> yolo_nas_pose_n_fp32.onnx.fp16.engine.err
|
5 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_n_fp32.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_n_fp32.onnx.best.engine > yolo_nas_pose_n_fp32.onnx.best.engine.log 2> yolo_nas_pose_n_fp32.onnx.best.engine.err
|
6 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_n_fp32.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_n_fp32.onnx.int8.engine > yolo_nas_pose_n_fp32.onnx.int8.engine.log 2> yolo_nas_pose_n_fp32.onnx.int8.engine.err
|
7 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_n_int8.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_n_int8.onnx.int8.engine > yolo_nas_pose_n_int8.onnx.int8.engine.log 2> yolo_nas_pose_n_int8.onnx.int8.engine.err
|
8 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_s_fp32.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_s_fp32.onnx.fp32.engine > yolo_nas_pose_s_fp32.onnx.fp32.engine.log 2> yolo_nas_pose_s_fp32.onnx.fp32.engine.err
|
9 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_s_fp32.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_s_fp32.onnx.fp16.engine > yolo_nas_pose_s_fp32.onnx.fp16.engine.log 2> yolo_nas_pose_s_fp32.onnx.fp16.engine.err
|
10 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_s_fp32.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_s_fp32.onnx.best.engine > yolo_nas_pose_s_fp32.onnx.best.engine.log 2> yolo_nas_pose_s_fp32.onnx.best.engine.err
|
11 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_s_fp32.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_s_fp32.onnx.int8.engine > yolo_nas_pose_s_fp32.onnx.int8.engine.log 2> yolo_nas_pose_s_fp32.onnx.int8.engine.err
|
12 |
+
#/usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_s_int8.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_s_int8.onnx.int8.engine > yolo_nas_pose_s_int8.onnx.int8.engine.log 2> yolo_nas_pose_s_int8.onnx.int8.engine.err
|
13 |
+
|
14 |
+
onnx_models=(
|
15 |
+
"yolo_nas_pose_n_fp32"
|
16 |
+
"yolo_nas_pose_n_fp16"
|
17 |
+
"yolo_nas_pose_n_int8"
|
18 |
+
"yolo_nas_pose_s_fp32"
|
19 |
+
"yolo_nas_pose_s_fp16"
|
20 |
+
"yolo_nas_pose_s_int8"
|
21 |
+
"yolo_nas_pose_m_fp32"
|
22 |
+
"yolo_nas_pose_m_fp16"
|
23 |
+
"yolo_nas_pose_m_int8"
|
24 |
+
"yolo_nas_pose_l_fp32"
|
25 |
+
"yolo_nas_pose_l_fp16"
|
26 |
+
"yolo_nas_pose_l_int8"
|
27 |
+
)
|
28 |
+
|
29 |
+
for onnx in "${onnx_models[@]}"; do
|
30 |
+
for opt in "" "--fp16" "--best" "--int8"; do
|
31 |
+
suffix=""
|
32 |
+
if [ ! -z "$opt" ]; then
|
33 |
+
suffix=".${opt:2}"
|
34 |
+
fi
|
35 |
+
/usr/src/tensorrt/bin/trtexec --onnx=${onnx}.onnx $opt --avgRuns=100 --duration=15 --saveEngine=${onnx}.onnx${suffix}.engine > ${onnx}.onnx${suffix}.engine.log 2> ${onnx}.onnx${suffix}.engine.err
|
36 |
+
done
|
37 |
+
done
|
yolo_nas_pose_l_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4da0316c679b93931da1a30d1224d280991d2350354cb8df7338b0affc154e3
|
3 |
+
size 108987993
|
yolo_nas_pose_l_fp16.onnx.best.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a88cce7911337fa5283e63dca004d66fef580a25ee5c322aad72f974c1259e3
|
3 |
+
size 57159395
|
yolo_nas_pose_l_fp16.onnx.best.engine.err
ADDED
@@ -0,0 +1,364 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-17:15:27] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-17:15:27] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-17:15:27] [W] [TRT] Calibrator is not being used. Users must provide dynamic range for all tensors that are not Int32 or Bool.
|
4 |
+
[12/28/2023-17:48:46] [W] [TRT] Tactic Device request: 4720MB Available: 2777MB. Device memory is insufficient to use tactic.
|
5 |
+
[12/28/2023-17:48:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000004.
|
6 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
7 |
+
[12/28/2023-17:48:47] [W] [TRT] Tactic Device request: 4720MB Available: 2777MB. Device memory is insufficient to use tactic.
|
8 |
+
[12/28/2023-17:48:47] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4720 detected for tactic 0x000000000000003c.
|
9 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
10 |
+
[12/28/2023-17:48:47] [W] [TRT] Tactic Device request: 4720MB Available: 2777MB. Device memory is insufficient to use tactic.
|
11 |
+
[12/28/2023-17:48:47] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000074.
|
12 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
13 |
+
[12/28/2023-17:48:52] [W] [TRT] Tactic Device request: 4706MB Available: 2784MB. Device memory is insufficient to use tactic.
|
14 |
+
[12/28/2023-17:48:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4706 detected for tactic 0x0000000000000004.
|
15 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
16 |
+
[12/28/2023-17:48:53] [W] [TRT] Tactic Device request: 4706MB Available: 2784MB. Device memory is insufficient to use tactic.
|
17 |
+
[12/28/2023-17:48:53] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4706 detected for tactic 0x000000000000003c.
|
18 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
19 |
+
[12/28/2023-17:48:57] [W] [TRT] Tactic Device request: 4711MB Available: 2755MB. Device memory is insufficient to use tactic.
|
20 |
+
[12/28/2023-17:48:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
21 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
22 |
+
[12/28/2023-17:48:58] [W] [TRT] Tactic Device request: 4711MB Available: 2755MB. Device memory is insufficient to use tactic.
|
23 |
+
[12/28/2023-17:48:58] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
24 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
25 |
+
[12/28/2023-17:48:59] [W] [TRT] Tactic Device request: 4711MB Available: 2755MB. Device memory is insufficient to use tactic.
|
26 |
+
[12/28/2023-17:48:59] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
27 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
28 |
+
[12/28/2023-17:49:04] [W] [TRT] Tactic Device request: 4702MB Available: 2754MB. Device memory is insufficient to use tactic.
|
29 |
+
[12/28/2023-17:49:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4702 detected for tactic 0x0000000000000004.
|
30 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
31 |
+
[12/28/2023-17:49:04] [W] [TRT] Tactic Device request: 4702MB Available: 2755MB. Device memory is insufficient to use tactic.
|
32 |
+
[12/28/2023-17:49:04] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4702 detected for tactic 0x000000000000003c.
|
33 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
34 |
+
[12/28/2023-17:49:08] [W] [TRT] Tactic Device request: 4711MB Available: 2711MB. Device memory is insufficient to use tactic.
|
35 |
+
[12/28/2023-17:49:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
36 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
37 |
+
[12/28/2023-17:49:09] [W] [TRT] Tactic Device request: 4711MB Available: 2711MB. Device memory is insufficient to use tactic.
|
38 |
+
[12/28/2023-17:49:09] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
39 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
40 |
+
[12/28/2023-17:49:09] [W] [TRT] Tactic Device request: 4711MB Available: 2711MB. Device memory is insufficient to use tactic.
|
41 |
+
[12/28/2023-17:49:10] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
42 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
43 |
+
[12/28/2023-17:49:15] [W] [TRT] Tactic Device request: 4702MB Available: 2710MB. Device memory is insufficient to use tactic.
|
44 |
+
[12/28/2023-17:49:15] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4702 detected for tactic 0x0000000000000004.
|
45 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
46 |
+
[12/28/2023-17:49:15] [W] [TRT] Tactic Device request: 4702MB Available: 2710MB. Device memory is insufficient to use tactic.
|
47 |
+
[12/28/2023-17:49:15] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4702 detected for tactic 0x000000000000003c.
|
48 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
49 |
+
[12/28/2023-17:56:52] [W] [TRT] Tactic Device request: 4711MB Available: 2405MB. Device memory is insufficient to use tactic.
|
50 |
+
[12/28/2023-17:56:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
51 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
52 |
+
[12/28/2023-17:56:52] [W] [TRT] Tactic Device request: 4711MB Available: 2407MB. Device memory is insufficient to use tactic.
|
53 |
+
[12/28/2023-17:56:52] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
54 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
55 |
+
[12/28/2023-17:56:52] [W] [TRT] Tactic Device request: 4711MB Available: 2407MB. Device memory is insufficient to use tactic.
|
56 |
+
[12/28/2023-17:56:52] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
57 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
58 |
+
[12/28/2023-17:56:54] [W] [TRT] Tactic Device request: 4701MB Available: 2406MB. Device memory is insufficient to use tactic.
|
59 |
+
[12/28/2023-17:56:54] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4701 detected for tactic 0x0000000000000004.
|
60 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
61 |
+
[12/28/2023-17:56:54] [W] [TRT] Tactic Device request: 4701MB Available: 2407MB. Device memory is insufficient to use tactic.
|
62 |
+
[12/28/2023-17:56:54] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4701 detected for tactic 0x000000000000003c.
|
63 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
64 |
+
[12/28/2023-17:57:13] [W] [TRT] Tactic Device request: 6275MB Available: 2406MB. Device memory is insufficient to use tactic.
|
65 |
+
[12/28/2023-17:57:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
66 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
67 |
+
[12/28/2023-17:57:13] [W] [TRT] Tactic Device request: 6275MB Available: 2406MB. Device memory is insufficient to use tactic.
|
68 |
+
[12/28/2023-17:57:13] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
69 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
70 |
+
[12/28/2023-17:57:13] [W] [TRT] Tactic Device request: 6275MB Available: 2406MB. Device memory is insufficient to use tactic.
|
71 |
+
[12/28/2023-17:57:13] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
72 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
73 |
+
[12/28/2023-17:57:15] [W] [TRT] Tactic Device request: 6270MB Available: 2405MB. Device memory is insufficient to use tactic.
|
74 |
+
[12/28/2023-17:57:15] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6270 detected for tactic 0x0000000000000004.
|
75 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
76 |
+
[12/28/2023-17:57:15] [W] [TRT] Tactic Device request: 6270MB Available: 2405MB. Device memory is insufficient to use tactic.
|
77 |
+
[12/28/2023-17:57:15] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6270 detected for tactic 0x000000000000003c.
|
78 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
79 |
+
[12/28/2023-18:08:00] [W] [TRT] Tactic Device request: 7056MB Available: 2739MB. Device memory is insufficient to use tactic.
|
80 |
+
[12/28/2023-18:08:00] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
81 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
82 |
+
[12/28/2023-18:08:01] [W] [TRT] Tactic Device request: 7056MB Available: 2738MB. Device memory is insufficient to use tactic.
|
83 |
+
[12/28/2023-18:08:01] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
84 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
85 |
+
[12/28/2023-18:08:01] [W] [TRT] Tactic Device request: 7056MB Available: 2738MB. Device memory is insufficient to use tactic.
|
86 |
+
[12/28/2023-18:08:01] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
87 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
88 |
+
[12/28/2023-18:08:03] [W] [TRT] Tactic Device request: 7050MB Available: 2738MB. Device memory is insufficient to use tactic.
|
89 |
+
[12/28/2023-18:08:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7050 detected for tactic 0x0000000000000004.
|
90 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
91 |
+
[12/28/2023-18:08:03] [W] [TRT] Tactic Device request: 7050MB Available: 2739MB. Device memory is insufficient to use tactic.
|
92 |
+
[12/28/2023-18:08:03] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 7050 detected for tactic 0x000000000000003c.
|
93 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
94 |
+
[12/28/2023-18:08:23] [W] [TRT] Tactic Device request: 6354MB Available: 2732MB. Device memory is insufficient to use tactic.
|
95 |
+
[12/28/2023-18:08:24] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
96 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
97 |
+
[12/28/2023-18:08:24] [W] [TRT] Tactic Device request: 6354MB Available: 2731MB. Device memory is insufficient to use tactic.
|
98 |
+
[12/28/2023-18:08:24] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
99 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
100 |
+
[12/28/2023-18:08:24] [W] [TRT] Tactic Device request: 6354MB Available: 2732MB. Device memory is insufficient to use tactic.
|
101 |
+
[12/28/2023-18:08:24] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
102 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
103 |
+
[12/28/2023-18:08:26] [W] [TRT] Tactic Device request: 6351MB Available: 2732MB. Device memory is insufficient to use tactic.
|
104 |
+
[12/28/2023-18:08:26] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6351 detected for tactic 0x0000000000000004.
|
105 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
106 |
+
[12/28/2023-18:08:26] [W] [TRT] Tactic Device request: 6351MB Available: 2732MB. Device memory is insufficient to use tactic.
|
107 |
+
[12/28/2023-18:08:26] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6351 detected for tactic 0x000000000000003c.
|
108 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
109 |
+
[12/28/2023-18:23:59] [W] [TRT] Tactic Device request: 6540MB Available: 2641MB. Device memory is insufficient to use tactic.
|
110 |
+
[12/28/2023-18:23:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000004.
|
111 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
112 |
+
[12/28/2023-18:23:59] [W] [TRT] Tactic Device request: 6540MB Available: 2641MB. Device memory is insufficient to use tactic.
|
113 |
+
[12/28/2023-18:23:59] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6540 detected for tactic 0x000000000000003c.
|
114 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
115 |
+
[12/28/2023-18:23:59] [W] [TRT] Tactic Device request: 6540MB Available: 2641MB. Device memory is insufficient to use tactic.
|
116 |
+
[12/28/2023-18:23:59] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000074.
|
117 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
118 |
+
[12/28/2023-18:24:01] [W] [TRT] Tactic Device request: 6538MB Available: 2642MB. Device memory is insufficient to use tactic.
|
119 |
+
[12/28/2023-18:24:01] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6538 detected for tactic 0x0000000000000004.
|
120 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
121 |
+
[12/28/2023-18:24:01] [W] [TRT] Tactic Device request: 6538MB Available: 2641MB. Device memory is insufficient to use tactic.
|
122 |
+
[12/28/2023-18:24:01] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6538 detected for tactic 0x000000000000003c.
|
123 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
124 |
+
[12/28/2023-18:32:34] [W] [TRT] Tactic Device request: 2457MB Available: 2443MB. Device memory is insufficient to use tactic.
|
125 |
+
[12/28/2023-18:32:34] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
126 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
127 |
+
[12/28/2023-18:32:34] [W] [TRT] Tactic Device request: 2457MB Available: 2444MB. Device memory is insufficient to use tactic.
|
128 |
+
[12/28/2023-18:32:34] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
129 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
130 |
+
[12/28/2023-18:32:34] [W] [TRT] Tactic Device request: 2457MB Available: 2444MB. Device memory is insufficient to use tactic.
|
131 |
+
[12/28/2023-18:32:34] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
132 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
133 |
+
[12/28/2023-18:32:35] [W] [TRT] Tactic Device request: 2456MB Available: 2444MB. Device memory is insufficient to use tactic.
|
134 |
+
[12/28/2023-18:32:35] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2456 detected for tactic 0x0000000000000004.
|
135 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
136 |
+
[12/28/2023-18:32:35] [W] [TRT] Tactic Device request: 2456MB Available: 2444MB. Device memory is insufficient to use tactic.
|
137 |
+
[12/28/2023-18:32:35] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2456 detected for tactic 0x000000000000003c.
|
138 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
139 |
+
[12/28/2023-18:33:03] [W] [TRT] Tactic Device request: 3587MB Available: 2405MB. Device memory is insufficient to use tactic.
|
140 |
+
[12/28/2023-18:33:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
141 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
142 |
+
[12/28/2023-18:33:03] [W] [TRT] Tactic Device request: 3587MB Available: 2405MB. Device memory is insufficient to use tactic.
|
143 |
+
[12/28/2023-18:33:03] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
144 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
145 |
+
[12/28/2023-18:33:03] [W] [TRT] Tactic Device request: 3587MB Available: 2405MB. Device memory is insufficient to use tactic.
|
146 |
+
[12/28/2023-18:33:03] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
147 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
148 |
+
[12/28/2023-18:33:04] [W] [TRT] Tactic Device request: 3585MB Available: 2405MB. Device memory is insufficient to use tactic.
|
149 |
+
[12/28/2023-18:33:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3585 detected for tactic 0x0000000000000004.
|
150 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
151 |
+
[12/28/2023-18:33:04] [W] [TRT] Tactic Device request: 3585MB Available: 2405MB. Device memory is insufficient to use tactic.
|
152 |
+
[12/28/2023-18:33:04] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3585 detected for tactic 0x000000000000003c.
|
153 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
154 |
+
[12/28/2023-18:45:49] [W] [TRT] Tactic Device request: 3556MB Available: 2253MB. Device memory is insufficient to use tactic.
|
155 |
+
[12/28/2023-18:45:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
156 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
157 |
+
[12/28/2023-18:45:49] [W] [TRT] Tactic Device request: 3556MB Available: 2254MB. Device memory is insufficient to use tactic.
|
158 |
+
[12/28/2023-18:45:49] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
159 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
160 |
+
[12/28/2023-18:45:49] [W] [TRT] Tactic Device request: 3556MB Available: 2254MB. Device memory is insufficient to use tactic.
|
161 |
+
[12/28/2023-18:45:49] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
162 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
163 |
+
[12/28/2023-18:45:50] [W] [TRT] Tactic Device request: 3551MB Available: 2254MB. Device memory is insufficient to use tactic.
|
164 |
+
[12/28/2023-18:45:50] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3551 detected for tactic 0x0000000000000004.
|
165 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
166 |
+
[12/28/2023-18:45:50] [W] [TRT] Tactic Device request: 3551MB Available: 2254MB. Device memory is insufficient to use tactic.
|
167 |
+
[12/28/2023-18:45:50] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3551 detected for tactic 0x000000000000003c.
|
168 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
169 |
+
[12/28/2023-18:45:52] [W] [TRT] Tactic Device request: 3140MB Available: 2253MB. Device memory is insufficient to use tactic.
|
170 |
+
[12/28/2023-18:45:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000004.
|
171 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
172 |
+
[12/28/2023-18:45:52] [W] [TRT] Tactic Device request: 3140MB Available: 2253MB. Device memory is insufficient to use tactic.
|
173 |
+
[12/28/2023-18:45:52] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3140 detected for tactic 0x000000000000003c.
|
174 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
175 |
+
[12/28/2023-18:45:52] [W] [TRT] Tactic Device request: 3140MB Available: 2253MB. Device memory is insufficient to use tactic.
|
176 |
+
[12/28/2023-18:45:52] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000074.
|
177 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
178 |
+
[12/28/2023-18:45:53] [W] [TRT] Tactic Device request: 3136MB Available: 2253MB. Device memory is insufficient to use tactic.
|
179 |
+
[12/28/2023-18:45:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3136 detected for tactic 0x0000000000000004.
|
180 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
181 |
+
[12/28/2023-18:45:53] [W] [TRT] Tactic Device request: 3136MB Available: 2253MB. Device memory is insufficient to use tactic.
|
182 |
+
[12/28/2023-18:45:53] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3136 detected for tactic 0x000000000000003c.
|
183 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
184 |
+
[12/28/2023-18:57:51] [W] [TRT] Tactic Device request: 3161MB Available: 2021MB. Device memory is insufficient to use tactic.
|
185 |
+
[12/28/2023-18:57:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000004.
|
186 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
187 |
+
[12/28/2023-18:57:51] [W] [TRT] Tactic Device request: 3161MB Available: 2021MB. Device memory is insufficient to use tactic.
|
188 |
+
[12/28/2023-18:57:51] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3161 detected for tactic 0x000000000000003c.
|
189 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
190 |
+
[12/28/2023-18:57:51] [W] [TRT] Tactic Device request: 3161MB Available: 2021MB. Device memory is insufficient to use tactic.
|
191 |
+
[12/28/2023-18:57:51] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000074.
|
192 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
193 |
+
[12/28/2023-18:57:52] [W] [TRT] Tactic Device request: 3156MB Available: 2021MB. Device memory is insufficient to use tactic.
|
194 |
+
[12/28/2023-18:57:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3156 detected for tactic 0x0000000000000004.
|
195 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
196 |
+
[12/28/2023-18:57:52] [W] [TRT] Tactic Device request: 3156MB Available: 2021MB. Device memory is insufficient to use tactic.
|
197 |
+
[12/28/2023-18:57:52] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3156 detected for tactic 0x000000000000003c.
|
198 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
199 |
+
[12/28/2023-18:57:59] [W] [TRT] Tactic Device request: 4189MB Available: 2022MB. Device memory is insufficient to use tactic.
|
200 |
+
[12/28/2023-18:57:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000004.
|
201 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
202 |
+
[12/28/2023-18:57:59] [W] [TRT] Tactic Device request: 4189MB Available: 2015MB. Device memory is insufficient to use tactic.
|
203 |
+
[12/28/2023-18:57:59] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4189 detected for tactic 0x000000000000003c.
|
204 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
205 |
+
[12/28/2023-18:58:00] [W] [TRT] Tactic Device request: 4189MB Available: 2016MB. Device memory is insufficient to use tactic.
|
206 |
+
[12/28/2023-18:58:00] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000074.
|
207 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
208 |
+
[12/28/2023-18:58:04] [W] [TRT] Tactic Device request: 4183MB Available: 2018MB. Device memory is insufficient to use tactic.
|
209 |
+
[12/28/2023-18:58:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4183 detected for tactic 0x0000000000000004.
|
210 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
211 |
+
[12/28/2023-18:58:04] [W] [TRT] Tactic Device request: 4183MB Available: 2017MB. Device memory is insufficient to use tactic.
|
212 |
+
[12/28/2023-18:58:04] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4183 detected for tactic 0x000000000000003c.
|
213 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
214 |
+
[12/28/2023-18:58:08] [W] [TRT] Tactic Device request: 4186MB Available: 2017MB. Device memory is insufficient to use tactic.
|
215 |
+
[12/28/2023-18:58:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000004.
|
216 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
217 |
+
[12/28/2023-18:58:08] [W] [TRT] Tactic Device request: 4186MB Available: 2015MB. Device memory is insufficient to use tactic.
|
218 |
+
[12/28/2023-18:58:08] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4186 detected for tactic 0x000000000000003c.
|
219 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
220 |
+
[12/28/2023-18:58:09] [W] [TRT] Tactic Device request: 4186MB Available: 2016MB. Device memory is insufficient to use tactic.
|
221 |
+
[12/28/2023-18:58:09] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000074.
|
222 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
223 |
+
[12/28/2023-18:58:13] [W] [TRT] Tactic Device request: 4182MB Available: 2016MB. Device memory is insufficient to use tactic.
|
224 |
+
[12/28/2023-18:58:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4182 detected for tactic 0x0000000000000004.
|
225 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
226 |
+
[12/28/2023-18:58:13] [W] [TRT] Tactic Device request: 4182MB Available: 2015MB. Device memory is insufficient to use tactic.
|
227 |
+
[12/28/2023-18:58:13] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4182 detected for tactic 0x000000000000003c.
|
228 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
229 |
+
[12/28/2023-19:10:51] [W] [TRT] Tactic Device request: 4764MB Available: 1955MB. Device memory is insufficient to use tactic.
|
230 |
+
[12/28/2023-19:10:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000004.
|
231 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
232 |
+
[12/28/2023-19:10:52] [W] [TRT] Tactic Device request: 4764MB Available: 1953MB. Device memory is insufficient to use tactic.
|
233 |
+
[12/28/2023-19:10:52] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4764 detected for tactic 0x000000000000003c.
|
234 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
235 |
+
[12/28/2023-19:10:52] [W] [TRT] Tactic Device request: 4764MB Available: 1953MB. Device memory is insufficient to use tactic.
|
236 |
+
[12/28/2023-19:10:52] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000074.
|
237 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
238 |
+
[12/28/2023-19:10:53] [W] [TRT] Tactic Device request: 4761MB Available: 1954MB. Device memory is insufficient to use tactic.
|
239 |
+
[12/28/2023-19:10:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4761 detected for tactic 0x0000000000000004.
|
240 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
241 |
+
[12/28/2023-19:10:53] [W] [TRT] Tactic Device request: 4761MB Available: 1954MB. Device memory is insufficient to use tactic.
|
242 |
+
[12/28/2023-19:10:53] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4761 detected for tactic 0x000000000000003c.
|
243 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
244 |
+
[12/28/2023-19:11:02] [W] [TRT] Tactic Device request: 4244MB Available: 1769MB. Device memory is insufficient to use tactic.
|
245 |
+
[12/28/2023-19:11:02] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000004.
|
246 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
247 |
+
[12/28/2023-19:11:03] [W] [TRT] Tactic Device request: 4244MB Available: 1768MB. Device memory is insufficient to use tactic.
|
248 |
+
[12/28/2023-19:11:03] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4244 detected for tactic 0x000000000000003c.
|
249 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
250 |
+
[12/28/2023-19:11:04] [W] [TRT] Tactic Device request: 4244MB Available: 1775MB. Device memory is insufficient to use tactic.
|
251 |
+
[12/28/2023-19:11:04] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000074.
|
252 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
253 |
+
[12/28/2023-19:11:09] [W] [TRT] Tactic Device request: 4240MB Available: 1773MB. Device memory is insufficient to use tactic.
|
254 |
+
[12/28/2023-19:11:09] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4240 detected for tactic 0x0000000000000004.
|
255 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
256 |
+
[12/28/2023-19:11:09] [W] [TRT] Tactic Device request: 4240MB Available: 1771MB. Device memory is insufficient to use tactic.
|
257 |
+
[12/28/2023-19:11:09] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4240 detected for tactic 0x000000000000003c.
|
258 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
259 |
+
[12/28/2023-19:11:14] [W] [TRT] Tactic Device request: 4241MB Available: 1774MB. Device memory is insufficient to use tactic.
|
260 |
+
[12/28/2023-19:11:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000004.
|
261 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
262 |
+
[12/28/2023-19:11:15] [W] [TRT] Tactic Device request: 4241MB Available: 1772MB. Device memory is insufficient to use tactic.
|
263 |
+
[12/28/2023-19:11:15] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4241 detected for tactic 0x000000000000003c.
|
264 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
265 |
+
[12/28/2023-19:11:16] [W] [TRT] Tactic Device request: 4241MB Available: 1770MB. Device memory is insufficient to use tactic.
|
266 |
+
[12/28/2023-19:11:16] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000074.
|
267 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
268 |
+
[12/28/2023-19:11:21] [W] [TRT] Tactic Device request: 4239MB Available: 1769MB. Device memory is insufficient to use tactic.
|
269 |
+
[12/28/2023-19:11:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4239 detected for tactic 0x0000000000000004.
|
270 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
271 |
+
[12/28/2023-19:11:22] [W] [TRT] Tactic Device request: 4239MB Available: 1768MB. Device memory is insufficient to use tactic.
|
272 |
+
[12/28/2023-19:11:22] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4239 detected for tactic 0x000000000000003c.
|
273 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
274 |
+
[12/28/2023-19:25:07] [W] [TRT] Tactic Device request: 1638MB Available: 1546MB. Device memory is insufficient to use tactic.
|
275 |
+
[12/28/2023-19:25:07] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1638 detected for tactic 0x000000000000003c.
|
276 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
277 |
+
[12/28/2023-19:25:07] [W] [TRT] Tactic Device request: 1638MB Available: 1546MB. Device memory is insufficient to use tactic.
|
278 |
+
[12/28/2023-19:25:07] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1638 detected for tactic 0x0000000000000074.
|
279 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
280 |
+
[12/28/2023-19:25:08] [W] [TRT] Tactic Device request: 1637MB Available: 1557MB. Device memory is insufficient to use tactic.
|
281 |
+
[12/28/2023-19:25:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
282 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
283 |
+
[12/28/2023-19:25:08] [W] [TRT] Tactic Device request: 1637MB Available: 1557MB. Device memory is insufficient to use tactic.
|
284 |
+
[12/28/2023-19:25:08] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
285 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
286 |
+
[12/28/2023-19:25:10] [W] [TRT] Tactic Device request: 3270MB Available: 1560MB. Device memory is insufficient to use tactic.
|
287 |
+
[12/28/2023-19:25:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000004.
|
288 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
289 |
+
[12/28/2023-19:25:10] [W] [TRT] Tactic Device request: 3270MB Available: 1560MB. Device memory is insufficient to use tactic.
|
290 |
+
[12/28/2023-19:25:10] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3270 detected for tactic 0x000000000000003c.
|
291 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
292 |
+
[12/28/2023-19:25:10] [W] [TRT] Tactic Device request: 3270MB Available: 1560MB. Device memory is insufficient to use tactic.
|
293 |
+
[12/28/2023-19:25:10] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000074.
|
294 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
295 |
+
[12/28/2023-19:25:12] [W] [TRT] Tactic Device request: 3269MB Available: 1558MB. Device memory is insufficient to use tactic.
|
296 |
+
[12/28/2023-19:25:12] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3269 detected for tactic 0x0000000000000004.
|
297 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
298 |
+
[12/28/2023-19:25:12] [W] [TRT] Tactic Device request: 3269MB Available: 1558MB. Device memory is insufficient to use tactic.
|
299 |
+
[12/28/2023-19:25:12] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3269 detected for tactic 0x000000000000003c.
|
300 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
301 |
+
[12/28/2023-19:25:15] [W] [TRT] Tactic Device request: 4377MB Available: 1563MB. Device memory is insufficient to use tactic.
|
302 |
+
[12/28/2023-19:25:15] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000004.
|
303 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
304 |
+
[12/28/2023-19:25:15] [W] [TRT] Tactic Device request: 2185MB Available: 1563MB. Device memory is insufficient to use tactic.
|
305 |
+
[12/28/2023-19:25:15] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000005.
|
306 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
307 |
+
[12/28/2023-19:25:16] [W] [TRT] Tactic Device request: 4377MB Available: 1563MB. Device memory is insufficient to use tactic.
|
308 |
+
[12/28/2023-19:25:16] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4377 detected for tactic 0x000000000000003c.
|
309 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
310 |
+
[12/28/2023-19:25:16] [W] [TRT] Tactic Device request: 2185MB Available: 1563MB. Device memory is insufficient to use tactic.
|
311 |
+
[12/28/2023-19:25:16] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2185 detected for tactic 0x000000000000003d.
|
312 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
313 |
+
[12/28/2023-19:25:16] [W] [TRT] Tactic Device request: 4377MB Available: 1561MB. Device memory is insufficient to use tactic.
|
314 |
+
[12/28/2023-19:25:16] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000074.
|
315 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
316 |
+
[12/28/2023-19:25:16] [W] [TRT] Tactic Device request: 2185MB Available: 1561MB. Device memory is insufficient to use tactic.
|
317 |
+
[12/28/2023-19:25:16] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000075.
|
318 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
319 |
+
[12/28/2023-19:25:22] [W] [TRT] Tactic Device request: 4375MB Available: 1748MB. Device memory is insufficient to use tactic.
|
320 |
+
[12/28/2023-19:25:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
321 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
322 |
+
[12/28/2023-19:25:22] [W] [TRT] Tactic Device request: 2183MB Available: 1748MB. Device memory is insufficient to use tactic.
|
323 |
+
[12/28/2023-19:25:22] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
324 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
325 |
+
[12/28/2023-19:25:22] [W] [TRT] Tactic Device request: 4375MB Available: 1748MB. Device memory is insufficient to use tactic.
|
326 |
+
[12/28/2023-19:25:22] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
327 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
328 |
+
[12/28/2023-19:25:22] [W] [TRT] Tactic Device request: 2183MB Available: 1749MB. Device memory is insufficient to use tactic.
|
329 |
+
[12/28/2023-19:25:22] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
330 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
331 |
+
[12/28/2023-19:25:29] [W] [TRT] Tactic Device request: 4376MB Available: 1746MB. Device memory is insufficient to use tactic.
|
332 |
+
[12/28/2023-19:25:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000004.
|
333 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
334 |
+
[12/28/2023-19:25:29] [W] [TRT] Tactic Device request: 2184MB Available: 1746MB. Device memory is insufficient to use tactic.
|
335 |
+
[12/28/2023-19:25:29] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000005.
|
336 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
337 |
+
[12/28/2023-19:25:29] [W] [TRT] Tactic Device request: 4376MB Available: 1746MB. Device memory is insufficient to use tactic.
|
338 |
+
[12/28/2023-19:25:29] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4376 detected for tactic 0x000000000000003c.
|
339 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
340 |
+
[12/28/2023-19:25:29] [W] [TRT] Tactic Device request: 2184MB Available: 1746MB. Device memory is insufficient to use tactic.
|
341 |
+
[12/28/2023-19:25:29] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2184 detected for tactic 0x000000000000003d.
|
342 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
343 |
+
[12/28/2023-19:25:30] [W] [TRT] Tactic Device request: 4376MB Available: 1746MB. Device memory is insufficient to use tactic.
|
344 |
+
[12/28/2023-19:25:30] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000074.
|
345 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
346 |
+
[12/28/2023-19:25:30] [W] [TRT] Tactic Device request: 2184MB Available: 1746MB. Device memory is insufficient to use tactic.
|
347 |
+
[12/28/2023-19:25:30] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000075.
|
348 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
349 |
+
[12/28/2023-19:25:36] [W] [TRT] Tactic Device request: 4375MB Available: 1750MB. Device memory is insufficient to use tactic.
|
350 |
+
[12/28/2023-19:25:36] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
351 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
352 |
+
[12/28/2023-19:25:36] [W] [TRT] Tactic Device request: 2183MB Available: 1750MB. Device memory is insufficient to use tactic.
|
353 |
+
[12/28/2023-19:25:36] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
354 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
355 |
+
[12/28/2023-19:25:36] [W] [TRT] Tactic Device request: 4375MB Available: 1750MB. Device memory is insufficient to use tactic.
|
356 |
+
[12/28/2023-19:25:36] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
357 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
358 |
+
[12/28/2023-19:25:36] [W] [TRT] Tactic Device request: 2183MB Available: 1750MB. Device memory is insufficient to use tactic.
|
359 |
+
[12/28/2023-19:25:36] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
360 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
361 |
+
[12/28/2023-19:26:56] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
362 |
+
[12/28/2023-19:26:56] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
363 |
+
[12/28/2023-19:26:56] [W] * GPU compute time is unstable, with coefficient of variance = 6.77541%.
|
364 |
+
[12/28/2023-19:26:56] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_fp16.onnx.best.engine.log
ADDED
@@ -0,0 +1,331 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.best.engine
|
2 |
+
[12/28/2023-17:15:16] [I] === Model Options ===
|
3 |
+
[12/28/2023-17:15:16] [I] Format: ONNX
|
4 |
+
[12/28/2023-17:15:16] [I] Model: yolo_nas_pose_l_fp16.onnx
|
5 |
+
[12/28/2023-17:15:16] [I] Output:
|
6 |
+
[12/28/2023-17:15:16] [I] === Build Options ===
|
7 |
+
[12/28/2023-17:15:16] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-17:15:16] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-17:15:16] [I] minTiming: 1
|
10 |
+
[12/28/2023-17:15:16] [I] avgTiming: 8
|
11 |
+
[12/28/2023-17:15:16] [I] Precision: FP32+FP16+INT8
|
12 |
+
[12/28/2023-17:15:16] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-17:15:16] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-17:15:16] [I] Refit: Disabled
|
15 |
+
[12/28/2023-17:15:16] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-17:15:16] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-17:15:16] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-17:15:16] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-17:15:16] [I] Build only: Disabled
|
20 |
+
[12/28/2023-17:15:16] [I] Save engine: yolo_nas_pose_l_fp16.onnx.best.engine
|
21 |
+
[12/28/2023-17:15:16] [I] Load engine:
|
22 |
+
[12/28/2023-17:15:16] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-17:15:16] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-17:15:16] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-17:15:16] [I] timingCacheFile:
|
26 |
+
[12/28/2023-17:15:16] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-17:15:16] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-17:15:16] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-17:15:16] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-17:15:16] [I] Input build shapes: model
|
31 |
+
[12/28/2023-17:15:16] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-17:15:16] [I] === System Options ===
|
33 |
+
[12/28/2023-17:15:16] [I] Device: 0
|
34 |
+
[12/28/2023-17:15:16] [I] DLACore:
|
35 |
+
[12/28/2023-17:15:16] [I] Plugins:
|
36 |
+
[12/28/2023-17:15:16] [I] === Inference Options ===
|
37 |
+
[12/28/2023-17:15:16] [I] Batch: Explicit
|
38 |
+
[12/28/2023-17:15:16] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-17:15:16] [I] Iterations: 10
|
40 |
+
[12/28/2023-17:15:16] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-17:15:16] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-17:15:16] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-17:15:16] [I] Streams: 1
|
44 |
+
[12/28/2023-17:15:16] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-17:15:16] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-17:15:16] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-17:15:16] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-17:15:16] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-17:15:16] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-17:15:16] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-17:15:16] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-17:15:16] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-17:15:16] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-17:15:16] [I] Inputs:
|
55 |
+
[12/28/2023-17:15:16] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-17:15:16] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-17:15:16] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-17:15:16] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-17:15:16] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-17:15:16] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-17:15:16] [I] Profile: Disabled
|
62 |
+
[12/28/2023-17:15:16] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-17:15:16] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-17:15:16] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-17:15:16] [I]
|
66 |
+
[12/28/2023-17:15:16] [I] === Device Information ===
|
67 |
+
[12/28/2023-17:15:16] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-17:15:16] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-17:15:16] [I] SMs: 8
|
70 |
+
[12/28/2023-17:15:16] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-17:15:16] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-17:15:16] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-17:15:16] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-17:15:16] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-17:15:16] [I]
|
76 |
+
[12/28/2023-17:15:16] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-17:15:21] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2974 (MiB)
|
78 |
+
[12/28/2023-17:15:25] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +286, now: CPU 574, GPU 3278 (MiB)
|
79 |
+
[12/28/2023-17:15:25] [I] Start parsing network model
|
80 |
+
[12/28/2023-17:15:27] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-17:15:27] [I] [TRT] Input filename: yolo_nas_pose_l_fp16.onnx
|
82 |
+
[12/28/2023-17:15:27] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-17:15:27] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-17:15:27] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-17:15:27] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-17:15:27] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-17:15:27] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-17:15:27] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-17:15:27] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-17:15:27] [I] Finish parsing network model
|
91 |
+
[12/28/2023-17:15:28] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-17:15:28] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 458) [Constant]
|
96 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 459) [Constant]
|
97 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 460) [Constant]
|
98 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv1/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
166 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
167 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
168 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
169 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
170 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
171 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
172 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
173 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
174 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
175 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
176 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
177 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
178 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
179 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
180 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
181 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
182 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
183 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
184 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
185 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
186 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 187) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
187 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
188 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
189 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 195) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
190 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
191 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
192 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
193 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
194 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
195 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
196 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
197 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
198 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
199 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
200 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
201 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
202 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 224) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
203 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
204 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
205 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 232) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
206 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
207 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
208 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 240) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
209 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
210 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
211 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
212 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
213 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
214 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
215 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
216 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
217 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
218 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
219 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
220 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
221 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
222 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
223 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
224 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 271) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
225 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
226 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
227 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
228 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 294) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
229 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
230 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
231 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 302) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
232 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
233 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
234 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 310) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
235 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
236 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
237 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
238 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
239 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
240 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
241 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
242 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
243 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
244 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
245 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
246 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
247 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
248 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
249 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
250 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 341) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
251 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
252 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
253 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
254 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 364) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
255 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
256 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
257 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 372) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
258 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
259 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
260 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 380) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
261 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
262 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
263 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
264 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
265 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
266 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
267 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
268 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
269 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
270 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
271 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
272 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
273 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
274 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1...cast_boxes_to_fp32]}
|
275 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
276 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 462) [NMS]_1_output[DevicetoShapeHostCopy]
|
277 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
278 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
279 |
+
[12/28/2023-17:15:28] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
280 |
+
[12/28/2023-17:15:40] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +308, now: CPU 1231, GPU 3787 (MiB)
|
281 |
+
[12/28/2023-17:15:42] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +83, GPU +72, now: CPU 1314, GPU 3859 (MiB)
|
282 |
+
[12/28/2023-17:15:42] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
283 |
+
[12/28/2023-19:26:12] [I] [TRT] Total Activation Memory: 7966500352
|
284 |
+
[12/28/2023-19:26:12] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
285 |
+
[12/28/2023-19:26:29] [I] [TRT] Total Host Persistent Memory: 330912
|
286 |
+
[12/28/2023-19:26:29] [I] [TRT] Total Device Persistent Memory: 656384
|
287 |
+
[12/28/2023-19:26:29] [I] [TRT] Total Scratch Memory: 134217728
|
288 |
+
[12/28/2023-19:26:29] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 79 MiB, GPU 2398 MiB
|
289 |
+
[12/28/2023-19:26:29] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 176 steps to complete.
|
290 |
+
[12/28/2023-19:26:29] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 96.1396ms to assign 14 blocks to 176 nodes requiring 149010944 bytes.
|
291 |
+
[12/28/2023-19:26:29] [I] [TRT] Total Activation Memory: 149010944
|
292 |
+
[12/28/2023-19:26:38] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU -17, now: CPU 1718, GPU 5578 (MiB)
|
293 |
+
[12/28/2023-19:26:38] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +52, GPU +64, now: CPU 52, GPU 64 (MiB)
|
294 |
+
[12/28/2023-19:26:39] [I] Engine built in 7882.87 sec.
|
295 |
+
[12/28/2023-19:26:40] [I] [TRT] Loaded engine size: 54 MiB
|
296 |
+
[12/28/2023-19:26:41] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1299, GPU 5193 (MiB)
|
297 |
+
[12/28/2023-19:26:41] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +52, now: CPU 0, GPU 52 (MiB)
|
298 |
+
[12/28/2023-19:26:41] [I] Engine deserialized in 0.300217 sec.
|
299 |
+
[12/28/2023-19:26:41] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1300, GPU 5193 (MiB)
|
300 |
+
[12/28/2023-19:26:41] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +143, now: CPU 0, GPU 195 (MiB)
|
301 |
+
[12/28/2023-19:26:41] [I] Setting persistentCacheLimit to 0 bytes.
|
302 |
+
[12/28/2023-19:26:41] [I] Using random values for input onnx::Cast_0
|
303 |
+
[12/28/2023-19:26:41] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
304 |
+
[12/28/2023-19:26:41] [I] Using random values for output graph2_flat_predictions
|
305 |
+
[12/28/2023-19:26:41] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
306 |
+
[12/28/2023-19:26:41] [I] Starting inference
|
307 |
+
[12/28/2023-19:26:56] [I] Warmup completed 6 queries over 200 ms
|
308 |
+
[12/28/2023-19:26:56] [I] Timing trace has 703 queries over 15.0461 s
|
309 |
+
[12/28/2023-19:26:56] [I]
|
310 |
+
[12/28/2023-19:26:56] [I] === Trace details ===
|
311 |
+
[12/28/2023-19:26:56] [I] Trace averages of 100 runs:
|
312 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 20.9395 ms - Host latency: 21.0535 ms (enqueue 21.0062 ms)
|
313 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 21.1664 ms - Host latency: 21.2792 ms (enqueue 21.2275 ms)
|
314 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 21.3262 ms - Host latency: 21.4444 ms (enqueue 21.3939 ms)
|
315 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 21.3667 ms - Host latency: 21.4831 ms (enqueue 21.4306 ms)
|
316 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 21.2193 ms - Host latency: 21.3339 ms (enqueue 21.2934 ms)
|
317 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 21.8831 ms - Host latency: 22.0036 ms (enqueue 21.9394 ms)
|
318 |
+
[12/28/2023-19:26:56] [I] Average on 100 runs - GPU latency: 20.8839 ms - Host latency: 20.9973 ms (enqueue 20.9568 ms)
|
319 |
+
[12/28/2023-19:26:56] [I]
|
320 |
+
[12/28/2023-19:26:56] [I] === Performance summary ===
|
321 |
+
[12/28/2023-19:26:56] [I] Throughput: 46.7231 qps
|
322 |
+
[12/28/2023-19:26:56] [I] Latency: min = 19.8525 ms, max = 30.6865 ms, mean = 21.368 ms, median = 21.1562 ms, percentile(90%) = 22.2715 ms, percentile(95%) = 23.1201 ms, percentile(99%) = 28.8721 ms
|
323 |
+
[12/28/2023-19:26:56] [I] Enqueue Time: min = 19.8208 ms, max = 30.626 ms, mean = 21.3184 ms, median = 21.1201 ms, percentile(90%) = 22.2363 ms, percentile(95%) = 23.2373 ms, percentile(99%) = 28.8086 ms
|
324 |
+
[12/28/2023-19:26:56] [I] H2D Latency: min = 0.0810547 ms, max = 0.134766 ms, mean = 0.0972954 ms, median = 0.0981445 ms, percentile(90%) = 0.100098 ms, percentile(95%) = 0.100586 ms, percentile(99%) = 0.111328 ms
|
325 |
+
[12/28/2023-19:26:56] [I] GPU Compute Time: min = 19.7407 ms, max = 30.5723 ms, mean = 21.2522 ms, median = 21.042 ms, percentile(90%) = 22.1533 ms, percentile(95%) = 23.0203 ms, percentile(99%) = 28.7578 ms
|
326 |
+
[12/28/2023-19:26:56] [I] D2H Latency: min = 0.00390625 ms, max = 0.0776367 ms, mean = 0.0184049 ms, median = 0.0155029 ms, percentile(90%) = 0.0283203 ms, percentile(95%) = 0.0302734 ms, percentile(99%) = 0.046875 ms
|
327 |
+
[12/28/2023-19:26:56] [I] Total Host Walltime: 15.0461 s
|
328 |
+
[12/28/2023-19:26:56] [I] Total GPU Compute Time: 14.9403 s
|
329 |
+
[12/28/2023-19:26:56] [I] Explanations of the performance metrics are printed in the verbose logs.
|
330 |
+
[12/28/2023-19:26:56] [I]
|
331 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.best.engine
|
yolo_nas_pose_l_fp16.onnx.engine.err
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-16:09:44] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-16:09:44] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-16:09:45] [E] Error[4]: [network.cpp::validate::2925] Error Code 4: Internal Error (fp16 precision has been set for a layer or layer output, but fp16 is not configured in the builder)
|
4 |
+
[12/28/2023-16:09:45] [E] Error[2]: [builder.cpp::buildSerializedNetwork::751] Error Code 2: Internal Error (Assertion engine != nullptr failed. )
|
5 |
+
[12/28/2023-16:09:45] [E] Engine could not be created from network
|
6 |
+
[12/28/2023-16:09:45] [E] Building engine failed
|
7 |
+
[12/28/2023-16:09:45] [E] Failed to create engine from model or file.
|
8 |
+
[12/28/2023-16:09:45] [E] Engine set up failed
|
yolo_nas_pose_l_fp16.onnx.engine.log
ADDED
@@ -0,0 +1,91 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.engine
|
2 |
+
[12/28/2023-16:09:34] [I] === Model Options ===
|
3 |
+
[12/28/2023-16:09:34] [I] Format: ONNX
|
4 |
+
[12/28/2023-16:09:34] [I] Model: yolo_nas_pose_l_fp16.onnx
|
5 |
+
[12/28/2023-16:09:34] [I] Output:
|
6 |
+
[12/28/2023-16:09:34] [I] === Build Options ===
|
7 |
+
[12/28/2023-16:09:34] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-16:09:34] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-16:09:34] [I] minTiming: 1
|
10 |
+
[12/28/2023-16:09:34] [I] avgTiming: 8
|
11 |
+
[12/28/2023-16:09:34] [I] Precision: FP32
|
12 |
+
[12/28/2023-16:09:34] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-16:09:34] [I] Calibration:
|
14 |
+
[12/28/2023-16:09:34] [I] Refit: Disabled
|
15 |
+
[12/28/2023-16:09:34] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-16:09:34] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-16:09:34] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-16:09:34] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-16:09:34] [I] Build only: Disabled
|
20 |
+
[12/28/2023-16:09:34] [I] Save engine: yolo_nas_pose_l_fp16.onnx.engine
|
21 |
+
[12/28/2023-16:09:34] [I] Load engine:
|
22 |
+
[12/28/2023-16:09:34] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-16:09:34] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-16:09:34] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-16:09:34] [I] timingCacheFile:
|
26 |
+
[12/28/2023-16:09:34] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-16:09:34] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-16:09:34] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-16:09:34] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-16:09:34] [I] Input build shapes: model
|
31 |
+
[12/28/2023-16:09:34] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-16:09:34] [I] === System Options ===
|
33 |
+
[12/28/2023-16:09:34] [I] Device: 0
|
34 |
+
[12/28/2023-16:09:34] [I] DLACore:
|
35 |
+
[12/28/2023-16:09:34] [I] Plugins:
|
36 |
+
[12/28/2023-16:09:34] [I] === Inference Options ===
|
37 |
+
[12/28/2023-16:09:34] [I] Batch: Explicit
|
38 |
+
[12/28/2023-16:09:34] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-16:09:34] [I] Iterations: 10
|
40 |
+
[12/28/2023-16:09:34] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-16:09:34] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-16:09:34] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-16:09:34] [I] Streams: 1
|
44 |
+
[12/28/2023-16:09:34] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-16:09:34] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-16:09:34] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-16:09:34] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-16:09:34] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-16:09:34] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-16:09:34] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-16:09:34] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-16:09:34] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-16:09:34] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-16:09:34] [I] Inputs:
|
55 |
+
[12/28/2023-16:09:34] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-16:09:34] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-16:09:34] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-16:09:34] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-16:09:34] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-16:09:34] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-16:09:34] [I] Profile: Disabled
|
62 |
+
[12/28/2023-16:09:34] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-16:09:34] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-16:09:34] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-16:09:34] [I]
|
66 |
+
[12/28/2023-16:09:34] [I] === Device Information ===
|
67 |
+
[12/28/2023-16:09:34] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-16:09:34] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-16:09:34] [I] SMs: 8
|
70 |
+
[12/28/2023-16:09:34] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-16:09:34] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-16:09:34] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-16:09:34] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-16:09:34] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-16:09:34] [I]
|
76 |
+
[12/28/2023-16:09:34] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-16:09:39] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2974 (MiB)
|
78 |
+
[12/28/2023-16:09:43] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +283, now: CPU 574, GPU 3281 (MiB)
|
79 |
+
[12/28/2023-16:09:43] [I] Start parsing network model
|
80 |
+
[12/28/2023-16:09:44] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-16:09:44] [I] [TRT] Input filename: yolo_nas_pose_l_fp16.onnx
|
82 |
+
[12/28/2023-16:09:44] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-16:09:44] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-16:09:44] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-16:09:44] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-16:09:44] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-16:09:44] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-16:09:44] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-16:09:44] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-16:09:45] [I] Finish parsing network model
|
91 |
+
&&&& FAILED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.engine
|
yolo_nas_pose_l_fp16.onnx.fp16.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:467ff31eefb68768b955df2011c89f375ab57c09a32840d671def8b3ad75de34
|
3 |
+
size 110752021
|
yolo_nas_pose_l_fp16.onnx.fp16.engine.err
ADDED
@@ -0,0 +1,423 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-16:09:49] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-16:09:49] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-16:15:22] [W] [TRT] Tactic Device request: 4720MB Available: 3156MB. Device memory is insufficient to use tactic.
|
4 |
+
[12/28/2023-16:15:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000004.
|
5 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
6 |
+
[12/28/2023-16:15:23] [W] [TRT] Tactic Device request: 4720MB Available: 3155MB. Device memory is insufficient to use tactic.
|
7 |
+
[12/28/2023-16:15:23] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4720 detected for tactic 0x000000000000003c.
|
8 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
9 |
+
[12/28/2023-16:15:23] [W] [TRT] Tactic Device request: 4720MB Available: 3155MB. Device memory is insufficient to use tactic.
|
10 |
+
[12/28/2023-16:15:23] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000074.
|
11 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
12 |
+
[12/28/2023-16:15:29] [W] [TRT] Tactic Device request: 4706MB Available: 3154MB. Device memory is insufficient to use tactic.
|
13 |
+
[12/28/2023-16:15:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4706 detected for tactic 0x0000000000000004.
|
14 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
15 |
+
[12/28/2023-16:15:29] [W] [TRT] Tactic Device request: 4706MB Available: 3155MB. Device memory is insufficient to use tactic.
|
16 |
+
[12/28/2023-16:15:29] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4706 detected for tactic 0x000000000000003c.
|
17 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
18 |
+
[12/28/2023-16:15:32] [W] [TRT] Tactic Device request: 4711MB Available: 3148MB. Device memory is insufficient to use tactic.
|
19 |
+
[12/28/2023-16:15:32] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
20 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
21 |
+
[12/28/2023-16:15:32] [W] [TRT] Tactic Device request: 4711MB Available: 3147MB. Device memory is insufficient to use tactic.
|
22 |
+
[12/28/2023-16:15:32] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
23 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
24 |
+
[12/28/2023-16:15:33] [W] [TRT] Tactic Device request: 4711MB Available: 3146MB. Device memory is insufficient to use tactic.
|
25 |
+
[12/28/2023-16:15:33] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
26 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
27 |
+
[12/28/2023-16:15:38] [W] [TRT] Tactic Device request: 4702MB Available: 3147MB. Device memory is insufficient to use tactic.
|
28 |
+
[12/28/2023-16:15:38] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4702 detected for tactic 0x0000000000000004.
|
29 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
30 |
+
[12/28/2023-16:15:38] [W] [TRT] Tactic Device request: 4702MB Available: 3147MB. Device memory is insufficient to use tactic.
|
31 |
+
[12/28/2023-16:15:39] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4702 detected for tactic 0x000000000000003c.
|
32 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
33 |
+
[12/28/2023-16:20:16] [W] [TRT] Tactic Device request: 4711MB Available: 3039MB. Device memory is insufficient to use tactic.
|
34 |
+
[12/28/2023-16:20:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
35 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
36 |
+
[12/28/2023-16:20:16] [W] [TRT] Tactic Device request: 4711MB Available: 3039MB. Device memory is insufficient to use tactic.
|
37 |
+
[12/28/2023-16:20:16] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
38 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
39 |
+
[12/28/2023-16:20:16] [W] [TRT] Tactic Device request: 4711MB Available: 3038MB. Device memory is insufficient to use tactic.
|
40 |
+
[12/28/2023-16:20:16] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
41 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
42 |
+
[12/28/2023-16:20:18] [W] [TRT] Tactic Device request: 4701MB Available: 3039MB. Device memory is insufficient to use tactic.
|
43 |
+
[12/28/2023-16:20:18] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4701 detected for tactic 0x0000000000000004.
|
44 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
45 |
+
[12/28/2023-16:20:18] [W] [TRT] Tactic Device request: 4701MB Available: 3039MB. Device memory is insufficient to use tactic.
|
46 |
+
[12/28/2023-16:20:18] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4701 detected for tactic 0x000000000000003c.
|
47 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
48 |
+
[12/28/2023-16:20:33] [W] [TRT] Tactic Device request: 6275MB Available: 3038MB. Device memory is insufficient to use tactic.
|
49 |
+
[12/28/2023-16:20:33] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
50 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
51 |
+
[12/28/2023-16:20:33] [W] [TRT] Tactic Device request: 6275MB Available: 3039MB. Device memory is insufficient to use tactic.
|
52 |
+
[12/28/2023-16:20:33] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
53 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
54 |
+
[12/28/2023-16:20:33] [W] [TRT] Tactic Device request: 6275MB Available: 3038MB. Device memory is insufficient to use tactic.
|
55 |
+
[12/28/2023-16:20:33] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
56 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
57 |
+
[12/28/2023-16:20:35] [W] [TRT] Tactic Device request: 6270MB Available: 3039MB. Device memory is insufficient to use tactic.
|
58 |
+
[12/28/2023-16:20:35] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6270 detected for tactic 0x0000000000000004.
|
59 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
60 |
+
[12/28/2023-16:20:35] [W] [TRT] Tactic Device request: 6270MB Available: 3039MB. Device memory is insufficient to use tactic.
|
61 |
+
[12/28/2023-16:20:35] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6270 detected for tactic 0x000000000000003c.
|
62 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
63 |
+
[12/28/2023-16:27:09] [W] [TRT] Tactic Device request: 7056MB Available: 2339MB. Device memory is insufficient to use tactic.
|
64 |
+
[12/28/2023-16:27:09] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
65 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
66 |
+
[12/28/2023-16:27:09] [W] [TRT] Tactic Device request: 7056MB Available: 2340MB. Device memory is insufficient to use tactic.
|
67 |
+
[12/28/2023-16:27:09] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
68 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
69 |
+
[12/28/2023-16:27:09] [W] [TRT] Tactic Device request: 7056MB Available: 2340MB. Device memory is insufficient to use tactic.
|
70 |
+
[12/28/2023-16:27:09] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
71 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
72 |
+
[12/28/2023-16:27:11] [W] [TRT] Tactic Device request: 7050MB Available: 2338MB. Device memory is insufficient to use tactic.
|
73 |
+
[12/28/2023-16:27:11] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7050 detected for tactic 0x0000000000000004.
|
74 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
75 |
+
[12/28/2023-16:27:11] [W] [TRT] Tactic Device request: 7050MB Available: 2338MB. Device memory is insufficient to use tactic.
|
76 |
+
[12/28/2023-16:27:11] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 7050 detected for tactic 0x000000000000003c.
|
77 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
78 |
+
[12/28/2023-16:27:27] [W] [TRT] Tactic Device request: 6354MB Available: 2340MB. Device memory is insufficient to use tactic.
|
79 |
+
[12/28/2023-16:27:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
80 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
81 |
+
[12/28/2023-16:27:27] [W] [TRT] Tactic Device request: 6354MB Available: 2338MB. Device memory is insufficient to use tactic.
|
82 |
+
[12/28/2023-16:27:28] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
83 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
84 |
+
[12/28/2023-16:27:28] [W] [TRT] Tactic Device request: 6354MB Available: 2339MB. Device memory is insufficient to use tactic.
|
85 |
+
[12/28/2023-16:27:28] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
86 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
87 |
+
[12/28/2023-16:27:29] [W] [TRT] Tactic Device request: 6351MB Available: 2341MB. Device memory is insufficient to use tactic.
|
88 |
+
[12/28/2023-16:27:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6351 detected for tactic 0x0000000000000004.
|
89 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
90 |
+
[12/28/2023-16:27:29] [W] [TRT] Tactic Device request: 6351MB Available: 2341MB. Device memory is insufficient to use tactic.
|
91 |
+
[12/28/2023-16:27:29] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6351 detected for tactic 0x000000000000003c.
|
92 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
93 |
+
[12/28/2023-16:36:16] [W] [TRT] Tactic Device request: 2394MB Available: 2304MB. Device memory is insufficient to use tactic.
|
94 |
+
[12/28/2023-16:36:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000004.
|
95 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
96 |
+
[12/28/2023-16:36:16] [W] [TRT] Tactic Device request: 2394MB Available: 2304MB. Device memory is insufficient to use tactic.
|
97 |
+
[12/28/2023-16:36:16] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
98 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
99 |
+
[12/28/2023-16:36:16] [W] [TRT] Tactic Device request: 2394MB Available: 2304MB. Device memory is insufficient to use tactic.
|
100 |
+
[12/28/2023-16:36:16] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
101 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
102 |
+
[12/28/2023-16:36:17] [W] [TRT] Tactic Device request: 2392MB Available: 2304MB. Device memory is insufficient to use tactic.
|
103 |
+
[12/28/2023-16:36:17] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
104 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
105 |
+
[12/28/2023-16:36:17] [W] [TRT] Tactic Device request: 2392MB Available: 2304MB. Device memory is insufficient to use tactic.
|
106 |
+
[12/28/2023-16:36:17] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
107 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
108 |
+
[12/28/2023-16:36:17] [W] [TRT] Tactic Device request: 2392MB Available: 2304MB. Device memory is insufficient to use tactic.
|
109 |
+
[12/28/2023-16:36:17] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
110 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
111 |
+
[12/28/2023-16:36:18] [W] [TRT] Tactic Device request: 2391MB Available: 2305MB. Device memory is insufficient to use tactic.
|
112 |
+
[12/28/2023-16:36:18] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2391 detected for tactic 0x0000000000000004.
|
113 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
114 |
+
[12/28/2023-16:36:18] [W] [TRT] Tactic Device request: 2391MB Available: 2305MB. Device memory is insufficient to use tactic.
|
115 |
+
[12/28/2023-16:36:18] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2391 detected for tactic 0x000000000000003c.
|
116 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
117 |
+
[12/28/2023-16:36:18] [W] [TRT] Tactic Device request: 2390MB Available: 2305MB. Device memory is insufficient to use tactic.
|
118 |
+
[12/28/2023-16:36:18] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
119 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
120 |
+
[12/28/2023-16:36:18] [W] [TRT] Tactic Device request: 2390MB Available: 2305MB. Device memory is insufficient to use tactic.
|
121 |
+
[12/28/2023-16:36:18] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
122 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
123 |
+
[12/28/2023-16:36:32] [W] [TRT] Tactic Device request: 6540MB Available: 2131MB. Device memory is insufficient to use tactic.
|
124 |
+
[12/28/2023-16:36:32] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000004.
|
125 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
126 |
+
[12/28/2023-16:36:32] [W] [TRT] Tactic Device request: 6540MB Available: 2131MB. Device memory is insufficient to use tactic.
|
127 |
+
[12/28/2023-16:36:32] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6540 detected for tactic 0x000000000000003c.
|
128 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
129 |
+
[12/28/2023-16:36:33] [W] [TRT] Tactic Device request: 6540MB Available: 2131MB. Device memory is insufficient to use tactic.
|
130 |
+
[12/28/2023-16:36:33] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000074.
|
131 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
132 |
+
[12/28/2023-16:36:34] [W] [TRT] Tactic Device request: 6538MB Available: 2131MB. Device memory is insufficient to use tactic.
|
133 |
+
[12/28/2023-16:36:34] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6538 detected for tactic 0x0000000000000004.
|
134 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
135 |
+
[12/28/2023-16:36:35] [W] [TRT] Tactic Device request: 6538MB Available: 2131MB. Device memory is insufficient to use tactic.
|
136 |
+
[12/28/2023-16:36:35] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6538 detected for tactic 0x000000000000003c.
|
137 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
138 |
+
[12/28/2023-16:36:36] [W] [TRT] Tactic Device request: 2191MB Available: 2131MB. Device memory is insufficient to use tactic.
|
139 |
+
[12/28/2023-16:36:36] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000004.
|
140 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
141 |
+
[12/28/2023-16:36:37] [W] [TRT] Tactic Device request: 2191MB Available: 2131MB. Device memory is insufficient to use tactic.
|
142 |
+
[12/28/2023-16:36:37] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2191 detected for tactic 0x000000000000003c.
|
143 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
144 |
+
[12/28/2023-16:36:38] [W] [TRT] Tactic Device request: 2191MB Available: 2131MB. Device memory is insufficient to use tactic.
|
145 |
+
[12/28/2023-16:36:38] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000074.
|
146 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
147 |
+
[12/28/2023-16:36:42] [W] [TRT] Tactic Device request: 2190MB Available: 2131MB. Device memory is insufficient to use tactic.
|
148 |
+
[12/28/2023-16:36:42] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
149 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
150 |
+
[12/28/2023-16:36:43] [W] [TRT] Tactic Device request: 2190MB Available: 2131MB. Device memory is insufficient to use tactic.
|
151 |
+
[12/28/2023-16:36:43] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
152 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
153 |
+
[12/28/2023-16:36:45] [W] [TRT] Tactic Device request: 2190MB Available: 2130MB. Device memory is insufficient to use tactic.
|
154 |
+
[12/28/2023-16:36:45] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
155 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
156 |
+
[12/28/2023-16:36:46] [W] [TRT] Tactic Device request: 2190MB Available: 2129MB. Device memory is insufficient to use tactic.
|
157 |
+
[12/28/2023-16:36:46] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
158 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
159 |
+
[12/28/2023-16:36:47] [W] [TRT] Tactic Device request: 2190MB Available: 2127MB. Device memory is insufficient to use tactic.
|
160 |
+
[12/28/2023-16:36:47] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
161 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
162 |
+
[12/28/2023-16:36:51] [W] [TRT] Tactic Device request: 2190MB Available: 2127MB. Device memory is insufficient to use tactic.
|
163 |
+
[12/28/2023-16:36:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
164 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
165 |
+
[12/28/2023-16:36:52] [W] [TRT] Tactic Device request: 2190MB Available: 2126MB. Device memory is insufficient to use tactic.
|
166 |
+
[12/28/2023-16:36:52] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
167 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
168 |
+
[12/28/2023-16:41:41] [W] [TRT] Tactic Device request: 2457MB Available: 2417MB. Device memory is insufficient to use tactic.
|
169 |
+
[12/28/2023-16:41:41] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
170 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
171 |
+
[12/28/2023-16:41:42] [W] [TRT] Tactic Device request: 2457MB Available: 2417MB. Device memory is insufficient to use tactic.
|
172 |
+
[12/28/2023-16:41:42] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
173 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
174 |
+
[12/28/2023-16:41:42] [W] [TRT] Tactic Device request: 2457MB Available: 2417MB. Device memory is insufficient to use tactic.
|
175 |
+
[12/28/2023-16:41:42] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
176 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
177 |
+
[12/28/2023-16:41:43] [W] [TRT] Tactic Device request: 2456MB Available: 2418MB. Device memory is insufficient to use tactic.
|
178 |
+
[12/28/2023-16:41:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2456 detected for tactic 0x0000000000000004.
|
179 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
180 |
+
[12/28/2023-16:41:43] [W] [TRT] Tactic Device request: 2456MB Available: 2418MB. Device memory is insufficient to use tactic.
|
181 |
+
[12/28/2023-16:41:43] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2456 detected for tactic 0x000000000000003c.
|
182 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
183 |
+
[12/28/2023-16:42:04] [W] [TRT] Tactic Device request: 3587MB Available: 2216MB. Device memory is insufficient to use tactic.
|
184 |
+
[12/28/2023-16:42:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
185 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
186 |
+
[12/28/2023-16:42:04] [W] [TRT] Tactic Device request: 3587MB Available: 2216MB. Device memory is insufficient to use tactic.
|
187 |
+
[12/28/2023-16:42:04] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
188 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
189 |
+
[12/28/2023-16:42:04] [W] [TRT] Tactic Device request: 3587MB Available: 2217MB. Device memory is insufficient to use tactic.
|
190 |
+
[12/28/2023-16:42:04] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
191 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
192 |
+
[12/28/2023-16:42:06] [W] [TRT] Tactic Device request: 3585MB Available: 2233MB. Device memory is insufficient to use tactic.
|
193 |
+
[12/28/2023-16:42:06] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3585 detected for tactic 0x0000000000000004.
|
194 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
195 |
+
[12/28/2023-16:42:06] [W] [TRT] Tactic Device request: 3585MB Available: 2233MB. Device memory is insufficient to use tactic.
|
196 |
+
[12/28/2023-16:42:06] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3585 detected for tactic 0x000000000000003c.
|
197 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
198 |
+
[12/28/2023-16:49:44] [W] [TRT] Tactic Device request: 3556MB Available: 1928MB. Device memory is insufficient to use tactic.
|
199 |
+
[12/28/2023-16:49:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
200 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
201 |
+
[12/28/2023-16:49:44] [W] [TRT] Tactic Device request: 3556MB Available: 1928MB. Device memory is insufficient to use tactic.
|
202 |
+
[12/28/2023-16:49:44] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
203 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
204 |
+
[12/28/2023-16:49:44] [W] [TRT] Tactic Device request: 3556MB Available: 1928MB. Device memory is insufficient to use tactic.
|
205 |
+
[12/28/2023-16:49:44] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
206 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
207 |
+
[12/28/2023-16:49:45] [W] [TRT] Tactic Device request: 3551MB Available: 1929MB. Device memory is insufficient to use tactic.
|
208 |
+
[12/28/2023-16:49:45] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3551 detected for tactic 0x0000000000000004.
|
209 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
210 |
+
[12/28/2023-16:49:45] [W] [TRT] Tactic Device request: 3551MB Available: 1929MB. Device memory is insufficient to use tactic.
|
211 |
+
[12/28/2023-16:49:45] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3551 detected for tactic 0x000000000000003c.
|
212 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
213 |
+
[12/28/2023-16:49:46] [W] [TRT] Tactic Device request: 3140MB Available: 1930MB. Device memory is insufficient to use tactic.
|
214 |
+
[12/28/2023-16:49:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000004.
|
215 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
216 |
+
[12/28/2023-16:49:46] [W] [TRT] Tactic Device request: 3140MB Available: 1929MB. Device memory is insufficient to use tactic.
|
217 |
+
[12/28/2023-16:49:46] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3140 detected for tactic 0x000000000000003c.
|
218 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
219 |
+
[12/28/2023-16:49:46] [W] [TRT] Tactic Device request: 3140MB Available: 1929MB. Device memory is insufficient to use tactic.
|
220 |
+
[12/28/2023-16:49:46] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000074.
|
221 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
222 |
+
[12/28/2023-16:49:47] [W] [TRT] Tactic Device request: 3136MB Available: 1929MB. Device memory is insufficient to use tactic.
|
223 |
+
[12/28/2023-16:49:48] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3136 detected for tactic 0x0000000000000004.
|
224 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
225 |
+
[12/28/2023-16:49:48] [W] [TRT] Tactic Device request: 3136MB Available: 1929MB. Device memory is insufficient to use tactic.
|
226 |
+
[12/28/2023-16:49:48] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3136 detected for tactic 0x000000000000003c.
|
227 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
228 |
+
[12/28/2023-16:56:57] [W] [TRT] Tactic Device request: 3161MB Available: 2194MB. Device memory is insufficient to use tactic.
|
229 |
+
[12/28/2023-16:56:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000004.
|
230 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
231 |
+
[12/28/2023-16:56:57] [W] [TRT] Tactic Device request: 3161MB Available: 2194MB. Device memory is insufficient to use tactic.
|
232 |
+
[12/28/2023-16:56:57] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3161 detected for tactic 0x000000000000003c.
|
233 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
234 |
+
[12/28/2023-16:56:57] [W] [TRT] Tactic Device request: 3161MB Available: 2194MB. Device memory is insufficient to use tactic.
|
235 |
+
[12/28/2023-16:56:57] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000074.
|
236 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
237 |
+
[12/28/2023-16:56:58] [W] [TRT] Tactic Device request: 3156MB Available: 2195MB. Device memory is insufficient to use tactic.
|
238 |
+
[12/28/2023-16:56:58] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3156 detected for tactic 0x0000000000000004.
|
239 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
240 |
+
[12/28/2023-16:56:58] [W] [TRT] Tactic Device request: 3156MB Available: 2195MB. Device memory is insufficient to use tactic.
|
241 |
+
[12/28/2023-16:56:58] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3156 detected for tactic 0x000000000000003c.
|
242 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
243 |
+
[12/28/2023-16:57:03] [W] [TRT] Tactic Device request: 4189MB Available: 2194MB. Device memory is insufficient to use tactic.
|
244 |
+
[12/28/2023-16:57:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000004.
|
245 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
246 |
+
[12/28/2023-16:57:03] [W] [TRT] Tactic Device request: 4189MB Available: 2194MB. Device memory is insufficient to use tactic.
|
247 |
+
[12/28/2023-16:57:03] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4189 detected for tactic 0x000000000000003c.
|
248 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
249 |
+
[12/28/2023-16:57:04] [W] [TRT] Tactic Device request: 4189MB Available: 2193MB. Device memory is insufficient to use tactic.
|
250 |
+
[12/28/2023-16:57:04] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000074.
|
251 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
252 |
+
[12/28/2023-16:57:08] [W] [TRT] Tactic Device request: 4183MB Available: 2193MB. Device memory is insufficient to use tactic.
|
253 |
+
[12/28/2023-16:57:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4183 detected for tactic 0x0000000000000004.
|
254 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
255 |
+
[12/28/2023-16:57:08] [W] [TRT] Tactic Device request: 4183MB Available: 2193MB. Device memory is insufficient to use tactic.
|
256 |
+
[12/28/2023-16:57:08] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4183 detected for tactic 0x000000000000003c.
|
257 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
258 |
+
[12/28/2023-16:57:10] [W] [TRT] Tactic Device request: 4186MB Available: 2194MB. Device memory is insufficient to use tactic.
|
259 |
+
[12/28/2023-16:57:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000004.
|
260 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
261 |
+
[12/28/2023-16:57:11] [W] [TRT] Tactic Device request: 4186MB Available: 2194MB. Device memory is insufficient to use tactic.
|
262 |
+
[12/28/2023-16:57:11] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4186 detected for tactic 0x000000000000003c.
|
263 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
264 |
+
[12/28/2023-16:57:11] [W] [TRT] Tactic Device request: 4186MB Available: 2194MB. Device memory is insufficient to use tactic.
|
265 |
+
[12/28/2023-16:57:11] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000074.
|
266 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
267 |
+
[12/28/2023-16:57:15] [W] [TRT] Tactic Device request: 4182MB Available: 2193MB. Device memory is insufficient to use tactic.
|
268 |
+
[12/28/2023-16:57:15] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4182 detected for tactic 0x0000000000000004.
|
269 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
270 |
+
[12/28/2023-16:57:16] [W] [TRT] Tactic Device request: 4182MB Available: 2194MB. Device memory is insufficient to use tactic.
|
271 |
+
[12/28/2023-16:57:16] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4182 detected for tactic 0x000000000000003c.
|
272 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
273 |
+
[12/28/2023-17:05:02] [W] [TRT] Tactic Device request: 4764MB Available: 2303MB. Device memory is insufficient to use tactic.
|
274 |
+
[12/28/2023-17:05:02] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000004.
|
275 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
276 |
+
[12/28/2023-17:05:02] [W] [TRT] Tactic Device request: 4764MB Available: 2303MB. Device memory is insufficient to use tactic.
|
277 |
+
[12/28/2023-17:05:02] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4764 detected for tactic 0x000000000000003c.
|
278 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
279 |
+
[12/28/2023-17:05:02] [W] [TRT] Tactic Device request: 4764MB Available: 2303MB. Device memory is insufficient to use tactic.
|
280 |
+
[12/28/2023-17:05:02] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000074.
|
281 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
282 |
+
[12/28/2023-17:05:04] [W] [TRT] Tactic Device request: 4761MB Available: 2316MB. Device memory is insufficient to use tactic.
|
283 |
+
[12/28/2023-17:05:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4761 detected for tactic 0x0000000000000004.
|
284 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
285 |
+
[12/28/2023-17:05:04] [W] [TRT] Tactic Device request: 4761MB Available: 2317MB. Device memory is insufficient to use tactic.
|
286 |
+
[12/28/2023-17:05:04] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4761 detected for tactic 0x000000000000003c.
|
287 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
288 |
+
[12/28/2023-17:05:10] [W] [TRT] Tactic Device request: 4244MB Available: 2261MB. Device memory is insufficient to use tactic.
|
289 |
+
[12/28/2023-17:05:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000004.
|
290 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
291 |
+
[12/28/2023-17:05:11] [W] [TRT] Tactic Device request: 4244MB Available: 1947MB. Device memory is insufficient to use tactic.
|
292 |
+
[12/28/2023-17:05:11] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4244 detected for tactic 0x000000000000003c.
|
293 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
294 |
+
[12/28/2023-17:05:12] [W] [TRT] Tactic Device request: 4244MB Available: 1942MB. Device memory is insufficient to use tactic.
|
295 |
+
[12/28/2023-17:05:12] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000074.
|
296 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
297 |
+
[12/28/2023-17:05:17] [W] [TRT] Tactic Device request: 4240MB Available: 1944MB. Device memory is insufficient to use tactic.
|
298 |
+
[12/28/2023-17:05:17] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4240 detected for tactic 0x0000000000000004.
|
299 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
300 |
+
[12/28/2023-17:05:17] [W] [TRT] Tactic Device request: 4240MB Available: 1931MB. Device memory is insufficient to use tactic.
|
301 |
+
[12/28/2023-17:05:17] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4240 detected for tactic 0x000000000000003c.
|
302 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
303 |
+
[12/28/2023-17:05:20] [W] [TRT] Tactic Device request: 4241MB Available: 1926MB. Device memory is insufficient to use tactic.
|
304 |
+
[12/28/2023-17:05:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000004.
|
305 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
306 |
+
[12/28/2023-17:05:21] [W] [TRT] Tactic Device request: 4241MB Available: 1894MB. Device memory is insufficient to use tactic.
|
307 |
+
[12/28/2023-17:05:21] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4241 detected for tactic 0x000000000000003c.
|
308 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
309 |
+
[12/28/2023-17:05:22] [W] [TRT] Tactic Device request: 4241MB Available: 1891MB. Device memory is insufficient to use tactic.
|
310 |
+
[12/28/2023-17:05:22] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000074.
|
311 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
312 |
+
[12/28/2023-17:05:27] [W] [TRT] Tactic Device request: 4239MB Available: 1889MB. Device memory is insufficient to use tactic.
|
313 |
+
[12/28/2023-17:05:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4239 detected for tactic 0x0000000000000004.
|
314 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
315 |
+
[12/28/2023-17:05:27] [W] [TRT] Tactic Device request: 4239MB Available: 1877MB. Device memory is insufficient to use tactic.
|
316 |
+
[12/28/2023-17:05:27] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4239 detected for tactic 0x000000000000003c.
|
317 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
318 |
+
[12/28/2023-17:06:08] [W] [TRT] Tactic Device request: 1637MB Available: 1622MB. Device memory is insufficient to use tactic.
|
319 |
+
[12/28/2023-17:06:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
320 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
321 |
+
[12/28/2023-17:06:08] [W] [TRT] Tactic Device request: 1637MB Available: 1622MB. Device memory is insufficient to use tactic.
|
322 |
+
[12/28/2023-17:06:08] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
323 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
324 |
+
[12/28/2023-17:06:08] [W] [TRT] Tactic Device request: 1637MB Available: 1622MB. Device memory is insufficient to use tactic.
|
325 |
+
[12/28/2023-17:06:08] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000074.
|
326 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
327 |
+
[12/28/2023-17:06:09] [W] [TRT] Tactic Device request: 1636MB Available: 1622MB. Device memory is insufficient to use tactic.
|
328 |
+
[12/28/2023-17:06:09] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1636 detected for tactic 0x0000000000000004.
|
329 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
330 |
+
[12/28/2023-17:06:09] [W] [TRT] Tactic Device request: 1636MB Available: 1622MB. Device memory is insufficient to use tactic.
|
331 |
+
[12/28/2023-17:06:09] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1636 detected for tactic 0x000000000000003c.
|
332 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
333 |
+
[12/28/2023-17:13:44] [W] [TRT] Tactic Device request: 1638MB Available: 1488MB. Device memory is insufficient to use tactic.
|
334 |
+
[12/28/2023-17:13:44] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1638 detected for tactic 0x000000000000003c.
|
335 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
336 |
+
[12/28/2023-17:13:44] [W] [TRT] Tactic Device request: 1638MB Available: 1488MB. Device memory is insufficient to use tactic.
|
337 |
+
[12/28/2023-17:13:44] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1638 detected for tactic 0x0000000000000074.
|
338 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
339 |
+
[12/28/2023-17:13:44] [W] [TRT] Tactic Device request: 1637MB Available: 1489MB. Device memory is insufficient to use tactic.
|
340 |
+
[12/28/2023-17:13:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
341 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
342 |
+
[12/28/2023-17:13:45] [W] [TRT] Tactic Device request: 1637MB Available: 1489MB. Device memory is insufficient to use tactic.
|
343 |
+
[12/28/2023-17:13:45] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
344 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
345 |
+
[12/28/2023-17:13:46] [W] [TRT] Tactic Device request: 3270MB Available: 1488MB. Device memory is insufficient to use tactic.
|
346 |
+
[12/28/2023-17:13:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000004.
|
347 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
348 |
+
[12/28/2023-17:13:46] [W] [TRT] Tactic Device request: 3270MB Available: 1488MB. Device memory is insufficient to use tactic.
|
349 |
+
[12/28/2023-17:13:46] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3270 detected for tactic 0x000000000000003c.
|
350 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
351 |
+
[12/28/2023-17:13:46] [W] [TRT] Tactic Device request: 3270MB Available: 1488MB. Device memory is insufficient to use tactic.
|
352 |
+
[12/28/2023-17:13:46] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000074.
|
353 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
354 |
+
[12/28/2023-17:13:47] [W] [TRT] Tactic Device request: 3269MB Available: 1519MB. Device memory is insufficient to use tactic.
|
355 |
+
[12/28/2023-17:13:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3269 detected for tactic 0x0000000000000004.
|
356 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
357 |
+
[12/28/2023-17:13:47] [W] [TRT] Tactic Device request: 3269MB Available: 1518MB. Device memory is insufficient to use tactic.
|
358 |
+
[12/28/2023-17:13:47] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3269 detected for tactic 0x000000000000003c.
|
359 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
360 |
+
[12/28/2023-17:13:50] [W] [TRT] Tactic Device request: 4377MB Available: 1700MB. Device memory is insufficient to use tactic.
|
361 |
+
[12/28/2023-17:13:50] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000004.
|
362 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
363 |
+
[12/28/2023-17:13:50] [W] [TRT] Tactic Device request: 2185MB Available: 1700MB. Device memory is insufficient to use tactic.
|
364 |
+
[12/28/2023-17:13:50] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000005.
|
365 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
366 |
+
[12/28/2023-17:13:50] [W] [TRT] Tactic Device request: 4377MB Available: 1700MB. Device memory is insufficient to use tactic.
|
367 |
+
[12/28/2023-17:13:50] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4377 detected for tactic 0x000000000000003c.
|
368 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
369 |
+
[12/28/2023-17:13:50] [W] [TRT] Tactic Device request: 2185MB Available: 1699MB. Device memory is insufficient to use tactic.
|
370 |
+
[12/28/2023-17:13:50] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2185 detected for tactic 0x000000000000003d.
|
371 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
372 |
+
[12/28/2023-17:13:51] [W] [TRT] Tactic Device request: 4377MB Available: 1699MB. Device memory is insufficient to use tactic.
|
373 |
+
[12/28/2023-17:13:51] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000074.
|
374 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
375 |
+
[12/28/2023-17:13:51] [W] [TRT] Tactic Device request: 2185MB Available: 1699MB. Device memory is insufficient to use tactic.
|
376 |
+
[12/28/2023-17:13:51] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000075.
|
377 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
378 |
+
[12/28/2023-17:13:56] [W] [TRT] Tactic Device request: 4375MB Available: 1824MB. Device memory is insufficient to use tactic.
|
379 |
+
[12/28/2023-17:13:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
380 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
381 |
+
[12/28/2023-17:13:56] [W] [TRT] Tactic Device request: 2183MB Available: 1824MB. Device memory is insufficient to use tactic.
|
382 |
+
[12/28/2023-17:13:57] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
383 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
384 |
+
[12/28/2023-17:13:57] [W] [TRT] Tactic Device request: 4375MB Available: 1824MB. Device memory is insufficient to use tactic.
|
385 |
+
[12/28/2023-17:13:57] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
386 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
387 |
+
[12/28/2023-17:13:57] [W] [TRT] Tactic Device request: 2183MB Available: 1824MB. Device memory is insufficient to use tactic.
|
388 |
+
[12/28/2023-17:13:57] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
389 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
390 |
+
[12/28/2023-17:14:01] [W] [TRT] Tactic Device request: 4376MB Available: 1823MB. Device memory is insufficient to use tactic.
|
391 |
+
[12/28/2023-17:14:01] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000004.
|
392 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
393 |
+
[12/28/2023-17:14:01] [W] [TRT] Tactic Device request: 2184MB Available: 1823MB. Device memory is insufficient to use tactic.
|
394 |
+
[12/28/2023-17:14:01] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000005.
|
395 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
396 |
+
[12/28/2023-17:14:01] [W] [TRT] Tactic Device request: 4376MB Available: 1823MB. Device memory is insufficient to use tactic.
|
397 |
+
[12/28/2023-17:14:01] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4376 detected for tactic 0x000000000000003c.
|
398 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
399 |
+
[12/28/2023-17:14:01] [W] [TRT] Tactic Device request: 2184MB Available: 1823MB. Device memory is insufficient to use tactic.
|
400 |
+
[12/28/2023-17:14:01] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2184 detected for tactic 0x000000000000003d.
|
401 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
402 |
+
[12/28/2023-17:14:01] [W] [TRT] Tactic Device request: 4376MB Available: 1822MB. Device memory is insufficient to use tactic.
|
403 |
+
[12/28/2023-17:14:01] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000074.
|
404 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
405 |
+
[12/28/2023-17:14:01] [W] [TRT] Tactic Device request: 2184MB Available: 1823MB. Device memory is insufficient to use tactic.
|
406 |
+
[12/28/2023-17:14:01] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000075.
|
407 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
408 |
+
[12/28/2023-17:14:07] [W] [TRT] Tactic Device request: 4375MB Available: 1822MB. Device memory is insufficient to use tactic.
|
409 |
+
[12/28/2023-17:14:07] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
410 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
411 |
+
[12/28/2023-17:14:07] [W] [TRT] Tactic Device request: 2183MB Available: 1822MB. Device memory is insufficient to use tactic.
|
412 |
+
[12/28/2023-17:14:07] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
413 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
414 |
+
[12/28/2023-17:14:07] [W] [TRT] Tactic Device request: 4375MB Available: 1822MB. Device memory is insufficient to use tactic.
|
415 |
+
[12/28/2023-17:14:07] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
416 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
417 |
+
[12/28/2023-17:14:07] [W] [TRT] Tactic Device request: 2183MB Available: 1821MB. Device memory is insufficient to use tactic.
|
418 |
+
[12/28/2023-17:14:07] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
419 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
420 |
+
[12/28/2023-17:15:12] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
421 |
+
[12/28/2023-17:15:12] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
422 |
+
[12/28/2023-17:15:12] [W] * GPU compute time is unstable, with coefficient of variance = 5.39183%.
|
423 |
+
[12/28/2023-17:15:12] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_fp16.onnx.fp16.engine.log
ADDED
@@ -0,0 +1,328 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.fp16.engine
|
2 |
+
[12/28/2023-16:09:46] [I] === Model Options ===
|
3 |
+
[12/28/2023-16:09:46] [I] Format: ONNX
|
4 |
+
[12/28/2023-16:09:46] [I] Model: yolo_nas_pose_l_fp16.onnx
|
5 |
+
[12/28/2023-16:09:46] [I] Output:
|
6 |
+
[12/28/2023-16:09:46] [I] === Build Options ===
|
7 |
+
[12/28/2023-16:09:46] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-16:09:46] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-16:09:46] [I] minTiming: 1
|
10 |
+
[12/28/2023-16:09:46] [I] avgTiming: 8
|
11 |
+
[12/28/2023-16:09:46] [I] Precision: FP32+FP16
|
12 |
+
[12/28/2023-16:09:46] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-16:09:46] [I] Calibration:
|
14 |
+
[12/28/2023-16:09:46] [I] Refit: Disabled
|
15 |
+
[12/28/2023-16:09:46] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-16:09:46] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-16:09:46] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-16:09:46] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-16:09:46] [I] Build only: Disabled
|
20 |
+
[12/28/2023-16:09:46] [I] Save engine: yolo_nas_pose_l_fp16.onnx.fp16.engine
|
21 |
+
[12/28/2023-16:09:46] [I] Load engine:
|
22 |
+
[12/28/2023-16:09:46] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-16:09:46] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-16:09:46] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-16:09:46] [I] timingCacheFile:
|
26 |
+
[12/28/2023-16:09:46] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-16:09:46] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-16:09:46] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-16:09:46] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-16:09:46] [I] Input build shapes: model
|
31 |
+
[12/28/2023-16:09:46] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-16:09:46] [I] === System Options ===
|
33 |
+
[12/28/2023-16:09:46] [I] Device: 0
|
34 |
+
[12/28/2023-16:09:46] [I] DLACore:
|
35 |
+
[12/28/2023-16:09:46] [I] Plugins:
|
36 |
+
[12/28/2023-16:09:46] [I] === Inference Options ===
|
37 |
+
[12/28/2023-16:09:46] [I] Batch: Explicit
|
38 |
+
[12/28/2023-16:09:46] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-16:09:46] [I] Iterations: 10
|
40 |
+
[12/28/2023-16:09:46] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-16:09:46] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-16:09:46] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-16:09:46] [I] Streams: 1
|
44 |
+
[12/28/2023-16:09:46] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-16:09:46] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-16:09:46] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-16:09:46] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-16:09:46] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-16:09:46] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-16:09:46] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-16:09:46] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-16:09:46] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-16:09:46] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-16:09:46] [I] Inputs:
|
55 |
+
[12/28/2023-16:09:46] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-16:09:46] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-16:09:46] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-16:09:46] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-16:09:46] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-16:09:46] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-16:09:46] [I] Profile: Disabled
|
62 |
+
[12/28/2023-16:09:46] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-16:09:46] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-16:09:46] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-16:09:46] [I]
|
66 |
+
[12/28/2023-16:09:46] [I] === Device Information ===
|
67 |
+
[12/28/2023-16:09:46] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-16:09:46] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-16:09:46] [I] SMs: 8
|
70 |
+
[12/28/2023-16:09:46] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-16:09:46] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-16:09:46] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-16:09:46] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-16:09:46] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-16:09:46] [I]
|
76 |
+
[12/28/2023-16:09:46] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-16:09:46] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2974 (MiB)
|
78 |
+
[12/28/2023-16:09:49] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +283, now: CPU 574, GPU 3280 (MiB)
|
79 |
+
[12/28/2023-16:09:49] [I] Start parsing network model
|
80 |
+
[12/28/2023-16:09:49] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-16:09:49] [I] [TRT] Input filename: yolo_nas_pose_l_fp16.onnx
|
82 |
+
[12/28/2023-16:09:49] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-16:09:49] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-16:09:49] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-16:09:49] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-16:09:49] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-16:09:49] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-16:09:49] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-16:09:49] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-16:09:49] [I] Finish parsing network model
|
91 |
+
[12/28/2023-16:09:50] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-16:09:50] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 458) [Constant]
|
96 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 459) [Constant]
|
97 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 460) [Constant]
|
98 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv1/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
166 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
167 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
168 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
169 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
170 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
171 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
172 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
173 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
174 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
175 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
176 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
177 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
178 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
179 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
180 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
181 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
182 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
183 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
184 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
185 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
186 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 187) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
187 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
188 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
189 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 195) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
190 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
191 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
192 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
193 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
194 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
195 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
196 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
197 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
198 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
199 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
200 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
201 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
202 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 224) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
203 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
204 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
205 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 232) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
206 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
207 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
208 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 240) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
209 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
210 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
211 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
212 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
213 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
214 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
215 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
216 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
217 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
218 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
219 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
220 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
221 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
222 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
223 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
224 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 271) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
225 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
226 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
227 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
228 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 294) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
229 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
230 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
231 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 302) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
232 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
233 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
234 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 310) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
235 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
236 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
237 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
238 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
239 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
240 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
241 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
242 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
243 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
244 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
245 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
246 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
247 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
248 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
249 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
250 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 341) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
251 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
252 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
253 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
254 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 364) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
255 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
256 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
257 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 372) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
258 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
259 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
260 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 380) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
261 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
262 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
263 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
264 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
265 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
266 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
267 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
268 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
269 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
270 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
271 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
272 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
273 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
274 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1...cast_boxes_to_fp32]}
|
275 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
276 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 462) [NMS]_1_output[DevicetoShapeHostCopy]
|
277 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
278 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
279 |
+
[12/28/2023-16:09:50] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
280 |
+
[12/28/2023-16:10:01] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +353, now: CPU 1231, GPU 3827 (MiB)
|
281 |
+
[12/28/2023-16:10:03] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +82, GPU +65, now: CPU 1313, GPU 3892 (MiB)
|
282 |
+
[12/28/2023-16:10:03] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
283 |
+
[12/28/2023-17:14:35] [I] [TRT] Total Activation Memory: 8058785792
|
284 |
+
[12/28/2023-17:14:35] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
285 |
+
[12/28/2023-17:14:49] [I] [TRT] Total Host Persistent Memory: 387328
|
286 |
+
[12/28/2023-17:14:49] [I] [TRT] Total Device Persistent Memory: 51712
|
287 |
+
[12/28/2023-17:14:49] [I] [TRT] Total Scratch Memory: 134217728
|
288 |
+
[12/28/2023-17:14:49] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 69 MiB, GPU 2131 MiB
|
289 |
+
[12/28/2023-17:14:49] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 196 steps to complete.
|
290 |
+
[12/28/2023-17:14:49] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 90.8216ms to assign 13 blocks to 196 nodes requiring 160489472 bytes.
|
291 |
+
[12/28/2023-17:14:49] [I] [TRT] Total Activation Memory: 160489472
|
292 |
+
[12/28/2023-17:14:55] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU -16, now: CPU 1661, GPU 5679 (MiB)
|
293 |
+
[12/28/2023-17:14:55] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +16, GPU +128, now: CPU 16, GPU 128 (MiB)
|
294 |
+
[12/28/2023-17:14:55] [I] Engine built in 3909.9 sec.
|
295 |
+
[12/28/2023-17:14:56] [I] [TRT] Loaded engine size: 105 MiB
|
296 |
+
[12/28/2023-17:14:56] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1347, GPU 5281 (MiB)
|
297 |
+
[12/28/2023-17:14:56] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +103, now: CPU 0, GPU 103 (MiB)
|
298 |
+
[12/28/2023-17:14:56] [I] Engine deserialized in 0.281193 sec.
|
299 |
+
[12/28/2023-17:14:56] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU -1, now: CPU 1348, GPU 5280 (MiB)
|
300 |
+
[12/28/2023-17:14:56] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +154, now: CPU 0, GPU 257 (MiB)
|
301 |
+
[12/28/2023-17:14:56] [I] Setting persistentCacheLimit to 0 bytes.
|
302 |
+
[12/28/2023-17:14:56] [I] Using random values for input onnx::Cast_0
|
303 |
+
[12/28/2023-17:14:56] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
304 |
+
[12/28/2023-17:14:56] [I] Using random values for output graph2_flat_predictions
|
305 |
+
[12/28/2023-17:14:56] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
306 |
+
[12/28/2023-17:14:56] [I] Starting inference
|
307 |
+
[12/28/2023-17:15:12] [I] Warmup completed 1 queries over 200 ms
|
308 |
+
[12/28/2023-17:15:12] [I] Timing trace has 446 queries over 15.0628 s
|
309 |
+
[12/28/2023-17:15:12] [I]
|
310 |
+
[12/28/2023-17:15:12] [I] === Trace details ===
|
311 |
+
[12/28/2023-17:15:12] [I] Trace averages of 100 runs:
|
312 |
+
[12/28/2023-17:15:12] [I] Average on 100 runs - GPU latency: 33.8846 ms - Host latency: 34.0014 ms (enqueue 33.9409 ms)
|
313 |
+
[12/28/2023-17:15:12] [I] Average on 100 runs - GPU latency: 33.6823 ms - Host latency: 33.7942 ms (enqueue 33.7436 ms)
|
314 |
+
[12/28/2023-17:15:12] [I] Average on 100 runs - GPU latency: 33.5307 ms - Host latency: 33.6433 ms (enqueue 33.5802 ms)
|
315 |
+
[12/28/2023-17:15:12] [I] Average on 100 runs - GPU latency: 33.377 ms - Host latency: 33.4884 ms (enqueue 33.4514 ms)
|
316 |
+
[12/28/2023-17:15:12] [I]
|
317 |
+
[12/28/2023-17:15:12] [I] === Performance summary ===
|
318 |
+
[12/28/2023-17:15:12] [I] Throughput: 29.6093 qps
|
319 |
+
[12/28/2023-17:15:12] [I] Latency: min = 31.7529 ms, max = 44.1514 ms, mean = 33.7469 ms, median = 33.4268 ms, percentile(90%) = 34.5583 ms, percentile(95%) = 37.8339 ms, percentile(99%) = 42.0027 ms
|
320 |
+
[12/28/2023-17:15:12] [I] Enqueue Time: min = 31.7227 ms, max = 44.1133 ms, mean = 33.6924 ms, median = 33.4424 ms, percentile(90%) = 34.3545 ms, percentile(95%) = 37.7542 ms, percentile(99%) = 41.9526 ms
|
321 |
+
[12/28/2023-17:15:12] [I] H2D Latency: min = 0.0800781 ms, max = 0.114746 ms, mean = 0.0954138 ms, median = 0.0969238 ms, percentile(90%) = 0.100098 ms, percentile(95%) = 0.100586 ms, percentile(99%) = 0.103027 ms
|
322 |
+
[12/28/2023-17:15:12] [I] GPU Compute Time: min = 31.6406 ms, max = 44.0381 ms, mean = 33.6343 ms, median = 33.311 ms, percentile(90%) = 34.4478 ms, percentile(95%) = 37.7091 ms, percentile(99%) = 41.8918 ms
|
323 |
+
[12/28/2023-17:15:12] [I] D2H Latency: min = 0.00292969 ms, max = 0.0541992 ms, mean = 0.017179 ms, median = 0.0146484 ms, percentile(90%) = 0.0290527 ms, percentile(95%) = 0.0314941 ms, percentile(99%) = 0.0361328 ms
|
324 |
+
[12/28/2023-17:15:12] [I] Total Host Walltime: 15.0628 s
|
325 |
+
[12/28/2023-17:15:12] [I] Total GPU Compute Time: 15.0009 s
|
326 |
+
[12/28/2023-17:15:12] [I] Explanations of the performance metrics are printed in the verbose logs.
|
327 |
+
[12/28/2023-17:15:12] [I]
|
328 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.fp16.engine
|
yolo_nas_pose_l_fp16.onnx.int8.engine.err
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-19:27:13] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-19:27:13] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-19:27:13] [E] Error[4]: [network.cpp::validate::2925] Error Code 4: Internal Error (fp16 precision has been set for a layer or layer output, but fp16 is not configured in the builder)
|
4 |
+
[12/28/2023-19:27:13] [E] Error[2]: [builder.cpp::buildSerializedNetwork::751] Error Code 2: Internal Error (Assertion engine != nullptr failed. )
|
5 |
+
[12/28/2023-19:27:13] [E] Engine could not be created from network
|
6 |
+
[12/28/2023-19:27:13] [E] Building engine failed
|
7 |
+
[12/28/2023-19:27:13] [E] Failed to create engine from model or file.
|
8 |
+
[12/28/2023-19:27:13] [E] Engine set up failed
|
yolo_nas_pose_l_fp16.onnx.int8.engine.log
ADDED
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.int8.engine
|
2 |
+
[12/28/2023-19:27:02] [I] === Model Options ===
|
3 |
+
[12/28/2023-19:27:02] [I] Format: ONNX
|
4 |
+
[12/28/2023-19:27:02] [I] Model: yolo_nas_pose_l_fp16.onnx
|
5 |
+
[12/28/2023-19:27:02] [I] Output:
|
6 |
+
[12/28/2023-19:27:02] [I] === Build Options ===
|
7 |
+
[12/28/2023-19:27:02] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-19:27:02] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-19:27:02] [I] minTiming: 1
|
10 |
+
[12/28/2023-19:27:02] [I] avgTiming: 8
|
11 |
+
[12/28/2023-19:27:02] [I] Precision: FP32+INT8
|
12 |
+
[12/28/2023-19:27:02] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-19:27:02] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-19:27:02] [I] Refit: Disabled
|
15 |
+
[12/28/2023-19:27:02] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-19:27:02] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-19:27:02] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-19:27:02] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-19:27:02] [I] Build only: Disabled
|
20 |
+
[12/28/2023-19:27:02] [I] Save engine: yolo_nas_pose_l_fp16.onnx.int8.engine
|
21 |
+
[12/28/2023-19:27:02] [I] Load engine:
|
22 |
+
[12/28/2023-19:27:02] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-19:27:02] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-19:27:02] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-19:27:02] [I] timingCacheFile:
|
26 |
+
[12/28/2023-19:27:02] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-19:27:02] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-19:27:02] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-19:27:02] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-19:27:02] [I] Input build shapes: model
|
31 |
+
[12/28/2023-19:27:02] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-19:27:02] [I] === System Options ===
|
33 |
+
[12/28/2023-19:27:02] [I] Device: 0
|
34 |
+
[12/28/2023-19:27:02] [I] DLACore:
|
35 |
+
[12/28/2023-19:27:02] [I] Plugins:
|
36 |
+
[12/28/2023-19:27:02] [I] === Inference Options ===
|
37 |
+
[12/28/2023-19:27:02] [I] Batch: Explicit
|
38 |
+
[12/28/2023-19:27:02] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-19:27:02] [I] Iterations: 10
|
40 |
+
[12/28/2023-19:27:02] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-19:27:02] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-19:27:02] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-19:27:02] [I] Streams: 1
|
44 |
+
[12/28/2023-19:27:02] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-19:27:02] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-19:27:02] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-19:27:02] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-19:27:02] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-19:27:02] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-19:27:02] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-19:27:02] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-19:27:02] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-19:27:02] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-19:27:02] [I] Inputs:
|
55 |
+
[12/28/2023-19:27:02] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-19:27:02] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-19:27:02] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-19:27:02] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-19:27:02] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-19:27:02] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-19:27:02] [I] Profile: Disabled
|
62 |
+
[12/28/2023-19:27:02] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-19:27:02] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-19:27:02] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-19:27:02] [I]
|
66 |
+
[12/28/2023-19:27:02] [I] === Device Information ===
|
67 |
+
[12/28/2023-19:27:02] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-19:27:02] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-19:27:02] [I] SMs: 8
|
70 |
+
[12/28/2023-19:27:02] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-19:27:02] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-19:27:02] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-19:27:02] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-19:27:02] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-19:27:02] [I]
|
76 |
+
[12/28/2023-19:27:02] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-19:27:07] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2837 (MiB)
|
78 |
+
[12/28/2023-19:27:11] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +285, now: CPU 574, GPU 3142 (MiB)
|
79 |
+
[12/28/2023-19:27:11] [I] Start parsing network model
|
80 |
+
[12/28/2023-19:27:12] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-19:27:12] [I] [TRT] Input filename: yolo_nas_pose_l_fp16.onnx
|
82 |
+
[12/28/2023-19:27:12] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-19:27:12] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-19:27:12] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-19:27:12] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-19:27:12] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-19:27:12] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-19:27:12] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-19:27:12] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-19:27:13] [I] Finish parsing network model
|
91 |
+
[12/28/2023-19:27:13] [I] FP32 and INT8 precisions have been specified - more performance might be enabled by additionally specifying --fp16 or --best
|
92 |
+
&&&& FAILED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp16.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp16.onnx.int8.engine
|
yolo_nas_pose_l_fp16.onnx.usage.txt
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
Model exported successfully to yolo_nas_pose_l_fp16.onnx
|
3 |
+
Model expects input image of shape [1, 3, 640, 640]
|
4 |
+
Input image dtype is torch.uint8
|
5 |
+
|
6 |
+
Exported model already contains preprocessing (normalization) step, so you don't need to do it manually.
|
7 |
+
Preprocessing steps to be applied to input image are:
|
8 |
+
Sequential(
|
9 |
+
(0): CastTensorTo(dtype=torch.float16)
|
10 |
+
(1): ChannelSelect(channels_indexes=tensor([2, 1, 0], device='cuda:0'))
|
11 |
+
(2): ApplyMeanStd(mean=[0.], scale=[255.])
|
12 |
+
)
|
13 |
+
|
14 |
+
|
15 |
+
Exported model contains postprocessing (NMS) step with the following parameters:
|
16 |
+
num_pre_nms_predictions=1000
|
17 |
+
max_predictions_per_image=10
|
18 |
+
nms_threshold=0.5
|
19 |
+
confidence_threshold=0.15
|
20 |
+
output_predictions_format=flat
|
21 |
+
|
22 |
+
|
23 |
+
Exported model is in ONNX format and can be used with ONNXRuntime
|
24 |
+
To run inference with ONNXRuntime, please use the following code snippet:
|
25 |
+
|
26 |
+
import onnxruntime
|
27 |
+
import numpy as np
|
28 |
+
session = onnxruntime.InferenceSession("yolo_nas_pose_l_fp16.onnx", providers=["CUDAExecutionProvider", "CPUExecutionProvider"])
|
29 |
+
inputs = [o.name for o in session.get_inputs()]
|
30 |
+
outputs = [o.name for o in session.get_outputs()]
|
31 |
+
|
32 |
+
example_input_image = np.zeros((1, 3, 640, 640)).astype(np.uint8)
|
33 |
+
predictions = session.run(outputs, {inputs[0]: example_input_image})
|
34 |
+
|
35 |
+
Exported model can also be used with TensorRT
|
36 |
+
To run inference with TensorRT, please see TensorRT deployment documentation
|
37 |
+
You can benchmark the model using the following code snippet:
|
38 |
+
|
39 |
+
trtexec --onnx=yolo_nas_pose_l_fp16.onnx --fp16 --avgRuns=100 --duration=15
|
40 |
+
|
41 |
+
|
42 |
+
Exported model has predictions in flat format:
|
43 |
+
|
44 |
+
# flat_predictions is a 2D array of [N,K] shape
|
45 |
+
# Each row represents (image_index, x_min, y_min, x_max, y_max, confidence, joints...)
|
46 |
+
# Please note all values are floats, so you have to convert them to integers if needed
|
47 |
+
|
48 |
+
[flat_predictions] = predictions
|
49 |
+
pred_bboxes = flat_predictions[:, 1:5]
|
50 |
+
pred_scores = flat_predictions[:, 5]
|
51 |
+
pred_joints = flat_predictions[:, 6:].reshape((len(pred_bboxes), -1, 3))
|
52 |
+
for i in range(len(pred_bboxes)):
|
53 |
+
confidence = pred_scores[i]
|
54 |
+
x_min, y_min, x_max, y_max = pred_bboxes[i]
|
55 |
+
print(f"Detected pose with confidence={{confidence}}, x_min={{x_min}}, y_min={{y_min}}, x_max={{x_max}}, y_max={{y_max}}")
|
56 |
+
for joint_index, (x, y, confidence) in enumerate(pred_joints[i]):")
|
57 |
+
print(f"Joint {{joint_index}} has coordinates x={{x}}, y={{y}}, confidence={{confidence}}")
|
58 |
+
|
yolo_nas_pose_l_fp32.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfd7c12de1275152ce64af33b734c74c085ed45403fb2722385718850a71f363
|
3 |
+
size 217830699
|
yolo_nas_pose_l_fp32.onnx.best.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea7e820c1d67f86f3b4c5749752351cb53d4f31886b72214b78d0621b27957f
|
3 |
+
size 57142878
|
yolo_nas_pose_l_fp32.onnx.best.engine.err
ADDED
@@ -0,0 +1,504 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-12:58:51] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-12:58:51] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-12:58:51] [W] [TRT] Calibrator is not being used. Users must provide dynamic range for all tensors that are not Int32 or Bool.
|
4 |
+
[12/28/2023-13:32:07] [W] [TRT] Tactic Device request: 4720MB Available: 2945MB. Device memory is insufficient to use tactic.
|
5 |
+
[12/28/2023-13:32:07] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000004.
|
6 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
7 |
+
[12/28/2023-13:32:07] [W] [TRT] Tactic Device request: 4720MB Available: 2943MB. Device memory is insufficient to use tactic.
|
8 |
+
[12/28/2023-13:32:07] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4720 detected for tactic 0x000000000000003c.
|
9 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
10 |
+
[12/28/2023-13:32:08] [W] [TRT] Tactic Device request: 4720MB Available: 2943MB. Device memory is insufficient to use tactic.
|
11 |
+
[12/28/2023-13:32:08] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000074.
|
12 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
13 |
+
[12/28/2023-13:32:13] [W] [TRT] Tactic Device request: 4706MB Available: 2945MB. Device memory is insufficient to use tactic.
|
14 |
+
[12/28/2023-13:32:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4706 detected for tactic 0x0000000000000004.
|
15 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
16 |
+
[12/28/2023-13:32:14] [W] [TRT] Tactic Device request: 4706MB Available: 2944MB. Device memory is insufficient to use tactic.
|
17 |
+
[12/28/2023-13:32:14] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4706 detected for tactic 0x000000000000003c.
|
18 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
19 |
+
[12/28/2023-13:32:18] [W] [TRT] Tactic Device request: 4711MB Available: 2921MB. Device memory is insufficient to use tactic.
|
20 |
+
[12/28/2023-13:32:18] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
21 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
22 |
+
[12/28/2023-13:32:19] [W] [TRT] Tactic Device request: 4711MB Available: 2920MB. Device memory is insufficient to use tactic.
|
23 |
+
[12/28/2023-13:32:19] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
24 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
25 |
+
[12/28/2023-13:32:19] [W] [TRT] Tactic Device request: 4711MB Available: 2919MB. Device memory is insufficient to use tactic.
|
26 |
+
[12/28/2023-13:32:19] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
27 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
28 |
+
[12/28/2023-13:32:24] [W] [TRT] Tactic Device request: 4702MB Available: 2920MB. Device memory is insufficient to use tactic.
|
29 |
+
[12/28/2023-13:32:24] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4702 detected for tactic 0x0000000000000004.
|
30 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
31 |
+
[12/28/2023-13:32:25] [W] [TRT] Tactic Device request: 4702MB Available: 2921MB. Device memory is insufficient to use tactic.
|
32 |
+
[12/28/2023-13:32:25] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4702 detected for tactic 0x000000000000003c.
|
33 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
34 |
+
[12/28/2023-13:32:29] [W] [TRT] Tactic Device request: 4711MB Available: 2875MB. Device memory is insufficient to use tactic.
|
35 |
+
[12/28/2023-13:32:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
36 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
37 |
+
[12/28/2023-13:32:30] [W] [TRT] Tactic Device request: 4711MB Available: 2875MB. Device memory is insufficient to use tactic.
|
38 |
+
[12/28/2023-13:32:30] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
39 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
40 |
+
[12/28/2023-13:32:30] [W] [TRT] Tactic Device request: 4711MB Available: 2874MB. Device memory is insufficient to use tactic.
|
41 |
+
[12/28/2023-13:32:30] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
42 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
43 |
+
[12/28/2023-13:32:35] [W] [TRT] Tactic Device request: 4702MB Available: 2874MB. Device memory is insufficient to use tactic.
|
44 |
+
[12/28/2023-13:32:35] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4702 detected for tactic 0x0000000000000004.
|
45 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
46 |
+
[12/28/2023-13:32:36] [W] [TRT] Tactic Device request: 4702MB Available: 2874MB. Device memory is insufficient to use tactic.
|
47 |
+
[12/28/2023-13:32:36] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4702 detected for tactic 0x000000000000003c.
|
48 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
49 |
+
[12/28/2023-13:40:10] [W] [TRT] Tactic Device request: 4711MB Available: 2317MB. Device memory is insufficient to use tactic.
|
50 |
+
[12/28/2023-13:40:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
51 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
52 |
+
[12/28/2023-13:40:10] [W] [TRT] Tactic Device request: 4711MB Available: 2317MB. Device memory is insufficient to use tactic.
|
53 |
+
[12/28/2023-13:40:11] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
54 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
55 |
+
[12/28/2023-13:40:11] [W] [TRT] Tactic Device request: 4711MB Available: 2317MB. Device memory is insufficient to use tactic.
|
56 |
+
[12/28/2023-13:40:11] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
57 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
58 |
+
[12/28/2023-13:40:13] [W] [TRT] Tactic Device request: 4701MB Available: 2317MB. Device memory is insufficient to use tactic.
|
59 |
+
[12/28/2023-13:40:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4701 detected for tactic 0x0000000000000004.
|
60 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
61 |
+
[12/28/2023-13:40:13] [W] [TRT] Tactic Device request: 4701MB Available: 2316MB. Device memory is insufficient to use tactic.
|
62 |
+
[12/28/2023-13:40:13] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4701 detected for tactic 0x000000000000003c.
|
63 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
64 |
+
[12/28/2023-13:40:32] [W] [TRT] Tactic Device request: 6275MB Available: 2317MB. Device memory is insufficient to use tactic.
|
65 |
+
[12/28/2023-13:40:32] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
66 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
67 |
+
[12/28/2023-13:40:32] [W] [TRT] Tactic Device request: 6275MB Available: 2317MB. Device memory is insufficient to use tactic.
|
68 |
+
[12/28/2023-13:40:32] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
69 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
70 |
+
[12/28/2023-13:40:32] [W] [TRT] Tactic Device request: 6275MB Available: 2317MB. Device memory is insufficient to use tactic.
|
71 |
+
[12/28/2023-13:40:32] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
72 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
73 |
+
[12/28/2023-13:40:34] [W] [TRT] Tactic Device request: 6270MB Available: 2318MB. Device memory is insufficient to use tactic.
|
74 |
+
[12/28/2023-13:40:34] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6270 detected for tactic 0x0000000000000004.
|
75 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
76 |
+
[12/28/2023-13:40:34] [W] [TRT] Tactic Device request: 6270MB Available: 2318MB. Device memory is insufficient to use tactic.
|
77 |
+
[12/28/2023-13:40:34] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6270 detected for tactic 0x000000000000003c.
|
78 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
79 |
+
[12/28/2023-13:51:21] [W] [TRT] Tactic Device request: 7056MB Available: 2081MB. Device memory is insufficient to use tactic.
|
80 |
+
[12/28/2023-13:51:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
81 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
82 |
+
[12/28/2023-13:51:21] [W] [TRT] Tactic Device request: 7056MB Available: 2081MB. Device memory is insufficient to use tactic.
|
83 |
+
[12/28/2023-13:51:21] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
84 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
85 |
+
[12/28/2023-13:51:21] [W] [TRT] Tactic Device request: 7056MB Available: 2081MB. Device memory is insufficient to use tactic.
|
86 |
+
[12/28/2023-13:51:21] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
87 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
88 |
+
[12/28/2023-13:51:23] [W] [TRT] Tactic Device request: 7050MB Available: 2080MB. Device memory is insufficient to use tactic.
|
89 |
+
[12/28/2023-13:51:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7050 detected for tactic 0x0000000000000004.
|
90 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
91 |
+
[12/28/2023-13:51:23] [W] [TRT] Tactic Device request: 7050MB Available: 2079MB. Device memory is insufficient to use tactic.
|
92 |
+
[12/28/2023-13:51:23] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 7050 detected for tactic 0x000000000000003c.
|
93 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
94 |
+
[12/28/2023-13:51:44] [W] [TRT] Tactic Device request: 6354MB Available: 2081MB. Device memory is insufficient to use tactic.
|
95 |
+
[12/28/2023-13:51:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
96 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
97 |
+
[12/28/2023-13:51:45] [W] [TRT] Tactic Device request: 6354MB Available: 2081MB. Device memory is insufficient to use tactic.
|
98 |
+
[12/28/2023-13:51:45] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
99 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
100 |
+
[12/28/2023-13:51:45] [W] [TRT] Tactic Device request: 6354MB Available: 2081MB. Device memory is insufficient to use tactic.
|
101 |
+
[12/28/2023-13:51:45] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
102 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
103 |
+
[12/28/2023-13:51:47] [W] [TRT] Tactic Device request: 6351MB Available: 2080MB. Device memory is insufficient to use tactic.
|
104 |
+
[12/28/2023-13:51:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6351 detected for tactic 0x0000000000000004.
|
105 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
106 |
+
[12/28/2023-13:51:47] [W] [TRT] Tactic Device request: 6351MB Available: 2080MB. Device memory is insufficient to use tactic.
|
107 |
+
[12/28/2023-13:51:47] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6351 detected for tactic 0x000000000000003c.
|
108 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
109 |
+
[12/28/2023-13:51:49] [W] [TRT] Tactic Device request: 2127MB Available: 2079MB. Device memory is insufficient to use tactic.
|
110 |
+
[12/28/2023-13:51:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2127 detected for tactic 0x0000000000000004.
|
111 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
112 |
+
[12/28/2023-13:51:50] [W] [TRT] Tactic Device request: 2127MB Available: 2078MB. Device memory is insufficient to use tactic.
|
113 |
+
[12/28/2023-13:51:50] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2127 detected for tactic 0x000000000000003c.
|
114 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
115 |
+
[12/28/2023-13:51:50] [W] [TRT] Tactic Device request: 2127MB Available: 2078MB. Device memory is insufficient to use tactic.
|
116 |
+
[12/28/2023-13:51:50] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2127 detected for tactic 0x0000000000000074.
|
117 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
118 |
+
[12/28/2023-13:51:53] [W] [TRT] Tactic Device request: 2124MB Available: 2081MB. Device memory is insufficient to use tactic.
|
119 |
+
[12/28/2023-13:51:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2124 detected for tactic 0x0000000000000004.
|
120 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
121 |
+
[12/28/2023-13:51:53] [W] [TRT] Tactic Device request: 2124MB Available: 2072MB. Device memory is insufficient to use tactic.
|
122 |
+
[12/28/2023-13:51:53] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2124 detected for tactic 0x000000000000003c.
|
123 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
124 |
+
[12/28/2023-13:51:56] [W] [TRT] Tactic Device request: 2125MB Available: 2070MB. Device memory is insufficient to use tactic.
|
125 |
+
[12/28/2023-13:51:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2125 detected for tactic 0x0000000000000004.
|
126 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
127 |
+
[12/28/2023-13:51:56] [W] [TRT] Tactic Device request: 2125MB Available: 2052MB. Device memory is insufficient to use tactic.
|
128 |
+
[12/28/2023-13:51:56] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2125 detected for tactic 0x000000000000003c.
|
129 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
130 |
+
[12/28/2023-13:51:57] [W] [TRT] Tactic Device request: 2125MB Available: 2052MB. Device memory is insufficient to use tactic.
|
131 |
+
[12/28/2023-13:51:57] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2125 detected for tactic 0x0000000000000074.
|
132 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
133 |
+
[12/28/2023-13:51:59] [W] [TRT] Tactic Device request: 2124MB Available: 2053MB. Device memory is insufficient to use tactic.
|
134 |
+
[12/28/2023-13:51:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2124 detected for tactic 0x0000000000000004.
|
135 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
136 |
+
[12/28/2023-13:52:00] [W] [TRT] Tactic Device request: 2124MB Available: 2051MB. Device memory is insufficient to use tactic.
|
137 |
+
[12/28/2023-13:52:00] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2124 detected for tactic 0x000000000000003c.
|
138 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
139 |
+
[12/28/2023-13:52:02] [W] [TRT] Tactic Device request: 2125MB Available: 2051MB. Device memory is insufficient to use tactic.
|
140 |
+
[12/28/2023-13:52:02] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2125 detected for tactic 0x0000000000000004.
|
141 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
142 |
+
[12/28/2023-13:52:03] [W] [TRT] Tactic Device request: 2125MB Available: 2051MB. Device memory is insufficient to use tactic.
|
143 |
+
[12/28/2023-13:52:03] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2125 detected for tactic 0x000000000000003c.
|
144 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
145 |
+
[12/28/2023-13:52:03] [W] [TRT] Tactic Device request: 2125MB Available: 2051MB. Device memory is insufficient to use tactic.
|
146 |
+
[12/28/2023-13:52:03] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2125 detected for tactic 0x0000000000000074.
|
147 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
148 |
+
[12/28/2023-13:52:06] [W] [TRT] Tactic Device request: 2124MB Available: 2039MB. Device memory is insufficient to use tactic.
|
149 |
+
[12/28/2023-13:52:06] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2124 detected for tactic 0x0000000000000004.
|
150 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
151 |
+
[12/28/2023-13:52:06] [W] [TRT] Tactic Device request: 2124MB Available: 2038MB. Device memory is insufficient to use tactic.
|
152 |
+
[12/28/2023-13:52:06] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2124 detected for tactic 0x000000000000003c.
|
153 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
154 |
+
[12/28/2023-14:06:20] [W] [TRT] Tactic Device request: 2394MB Available: 1765MB. Device memory is insufficient to use tactic.
|
155 |
+
[12/28/2023-14:06:20] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000004.
|
156 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
157 |
+
[12/28/2023-14:06:20] [W] [TRT] Tactic Device request: 2394MB Available: 1764MB. Device memory is insufficient to use tactic.
|
158 |
+
[12/28/2023-14:06:20] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
159 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
160 |
+
[12/28/2023-14:06:20] [W] [TRT] Tactic Device request: 2394MB Available: 1764MB. Device memory is insufficient to use tactic.
|
161 |
+
[12/28/2023-14:06:20] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
162 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
163 |
+
[12/28/2023-14:06:21] [W] [TRT] Tactic Device request: 2392MB Available: 1765MB. Device memory is insufficient to use tactic.
|
164 |
+
[12/28/2023-14:06:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
165 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
166 |
+
[12/28/2023-14:06:21] [W] [TRT] Tactic Device request: 2392MB Available: 1764MB. Device memory is insufficient to use tactic.
|
167 |
+
[12/28/2023-14:06:21] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
168 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
169 |
+
[12/28/2023-14:06:21] [W] [TRT] Tactic Device request: 2392MB Available: 1764MB. Device memory is insufficient to use tactic.
|
170 |
+
[12/28/2023-14:06:21] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
171 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
172 |
+
[12/28/2023-14:06:22] [W] [TRT] Tactic Device request: 2391MB Available: 1764MB. Device memory is insufficient to use tactic.
|
173 |
+
[12/28/2023-14:06:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2391 detected for tactic 0x0000000000000004.
|
174 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
175 |
+
[12/28/2023-14:06:23] [W] [TRT] Tactic Device request: 2391MB Available: 1763MB. Device memory is insufficient to use tactic.
|
176 |
+
[12/28/2023-14:06:23] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2391 detected for tactic 0x000000000000003c.
|
177 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
178 |
+
[12/28/2023-14:06:23] [W] [TRT] Tactic Device request: 2390MB Available: 1763MB. Device memory is insufficient to use tactic.
|
179 |
+
[12/28/2023-14:06:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
180 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
181 |
+
[12/28/2023-14:06:23] [W] [TRT] Tactic Device request: 2390MB Available: 1763MB. Device memory is insufficient to use tactic.
|
182 |
+
[12/28/2023-14:06:23] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
183 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
184 |
+
[12/28/2023-14:06:41] [W] [TRT] Tactic Device request: 6540MB Available: 1782MB. Device memory is insufficient to use tactic.
|
185 |
+
[12/28/2023-14:06:41] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000004.
|
186 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
187 |
+
[12/28/2023-14:06:41] [W] [TRT] Tactic Device request: 6540MB Available: 1781MB. Device memory is insufficient to use tactic.
|
188 |
+
[12/28/2023-14:06:41] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6540 detected for tactic 0x000000000000003c.
|
189 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
190 |
+
[12/28/2023-14:06:42] [W] [TRT] Tactic Device request: 6540MB Available: 1781MB. Device memory is insufficient to use tactic.
|
191 |
+
[12/28/2023-14:06:42] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000074.
|
192 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
193 |
+
[12/28/2023-14:06:44] [W] [TRT] Tactic Device request: 6538MB Available: 1781MB. Device memory is insufficient to use tactic.
|
194 |
+
[12/28/2023-14:06:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6538 detected for tactic 0x0000000000000004.
|
195 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
196 |
+
[12/28/2023-14:06:44] [W] [TRT] Tactic Device request: 6538MB Available: 1781MB. Device memory is insufficient to use tactic.
|
197 |
+
[12/28/2023-14:06:44] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6538 detected for tactic 0x000000000000003c.
|
198 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
199 |
+
[12/28/2023-14:06:47] [W] [TRT] Tactic Device request: 2191MB Available: 1783MB. Device memory is insufficient to use tactic.
|
200 |
+
[12/28/2023-14:06:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000004.
|
201 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
202 |
+
[12/28/2023-14:06:48] [W] [TRT] Tactic Device request: 2191MB Available: 1783MB. Device memory is insufficient to use tactic.
|
203 |
+
[12/28/2023-14:06:48] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2191 detected for tactic 0x000000000000003c.
|
204 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
205 |
+
[12/28/2023-14:06:48] [W] [TRT] Tactic Device request: 2191MB Available: 1782MB. Device memory is insufficient to use tactic.
|
206 |
+
[12/28/2023-14:06:49] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000074.
|
207 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
208 |
+
[12/28/2023-14:06:52] [W] [TRT] Tactic Device request: 2190MB Available: 1779MB. Device memory is insufficient to use tactic.
|
209 |
+
[12/28/2023-14:06:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
210 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
211 |
+
[12/28/2023-14:06:53] [W] [TRT] Tactic Device request: 2190MB Available: 1779MB. Device memory is insufficient to use tactic.
|
212 |
+
[12/28/2023-14:06:53] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
213 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
214 |
+
[12/28/2023-14:06:57] [W] [TRT] Tactic Device request: 2190MB Available: 1780MB. Device memory is insufficient to use tactic.
|
215 |
+
[12/28/2023-14:06:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
216 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
217 |
+
[12/28/2023-14:06:58] [W] [TRT] Tactic Device request: 2190MB Available: 1778MB. Device memory is insufficient to use tactic.
|
218 |
+
[12/28/2023-14:06:58] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
219 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
220 |
+
[12/28/2023-14:06:59] [W] [TRT] Tactic Device request: 2190MB Available: 1775MB. Device memory is insufficient to use tactic.
|
221 |
+
[12/28/2023-14:06:59] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
222 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
223 |
+
[12/28/2023-14:07:03] [W] [TRT] Tactic Device request: 2190MB Available: 1778MB. Device memory is insufficient to use tactic.
|
224 |
+
[12/28/2023-14:07:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
225 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
226 |
+
[12/28/2023-14:07:03] [W] [TRT] Tactic Device request: 2190MB Available: 1777MB. Device memory is insufficient to use tactic.
|
227 |
+
[12/28/2023-14:07:03] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
228 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
229 |
+
[12/28/2023-14:07:08] [W] [TRT] Tactic Device request: 2190MB Available: 1778MB. Device memory is insufficient to use tactic.
|
230 |
+
[12/28/2023-14:07:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
231 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
232 |
+
[12/28/2023-14:07:09] [W] [TRT] Tactic Device request: 2190MB Available: 1779MB. Device memory is insufficient to use tactic.
|
233 |
+
[12/28/2023-14:07:09] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
234 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
235 |
+
[12/28/2023-14:07:09] [W] [TRT] Tactic Device request: 2190MB Available: 1778MB. Device memory is insufficient to use tactic.
|
236 |
+
[12/28/2023-14:07:09] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
237 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
238 |
+
[12/28/2023-14:07:13] [W] [TRT] Tactic Device request: 2190MB Available: 1778MB. Device memory is insufficient to use tactic.
|
239 |
+
[12/28/2023-14:07:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
240 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
241 |
+
[12/28/2023-14:07:14] [W] [TRT] Tactic Device request: 2190MB Available: 1776MB. Device memory is insufficient to use tactic.
|
242 |
+
[12/28/2023-14:07:14] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
243 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
244 |
+
[12/28/2023-14:15:03] [W] [TRT] Tactic Device request: 2457MB Available: 2222MB. Device memory is insufficient to use tactic.
|
245 |
+
[12/28/2023-14:15:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
246 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
247 |
+
[12/28/2023-14:15:03] [W] [TRT] Tactic Device request: 2457MB Available: 2222MB. Device memory is insufficient to use tactic.
|
248 |
+
[12/28/2023-14:15:03] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
249 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
250 |
+
[12/28/2023-14:15:03] [W] [TRT] Tactic Device request: 2457MB Available: 2222MB. Device memory is insufficient to use tactic.
|
251 |
+
[12/28/2023-14:15:03] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
252 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
253 |
+
[12/28/2023-14:15:05] [W] [TRT] Tactic Device request: 2456MB Available: 2224MB. Device memory is insufficient to use tactic.
|
254 |
+
[12/28/2023-14:15:05] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2456 detected for tactic 0x0000000000000004.
|
255 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
256 |
+
[12/28/2023-14:15:05] [W] [TRT] Tactic Device request: 2456MB Available: 2224MB. Device memory is insufficient to use tactic.
|
257 |
+
[12/28/2023-14:15:05] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2456 detected for tactic 0x000000000000003c.
|
258 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
259 |
+
[12/28/2023-14:15:32] [W] [TRT] Tactic Device request: 3587MB Available: 1846MB. Device memory is insufficient to use tactic.
|
260 |
+
[12/28/2023-14:15:32] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
261 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
262 |
+
[12/28/2023-14:15:32] [W] [TRT] Tactic Device request: 3587MB Available: 1846MB. Device memory is insufficient to use tactic.
|
263 |
+
[12/28/2023-14:15:32] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
264 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
265 |
+
[12/28/2023-14:15:32] [W] [TRT] Tactic Device request: 3587MB Available: 1846MB. Device memory is insufficient to use tactic.
|
266 |
+
[12/28/2023-14:15:32] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
267 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
268 |
+
[12/28/2023-14:15:33] [W] [TRT] Tactic Device request: 3585MB Available: 1846MB. Device memory is insufficient to use tactic.
|
269 |
+
[12/28/2023-14:15:33] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3585 detected for tactic 0x0000000000000004.
|
270 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
271 |
+
[12/28/2023-14:15:34] [W] [TRT] Tactic Device request: 3585MB Available: 1846MB. Device memory is insufficient to use tactic.
|
272 |
+
[12/28/2023-14:15:34] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3585 detected for tactic 0x000000000000003c.
|
273 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
274 |
+
[12/28/2023-14:28:21] [W] [TRT] Tactic Device request: 3556MB Available: 1715MB. Device memory is insufficient to use tactic.
|
275 |
+
[12/28/2023-14:28:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
276 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
277 |
+
[12/28/2023-14:28:21] [W] [TRT] Tactic Device request: 3556MB Available: 1715MB. Device memory is insufficient to use tactic.
|
278 |
+
[12/28/2023-14:28:21] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
279 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
280 |
+
[12/28/2023-14:28:22] [W] [TRT] Tactic Device request: 3556MB Available: 1714MB. Device memory is insufficient to use tactic.
|
281 |
+
[12/28/2023-14:28:22] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
282 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
283 |
+
[12/28/2023-14:28:23] [W] [TRT] Tactic Device request: 3551MB Available: 1715MB. Device memory is insufficient to use tactic.
|
284 |
+
[12/28/2023-14:28:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3551 detected for tactic 0x0000000000000004.
|
285 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
286 |
+
[12/28/2023-14:28:23] [W] [TRT] Tactic Device request: 3551MB Available: 1715MB. Device memory is insufficient to use tactic.
|
287 |
+
[12/28/2023-14:28:23] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3551 detected for tactic 0x000000000000003c.
|
288 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
289 |
+
[12/28/2023-14:28:25] [W] [TRT] Tactic Device request: 3140MB Available: 1715MB. Device memory is insufficient to use tactic.
|
290 |
+
[12/28/2023-14:28:25] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000004.
|
291 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
292 |
+
[12/28/2023-14:28:25] [W] [TRT] Tactic Device request: 3140MB Available: 1715MB. Device memory is insufficient to use tactic.
|
293 |
+
[12/28/2023-14:28:25] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3140 detected for tactic 0x000000000000003c.
|
294 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
295 |
+
[12/28/2023-14:28:25] [W] [TRT] Tactic Device request: 3140MB Available: 1715MB. Device memory is insufficient to use tactic.
|
296 |
+
[12/28/2023-14:28:25] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000074.
|
297 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
298 |
+
[12/28/2023-14:28:26] [W] [TRT] Tactic Device request: 3136MB Available: 1715MB. Device memory is insufficient to use tactic.
|
299 |
+
[12/28/2023-14:28:26] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3136 detected for tactic 0x0000000000000004.
|
300 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
301 |
+
[12/28/2023-14:28:26] [W] [TRT] Tactic Device request: 3136MB Available: 1715MB. Device memory is insufficient to use tactic.
|
302 |
+
[12/28/2023-14:28:26] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3136 detected for tactic 0x000000000000003c.
|
303 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
304 |
+
[12/28/2023-14:40:35] [W] [TRT] Tactic Device request: 3161MB Available: 2110MB. Device memory is insufficient to use tactic.
|
305 |
+
[12/28/2023-14:40:35] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000004.
|
306 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
307 |
+
[12/28/2023-14:40:36] [W] [TRT] Tactic Device request: 3161MB Available: 2110MB. Device memory is insufficient to use tactic.
|
308 |
+
[12/28/2023-14:40:36] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3161 detected for tactic 0x000000000000003c.
|
309 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
310 |
+
[12/28/2023-14:40:36] [W] [TRT] Tactic Device request: 3161MB Available: 2110MB. Device memory is insufficient to use tactic.
|
311 |
+
[12/28/2023-14:40:36] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000074.
|
312 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
313 |
+
[12/28/2023-14:40:37] [W] [TRT] Tactic Device request: 3156MB Available: 2109MB. Device memory is insufficient to use tactic.
|
314 |
+
[12/28/2023-14:40:37] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3156 detected for tactic 0x0000000000000004.
|
315 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
316 |
+
[12/28/2023-14:40:37] [W] [TRT] Tactic Device request: 3156MB Available: 2109MB. Device memory is insufficient to use tactic.
|
317 |
+
[12/28/2023-14:40:37] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3156 detected for tactic 0x000000000000003c.
|
318 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
319 |
+
[12/28/2023-14:40:43] [W] [TRT] Tactic Device request: 4189MB Available: 2109MB. Device memory is insufficient to use tactic.
|
320 |
+
[12/28/2023-14:40:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000004.
|
321 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
322 |
+
[12/28/2023-14:40:44] [W] [TRT] Tactic Device request: 4189MB Available: 2088MB. Device memory is insufficient to use tactic.
|
323 |
+
[12/28/2023-14:40:44] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4189 detected for tactic 0x000000000000003c.
|
324 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
325 |
+
[12/28/2023-14:40:44] [W] [TRT] Tactic Device request: 4189MB Available: 2087MB. Device memory is insufficient to use tactic.
|
326 |
+
[12/28/2023-14:40:44] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000074.
|
327 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
328 |
+
[12/28/2023-14:40:49] [W] [TRT] Tactic Device request: 4183MB Available: 2085MB. Device memory is insufficient to use tactic.
|
329 |
+
[12/28/2023-14:40:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4183 detected for tactic 0x0000000000000004.
|
330 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
331 |
+
[12/28/2023-14:40:49] [W] [TRT] Tactic Device request: 4183MB Available: 2082MB. Device memory is insufficient to use tactic.
|
332 |
+
[12/28/2023-14:40:49] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4183 detected for tactic 0x000000000000003c.
|
333 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
334 |
+
[12/28/2023-14:40:52] [W] [TRT] Tactic Device request: 4186MB Available: 2082MB. Device memory is insufficient to use tactic.
|
335 |
+
[12/28/2023-14:40:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000004.
|
336 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
337 |
+
[12/28/2023-14:40:53] [W] [TRT] Tactic Device request: 4186MB Available: 2061MB. Device memory is insufficient to use tactic.
|
338 |
+
[12/28/2023-14:40:53] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4186 detected for tactic 0x000000000000003c.
|
339 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
340 |
+
[12/28/2023-14:40:53] [W] [TRT] Tactic Device request: 4186MB Available: 2060MB. Device memory is insufficient to use tactic.
|
341 |
+
[12/28/2023-14:40:53] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000074.
|
342 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
343 |
+
[12/28/2023-14:40:57] [W] [TRT] Tactic Device request: 4182MB Available: 2059MB. Device memory is insufficient to use tactic.
|
344 |
+
[12/28/2023-14:40:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4182 detected for tactic 0x0000000000000004.
|
345 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
346 |
+
[12/28/2023-14:40:58] [W] [TRT] Tactic Device request: 4182MB Available: 2054MB. Device memory is insufficient to use tactic.
|
347 |
+
[12/28/2023-14:40:58] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4182 detected for tactic 0x000000000000003c.
|
348 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
349 |
+
[12/28/2023-14:53:46] [W] [TRT] Tactic Device request: 4764MB Available: 2038MB. Device memory is insufficient to use tactic.
|
350 |
+
[12/28/2023-14:53:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000004.
|
351 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
352 |
+
[12/28/2023-14:53:46] [W] [TRT] Tactic Device request: 4764MB Available: 2038MB. Device memory is insufficient to use tactic.
|
353 |
+
[12/28/2023-14:53:46] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4764 detected for tactic 0x000000000000003c.
|
354 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
355 |
+
[12/28/2023-14:53:46] [W] [TRT] Tactic Device request: 4764MB Available: 2039MB. Device memory is insufficient to use tactic.
|
356 |
+
[12/28/2023-14:53:46] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000074.
|
357 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
358 |
+
[12/28/2023-14:53:48] [W] [TRT] Tactic Device request: 4761MB Available: 2038MB. Device memory is insufficient to use tactic.
|
359 |
+
[12/28/2023-14:53:48] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4761 detected for tactic 0x0000000000000004.
|
360 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
361 |
+
[12/28/2023-14:53:48] [W] [TRT] Tactic Device request: 4761MB Available: 2038MB. Device memory is insufficient to use tactic.
|
362 |
+
[12/28/2023-14:53:48] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4761 detected for tactic 0x000000000000003c.
|
363 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
364 |
+
[12/28/2023-14:53:56] [W] [TRT] Tactic Device request: 4244MB Available: 1833MB. Device memory is insufficient to use tactic.
|
365 |
+
[12/28/2023-14:53:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000004.
|
366 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
367 |
+
[12/28/2023-14:53:57] [W] [TRT] Tactic Device request: 4244MB Available: 1504MB. Device memory is insufficient to use tactic.
|
368 |
+
[12/28/2023-14:53:57] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4244 detected for tactic 0x000000000000003c.
|
369 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
370 |
+
[12/28/2023-14:53:58] [W] [TRT] Tactic Device request: 4244MB Available: 1500MB. Device memory is insufficient to use tactic.
|
371 |
+
[12/28/2023-14:53:58] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000074.
|
372 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
373 |
+
[12/28/2023-14:54:03] [W] [TRT] Tactic Device request: 4240MB Available: 1498MB. Device memory is insufficient to use tactic.
|
374 |
+
[12/28/2023-14:54:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4240 detected for tactic 0x0000000000000004.
|
375 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
376 |
+
[12/28/2023-14:54:03] [W] [TRT] Tactic Device request: 4240MB Available: 1494MB. Device memory is insufficient to use tactic.
|
377 |
+
[12/28/2023-14:54:03] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4240 detected for tactic 0x000000000000003c.
|
378 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
379 |
+
[12/28/2023-14:54:08] [W] [TRT] Tactic Device request: 4241MB Available: 1553MB. Device memory is insufficient to use tactic.
|
380 |
+
[12/28/2023-14:54:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000004.
|
381 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
382 |
+
[12/28/2023-14:54:09] [W] [TRT] Tactic Device request: 4241MB Available: 1514MB. Device memory is insufficient to use tactic.
|
383 |
+
[12/28/2023-14:54:09] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4241 detected for tactic 0x000000000000003c.
|
384 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
385 |
+
[12/28/2023-14:54:10] [W] [TRT] Tactic Device request: 4241MB Available: 1508MB. Device memory is insufficient to use tactic.
|
386 |
+
[12/28/2023-14:54:10] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000074.
|
387 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
388 |
+
[12/28/2023-14:54:14] [W] [TRT] Tactic Device request: 4239MB Available: 1510MB. Device memory is insufficient to use tactic.
|
389 |
+
[12/28/2023-14:54:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4239 detected for tactic 0x0000000000000004.
|
390 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
391 |
+
[12/28/2023-14:54:15] [W] [TRT] Tactic Device request: 4239MB Available: 1496MB. Device memory is insufficient to use tactic.
|
392 |
+
[12/28/2023-14:54:15] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4239 detected for tactic 0x000000000000003c.
|
393 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
394 |
+
[12/28/2023-14:55:04] [W] [TRT] Tactic Device request: 1637MB Available: 1234MB. Device memory is insufficient to use tactic.
|
395 |
+
[12/28/2023-14:55:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
396 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
397 |
+
[12/28/2023-14:55:04] [W] [TRT] Tactic Device request: 1637MB Available: 1234MB. Device memory is insufficient to use tactic.
|
398 |
+
[12/28/2023-14:55:04] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
399 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
400 |
+
[12/28/2023-14:55:04] [W] [TRT] Tactic Device request: 1637MB Available: 1234MB. Device memory is insufficient to use tactic.
|
401 |
+
[12/28/2023-14:55:04] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000074.
|
402 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
403 |
+
[12/28/2023-14:55:05] [W] [TRT] Tactic Device request: 1636MB Available: 1268MB. Device memory is insufficient to use tactic.
|
404 |
+
[12/28/2023-14:55:05] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1636 detected for tactic 0x0000000000000004.
|
405 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
406 |
+
[12/28/2023-14:55:05] [W] [TRT] Tactic Device request: 1636MB Available: 1268MB. Device memory is insufficient to use tactic.
|
407 |
+
[12/28/2023-14:55:05] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1636 detected for tactic 0x000000000000003c.
|
408 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
409 |
+
[12/28/2023-15:08:11] [W] [TRT] Tactic Device request: 1638MB Available: 1062MB. Device memory is insufficient to use tactic.
|
410 |
+
[12/28/2023-15:08:12] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1638 detected for tactic 0x000000000000003c.
|
411 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
412 |
+
[12/28/2023-15:08:12] [W] [TRT] Tactic Device request: 1638MB Available: 1063MB. Device memory is insufficient to use tactic.
|
413 |
+
[12/28/2023-15:08:12] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1638 detected for tactic 0x0000000000000074.
|
414 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
415 |
+
[12/28/2023-15:08:14] [W] [TRT] Tactic Device request: 1637MB Available: 1065MB. Device memory is insufficient to use tactic.
|
416 |
+
[12/28/2023-15:08:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
417 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
418 |
+
[12/28/2023-15:08:14] [W] [TRT] Tactic Device request: 1637MB Available: 1065MB. Device memory is insufficient to use tactic.
|
419 |
+
[12/28/2023-15:08:14] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
420 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
421 |
+
[12/28/2023-15:08:16] [W] [TRT] Tactic Device request: 3270MB Available: 1064MB. Device memory is insufficient to use tactic.
|
422 |
+
[12/28/2023-15:08:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000004.
|
423 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
424 |
+
[12/28/2023-15:08:17] [W] [TRT] Tactic Device request: 3270MB Available: 1064MB. Device memory is insufficient to use tactic.
|
425 |
+
[12/28/2023-15:08:17] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3270 detected for tactic 0x000000000000003c.
|
426 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
427 |
+
[12/28/2023-15:08:17] [W] [TRT] Tactic Device request: 3270MB Available: 1064MB. Device memory is insufficient to use tactic.
|
428 |
+
[12/28/2023-15:08:17] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000074.
|
429 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
430 |
+
[12/28/2023-15:08:18] [W] [TRT] Tactic Device request: 3269MB Available: 1063MB. Device memory is insufficient to use tactic.
|
431 |
+
[12/28/2023-15:08:18] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3269 detected for tactic 0x0000000000000004.
|
432 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
433 |
+
[12/28/2023-15:08:19] [W] [TRT] Tactic Device request: 3269MB Available: 1063MB. Device memory is insufficient to use tactic.
|
434 |
+
[12/28/2023-15:08:19] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3269 detected for tactic 0x000000000000003c.
|
435 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
436 |
+
[12/28/2023-15:08:22] [W] [TRT] Tactic Device request: 4377MB Available: 1060MB. Device memory is insufficient to use tactic.
|
437 |
+
[12/28/2023-15:08:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000004.
|
438 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
439 |
+
[12/28/2023-15:08:22] [W] [TRT] Tactic Device request: 2185MB Available: 1060MB. Device memory is insufficient to use tactic.
|
440 |
+
[12/28/2023-15:08:22] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000005.
|
441 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
442 |
+
[12/28/2023-15:08:23] [W] [TRT] Tactic Device request: 4377MB Available: 1061MB. Device memory is insufficient to use tactic.
|
443 |
+
[12/28/2023-15:08:23] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4377 detected for tactic 0x000000000000003c.
|
444 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
445 |
+
[12/28/2023-15:08:23] [W] [TRT] Tactic Device request: 2185MB Available: 1061MB. Device memory is insufficient to use tactic.
|
446 |
+
[12/28/2023-15:08:23] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2185 detected for tactic 0x000000000000003d.
|
447 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
448 |
+
[12/28/2023-15:08:23] [W] [TRT] Tactic Device request: 4377MB Available: 1060MB. Device memory is insufficient to use tactic.
|
449 |
+
[12/28/2023-15:08:23] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000074.
|
450 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
451 |
+
[12/28/2023-15:08:23] [W] [TRT] Tactic Device request: 2185MB Available: 1060MB. Device memory is insufficient to use tactic.
|
452 |
+
[12/28/2023-15:08:23] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000075.
|
453 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
454 |
+
[12/28/2023-15:08:29] [W] [TRT] Tactic Device request: 4375MB Available: 1059MB. Device memory is insufficient to use tactic.
|
455 |
+
[12/28/2023-15:08:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
456 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
457 |
+
[12/28/2023-15:08:29] [W] [TRT] Tactic Device request: 2183MB Available: 1059MB. Device memory is insufficient to use tactic.
|
458 |
+
[12/28/2023-15:08:29] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
459 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
460 |
+
[12/28/2023-15:08:29] [W] [TRT] Tactic Device request: 4375MB Available: 1058MB. Device memory is insufficient to use tactic.
|
461 |
+
[12/28/2023-15:08:29] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
462 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
463 |
+
[12/28/2023-15:08:29] [W] [TRT] Tactic Device request: 2183MB Available: 1058MB. Device memory is insufficient to use tactic.
|
464 |
+
[12/28/2023-15:08:29] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
465 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
466 |
+
[12/28/2023-15:08:36] [W] [TRT] Tactic Device request: 4376MB Available: 1050MB. Device memory is insufficient to use tactic.
|
467 |
+
[12/28/2023-15:08:36] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000004.
|
468 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
469 |
+
[12/28/2023-15:08:36] [W] [TRT] Tactic Device request: 2184MB Available: 1049MB. Device memory is insufficient to use tactic.
|
470 |
+
[12/28/2023-15:08:36] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000005.
|
471 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
472 |
+
[12/28/2023-15:08:36] [W] [TRT] Tactic Device request: 4376MB Available: 1037MB. Device memory is insufficient to use tactic.
|
473 |
+
[12/28/2023-15:08:36] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4376 detected for tactic 0x000000000000003c.
|
474 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
475 |
+
[12/28/2023-15:08:36] [W] [TRT] Tactic Device request: 2184MB Available: 1037MB. Device memory is insufficient to use tactic.
|
476 |
+
[12/28/2023-15:08:36] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2184 detected for tactic 0x000000000000003d.
|
477 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
478 |
+
[12/28/2023-15:08:37] [W] [TRT] Tactic Device request: 4376MB Available: 1036MB. Device memory is insufficient to use tactic.
|
479 |
+
[12/28/2023-15:08:37] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000074.
|
480 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
481 |
+
[12/28/2023-15:08:37] [W] [TRT] Tactic Device request: 2184MB Available: 1036MB. Device memory is insufficient to use tactic.
|
482 |
+
[12/28/2023-15:08:37] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000075.
|
483 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
484 |
+
[12/28/2023-15:08:42] [W] [TRT] Tactic Device request: 4375MB Available: 1058MB. Device memory is insufficient to use tactic.
|
485 |
+
[12/28/2023-15:08:42] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
486 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
487 |
+
[12/28/2023-15:08:42] [W] [TRT] Tactic Device request: 2183MB Available: 1058MB. Device memory is insufficient to use tactic.
|
488 |
+
[12/28/2023-15:08:42] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
489 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
490 |
+
[12/28/2023-15:08:43] [W] [TRT] Tactic Device request: 4375MB Available: 1058MB. Device memory is insufficient to use tactic.
|
491 |
+
[12/28/2023-15:08:43] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
492 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
493 |
+
[12/28/2023-15:08:43] [W] [TRT] Tactic Device request: 2183MB Available: 1058MB. Device memory is insufficient to use tactic.
|
494 |
+
[12/28/2023-15:08:43] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
495 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
496 |
+
[12/28/2023-15:09:47] [W] [TRT] TensorRT encountered issues when converting weights between types and that could affect accuracy.
|
497 |
+
[12/28/2023-15:09:47] [W] [TRT] If this is not the desired behavior, please modify the weights or retrain with regularization to adjust the magnitude of the weights.
|
498 |
+
[12/28/2023-15:09:47] [W] [TRT] Check verbose logs for the list of affected weights.
|
499 |
+
[12/28/2023-15:09:47] [W] [TRT] - 114 weights are affected by this issue: Detected subnormal FP16 values.
|
500 |
+
[12/28/2023-15:09:47] [W] [TRT] - 40 weights are affected by this issue: Detected values less than smallest positive FP16 subnormal value and converted them to the FP16 minimum subnormalized value.
|
501 |
+
[12/28/2023-15:10:04] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
502 |
+
[12/28/2023-15:10:04] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
503 |
+
[12/28/2023-15:10:04] [W] * GPU compute time is unstable, with coefficient of variance = 7.00146%.
|
504 |
+
[12/28/2023-15:10:04] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_fp32.onnx.best.engine.log
ADDED
@@ -0,0 +1,331 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.best.engine
|
2 |
+
[12/28/2023-12:58:38] [I] === Model Options ===
|
3 |
+
[12/28/2023-12:58:38] [I] Format: ONNX
|
4 |
+
[12/28/2023-12:58:38] [I] Model: yolo_nas_pose_l_fp32.onnx
|
5 |
+
[12/28/2023-12:58:38] [I] Output:
|
6 |
+
[12/28/2023-12:58:38] [I] === Build Options ===
|
7 |
+
[12/28/2023-12:58:38] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-12:58:38] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-12:58:38] [I] minTiming: 1
|
10 |
+
[12/28/2023-12:58:38] [I] avgTiming: 8
|
11 |
+
[12/28/2023-12:58:38] [I] Precision: FP32+FP16+INT8
|
12 |
+
[12/28/2023-12:58:38] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-12:58:38] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-12:58:38] [I] Refit: Disabled
|
15 |
+
[12/28/2023-12:58:38] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-12:58:38] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-12:58:38] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-12:58:38] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-12:58:38] [I] Build only: Disabled
|
20 |
+
[12/28/2023-12:58:38] [I] Save engine: yolo_nas_pose_l_fp32.onnx.best.engine
|
21 |
+
[12/28/2023-12:58:38] [I] Load engine:
|
22 |
+
[12/28/2023-12:58:38] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-12:58:38] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-12:58:38] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-12:58:38] [I] timingCacheFile:
|
26 |
+
[12/28/2023-12:58:38] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-12:58:38] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-12:58:38] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-12:58:38] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-12:58:38] [I] Input build shapes: model
|
31 |
+
[12/28/2023-12:58:38] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-12:58:38] [I] === System Options ===
|
33 |
+
[12/28/2023-12:58:38] [I] Device: 0
|
34 |
+
[12/28/2023-12:58:38] [I] DLACore:
|
35 |
+
[12/28/2023-12:58:38] [I] Plugins:
|
36 |
+
[12/28/2023-12:58:38] [I] === Inference Options ===
|
37 |
+
[12/28/2023-12:58:38] [I] Batch: Explicit
|
38 |
+
[12/28/2023-12:58:38] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-12:58:38] [I] Iterations: 10
|
40 |
+
[12/28/2023-12:58:38] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-12:58:38] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-12:58:38] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-12:58:38] [I] Streams: 1
|
44 |
+
[12/28/2023-12:58:38] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-12:58:38] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-12:58:38] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-12:58:38] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-12:58:38] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-12:58:38] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-12:58:38] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-12:58:38] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-12:58:38] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-12:58:38] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-12:58:38] [I] Inputs:
|
55 |
+
[12/28/2023-12:58:38] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-12:58:38] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-12:58:38] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-12:58:38] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-12:58:38] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-12:58:38] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-12:58:38] [I] Profile: Disabled
|
62 |
+
[12/28/2023-12:58:38] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-12:58:38] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-12:58:38] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-12:58:38] [I]
|
66 |
+
[12/28/2023-12:58:38] [I] === Device Information ===
|
67 |
+
[12/28/2023-12:58:38] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-12:58:38] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-12:58:38] [I] SMs: 8
|
70 |
+
[12/28/2023-12:58:38] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-12:58:38] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-12:58:38] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-12:58:38] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-12:58:38] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-12:58:38] [I]
|
76 |
+
[12/28/2023-12:58:38] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-12:58:43] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 3010 (MiB)
|
78 |
+
[12/28/2023-12:58:48] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +283, now: CPU 574, GPU 3313 (MiB)
|
79 |
+
[12/28/2023-12:58:48] [I] Start parsing network model
|
80 |
+
[12/28/2023-12:58:51] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-12:58:51] [I] [TRT] Input filename: yolo_nas_pose_l_fp32.onnx
|
82 |
+
[12/28/2023-12:58:51] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-12:58:51] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-12:58:51] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-12:58:51] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-12:58:51] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-12:58:51] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-12:58:51] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-12:58:51] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-12:58:51] [I] Finish parsing network model
|
91 |
+
[12/28/2023-12:58:52] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-12:58:52] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 455) [Constant]
|
96 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 456) [Constant]
|
97 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 457) [Constant]
|
98 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv1/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
166 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
167 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
168 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
169 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
170 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
171 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
172 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
173 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
174 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
175 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
176 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
177 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
178 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
179 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
180 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
181 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
182 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
183 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
184 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
185 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
186 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 187) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
187 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
188 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
189 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 195) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
190 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
191 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
192 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
193 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
194 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
195 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
196 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
197 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
198 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
199 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
200 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
201 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
202 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 224) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
203 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
204 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
205 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 232) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
206 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
207 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
208 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 240) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
209 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
210 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
211 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
212 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
213 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
214 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
215 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
216 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
217 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
218 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
219 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
220 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
221 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
222 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
223 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
224 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 271) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
225 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
226 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
227 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
228 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 294) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
229 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
230 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
231 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 302) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
232 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
233 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
234 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 310) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
235 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
236 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
237 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
238 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
239 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
240 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
241 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
242 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
243 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
244 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
245 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
246 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
247 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
248 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
249 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
250 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 341) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
251 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
252 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
253 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
254 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 364) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
255 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
256 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
257 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 372) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
258 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
259 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
260 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 380) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
261 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
262 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
263 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
264 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
265 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
266 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
267 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
268 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
269 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
270 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
271 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
272 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
273 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
274 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1.../post_process/Reshape_2]}
|
275 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
276 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 459) [NMS]_1_output[DevicetoShapeHostCopy]
|
277 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
278 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
279 |
+
[12/28/2023-12:58:52] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
280 |
+
[12/28/2023-12:59:03] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +411, now: CPU 1351, GPU 3918 (MiB)
|
281 |
+
[12/28/2023-12:59:05] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +82, GPU +80, now: CPU 1433, GPU 3998 (MiB)
|
282 |
+
[12/28/2023-12:59:05] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
283 |
+
[12/28/2023-15:09:20] [I] [TRT] Total Activation Memory: 7964877312
|
284 |
+
[12/28/2023-15:09:20] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
285 |
+
[12/28/2023-15:09:38] [I] [TRT] Total Host Persistent Memory: 331680
|
286 |
+
[12/28/2023-15:09:38] [I] [TRT] Total Device Persistent Memory: 38912
|
287 |
+
[12/28/2023-15:09:38] [I] [TRT] Total Scratch Memory: 134217728
|
288 |
+
[12/28/2023-15:09:38] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 88 MiB, GPU 2110 MiB
|
289 |
+
[12/28/2023-15:09:38] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 176 steps to complete.
|
290 |
+
[12/28/2023-15:09:38] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 114.49ms to assign 14 blocks to 176 nodes requiring 147384320 bytes.
|
291 |
+
[12/28/2023-15:09:38] [I] [TRT] Total Activation Memory: 147384320
|
292 |
+
[12/28/2023-15:09:47] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU -15, now: CPU 1838, GPU 5747 (MiB)
|
293 |
+
[12/28/2023-15:09:47] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +53, GPU +64, now: CPU 53, GPU 64 (MiB)
|
294 |
+
[12/28/2023-15:09:48] [I] Engine built in 7870.12 sec.
|
295 |
+
[12/28/2023-15:09:48] [I] [TRT] Loaded engine size: 54 MiB
|
296 |
+
[12/28/2023-15:09:48] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1299, GPU 5509 (MiB)
|
297 |
+
[12/28/2023-15:09:48] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +52, now: CPU 0, GPU 52 (MiB)
|
298 |
+
[12/28/2023-15:09:48] [I] Engine deserialized in 0.136755 sec.
|
299 |
+
[12/28/2023-15:09:48] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1300, GPU 5509 (MiB)
|
300 |
+
[12/28/2023-15:09:48] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +140, now: CPU 0, GPU 192 (MiB)
|
301 |
+
[12/28/2023-15:09:48] [I] Setting persistentCacheLimit to 0 bytes.
|
302 |
+
[12/28/2023-15:09:48] [I] Using random values for input onnx::Cast_0
|
303 |
+
[12/28/2023-15:09:48] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
304 |
+
[12/28/2023-15:09:48] [I] Using random values for output graph2_flat_predictions
|
305 |
+
[12/28/2023-15:09:48] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
306 |
+
[12/28/2023-15:09:48] [I] Starting inference
|
307 |
+
[12/28/2023-15:10:04] [I] Warmup completed 2 queries over 200 ms
|
308 |
+
[12/28/2023-15:10:04] [I] Timing trace has 712 queries over 15.0201 s
|
309 |
+
[12/28/2023-15:10:04] [I]
|
310 |
+
[12/28/2023-15:10:04] [I] === Trace details ===
|
311 |
+
[12/28/2023-15:10:04] [I] Trace averages of 100 runs:
|
312 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 21.1141 ms - Host latency: 21.2281 ms (enqueue 21.1848 ms)
|
313 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 21.2938 ms - Host latency: 21.4086 ms (enqueue 21.3535 ms)
|
314 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 20.5876 ms - Host latency: 20.6987 ms (enqueue 20.679 ms)
|
315 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 20.9284 ms - Host latency: 21.0399 ms (enqueue 20.9968 ms)
|
316 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 21.3846 ms - Host latency: 21.5023 ms (enqueue 21.4432 ms)
|
317 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 20.5315 ms - Host latency: 20.6422 ms (enqueue 20.6192 ms)
|
318 |
+
[12/28/2023-15:10:04] [I] Average on 100 runs - GPU latency: 20.7566 ms - Host latency: 20.8657 ms (enqueue 20.8177 ms)
|
319 |
+
[12/28/2023-15:10:04] [I]
|
320 |
+
[12/28/2023-15:10:04] [I] === Performance summary ===
|
321 |
+
[12/28/2023-15:10:04] [I] Throughput: 47.4032 qps
|
322 |
+
[12/28/2023-15:10:04] [I] Latency: min = 19.6377 ms, max = 32.405 ms, mean = 21.0632 ms, median = 20.583 ms, percentile(90%) = 21.897 ms, percentile(95%) = 23.0127 ms, percentile(99%) = 29.6182 ms
|
323 |
+
[12/28/2023-15:10:04] [I] Enqueue Time: min = 19.6035 ms, max = 33.8328 ms, mean = 21.0211 ms, median = 20.5366 ms, percentile(90%) = 21.8384 ms, percentile(95%) = 22.998 ms, percentile(99%) = 29.0708 ms
|
324 |
+
[12/28/2023-15:10:04] [I] H2D Latency: min = 0.0800781 ms, max = 0.128906 ms, mean = 0.0964459 ms, median = 0.097168 ms, percentile(90%) = 0.0991211 ms, percentile(95%) = 0.0996094 ms, percentile(99%) = 0.110474 ms
|
325 |
+
[12/28/2023-15:10:04] [I] GPU Compute Time: min = 19.5264 ms, max = 32.2937 ms, mean = 20.9506 ms, median = 20.4727 ms, percentile(90%) = 21.7739 ms, percentile(95%) = 22.8984 ms, percentile(99%) = 29.5049 ms
|
326 |
+
[12/28/2023-15:10:04] [I] D2H Latency: min = 0.00341797 ms, max = 0.0615234 ms, mean = 0.0161761 ms, median = 0.0136719 ms, percentile(90%) = 0.0258789 ms, percentile(95%) = 0.0273438 ms, percentile(99%) = 0.03125 ms
|
327 |
+
[12/28/2023-15:10:04] [I] Total Host Walltime: 15.0201 s
|
328 |
+
[12/28/2023-15:10:04] [I] Total GPU Compute Time: 14.9168 s
|
329 |
+
[12/28/2023-15:10:04] [I] Explanations of the performance metrics are printed in the verbose logs.
|
330 |
+
[12/28/2023-15:10:04] [I]
|
331 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.best.engine
|
yolo_nas_pose_l_fp32.onnx.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41ae49ee96e19ad3d8bfede2728e2c7fb331aa5a1d99fc7b5e139b10ec687299
|
3 |
+
size 219687473
|
yolo_nas_pose_l_fp32.onnx.engine.err
ADDED
@@ -0,0 +1,237 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-11:29:23] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-11:29:23] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-11:30:52] [W] [TRT] Tactic Device request: 4720MB Available: 2387MB. Device memory is insufficient to use tactic.
|
4 |
+
[12/28/2023-11:30:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000004.
|
5 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
6 |
+
[12/28/2023-11:30:53] [W] [TRT] Tactic Device request: 4720MB Available: 2388MB. Device memory is insufficient to use tactic.
|
7 |
+
[12/28/2023-11:30:53] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4720 detected for tactic 0x000000000000003c.
|
8 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
9 |
+
[12/28/2023-11:30:54] [W] [TRT] Tactic Device request: 4720MB Available: 2389MB. Device memory is insufficient to use tactic.
|
10 |
+
[12/28/2023-11:30:54] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000074.
|
11 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
12 |
+
[12/28/2023-11:30:59] [W] [TRT] Tactic Device request: 4711MB Available: 2388MB. Device memory is insufficient to use tactic.
|
13 |
+
[12/28/2023-11:30:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
14 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
15 |
+
[12/28/2023-11:31:00] [W] [TRT] Tactic Device request: 4711MB Available: 2388MB. Device memory is insufficient to use tactic.
|
16 |
+
[12/28/2023-11:31:00] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
17 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
18 |
+
[12/28/2023-11:31:00] [W] [TRT] Tactic Device request: 4711MB Available: 2389MB. Device memory is insufficient to use tactic.
|
19 |
+
[12/28/2023-11:31:00] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
20 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
21 |
+
[12/28/2023-11:32:39] [W] [TRT] Tactic Device request: 4711MB Available: 2349MB. Device memory is insufficient to use tactic.
|
22 |
+
[12/28/2023-11:32:39] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
23 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
24 |
+
[12/28/2023-11:32:39] [W] [TRT] Tactic Device request: 4711MB Available: 2348MB. Device memory is insufficient to use tactic.
|
25 |
+
[12/28/2023-11:32:39] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
26 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
27 |
+
[12/28/2023-11:32:39] [W] [TRT] Tactic Device request: 4711MB Available: 2349MB. Device memory is insufficient to use tactic.
|
28 |
+
[12/28/2023-11:32:39] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
29 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
30 |
+
[12/28/2023-11:32:51] [W] [TRT] Tactic Device request: 6275MB Available: 2347MB. Device memory is insufficient to use tactic.
|
31 |
+
[12/28/2023-11:32:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
32 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
33 |
+
[12/28/2023-11:32:51] [W] [TRT] Tactic Device request: 6275MB Available: 2348MB. Device memory is insufficient to use tactic.
|
34 |
+
[12/28/2023-11:32:51] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
35 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
36 |
+
[12/28/2023-11:32:51] [W] [TRT] Tactic Device request: 6275MB Available: 2350MB. Device memory is insufficient to use tactic.
|
37 |
+
[12/28/2023-11:32:51] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
38 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
39 |
+
[12/28/2023-11:35:14] [W] [TRT] Tactic Device request: 7056MB Available: 2331MB. Device memory is insufficient to use tactic.
|
40 |
+
[12/28/2023-11:35:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
41 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
42 |
+
[12/28/2023-11:35:14] [W] [TRT] Tactic Device request: 7056MB Available: 2330MB. Device memory is insufficient to use tactic.
|
43 |
+
[12/28/2023-11:35:14] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
44 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
45 |
+
[12/28/2023-11:35:15] [W] [TRT] Tactic Device request: 7056MB Available: 2330MB. Device memory is insufficient to use tactic.
|
46 |
+
[12/28/2023-11:35:15] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
47 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
48 |
+
[12/28/2023-11:35:27] [W] [TRT] Tactic Device request: 6354MB Available: 2331MB. Device memory is insufficient to use tactic.
|
49 |
+
[12/28/2023-11:35:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
50 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
51 |
+
[12/28/2023-11:35:27] [W] [TRT] Tactic Device request: 6354MB Available: 2331MB. Device memory is insufficient to use tactic.
|
52 |
+
[12/28/2023-11:35:27] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
53 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
54 |
+
[12/28/2023-11:35:27] [W] [TRT] Tactic Device request: 6354MB Available: 2331MB. Device memory is insufficient to use tactic.
|
55 |
+
[12/28/2023-11:35:27] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
56 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
57 |
+
[12/28/2023-11:38:31] [W] [TRT] Tactic Device request: 2394MB Available: 2273MB. Device memory is insufficient to use tactic.
|
58 |
+
[12/28/2023-11:38:31] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000004.
|
59 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
60 |
+
[12/28/2023-11:38:31] [W] [TRT] Tactic Device request: 2394MB Available: 2273MB. Device memory is insufficient to use tactic.
|
61 |
+
[12/28/2023-11:38:31] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
62 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
63 |
+
[12/28/2023-11:38:31] [W] [TRT] Tactic Device request: 2394MB Available: 2273MB. Device memory is insufficient to use tactic.
|
64 |
+
[12/28/2023-11:38:31] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
65 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
66 |
+
[12/28/2023-11:38:32] [W] [TRT] Tactic Device request: 2392MB Available: 2272MB. Device memory is insufficient to use tactic.
|
67 |
+
[12/28/2023-11:38:32] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
68 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
69 |
+
[12/28/2023-11:38:32] [W] [TRT] Tactic Device request: 2392MB Available: 2272MB. Device memory is insufficient to use tactic.
|
70 |
+
[12/28/2023-11:38:32] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
71 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
72 |
+
[12/28/2023-11:38:32] [W] [TRT] Tactic Device request: 2392MB Available: 2272MB. Device memory is insufficient to use tactic.
|
73 |
+
[12/28/2023-11:38:32] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
74 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
75 |
+
[12/28/2023-11:38:41] [W] [TRT] Tactic Device request: 6540MB Available: 2263MB. Device memory is insufficient to use tactic.
|
76 |
+
[12/28/2023-11:38:41] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000004.
|
77 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
78 |
+
[12/28/2023-11:38:42] [W] [TRT] Tactic Device request: 6540MB Available: 2262MB. Device memory is insufficient to use tactic.
|
79 |
+
[12/28/2023-11:38:42] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6540 detected for tactic 0x000000000000003c.
|
80 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
81 |
+
[12/28/2023-11:38:42] [W] [TRT] Tactic Device request: 6540MB Available: 2262MB. Device memory is insufficient to use tactic.
|
82 |
+
[12/28/2023-11:38:42] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000074.
|
83 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
84 |
+
[12/28/2023-11:38:46] [W] [TRT] Tactic Device request: 2191MB Available: 2163MB. Device memory is insufficient to use tactic.
|
85 |
+
[12/28/2023-11:38:46] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2191 detected for tactic 0x000000000000003c.
|
86 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
87 |
+
[12/28/2023-11:38:47] [W] [TRT] Tactic Device request: 2191MB Available: 2160MB. Device memory is insufficient to use tactic.
|
88 |
+
[12/28/2023-11:38:47] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000074.
|
89 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
90 |
+
[12/28/2023-11:38:51] [W] [TRT] Tactic Device request: 2190MB Available: 2161MB. Device memory is insufficient to use tactic.
|
91 |
+
[12/28/2023-11:38:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
92 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
93 |
+
[12/28/2023-11:38:52] [W] [TRT] Tactic Device request: 2190MB Available: 2161MB. Device memory is insufficient to use tactic.
|
94 |
+
[12/28/2023-11:38:52] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
95 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
96 |
+
[12/28/2023-11:38:53] [W] [TRT] Tactic Device request: 2190MB Available: 2161MB. Device memory is insufficient to use tactic.
|
97 |
+
[12/28/2023-11:38:53] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
98 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
99 |
+
[12/28/2023-11:40:32] [W] [TRT] Tactic Device request: 2457MB Available: 2131MB. Device memory is insufficient to use tactic.
|
100 |
+
[12/28/2023-11:40:32] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
101 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
102 |
+
[12/28/2023-11:40:32] [W] [TRT] Tactic Device request: 2457MB Available: 2131MB. Device memory is insufficient to use tactic.
|
103 |
+
[12/28/2023-11:40:32] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
104 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
105 |
+
[12/28/2023-11:40:32] [W] [TRT] Tactic Device request: 2457MB Available: 2131MB. Device memory is insufficient to use tactic.
|
106 |
+
[12/28/2023-11:40:32] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
107 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
108 |
+
[12/28/2023-11:40:46] [W] [TRT] Tactic Device request: 3587MB Available: 2158MB. Device memory is insufficient to use tactic.
|
109 |
+
[12/28/2023-11:40:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
110 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
111 |
+
[12/28/2023-11:40:46] [W] [TRT] Tactic Device request: 3587MB Available: 2158MB. Device memory is insufficient to use tactic.
|
112 |
+
[12/28/2023-11:40:46] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
113 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
114 |
+
[12/28/2023-11:40:46] [W] [TRT] Tactic Device request: 3587MB Available: 2158MB. Device memory is insufficient to use tactic.
|
115 |
+
[12/28/2023-11:40:46] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
116 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
117 |
+
[12/28/2023-11:43:23] [W] [TRT] Tactic Device request: 3556MB Available: 2179MB. Device memory is insufficient to use tactic.
|
118 |
+
[12/28/2023-11:43:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
119 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
120 |
+
[12/28/2023-11:43:23] [W] [TRT] Tactic Device request: 3556MB Available: 2179MB. Device memory is insufficient to use tactic.
|
121 |
+
[12/28/2023-11:43:23] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
122 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
123 |
+
[12/28/2023-11:43:23] [W] [TRT] Tactic Device request: 3556MB Available: 2179MB. Device memory is insufficient to use tactic.
|
124 |
+
[12/28/2023-11:43:23] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
125 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
126 |
+
[12/28/2023-11:43:24] [W] [TRT] Tactic Device request: 3140MB Available: 2178MB. Device memory is insufficient to use tactic.
|
127 |
+
[12/28/2023-11:43:24] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000004.
|
128 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
129 |
+
[12/28/2023-11:43:24] [W] [TRT] Tactic Device request: 3140MB Available: 2178MB. Device memory is insufficient to use tactic.
|
130 |
+
[12/28/2023-11:43:24] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3140 detected for tactic 0x000000000000003c.
|
131 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
132 |
+
[12/28/2023-11:43:24] [W] [TRT] Tactic Device request: 3140MB Available: 2178MB. Device memory is insufficient to use tactic.
|
133 |
+
[12/28/2023-11:43:24] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000074.
|
134 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
135 |
+
[12/28/2023-11:45:43] [W] [TRT] Tactic Device request: 3161MB Available: 2140MB. Device memory is insufficient to use tactic.
|
136 |
+
[12/28/2023-11:45:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000004.
|
137 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
138 |
+
[12/28/2023-11:45:43] [W] [TRT] Tactic Device request: 3161MB Available: 2140MB. Device memory is insufficient to use tactic.
|
139 |
+
[12/28/2023-11:45:43] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3161 detected for tactic 0x000000000000003c.
|
140 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
141 |
+
[12/28/2023-11:45:43] [W] [TRT] Tactic Device request: 3161MB Available: 2140MB. Device memory is insufficient to use tactic.
|
142 |
+
[12/28/2023-11:45:43] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000074.
|
143 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
144 |
+
[12/28/2023-11:45:46] [W] [TRT] Tactic Device request: 4189MB Available: 2138MB. Device memory is insufficient to use tactic.
|
145 |
+
[12/28/2023-11:45:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000004.
|
146 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
147 |
+
[12/28/2023-11:45:47] [W] [TRT] Tactic Device request: 4189MB Available: 2138MB. Device memory is insufficient to use tactic.
|
148 |
+
[12/28/2023-11:45:47] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4189 detected for tactic 0x000000000000003c.
|
149 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
150 |
+
[12/28/2023-11:45:47] [W] [TRT] Tactic Device request: 4189MB Available: 2140MB. Device memory is insufficient to use tactic.
|
151 |
+
[12/28/2023-11:45:47] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000074.
|
152 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
153 |
+
[12/28/2023-11:45:51] [W] [TRT] Tactic Device request: 4186MB Available: 2139MB. Device memory is insufficient to use tactic.
|
154 |
+
[12/28/2023-11:45:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000004.
|
155 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
156 |
+
[12/28/2023-11:45:52] [W] [TRT] Tactic Device request: 4186MB Available: 2139MB. Device memory is insufficient to use tactic.
|
157 |
+
[12/28/2023-11:45:52] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4186 detected for tactic 0x000000000000003c.
|
158 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
159 |
+
[12/28/2023-11:45:52] [W] [TRT] Tactic Device request: 4186MB Available: 2138MB. Device memory is insufficient to use tactic.
|
160 |
+
[12/28/2023-11:45:52] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000074.
|
161 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
162 |
+
[12/28/2023-11:48:34] [W] [TRT] Tactic Device request: 4764MB Available: 2088MB. Device memory is insufficient to use tactic.
|
163 |
+
[12/28/2023-11:48:34] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000004.
|
164 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
165 |
+
[12/28/2023-11:48:34] [W] [TRT] Tactic Device request: 4764MB Available: 2088MB. Device memory is insufficient to use tactic.
|
166 |
+
[12/28/2023-11:48:34] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4764 detected for tactic 0x000000000000003c.
|
167 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
168 |
+
[12/28/2023-11:48:34] [W] [TRT] Tactic Device request: 4764MB Available: 2088MB. Device memory is insufficient to use tactic.
|
169 |
+
[12/28/2023-11:48:34] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000074.
|
170 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
171 |
+
[12/28/2023-11:48:39] [W] [TRT] Tactic Device request: 4244MB Available: 2088MB. Device memory is insufficient to use tactic.
|
172 |
+
[12/28/2023-11:48:39] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000004.
|
173 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
174 |
+
[12/28/2023-11:48:40] [W] [TRT] Tactic Device request: 4244MB Available: 2081MB. Device memory is insufficient to use tactic.
|
175 |
+
[12/28/2023-11:48:40] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4244 detected for tactic 0x000000000000003c.
|
176 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
177 |
+
[12/28/2023-11:48:41] [W] [TRT] Tactic Device request: 4244MB Available: 2080MB. Device memory is insufficient to use tactic.
|
178 |
+
[12/28/2023-11:48:41] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000074.
|
179 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
180 |
+
[12/28/2023-11:48:46] [W] [TRT] Tactic Device request: 4241MB Available: 2082MB. Device memory is insufficient to use tactic.
|
181 |
+
[12/28/2023-11:48:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000004.
|
182 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
183 |
+
[12/28/2023-11:48:47] [W] [TRT] Tactic Device request: 4241MB Available: 2080MB. Device memory is insufficient to use tactic.
|
184 |
+
[12/28/2023-11:48:47] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4241 detected for tactic 0x000000000000003c.
|
185 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
186 |
+
[12/28/2023-11:48:48] [W] [TRT] Tactic Device request: 4241MB Available: 2080MB. Device memory is insufficient to use tactic.
|
187 |
+
[12/28/2023-11:48:48] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000074.
|
188 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
189 |
+
[12/28/2023-11:51:58] [W] [TRT] Tactic Device request: 3270MB Available: 2043MB. Device memory is insufficient to use tactic.
|
190 |
+
[12/28/2023-11:51:58] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000004.
|
191 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
192 |
+
[12/28/2023-11:51:58] [W] [TRT] Tactic Device request: 3270MB Available: 2043MB. Device memory is insufficient to use tactic.
|
193 |
+
[12/28/2023-11:51:58] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3270 detected for tactic 0x000000000000003c.
|
194 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
195 |
+
[12/28/2023-11:51:58] [W] [TRT] Tactic Device request: 3270MB Available: 2043MB. Device memory is insufficient to use tactic.
|
196 |
+
[12/28/2023-11:51:58] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000074.
|
197 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
198 |
+
[12/28/2023-11:52:01] [W] [TRT] Tactic Device request: 4377MB Available: 2039MB. Device memory is insufficient to use tactic.
|
199 |
+
[12/28/2023-11:52:01] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000004.
|
200 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
201 |
+
[12/28/2023-11:52:01] [W] [TRT] Tactic Device request: 2185MB Available: 2039MB. Device memory is insufficient to use tactic.
|
202 |
+
[12/28/2023-11:52:01] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000005.
|
203 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
204 |
+
[12/28/2023-11:52:01] [W] [TRT] Tactic Device request: 4377MB Available: 2039MB. Device memory is insufficient to use tactic.
|
205 |
+
[12/28/2023-11:52:01] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4377 detected for tactic 0x000000000000003c.
|
206 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
207 |
+
[12/28/2023-11:52:01] [W] [TRT] Tactic Device request: 2185MB Available: 2039MB. Device memory is insufficient to use tactic.
|
208 |
+
[12/28/2023-11:52:01] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2185 detected for tactic 0x000000000000003d.
|
209 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
210 |
+
[12/28/2023-11:52:02] [W] [TRT] Tactic Device request: 4377MB Available: 2039MB. Device memory is insufficient to use tactic.
|
211 |
+
[12/28/2023-11:52:02] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000074.
|
212 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
213 |
+
[12/28/2023-11:52:02] [W] [TRT] Tactic Device request: 2185MB Available: 2038MB. Device memory is insufficient to use tactic.
|
214 |
+
[12/28/2023-11:52:02] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000075.
|
215 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
216 |
+
[12/28/2023-11:52:09] [W] [TRT] Tactic Device request: 4376MB Available: 2038MB. Device memory is insufficient to use tactic.
|
217 |
+
[12/28/2023-11:52:09] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000004.
|
218 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
219 |
+
[12/28/2023-11:52:09] [W] [TRT] Tactic Device request: 2184MB Available: 2038MB. Device memory is insufficient to use tactic.
|
220 |
+
[12/28/2023-11:52:09] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000005.
|
221 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
222 |
+
[12/28/2023-11:52:09] [W] [TRT] Tactic Device request: 4376MB Available: 2038MB. Device memory is insufficient to use tactic.
|
223 |
+
[12/28/2023-11:52:09] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4376 detected for tactic 0x000000000000003c.
|
224 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
225 |
+
[12/28/2023-11:52:09] [W] [TRT] Tactic Device request: 2184MB Available: 2038MB. Device memory is insufficient to use tactic.
|
226 |
+
[12/28/2023-11:52:09] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2184 detected for tactic 0x000000000000003d.
|
227 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
228 |
+
[12/28/2023-11:52:09] [W] [TRT] Tactic Device request: 4376MB Available: 2037MB. Device memory is insufficient to use tactic.
|
229 |
+
[12/28/2023-11:52:09] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000074.
|
230 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
231 |
+
[12/28/2023-11:52:09] [W] [TRT] Tactic Device request: 2184MB Available: 2038MB. Device memory is insufficient to use tactic.
|
232 |
+
[12/28/2023-11:52:09] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000075.
|
233 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
234 |
+
[12/28/2023-11:52:51] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
235 |
+
[12/28/2023-11:52:51] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
236 |
+
[12/28/2023-11:52:51] [W] * GPU compute time is unstable, with coefficient of variance = 4.81745%.
|
237 |
+
[12/28/2023-11:52:51] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_fp32.onnx.engine.log
ADDED
@@ -0,0 +1,326 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.engine
|
2 |
+
[12/28/2023-11:29:16] [I] === Model Options ===
|
3 |
+
[12/28/2023-11:29:16] [I] Format: ONNX
|
4 |
+
[12/28/2023-11:29:16] [I] Model: yolo_nas_pose_l_fp32.onnx
|
5 |
+
[12/28/2023-11:29:16] [I] Output:
|
6 |
+
[12/28/2023-11:29:16] [I] === Build Options ===
|
7 |
+
[12/28/2023-11:29:16] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-11:29:16] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-11:29:16] [I] minTiming: 1
|
10 |
+
[12/28/2023-11:29:16] [I] avgTiming: 8
|
11 |
+
[12/28/2023-11:29:16] [I] Precision: FP32
|
12 |
+
[12/28/2023-11:29:16] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-11:29:16] [I] Calibration:
|
14 |
+
[12/28/2023-11:29:16] [I] Refit: Disabled
|
15 |
+
[12/28/2023-11:29:16] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-11:29:16] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-11:29:16] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-11:29:16] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-11:29:16] [I] Build only: Disabled
|
20 |
+
[12/28/2023-11:29:16] [I] Save engine: yolo_nas_pose_l_fp32.onnx.engine
|
21 |
+
[12/28/2023-11:29:16] [I] Load engine:
|
22 |
+
[12/28/2023-11:29:16] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-11:29:16] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-11:29:16] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-11:29:16] [I] timingCacheFile:
|
26 |
+
[12/28/2023-11:29:16] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-11:29:16] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-11:29:16] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-11:29:16] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-11:29:16] [I] Input build shapes: model
|
31 |
+
[12/28/2023-11:29:16] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-11:29:16] [I] === System Options ===
|
33 |
+
[12/28/2023-11:29:16] [I] Device: 0
|
34 |
+
[12/28/2023-11:29:16] [I] DLACore:
|
35 |
+
[12/28/2023-11:29:16] [I] Plugins:
|
36 |
+
[12/28/2023-11:29:16] [I] === Inference Options ===
|
37 |
+
[12/28/2023-11:29:16] [I] Batch: Explicit
|
38 |
+
[12/28/2023-11:29:16] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-11:29:16] [I] Iterations: 10
|
40 |
+
[12/28/2023-11:29:16] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-11:29:16] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-11:29:16] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-11:29:16] [I] Streams: 1
|
44 |
+
[12/28/2023-11:29:16] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-11:29:16] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-11:29:16] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-11:29:16] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-11:29:16] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-11:29:16] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-11:29:16] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-11:29:16] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-11:29:16] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-11:29:16] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-11:29:16] [I] Inputs:
|
55 |
+
[12/28/2023-11:29:16] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-11:29:16] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-11:29:16] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-11:29:16] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-11:29:16] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-11:29:16] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-11:29:16] [I] Profile: Disabled
|
62 |
+
[12/28/2023-11:29:16] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-11:29:16] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-11:29:16] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-11:29:16] [I]
|
66 |
+
[12/28/2023-11:29:16] [I] === Device Information ===
|
67 |
+
[12/28/2023-11:29:16] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-11:29:16] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-11:29:16] [I] SMs: 8
|
70 |
+
[12/28/2023-11:29:16] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-11:29:16] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-11:29:16] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-11:29:16] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-11:29:16] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-11:29:16] [I]
|
76 |
+
[12/28/2023-11:29:16] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-11:29:17] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 3132 (MiB)
|
78 |
+
[12/28/2023-11:29:20] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +424, now: CPU 574, GPU 3573 (MiB)
|
79 |
+
[12/28/2023-11:29:20] [I] Start parsing network model
|
80 |
+
[12/28/2023-11:29:23] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-11:29:23] [I] [TRT] Input filename: yolo_nas_pose_l_fp32.onnx
|
82 |
+
[12/28/2023-11:29:23] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-11:29:23] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-11:29:23] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-11:29:23] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-11:29:23] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-11:29:23] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-11:29:23] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-11:29:23] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-11:29:23] [I] Finish parsing network model
|
91 |
+
[12/28/2023-11:29:23] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-11:29:23] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 455) [Constant]
|
96 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 456) [Constant]
|
97 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 457) [Constant]
|
98 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-11:29:23] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv1/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
166 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
167 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
168 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
169 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
170 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
171 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
172 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
173 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
174 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
175 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
176 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
177 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
178 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
179 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
180 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
181 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
182 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
183 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
184 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
185 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
186 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 187) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
187 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
188 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
189 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 195) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
190 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
191 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
192 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
193 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
194 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
195 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
196 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
197 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
198 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
199 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
200 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
201 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
202 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 224) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
203 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
204 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
205 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 232) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
206 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
207 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
208 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 240) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
209 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
210 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
211 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
212 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
213 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
214 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
215 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
216 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
217 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
218 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
219 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
220 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
221 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
222 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
223 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
224 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 271) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
225 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
226 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
227 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
228 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 294) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
229 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
230 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
231 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 302) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
232 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
233 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
234 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 310) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
235 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
236 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
237 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
238 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
239 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
240 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
241 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
242 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
243 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
244 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
245 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
246 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
247 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
248 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
249 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
250 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 341) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
251 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
252 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
253 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
254 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 364) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
255 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
256 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
257 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 372) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
258 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
259 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
260 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 380) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
261 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
262 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
263 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
264 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
265 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
266 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
267 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
268 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
269 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
270 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
271 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
272 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
273 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
274 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1.../post_process/Reshape_2]}
|
275 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
276 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 459) [NMS]_1_output[DevicetoShapeHostCopy]
|
277 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
278 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
279 |
+
[12/28/2023-11:29:24] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
280 |
+
[12/28/2023-11:29:25] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +763, now: CPU 1350, GPU 4631 (MiB)
|
281 |
+
[12/28/2023-11:29:25] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +83, GPU +131, now: CPU 1433, GPU 4762 (MiB)
|
282 |
+
[12/28/2023-11:29:25] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
283 |
+
[12/28/2023-11:52:24] [I] [TRT] Total Activation Memory: 8308511744
|
284 |
+
[12/28/2023-11:52:24] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
285 |
+
[12/28/2023-11:52:32] [I] [TRT] Total Host Persistent Memory: 380944
|
286 |
+
[12/28/2023-11:52:32] [I] [TRT] Total Device Persistent Memory: 656384
|
287 |
+
[12/28/2023-11:52:32] [I] [TRT] Total Scratch Memory: 134217728
|
288 |
+
[12/28/2023-11:52:32] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 49 MiB, GPU 2207 MiB
|
289 |
+
[12/28/2023-11:52:32] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 216 steps to complete.
|
290 |
+
[12/28/2023-11:52:32] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 108.365ms to assign 15 blocks to 216 nodes requiring 188319232 bytes.
|
291 |
+
[12/28/2023-11:52:32] [I] [TRT] Total Activation Memory: 188319232
|
292 |
+
[12/28/2023-11:52:34] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1778, GPU 5584 (MiB)
|
293 |
+
[12/28/2023-11:52:34] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +31, GPU +256, now: CPU 31, GPU 256 (MiB)
|
294 |
+
[12/28/2023-11:52:35] [I] Engine built in 1398.12 sec.
|
295 |
+
[12/28/2023-11:52:35] [I] [TRT] Loaded engine size: 209 MiB
|
296 |
+
[12/28/2023-11:52:36] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1451, GPU 4904 (MiB)
|
297 |
+
[12/28/2023-11:52:36] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +208, now: CPU 0, GPU 208 (MiB)
|
298 |
+
[12/28/2023-11:52:36] [I] Engine deserialized in 0.328264 sec.
|
299 |
+
[12/28/2023-11:52:36] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1451, GPU 4904 (MiB)
|
300 |
+
[12/28/2023-11:52:36] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +180, now: CPU 0, GPU 388 (MiB)
|
301 |
+
[12/28/2023-11:52:36] [I] Setting persistentCacheLimit to 0 bytes.
|
302 |
+
[12/28/2023-11:52:36] [I] Using random values for input onnx::Cast_0
|
303 |
+
[12/28/2023-11:52:36] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
304 |
+
[12/28/2023-11:52:36] [I] Using random values for output graph2_flat_predictions
|
305 |
+
[12/28/2023-11:52:36] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
306 |
+
[12/28/2023-11:52:36] [I] Starting inference
|
307 |
+
[12/28/2023-11:52:51] [I] Warmup completed 3 queries over 200 ms
|
308 |
+
[12/28/2023-11:52:51] [I] Timing trace has 228 queries over 15.134 s
|
309 |
+
[12/28/2023-11:52:51] [I]
|
310 |
+
[12/28/2023-11:52:51] [I] === Trace details ===
|
311 |
+
[12/28/2023-11:52:51] [I] Trace averages of 100 runs:
|
312 |
+
[12/28/2023-11:52:51] [I] Average on 100 runs - GPU latency: 66.5633 ms - Host latency: 66.6799 ms (enqueue 66.6144 ms)
|
313 |
+
[12/28/2023-11:52:51] [I] Average on 100 runs - GPU latency: 65.9454 ms - Host latency: 66.065 ms (enqueue 66.0061 ms)
|
314 |
+
[12/28/2023-11:52:51] [I]
|
315 |
+
[12/28/2023-11:52:51] [I] === Performance summary ===
|
316 |
+
[12/28/2023-11:52:51] [I] Throughput: 15.0654 qps
|
317 |
+
[12/28/2023-11:52:51] [I] Latency: min = 63.8037 ms, max = 84.0011 ms, mean = 66.3393 ms, median = 65.521 ms, percentile(90%) = 67.4297 ms, percentile(95%) = 76.3467 ms, percentile(99%) = 78.6501 ms
|
318 |
+
[12/28/2023-11:52:51] [I] Enqueue Time: min = 63.7715 ms, max = 83.9532 ms, mean = 66.2756 ms, median = 65.4399 ms, percentile(90%) = 68.3887 ms, percentile(95%) = 76.9697 ms, percentile(99%) = 78.6002 ms
|
319 |
+
[12/28/2023-11:52:51] [I] H2D Latency: min = 0.081543 ms, max = 0.12793 ms, mean = 0.0942483 ms, median = 0.0947266 ms, percentile(90%) = 0.0976562 ms, percentile(95%) = 0.0986328 ms, percentile(99%) = 0.112305 ms
|
320 |
+
[12/28/2023-11:52:51] [I] GPU Compute Time: min = 63.6914 ms, max = 83.8763 ms, mean = 66.222 ms, median = 65.4058 ms, percentile(90%) = 67.313 ms, percentile(95%) = 76.2305 ms, percentile(99%) = 78.5333 ms
|
321 |
+
[12/28/2023-11:52:51] [I] D2H Latency: min = 0.00390625 ms, max = 0.0869141 ms, mean = 0.023145 ms, median = 0.0244141 ms, percentile(90%) = 0.0336914 ms, percentile(95%) = 0.0390625 ms, percentile(99%) = 0.0546875 ms
|
322 |
+
[12/28/2023-11:52:51] [I] Total Host Walltime: 15.134 s
|
323 |
+
[12/28/2023-11:52:51] [I] Total GPU Compute Time: 15.0986 s
|
324 |
+
[12/28/2023-11:52:51] [I] Explanations of the performance metrics are printed in the verbose logs.
|
325 |
+
[12/28/2023-11:52:51] [I]
|
326 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.engine
|
yolo_nas_pose_l_fp32.onnx.fp16.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3274fec20ea219c10bcdf044022eedcd2ced07cc929ad0b5f08c625d5fdf12b4
|
3 |
+
size 110783531
|
yolo_nas_pose_l_fp32.onnx.fp16.engine.err
ADDED
@@ -0,0 +1,401 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-11:53:03] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-11:53:03] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-11:58:20] [W] [TRT] Tactic Device request: 4720MB Available: 2406MB. Device memory is insufficient to use tactic.
|
4 |
+
[12/28/2023-11:58:20] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000004.
|
5 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
6 |
+
[12/28/2023-11:58:20] [W] [TRT] Tactic Device request: 4720MB Available: 2407MB. Device memory is insufficient to use tactic.
|
7 |
+
[12/28/2023-11:58:20] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4720 detected for tactic 0x000000000000003c.
|
8 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
9 |
+
[12/28/2023-11:58:21] [W] [TRT] Tactic Device request: 4720MB Available: 2407MB. Device memory is insufficient to use tactic.
|
10 |
+
[12/28/2023-11:58:21] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000074.
|
11 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
12 |
+
[12/28/2023-11:58:27] [W] [TRT] Tactic Device request: 4706MB Available: 2408MB. Device memory is insufficient to use tactic.
|
13 |
+
[12/28/2023-11:58:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4706 detected for tactic 0x0000000000000004.
|
14 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
15 |
+
[12/28/2023-11:58:27] [W] [TRT] Tactic Device request: 4706MB Available: 2408MB. Device memory is insufficient to use tactic.
|
16 |
+
[12/28/2023-11:58:28] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4706 detected for tactic 0x000000000000003c.
|
17 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
18 |
+
[12/28/2023-11:58:30] [W] [TRT] Tactic Device request: 4711MB Available: 2408MB. Device memory is insufficient to use tactic.
|
19 |
+
[12/28/2023-11:58:30] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
20 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
21 |
+
[12/28/2023-11:58:31] [W] [TRT] Tactic Device request: 4711MB Available: 2407MB. Device memory is insufficient to use tactic.
|
22 |
+
[12/28/2023-11:58:31] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
23 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
24 |
+
[12/28/2023-11:58:32] [W] [TRT] Tactic Device request: 4711MB Available: 2407MB. Device memory is insufficient to use tactic.
|
25 |
+
[12/28/2023-11:58:32] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
26 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
27 |
+
[12/28/2023-11:58:37] [W] [TRT] Tactic Device request: 4702MB Available: 2407MB. Device memory is insufficient to use tactic.
|
28 |
+
[12/28/2023-11:58:37] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4702 detected for tactic 0x0000000000000004.
|
29 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
30 |
+
[12/28/2023-11:58:38] [W] [TRT] Tactic Device request: 4702MB Available: 2407MB. Device memory is insufficient to use tactic.
|
31 |
+
[12/28/2023-11:58:38] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4702 detected for tactic 0x000000000000003c.
|
32 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
33 |
+
[12/28/2023-12:03:21] [W] [TRT] Tactic Device request: 4711MB Available: 2283MB. Device memory is insufficient to use tactic.
|
34 |
+
[12/28/2023-12:03:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
35 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
36 |
+
[12/28/2023-12:03:21] [W] [TRT] Tactic Device request: 4711MB Available: 2282MB. Device memory is insufficient to use tactic.
|
37 |
+
[12/28/2023-12:03:21] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
38 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
39 |
+
[12/28/2023-12:03:21] [W] [TRT] Tactic Device request: 4711MB Available: 2282MB. Device memory is insufficient to use tactic.
|
40 |
+
[12/28/2023-12:03:21] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
41 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
42 |
+
[12/28/2023-12:03:23] [W] [TRT] Tactic Device request: 4701MB Available: 2281MB. Device memory is insufficient to use tactic.
|
43 |
+
[12/28/2023-12:03:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4701 detected for tactic 0x0000000000000004.
|
44 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
45 |
+
[12/28/2023-12:03:23] [W] [TRT] Tactic Device request: 4701MB Available: 2281MB. Device memory is insufficient to use tactic.
|
46 |
+
[12/28/2023-12:03:23] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4701 detected for tactic 0x000000000000003c.
|
47 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
48 |
+
[12/28/2023-12:03:40] [W] [TRT] Tactic Device request: 6275MB Available: 2278MB. Device memory is insufficient to use tactic.
|
49 |
+
[12/28/2023-12:03:41] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
50 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
51 |
+
[12/28/2023-12:03:41] [W] [TRT] Tactic Device request: 6275MB Available: 2277MB. Device memory is insufficient to use tactic.
|
52 |
+
[12/28/2023-12:03:41] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
53 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
54 |
+
[12/28/2023-12:03:41] [W] [TRT] Tactic Device request: 6275MB Available: 2278MB. Device memory is insufficient to use tactic.
|
55 |
+
[12/28/2023-12:03:41] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
56 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
57 |
+
[12/28/2023-12:03:43] [W] [TRT] Tactic Device request: 6270MB Available: 2276MB. Device memory is insufficient to use tactic.
|
58 |
+
[12/28/2023-12:03:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6270 detected for tactic 0x0000000000000004.
|
59 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
60 |
+
[12/28/2023-12:03:43] [W] [TRT] Tactic Device request: 6270MB Available: 2276MB. Device memory is insufficient to use tactic.
|
61 |
+
[12/28/2023-12:03:43] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6270 detected for tactic 0x000000000000003c.
|
62 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
63 |
+
[12/28/2023-12:10:19] [W] [TRT] Tactic Device request: 7056MB Available: 2319MB. Device memory is insufficient to use tactic.
|
64 |
+
[12/28/2023-12:10:19] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
65 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
66 |
+
[12/28/2023-12:10:19] [W] [TRT] Tactic Device request: 7056MB Available: 2319MB. Device memory is insufficient to use tactic.
|
67 |
+
[12/28/2023-12:10:19] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
68 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
69 |
+
[12/28/2023-12:10:19] [W] [TRT] Tactic Device request: 7056MB Available: 2319MB. Device memory is insufficient to use tactic.
|
70 |
+
[12/28/2023-12:10:19] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
71 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
72 |
+
[12/28/2023-12:10:21] [W] [TRT] Tactic Device request: 7050MB Available: 2320MB. Device memory is insufficient to use tactic.
|
73 |
+
[12/28/2023-12:10:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7050 detected for tactic 0x0000000000000004.
|
74 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
75 |
+
[12/28/2023-12:10:21] [W] [TRT] Tactic Device request: 7050MB Available: 2320MB. Device memory is insufficient to use tactic.
|
76 |
+
[12/28/2023-12:10:21] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 7050 detected for tactic 0x000000000000003c.
|
77 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
78 |
+
[12/28/2023-12:10:37] [W] [TRT] Tactic Device request: 6354MB Available: 2321MB. Device memory is insufficient to use tactic.
|
79 |
+
[12/28/2023-12:10:37] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
80 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
81 |
+
[12/28/2023-12:10:38] [W] [TRT] Tactic Device request: 6354MB Available: 2320MB. Device memory is insufficient to use tactic.
|
82 |
+
[12/28/2023-12:10:38] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
83 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
84 |
+
[12/28/2023-12:10:38] [W] [TRT] Tactic Device request: 6354MB Available: 2320MB. Device memory is insufficient to use tactic.
|
85 |
+
[12/28/2023-12:10:38] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
86 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
87 |
+
[12/28/2023-12:10:39] [W] [TRT] Tactic Device request: 6351MB Available: 2320MB. Device memory is insufficient to use tactic.
|
88 |
+
[12/28/2023-12:10:39] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6351 detected for tactic 0x0000000000000004.
|
89 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
90 |
+
[12/28/2023-12:10:39] [W] [TRT] Tactic Device request: 6351MB Available: 2320MB. Device memory is insufficient to use tactic.
|
91 |
+
[12/28/2023-12:10:39] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6351 detected for tactic 0x000000000000003c.
|
92 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
93 |
+
[12/28/2023-12:19:26] [W] [TRT] Tactic Device request: 2394MB Available: 2151MB. Device memory is insufficient to use tactic.
|
94 |
+
[12/28/2023-12:19:26] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000004.
|
95 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
96 |
+
[12/28/2023-12:19:26] [W] [TRT] Tactic Device request: 2394MB Available: 2151MB. Device memory is insufficient to use tactic.
|
97 |
+
[12/28/2023-12:19:26] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
98 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
99 |
+
[12/28/2023-12:19:26] [W] [TRT] Tactic Device request: 2394MB Available: 2151MB. Device memory is insufficient to use tactic.
|
100 |
+
[12/28/2023-12:19:26] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
101 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
102 |
+
[12/28/2023-12:19:27] [W] [TRT] Tactic Device request: 2392MB Available: 2151MB. Device memory is insufficient to use tactic.
|
103 |
+
[12/28/2023-12:19:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
104 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
105 |
+
[12/28/2023-12:19:27] [W] [TRT] Tactic Device request: 2392MB Available: 2150MB. Device memory is insufficient to use tactic.
|
106 |
+
[12/28/2023-12:19:27] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
107 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
108 |
+
[12/28/2023-12:19:27] [W] [TRT] Tactic Device request: 2392MB Available: 2150MB. Device memory is insufficient to use tactic.
|
109 |
+
[12/28/2023-12:19:27] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
110 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
111 |
+
[12/28/2023-12:19:28] [W] [TRT] Tactic Device request: 2391MB Available: 2150MB. Device memory is insufficient to use tactic.
|
112 |
+
[12/28/2023-12:19:28] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2391 detected for tactic 0x0000000000000004.
|
113 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
114 |
+
[12/28/2023-12:19:28] [W] [TRT] Tactic Device request: 2391MB Available: 2150MB. Device memory is insufficient to use tactic.
|
115 |
+
[12/28/2023-12:19:28] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2391 detected for tactic 0x000000000000003c.
|
116 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
117 |
+
[12/28/2023-12:19:28] [W] [TRT] Tactic Device request: 2390MB Available: 2150MB. Device memory is insufficient to use tactic.
|
118 |
+
[12/28/2023-12:19:28] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
119 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
120 |
+
[12/28/2023-12:19:29] [W] [TRT] Tactic Device request: 2390MB Available: 2150MB. Device memory is insufficient to use tactic.
|
121 |
+
[12/28/2023-12:19:29] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
122 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
123 |
+
[12/28/2023-12:19:43] [W] [TRT] Tactic Device request: 6540MB Available: 2123MB. Device memory is insufficient to use tactic.
|
124 |
+
[12/28/2023-12:19:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000004.
|
125 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
126 |
+
[12/28/2023-12:19:43] [W] [TRT] Tactic Device request: 6540MB Available: 2122MB. Device memory is insufficient to use tactic.
|
127 |
+
[12/28/2023-12:19:43] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6540 detected for tactic 0x000000000000003c.
|
128 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
129 |
+
[12/28/2023-12:19:43] [W] [TRT] Tactic Device request: 6540MB Available: 2122MB. Device memory is insufficient to use tactic.
|
130 |
+
[12/28/2023-12:19:43] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000074.
|
131 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
132 |
+
[12/28/2023-12:19:45] [W] [TRT] Tactic Device request: 6538MB Available: 2121MB. Device memory is insufficient to use tactic.
|
133 |
+
[12/28/2023-12:19:45] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6538 detected for tactic 0x0000000000000004.
|
134 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
135 |
+
[12/28/2023-12:19:45] [W] [TRT] Tactic Device request: 6538MB Available: 2122MB. Device memory is insufficient to use tactic.
|
136 |
+
[12/28/2023-12:19:45] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6538 detected for tactic 0x000000000000003c.
|
137 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
138 |
+
[12/28/2023-12:19:47] [W] [TRT] Tactic Device request: 2191MB Available: 2122MB. Device memory is insufficient to use tactic.
|
139 |
+
[12/28/2023-12:19:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000004.
|
140 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
141 |
+
[12/28/2023-12:19:48] [W] [TRT] Tactic Device request: 2191MB Available: 2123MB. Device memory is insufficient to use tactic.
|
142 |
+
[12/28/2023-12:19:48] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2191 detected for tactic 0x000000000000003c.
|
143 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
144 |
+
[12/28/2023-12:19:49] [W] [TRT] Tactic Device request: 2191MB Available: 2122MB. Device memory is insufficient to use tactic.
|
145 |
+
[12/28/2023-12:19:49] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000074.
|
146 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
147 |
+
[12/28/2023-12:19:52] [W] [TRT] Tactic Device request: 2190MB Available: 2123MB. Device memory is insufficient to use tactic.
|
148 |
+
[12/28/2023-12:19:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
149 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
150 |
+
[12/28/2023-12:19:53] [W] [TRT] Tactic Device request: 2190MB Available: 2123MB. Device memory is insufficient to use tactic.
|
151 |
+
[12/28/2023-12:19:53] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
152 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
153 |
+
[12/28/2023-12:19:56] [W] [TRT] Tactic Device request: 2190MB Available: 2128MB. Device memory is insufficient to use tactic.
|
154 |
+
[12/28/2023-12:19:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
155 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
156 |
+
[12/28/2023-12:19:57] [W] [TRT] Tactic Device request: 2190MB Available: 2123MB. Device memory is insufficient to use tactic.
|
157 |
+
[12/28/2023-12:19:57] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
158 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
159 |
+
[12/28/2023-12:19:58] [W] [TRT] Tactic Device request: 2190MB Available: 2122MB. Device memory is insufficient to use tactic.
|
160 |
+
[12/28/2023-12:19:58] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
161 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
162 |
+
[12/28/2023-12:20:02] [W] [TRT] Tactic Device request: 2190MB Available: 2125MB. Device memory is insufficient to use tactic.
|
163 |
+
[12/28/2023-12:20:02] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
164 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
165 |
+
[12/28/2023-12:20:02] [W] [TRT] Tactic Device request: 2190MB Available: 2122MB. Device memory is insufficient to use tactic.
|
166 |
+
[12/28/2023-12:20:02] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
167 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
168 |
+
[12/28/2023-12:24:51] [W] [TRT] Tactic Device request: 2457MB Available: 2244MB. Device memory is insufficient to use tactic.
|
169 |
+
[12/28/2023-12:24:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
170 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
171 |
+
[12/28/2023-12:24:52] [W] [TRT] Tactic Device request: 2457MB Available: 2244MB. Device memory is insufficient to use tactic.
|
172 |
+
[12/28/2023-12:24:52] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
173 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
174 |
+
[12/28/2023-12:24:52] [W] [TRT] Tactic Device request: 2457MB Available: 2244MB. Device memory is insufficient to use tactic.
|
175 |
+
[12/28/2023-12:24:52] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
176 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
177 |
+
[12/28/2023-12:24:53] [W] [TRT] Tactic Device request: 2456MB Available: 2245MB. Device memory is insufficient to use tactic.
|
178 |
+
[12/28/2023-12:24:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2456 detected for tactic 0x0000000000000004.
|
179 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
180 |
+
[12/28/2023-12:24:53] [W] [TRT] Tactic Device request: 2456MB Available: 2245MB. Device memory is insufficient to use tactic.
|
181 |
+
[12/28/2023-12:24:53] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2456 detected for tactic 0x000000000000003c.
|
182 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
183 |
+
[12/28/2023-12:25:14] [W] [TRT] Tactic Device request: 3587MB Available: 2175MB. Device memory is insufficient to use tactic.
|
184 |
+
[12/28/2023-12:25:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
185 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
186 |
+
[12/28/2023-12:25:14] [W] [TRT] Tactic Device request: 3587MB Available: 2176MB. Device memory is insufficient to use tactic.
|
187 |
+
[12/28/2023-12:25:14] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
188 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
189 |
+
[12/28/2023-12:25:14] [W] [TRT] Tactic Device request: 3587MB Available: 2176MB. Device memory is insufficient to use tactic.
|
190 |
+
[12/28/2023-12:25:15] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
191 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
192 |
+
[12/28/2023-12:25:16] [W] [TRT] Tactic Device request: 3585MB Available: 2176MB. Device memory is insufficient to use tactic.
|
193 |
+
[12/28/2023-12:25:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3585 detected for tactic 0x0000000000000004.
|
194 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
195 |
+
[12/28/2023-12:25:16] [W] [TRT] Tactic Device request: 3585MB Available: 2176MB. Device memory is insufficient to use tactic.
|
196 |
+
[12/28/2023-12:25:16] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3585 detected for tactic 0x000000000000003c.
|
197 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
198 |
+
[12/28/2023-12:32:54] [W] [TRT] Tactic Device request: 3556MB Available: 2050MB. Device memory is insufficient to use tactic.
|
199 |
+
[12/28/2023-12:32:54] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
200 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
201 |
+
[12/28/2023-12:32:54] [W] [TRT] Tactic Device request: 3556MB Available: 2051MB. Device memory is insufficient to use tactic.
|
202 |
+
[12/28/2023-12:32:54] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
203 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
204 |
+
[12/28/2023-12:32:54] [W] [TRT] Tactic Device request: 3556MB Available: 2049MB. Device memory is insufficient to use tactic.
|
205 |
+
[12/28/2023-12:32:54] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
206 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
207 |
+
[12/28/2023-12:32:55] [W] [TRT] Tactic Device request: 3551MB Available: 2050MB. Device memory is insufficient to use tactic.
|
208 |
+
[12/28/2023-12:32:55] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3551 detected for tactic 0x0000000000000004.
|
209 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
210 |
+
[12/28/2023-12:32:55] [W] [TRT] Tactic Device request: 3551MB Available: 2050MB. Device memory is insufficient to use tactic.
|
211 |
+
[12/28/2023-12:32:55] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3551 detected for tactic 0x000000000000003c.
|
212 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
213 |
+
[12/28/2023-12:32:56] [W] [TRT] Tactic Device request: 3140MB Available: 2051MB. Device memory is insufficient to use tactic.
|
214 |
+
[12/28/2023-12:32:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000004.
|
215 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
216 |
+
[12/28/2023-12:32:56] [W] [TRT] Tactic Device request: 3140MB Available: 2050MB. Device memory is insufficient to use tactic.
|
217 |
+
[12/28/2023-12:32:56] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3140 detected for tactic 0x000000000000003c.
|
218 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
219 |
+
[12/28/2023-12:32:56] [W] [TRT] Tactic Device request: 3140MB Available: 2050MB. Device memory is insufficient to use tactic.
|
220 |
+
[12/28/2023-12:32:56] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000074.
|
221 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
222 |
+
[12/28/2023-12:32:57] [W] [TRT] Tactic Device request: 3136MB Available: 2051MB. Device memory is insufficient to use tactic.
|
223 |
+
[12/28/2023-12:32:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3136 detected for tactic 0x0000000000000004.
|
224 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
225 |
+
[12/28/2023-12:32:57] [W] [TRT] Tactic Device request: 3136MB Available: 2051MB. Device memory is insufficient to use tactic.
|
226 |
+
[12/28/2023-12:32:57] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3136 detected for tactic 0x000000000000003c.
|
227 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
228 |
+
[12/28/2023-12:40:09] [W] [TRT] Tactic Device request: 3161MB Available: 2255MB. Device memory is insufficient to use tactic.
|
229 |
+
[12/28/2023-12:40:09] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000004.
|
230 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
231 |
+
[12/28/2023-12:40:09] [W] [TRT] Tactic Device request: 3161MB Available: 2255MB. Device memory is insufficient to use tactic.
|
232 |
+
[12/28/2023-12:40:09] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3161 detected for tactic 0x000000000000003c.
|
233 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
234 |
+
[12/28/2023-12:40:09] [W] [TRT] Tactic Device request: 3161MB Available: 2255MB. Device memory is insufficient to use tactic.
|
235 |
+
[12/28/2023-12:40:09] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000074.
|
236 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
237 |
+
[12/28/2023-12:40:10] [W] [TRT] Tactic Device request: 3156MB Available: 2253MB. Device memory is insufficient to use tactic.
|
238 |
+
[12/28/2023-12:40:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3156 detected for tactic 0x0000000000000004.
|
239 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
240 |
+
[12/28/2023-12:40:10] [W] [TRT] Tactic Device request: 3156MB Available: 2254MB. Device memory is insufficient to use tactic.
|
241 |
+
[12/28/2023-12:40:10] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3156 detected for tactic 0x000000000000003c.
|
242 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
243 |
+
[12/28/2023-12:40:14] [W] [TRT] Tactic Device request: 4189MB Available: 2253MB. Device memory is insufficient to use tactic.
|
244 |
+
[12/28/2023-12:40:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000004.
|
245 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
246 |
+
[12/28/2023-12:40:15] [W] [TRT] Tactic Device request: 4189MB Available: 2253MB. Device memory is insufficient to use tactic.
|
247 |
+
[12/28/2023-12:40:15] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4189 detected for tactic 0x000000000000003c.
|
248 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
249 |
+
[12/28/2023-12:40:15] [W] [TRT] Tactic Device request: 4189MB Available: 2254MB. Device memory is insufficient to use tactic.
|
250 |
+
[12/28/2023-12:40:15] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000074.
|
251 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
252 |
+
[12/28/2023-12:40:19] [W] [TRT] Tactic Device request: 4183MB Available: 2255MB. Device memory is insufficient to use tactic.
|
253 |
+
[12/28/2023-12:40:20] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4183 detected for tactic 0x0000000000000004.
|
254 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
255 |
+
[12/28/2023-12:40:20] [W] [TRT] Tactic Device request: 4183MB Available: 2255MB. Device memory is insufficient to use tactic.
|
256 |
+
[12/28/2023-12:40:20] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4183 detected for tactic 0x000000000000003c.
|
257 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
258 |
+
[12/28/2023-12:40:22] [W] [TRT] Tactic Device request: 4186MB Available: 2255MB. Device memory is insufficient to use tactic.
|
259 |
+
[12/28/2023-12:40:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000004.
|
260 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
261 |
+
[12/28/2023-12:40:22] [W] [TRT] Tactic Device request: 4186MB Available: 2254MB. Device memory is insufficient to use tactic.
|
262 |
+
[12/28/2023-12:40:22] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4186 detected for tactic 0x000000000000003c.
|
263 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
264 |
+
[12/28/2023-12:40:23] [W] [TRT] Tactic Device request: 4186MB Available: 2254MB. Device memory is insufficient to use tactic.
|
265 |
+
[12/28/2023-12:40:23] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000074.
|
266 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
267 |
+
[12/28/2023-12:40:27] [W] [TRT] Tactic Device request: 4182MB Available: 2254MB. Device memory is insufficient to use tactic.
|
268 |
+
[12/28/2023-12:40:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4182 detected for tactic 0x0000000000000004.
|
269 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
270 |
+
[12/28/2023-12:40:27] [W] [TRT] Tactic Device request: 4182MB Available: 2253MB. Device memory is insufficient to use tactic.
|
271 |
+
[12/28/2023-12:40:27] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4182 detected for tactic 0x000000000000003c.
|
272 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
273 |
+
[12/28/2023-12:48:15] [W] [TRT] Tactic Device request: 4764MB Available: 2271MB. Device memory is insufficient to use tactic.
|
274 |
+
[12/28/2023-12:48:15] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000004.
|
275 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
276 |
+
[12/28/2023-12:48:15] [W] [TRT] Tactic Device request: 4764MB Available: 2271MB. Device memory is insufficient to use tactic.
|
277 |
+
[12/28/2023-12:48:15] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4764 detected for tactic 0x000000000000003c.
|
278 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
279 |
+
[12/28/2023-12:48:15] [W] [TRT] Tactic Device request: 4764MB Available: 2269MB. Device memory is insufficient to use tactic.
|
280 |
+
[12/28/2023-12:48:15] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000074.
|
281 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
282 |
+
[12/28/2023-12:48:17] [W] [TRT] Tactic Device request: 4761MB Available: 2268MB. Device memory is insufficient to use tactic.
|
283 |
+
[12/28/2023-12:48:17] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4761 detected for tactic 0x0000000000000004.
|
284 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
285 |
+
[12/28/2023-12:48:17] [W] [TRT] Tactic Device request: 4761MB Available: 2265MB. Device memory is insufficient to use tactic.
|
286 |
+
[12/28/2023-12:48:17] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4761 detected for tactic 0x000000000000003c.
|
287 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
288 |
+
[12/28/2023-12:48:23] [W] [TRT] Tactic Device request: 4244MB Available: 2235MB. Device memory is insufficient to use tactic.
|
289 |
+
[12/28/2023-12:48:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000004.
|
290 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
291 |
+
[12/28/2023-12:48:24] [W] [TRT] Tactic Device request: 4244MB Available: 1911MB. Device memory is insufficient to use tactic.
|
292 |
+
[12/28/2023-12:48:24] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4244 detected for tactic 0x000000000000003c.
|
293 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
294 |
+
[12/28/2023-12:48:24] [W] [TRT] Tactic Device request: 4244MB Available: 1909MB. Device memory is insufficient to use tactic.
|
295 |
+
[12/28/2023-12:48:25] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000074.
|
296 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
297 |
+
[12/28/2023-12:48:29] [W] [TRT] Tactic Device request: 4240MB Available: 1905MB. Device memory is insufficient to use tactic.
|
298 |
+
[12/28/2023-12:48:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4240 detected for tactic 0x0000000000000004.
|
299 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
300 |
+
[12/28/2023-12:48:30] [W] [TRT] Tactic Device request: 4240MB Available: 1896MB. Device memory is insufficient to use tactic.
|
301 |
+
[12/28/2023-12:48:30] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4240 detected for tactic 0x000000000000003c.
|
302 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
303 |
+
[12/28/2023-12:48:33] [W] [TRT] Tactic Device request: 4241MB Available: 1892MB. Device memory is insufficient to use tactic.
|
304 |
+
[12/28/2023-12:48:33] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000004.
|
305 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
306 |
+
[12/28/2023-12:48:34] [W] [TRT] Tactic Device request: 4241MB Available: 1864MB. Device memory is insufficient to use tactic.
|
307 |
+
[12/28/2023-12:48:34] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4241 detected for tactic 0x000000000000003c.
|
308 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
309 |
+
[12/28/2023-12:48:35] [W] [TRT] Tactic Device request: 4241MB Available: 1860MB. Device memory is insufficient to use tactic.
|
310 |
+
[12/28/2023-12:48:35] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000074.
|
311 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
312 |
+
[12/28/2023-12:48:39] [W] [TRT] Tactic Device request: 4239MB Available: 1857MB. Device memory is insufficient to use tactic.
|
313 |
+
[12/28/2023-12:48:39] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4239 detected for tactic 0x0000000000000004.
|
314 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
315 |
+
[12/28/2023-12:48:40] [W] [TRT] Tactic Device request: 4239MB Available: 1845MB. Device memory is insufficient to use tactic.
|
316 |
+
[12/28/2023-12:48:40] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4239 detected for tactic 0x000000000000003c.
|
317 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
318 |
+
[12/28/2023-12:57:07] [W] [TRT] Tactic Device request: 3270MB Available: 1684MB. Device memory is insufficient to use tactic.
|
319 |
+
[12/28/2023-12:57:07] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000004.
|
320 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
321 |
+
[12/28/2023-12:57:07] [W] [TRT] Tactic Device request: 3270MB Available: 1684MB. Device memory is insufficient to use tactic.
|
322 |
+
[12/28/2023-12:57:07] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3270 detected for tactic 0x000000000000003c.
|
323 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
324 |
+
[12/28/2023-12:57:07] [W] [TRT] Tactic Device request: 3270MB Available: 1684MB. Device memory is insufficient to use tactic.
|
325 |
+
[12/28/2023-12:57:07] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000074.
|
326 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
327 |
+
[12/28/2023-12:57:08] [W] [TRT] Tactic Device request: 3269MB Available: 1684MB. Device memory is insufficient to use tactic.
|
328 |
+
[12/28/2023-12:57:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3269 detected for tactic 0x0000000000000004.
|
329 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
330 |
+
[12/28/2023-12:57:09] [W] [TRT] Tactic Device request: 3269MB Available: 1684MB. Device memory is insufficient to use tactic.
|
331 |
+
[12/28/2023-12:57:09] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3269 detected for tactic 0x000000000000003c.
|
332 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
333 |
+
[12/28/2023-12:57:11] [W] [TRT] Tactic Device request: 4377MB Available: 1680MB. Device memory is insufficient to use tactic.
|
334 |
+
[12/28/2023-12:57:11] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000004.
|
335 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
336 |
+
[12/28/2023-12:57:11] [W] [TRT] Tactic Device request: 2185MB Available: 1680MB. Device memory is insufficient to use tactic.
|
337 |
+
[12/28/2023-12:57:11] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000005.
|
338 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
339 |
+
[12/28/2023-12:57:11] [W] [TRT] Tactic Device request: 4377MB Available: 1680MB. Device memory is insufficient to use tactic.
|
340 |
+
[12/28/2023-12:57:11] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4377 detected for tactic 0x000000000000003c.
|
341 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
342 |
+
[12/28/2023-12:57:11] [W] [TRT] Tactic Device request: 2185MB Available: 1680MB. Device memory is insufficient to use tactic.
|
343 |
+
[12/28/2023-12:57:11] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2185 detected for tactic 0x000000000000003d.
|
344 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
345 |
+
[12/28/2023-12:57:12] [W] [TRT] Tactic Device request: 4377MB Available: 1680MB. Device memory is insufficient to use tactic.
|
346 |
+
[12/28/2023-12:57:12] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000074.
|
347 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
348 |
+
[12/28/2023-12:57:12] [W] [TRT] Tactic Device request: 2185MB Available: 1680MB. Device memory is insufficient to use tactic.
|
349 |
+
[12/28/2023-12:57:12] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000075.
|
350 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
351 |
+
[12/28/2023-12:57:17] [W] [TRT] Tactic Device request: 4375MB Available: 1680MB. Device memory is insufficient to use tactic.
|
352 |
+
[12/28/2023-12:57:17] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
353 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
354 |
+
[12/28/2023-12:57:18] [W] [TRT] Tactic Device request: 2183MB Available: 1680MB. Device memory is insufficient to use tactic.
|
355 |
+
[12/28/2023-12:57:18] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
356 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
357 |
+
[12/28/2023-12:57:18] [W] [TRT] Tactic Device request: 4375MB Available: 1680MB. Device memory is insufficient to use tactic.
|
358 |
+
[12/28/2023-12:57:18] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
359 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
360 |
+
[12/28/2023-12:57:18] [W] [TRT] Tactic Device request: 2183MB Available: 1680MB. Device memory is insufficient to use tactic.
|
361 |
+
[12/28/2023-12:57:18] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
362 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
363 |
+
[12/28/2023-12:57:22] [W] [TRT] Tactic Device request: 4376MB Available: 1680MB. Device memory is insufficient to use tactic.
|
364 |
+
[12/28/2023-12:57:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000004.
|
365 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
366 |
+
[12/28/2023-12:57:22] [W] [TRT] Tactic Device request: 2184MB Available: 1680MB. Device memory is insufficient to use tactic.
|
367 |
+
[12/28/2023-12:57:22] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000005.
|
368 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
369 |
+
[12/28/2023-12:57:22] [W] [TRT] Tactic Device request: 4376MB Available: 1679MB. Device memory is insufficient to use tactic.
|
370 |
+
[12/28/2023-12:57:22] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4376 detected for tactic 0x000000000000003c.
|
371 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
372 |
+
[12/28/2023-12:57:22] [W] [TRT] Tactic Device request: 2184MB Available: 1679MB. Device memory is insufficient to use tactic.
|
373 |
+
[12/28/2023-12:57:22] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2184 detected for tactic 0x000000000000003d.
|
374 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
375 |
+
[12/28/2023-12:57:23] [W] [TRT] Tactic Device request: 4376MB Available: 1679MB. Device memory is insufficient to use tactic.
|
376 |
+
[12/28/2023-12:57:23] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000074.
|
377 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
378 |
+
[12/28/2023-12:57:23] [W] [TRT] Tactic Device request: 2184MB Available: 1679MB. Device memory is insufficient to use tactic.
|
379 |
+
[12/28/2023-12:57:23] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000075.
|
380 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
381 |
+
[12/28/2023-12:57:28] [W] [TRT] Tactic Device request: 4375MB Available: 1679MB. Device memory is insufficient to use tactic.
|
382 |
+
[12/28/2023-12:57:28] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4375 detected for tactic 0x0000000000000004.
|
383 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
384 |
+
[12/28/2023-12:57:28] [W] [TRT] Tactic Device request: 2183MB Available: 1679MB. Device memory is insufficient to use tactic.
|
385 |
+
[12/28/2023-12:57:28] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2183 detected for tactic 0x0000000000000005.
|
386 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
387 |
+
[12/28/2023-12:57:29] [W] [TRT] Tactic Device request: 4375MB Available: 1679MB. Device memory is insufficient to use tactic.
|
388 |
+
[12/28/2023-12:57:29] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4375 detected for tactic 0x000000000000003c.
|
389 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
390 |
+
[12/28/2023-12:57:29] [W] [TRT] Tactic Device request: 2183MB Available: 1679MB. Device memory is insufficient to use tactic.
|
391 |
+
[12/28/2023-12:57:29] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2183 detected for tactic 0x000000000000003d.
|
392 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
393 |
+
[12/28/2023-12:58:16] [W] [TRT] TensorRT encountered issues when converting weights between types and that could affect accuracy.
|
394 |
+
[12/28/2023-12:58:16] [W] [TRT] If this is not the desired behavior, please modify the weights or retrain with regularization to adjust the magnitude of the weights.
|
395 |
+
[12/28/2023-12:58:16] [W] [TRT] Check verbose logs for the list of affected weights.
|
396 |
+
[12/28/2023-12:58:16] [W] [TRT] - 114 weights are affected by this issue: Detected subnormal FP16 values.
|
397 |
+
[12/28/2023-12:58:16] [W] [TRT] - 40 weights are affected by this issue: Detected values less than smallest positive FP16 subnormal value and converted them to the FP16 minimum subnormalized value.
|
398 |
+
[12/28/2023-12:58:33] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
399 |
+
[12/28/2023-12:58:33] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
400 |
+
[12/28/2023-12:58:33] [W] * GPU compute time is unstable, with coefficient of variance = 5.80641%.
|
401 |
+
[12/28/2023-12:58:33] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_fp32.onnx.fp16.engine.log
ADDED
@@ -0,0 +1,328 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.fp16.engine
|
2 |
+
[12/28/2023-11:52:55] [I] === Model Options ===
|
3 |
+
[12/28/2023-11:52:55] [I] Format: ONNX
|
4 |
+
[12/28/2023-11:52:55] [I] Model: yolo_nas_pose_l_fp32.onnx
|
5 |
+
[12/28/2023-11:52:55] [I] Output:
|
6 |
+
[12/28/2023-11:52:55] [I] === Build Options ===
|
7 |
+
[12/28/2023-11:52:55] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-11:52:55] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-11:52:55] [I] minTiming: 1
|
10 |
+
[12/28/2023-11:52:55] [I] avgTiming: 8
|
11 |
+
[12/28/2023-11:52:55] [I] Precision: FP32+FP16
|
12 |
+
[12/28/2023-11:52:55] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-11:52:55] [I] Calibration:
|
14 |
+
[12/28/2023-11:52:55] [I] Refit: Disabled
|
15 |
+
[12/28/2023-11:52:55] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-11:52:55] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-11:52:55] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-11:52:55] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-11:52:55] [I] Build only: Disabled
|
20 |
+
[12/28/2023-11:52:55] [I] Save engine: yolo_nas_pose_l_fp32.onnx.fp16.engine
|
21 |
+
[12/28/2023-11:52:55] [I] Load engine:
|
22 |
+
[12/28/2023-11:52:55] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-11:52:55] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-11:52:55] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-11:52:55] [I] timingCacheFile:
|
26 |
+
[12/28/2023-11:52:55] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-11:52:55] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-11:52:55] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-11:52:55] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-11:52:55] [I] Input build shapes: model
|
31 |
+
[12/28/2023-11:52:55] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-11:52:55] [I] === System Options ===
|
33 |
+
[12/28/2023-11:52:55] [I] Device: 0
|
34 |
+
[12/28/2023-11:52:55] [I] DLACore:
|
35 |
+
[12/28/2023-11:52:55] [I] Plugins:
|
36 |
+
[12/28/2023-11:52:55] [I] === Inference Options ===
|
37 |
+
[12/28/2023-11:52:55] [I] Batch: Explicit
|
38 |
+
[12/28/2023-11:52:55] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-11:52:55] [I] Iterations: 10
|
40 |
+
[12/28/2023-11:52:55] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-11:52:55] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-11:52:55] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-11:52:55] [I] Streams: 1
|
44 |
+
[12/28/2023-11:52:55] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-11:52:55] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-11:52:55] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-11:52:55] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-11:52:55] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-11:52:55] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-11:52:55] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-11:52:55] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-11:52:55] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-11:52:55] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-11:52:55] [I] Inputs:
|
55 |
+
[12/28/2023-11:52:55] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-11:52:55] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-11:52:55] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-11:52:55] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-11:52:55] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-11:52:55] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-11:52:55] [I] Profile: Disabled
|
62 |
+
[12/28/2023-11:52:55] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-11:52:55] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-11:52:55] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-11:52:55] [I]
|
66 |
+
[12/28/2023-11:52:55] [I] === Device Information ===
|
67 |
+
[12/28/2023-11:52:55] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-11:52:55] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-11:52:55] [I] SMs: 8
|
70 |
+
[12/28/2023-11:52:55] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-11:52:55] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-11:52:55] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-11:52:55] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-11:52:55] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-11:52:55] [I]
|
76 |
+
[12/28/2023-11:52:55] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-11:52:56] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 3001 (MiB)
|
78 |
+
[12/28/2023-11:52:59] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +283, now: CPU 574, GPU 3306 (MiB)
|
79 |
+
[12/28/2023-11:52:59] [I] Start parsing network model
|
80 |
+
[12/28/2023-11:53:02] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-11:53:02] [I] [TRT] Input filename: yolo_nas_pose_l_fp32.onnx
|
82 |
+
[12/28/2023-11:53:02] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-11:53:02] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-11:53:02] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-11:53:02] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-11:53:02] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-11:53:02] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-11:53:02] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-11:53:02] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-11:53:03] [I] Finish parsing network model
|
91 |
+
[12/28/2023-11:53:04] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-11:53:04] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 455) [Constant]
|
96 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 456) [Constant]
|
97 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 457) [Constant]
|
98 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv1/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
166 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
167 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
168 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
169 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
170 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
171 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
172 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
173 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
174 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
175 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
176 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
177 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
178 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
179 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
180 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
181 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
182 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
183 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
184 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
185 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
186 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 187) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
187 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
188 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
189 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 195) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
190 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
191 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
192 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
193 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
194 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
195 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
196 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
197 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
198 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
199 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
200 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
201 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
202 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 224) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
203 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
204 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
205 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 232) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
206 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
207 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
208 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 240) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
209 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
210 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
211 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
212 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
213 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
214 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
215 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
216 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
217 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
218 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
219 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
220 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
221 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
222 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
223 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
224 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 271) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
225 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
226 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
227 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
228 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 294) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
229 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
230 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
231 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 302) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
232 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
233 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
234 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 310) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
235 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
236 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
237 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
238 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
239 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
240 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
241 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
242 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
243 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
244 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
245 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
246 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
247 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
248 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
249 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
250 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 341) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
251 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
252 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
253 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
254 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 364) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
255 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
256 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
257 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 372) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
258 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
259 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
260 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 380) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
261 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
262 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
263 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
264 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
265 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
266 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
267 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
268 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
269 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
270 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
271 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
272 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
273 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
274 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1.../post_process/Reshape_2]}
|
275 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
276 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 459) [NMS]_1_output[DevicetoShapeHostCopy]
|
277 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
278 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
279 |
+
[12/28/2023-11:53:04] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
280 |
+
[12/28/2023-11:53:10] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +444, now: CPU 1350, GPU 4042 (MiB)
|
281 |
+
[12/28/2023-11:53:11] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +83, GPU +74, now: CPU 1433, GPU 4116 (MiB)
|
282 |
+
[12/28/2023-11:53:11] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
283 |
+
[12/28/2023-12:57:56] [I] [TRT] Total Activation Memory: 8060146176
|
284 |
+
[12/28/2023-12:57:56] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
285 |
+
[12/28/2023-12:58:10] [I] [TRT] Total Host Persistent Memory: 376864
|
286 |
+
[12/28/2023-12:58:10] [I] [TRT] Total Device Persistent Memory: 61440
|
287 |
+
[12/28/2023-12:58:10] [I] [TRT] Total Scratch Memory: 134217728
|
288 |
+
[12/28/2023-12:58:10] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 139 MiB, GPU 2131 MiB
|
289 |
+
[12/28/2023-12:58:10] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 209 steps to complete.
|
290 |
+
[12/28/2023-12:58:10] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 267.621ms to assign 16 blocks to 209 nodes requiring 160521216 bytes.
|
291 |
+
[12/28/2023-12:58:10] [I] [TRT] Total Activation Memory: 160521216
|
292 |
+
[12/28/2023-12:58:16] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +1, GPU +0, now: CPU 1885, GPU 5668 (MiB)
|
293 |
+
[12/28/2023-12:58:16] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +104, GPU +128, now: CPU 104, GPU 128 (MiB)
|
294 |
+
[12/28/2023-12:58:17] [I] Engine built in 3922.11 sec.
|
295 |
+
[12/28/2023-12:58:17] [I] [TRT] Loaded engine size: 105 MiB
|
296 |
+
[12/28/2023-12:58:18] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1347, GPU 5215 (MiB)
|
297 |
+
[12/28/2023-12:58:18] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +103, now: CPU 0, GPU 103 (MiB)
|
298 |
+
[12/28/2023-12:58:18] [I] Engine deserialized in 0.277587 sec.
|
299 |
+
[12/28/2023-12:58:18] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1348, GPU 5215 (MiB)
|
300 |
+
[12/28/2023-12:58:18] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +154, now: CPU 0, GPU 257 (MiB)
|
301 |
+
[12/28/2023-12:58:18] [I] Setting persistentCacheLimit to 0 bytes.
|
302 |
+
[12/28/2023-12:58:18] [I] Using random values for input onnx::Cast_0
|
303 |
+
[12/28/2023-12:58:18] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
304 |
+
[12/28/2023-12:58:18] [I] Using random values for output graph2_flat_predictions
|
305 |
+
[12/28/2023-12:58:18] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
306 |
+
[12/28/2023-12:58:18] [I] Starting inference
|
307 |
+
[12/28/2023-12:58:33] [I] Warmup completed 2 queries over 200 ms
|
308 |
+
[12/28/2023-12:58:33] [I] Timing trace has 437 queries over 15.0687 s
|
309 |
+
[12/28/2023-12:58:33] [I]
|
310 |
+
[12/28/2023-12:58:33] [I] === Trace details ===
|
311 |
+
[12/28/2023-12:58:33] [I] Trace averages of 100 runs:
|
312 |
+
[12/28/2023-12:58:33] [I] Average on 100 runs - GPU latency: 34.2122 ms - Host latency: 34.3209 ms (enqueue 34.261 ms)
|
313 |
+
[12/28/2023-12:58:33] [I] Average on 100 runs - GPU latency: 34.6286 ms - Host latency: 34.7419 ms (enqueue 34.6733 ms)
|
314 |
+
[12/28/2023-12:58:33] [I] Average on 100 runs - GPU latency: 34.32 ms - Host latency: 34.4264 ms (enqueue 34.3737 ms)
|
315 |
+
[12/28/2023-12:58:33] [I] Average on 100 runs - GPU latency: 34.1213 ms - Host latency: 34.2258 ms (enqueue 34.1666 ms)
|
316 |
+
[12/28/2023-12:58:33] [I]
|
317 |
+
[12/28/2023-12:58:33] [I] === Performance summary ===
|
318 |
+
[12/28/2023-12:58:33] [I] Throughput: 29.0005 qps
|
319 |
+
[12/28/2023-12:58:33] [I] Latency: min = 32.0405 ms, max = 46.5195 ms, mean = 34.4576 ms, median = 34.021 ms, percentile(90%) = 35.2378 ms, percentile(95%) = 37.8905 ms, percentile(99%) = 44.1553 ms
|
320 |
+
[12/28/2023-12:58:33] [I] Enqueue Time: min = 32.0081 ms, max = 46.4473 ms, mean = 34.3937 ms, median = 33.9883 ms, percentile(90%) = 35.166 ms, percentile(95%) = 37.6458 ms, percentile(99%) = 44.0703 ms
|
321 |
+
[12/28/2023-12:58:33] [I] H2D Latency: min = 0.0800781 ms, max = 0.119629 ms, mean = 0.0890405 ms, median = 0.0893555 ms, percentile(90%) = 0.0913086 ms, percentile(95%) = 0.0917969 ms, percentile(99%) = 0.103516 ms
|
322 |
+
[12/28/2023-12:58:33] [I] GPU Compute Time: min = 31.9365 ms, max = 46.3989 ms, mean = 34.3493 ms, median = 33.9121 ms, percentile(90%) = 35.1299 ms, percentile(95%) = 37.7999 ms, percentile(99%) = 44.0645 ms
|
323 |
+
[12/28/2023-12:58:33] [I] D2H Latency: min = 0.00292969 ms, max = 0.0566406 ms, mean = 0.0192997 ms, median = 0.0175781 ms, percentile(90%) = 0.0292969 ms, percentile(95%) = 0.03125 ms, percentile(99%) = 0.0371094 ms
|
324 |
+
[12/28/2023-12:58:33] [I] Total Host Walltime: 15.0687 s
|
325 |
+
[12/28/2023-12:58:33] [I] Total GPU Compute Time: 15.0106 s
|
326 |
+
[12/28/2023-12:58:33] [I] Explanations of the performance metrics are printed in the verbose logs.
|
327 |
+
[12/28/2023-12:58:33] [I]
|
328 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.fp16.engine
|
yolo_nas_pose_l_fp32.onnx.int8.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48058cfe18fb0bfcfbf2822e4ac65f9801a49f738a3d6718eff46f2237aeee33
|
3 |
+
size 57073047
|
yolo_nas_pose_l_fp32.onnx.int8.engine.err
ADDED
@@ -0,0 +1,256 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-15:10:20] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-15:10:20] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-15:10:21] [W] [TRT] Calibrator is not being used. Users must provide dynamic range for all tensors that are not Int32 or Bool.
|
4 |
+
[12/28/2023-15:17:13] [W] [TRT] Tactic Device request: 4720MB Available: 2708MB. Device memory is insufficient to use tactic.
|
5 |
+
[12/28/2023-15:17:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000004.
|
6 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
7 |
+
[12/28/2023-15:17:14] [W] [TRT] Tactic Device request: 4720MB Available: 2708MB. Device memory is insufficient to use tactic.
|
8 |
+
[12/28/2023-15:17:14] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4720 detected for tactic 0x000000000000003c.
|
9 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
10 |
+
[12/28/2023-15:17:14] [W] [TRT] Tactic Device request: 4720MB Available: 2707MB. Device memory is insufficient to use tactic.
|
11 |
+
[12/28/2023-15:17:14] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4720 detected for tactic 0x0000000000000074.
|
12 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
13 |
+
[12/28/2023-15:17:21] [W] [TRT] Tactic Device request: 4711MB Available: 2698MB. Device memory is insufficient to use tactic.
|
14 |
+
[12/28/2023-15:17:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
15 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
16 |
+
[12/28/2023-15:17:22] [W] [TRT] Tactic Device request: 4711MB Available: 2697MB. Device memory is insufficient to use tactic.
|
17 |
+
[12/28/2023-15:17:22] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
18 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
19 |
+
[12/28/2023-15:17:22] [W] [TRT] Tactic Device request: 4711MB Available: 2702MB. Device memory is insufficient to use tactic.
|
20 |
+
[12/28/2023-15:17:22] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
21 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
22 |
+
[12/28/2023-15:17:29] [W] [TRT] Tactic Device request: 4711MB Available: 2688MB. Device memory is insufficient to use tactic.
|
23 |
+
[12/28/2023-15:17:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
24 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
25 |
+
[12/28/2023-15:17:30] [W] [TRT] Tactic Device request: 4711MB Available: 2689MB. Device memory is insufficient to use tactic.
|
26 |
+
[12/28/2023-15:17:30] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
27 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
28 |
+
[12/28/2023-15:17:30] [W] [TRT] Tactic Device request: 4711MB Available: 2689MB. Device memory is insufficient to use tactic.
|
29 |
+
[12/28/2023-15:17:30] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
30 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
31 |
+
[12/28/2023-15:21:24] [W] [TRT] Tactic Device request: 4711MB Available: 2366MB. Device memory is insufficient to use tactic.
|
32 |
+
[12/28/2023-15:21:24] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
33 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
34 |
+
[12/28/2023-15:21:24] [W] [TRT] Tactic Device request: 4711MB Available: 2366MB. Device memory is insufficient to use tactic.
|
35 |
+
[12/28/2023-15:21:24] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
36 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
37 |
+
[12/28/2023-15:21:24] [W] [TRT] Tactic Device request: 4711MB Available: 2366MB. Device memory is insufficient to use tactic.
|
38 |
+
[12/28/2023-15:21:24] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
39 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
40 |
+
[12/28/2023-15:21:39] [W] [TRT] Tactic Device request: 6275MB Available: 2366MB. Device memory is insufficient to use tactic.
|
41 |
+
[12/28/2023-15:21:39] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
42 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
43 |
+
[12/28/2023-15:21:39] [W] [TRT] Tactic Device request: 6275MB Available: 2366MB. Device memory is insufficient to use tactic.
|
44 |
+
[12/28/2023-15:21:39] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
45 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
46 |
+
[12/28/2023-15:21:39] [W] [TRT] Tactic Device request: 6275MB Available: 2366MB. Device memory is insufficient to use tactic.
|
47 |
+
[12/28/2023-15:21:39] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
48 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
49 |
+
[12/28/2023-15:27:20] [W] [TRT] Tactic Device request: 7056MB Available: 2259MB. Device memory is insufficient to use tactic.
|
50 |
+
[12/28/2023-15:27:20] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
51 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
52 |
+
[12/28/2023-15:27:20] [W] [TRT] Tactic Device request: 7056MB Available: 2257MB. Device memory is insufficient to use tactic.
|
53 |
+
[12/28/2023-15:27:20] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
54 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
55 |
+
[12/28/2023-15:27:20] [W] [TRT] Tactic Device request: 7056MB Available: 2257MB. Device memory is insufficient to use tactic.
|
56 |
+
[12/28/2023-15:27:20] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
57 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
58 |
+
[12/28/2023-15:27:36] [W] [TRT] Tactic Device request: 6354MB Available: 2258MB. Device memory is insufficient to use tactic.
|
59 |
+
[12/28/2023-15:27:36] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
60 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
61 |
+
[12/28/2023-15:27:36] [W] [TRT] Tactic Device request: 6354MB Available: 2258MB. Device memory is insufficient to use tactic.
|
62 |
+
[12/28/2023-15:27:36] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
63 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
64 |
+
[12/28/2023-15:27:36] [W] [TRT] Tactic Device request: 6354MB Available: 2258MB. Device memory is insufficient to use tactic.
|
65 |
+
[12/28/2023-15:27:36] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
66 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
67 |
+
[12/28/2023-15:35:28] [W] [TRT] Tactic Device request: 2394MB Available: 2120MB. Device memory is insufficient to use tactic.
|
68 |
+
[12/28/2023-15:35:28] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000004.
|
69 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
70 |
+
[12/28/2023-15:35:28] [W] [TRT] Tactic Device request: 2394MB Available: 2120MB. Device memory is insufficient to use tactic.
|
71 |
+
[12/28/2023-15:35:28] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
72 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
73 |
+
[12/28/2023-15:35:28] [W] [TRT] Tactic Device request: 2394MB Available: 2120MB. Device memory is insufficient to use tactic.
|
74 |
+
[12/28/2023-15:35:28] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
75 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
76 |
+
[12/28/2023-15:35:29] [W] [TRT] Tactic Device request: 2392MB Available: 2120MB. Device memory is insufficient to use tactic.
|
77 |
+
[12/28/2023-15:35:29] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
78 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
79 |
+
[12/28/2023-15:35:29] [W] [TRT] Tactic Device request: 2392MB Available: 2120MB. Device memory is insufficient to use tactic.
|
80 |
+
[12/28/2023-15:35:29] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
81 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
82 |
+
[12/28/2023-15:35:29] [W] [TRT] Tactic Device request: 2392MB Available: 2120MB. Device memory is insufficient to use tactic.
|
83 |
+
[12/28/2023-15:35:29] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
84 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
85 |
+
[12/28/2023-15:35:42] [W] [TRT] Tactic Device request: 6540MB Available: 2103MB. Device memory is insufficient to use tactic.
|
86 |
+
[12/28/2023-15:35:42] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000004.
|
87 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
88 |
+
[12/28/2023-15:35:42] [W] [TRT] Tactic Device request: 6540MB Available: 2103MB. Device memory is insufficient to use tactic.
|
89 |
+
[12/28/2023-15:35:42] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6540 detected for tactic 0x000000000000003c.
|
90 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
91 |
+
[12/28/2023-15:35:42] [W] [TRT] Tactic Device request: 6540MB Available: 2103MB. Device memory is insufficient to use tactic.
|
92 |
+
[12/28/2023-15:35:42] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6540 detected for tactic 0x0000000000000074.
|
93 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
94 |
+
[12/28/2023-15:35:46] [W] [TRT] Tactic Device request: 2191MB Available: 2103MB. Device memory is insufficient to use tactic.
|
95 |
+
[12/28/2023-15:35:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000004.
|
96 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
97 |
+
[12/28/2023-15:35:47] [W] [TRT] Tactic Device request: 2191MB Available: 2102MB. Device memory is insufficient to use tactic.
|
98 |
+
[12/28/2023-15:35:47] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2191 detected for tactic 0x000000000000003c.
|
99 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
100 |
+
[12/28/2023-15:35:48] [W] [TRT] Tactic Device request: 2191MB Available: 2100MB. Device memory is insufficient to use tactic.
|
101 |
+
[12/28/2023-15:35:48] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2191 detected for tactic 0x0000000000000074.
|
102 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
103 |
+
[12/28/2023-15:35:53] [W] [TRT] Tactic Device request: 2190MB Available: 2102MB. Device memory is insufficient to use tactic.
|
104 |
+
[12/28/2023-15:35:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
105 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
106 |
+
[12/28/2023-15:35:54] [W] [TRT] Tactic Device request: 2190MB Available: 2099MB. Device memory is insufficient to use tactic.
|
107 |
+
[12/28/2023-15:35:54] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
108 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
109 |
+
[12/28/2023-15:35:55] [W] [TRT] Tactic Device request: 2190MB Available: 2100MB. Device memory is insufficient to use tactic.
|
110 |
+
[12/28/2023-15:35:55] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
111 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
112 |
+
[12/28/2023-15:36:01] [W] [TRT] Tactic Device request: 2190MB Available: 2100MB. Device memory is insufficient to use tactic.
|
113 |
+
[12/28/2023-15:36:01] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000004.
|
114 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
115 |
+
[12/28/2023-15:36:02] [W] [TRT] Tactic Device request: 2190MB Available: 2100MB. Device memory is insufficient to use tactic.
|
116 |
+
[12/28/2023-15:36:02] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2190 detected for tactic 0x000000000000003c.
|
117 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
118 |
+
[12/28/2023-15:36:03] [W] [TRT] Tactic Device request: 2190MB Available: 2099MB. Device memory is insufficient to use tactic.
|
119 |
+
[12/28/2023-15:36:03] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2190 detected for tactic 0x0000000000000074.
|
120 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
121 |
+
[12/28/2023-15:40:03] [W] [TRT] Tactic Device request: 2457MB Available: 2339MB. Device memory is insufficient to use tactic.
|
122 |
+
[12/28/2023-15:40:03] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
123 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
124 |
+
[12/28/2023-15:40:03] [W] [TRT] Tactic Device request: 2457MB Available: 2339MB. Device memory is insufficient to use tactic.
|
125 |
+
[12/28/2023-15:40:03] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
126 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
127 |
+
[12/28/2023-15:40:23] [W] [TRT] Tactic Device request: 3587MB Available: 2337MB. Device memory is insufficient to use tactic.
|
128 |
+
[12/28/2023-15:40:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
129 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
130 |
+
[12/28/2023-15:40:23] [W] [TRT] Tactic Device request: 3587MB Available: 2337MB. Device memory is insufficient to use tactic.
|
131 |
+
[12/28/2023-15:40:23] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
132 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
133 |
+
[12/28/2023-15:40:23] [W] [TRT] Tactic Device request: 3587MB Available: 2337MB. Device memory is insufficient to use tactic.
|
134 |
+
[12/28/2023-15:40:23] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
135 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
136 |
+
[12/28/2023-15:47:03] [W] [TRT] Tactic Device request: 3556MB Available: 2223MB. Device memory is insufficient to use tactic.
|
137 |
+
[12/28/2023-15:47:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
138 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
139 |
+
[12/28/2023-15:47:03] [W] [TRT] Tactic Device request: 3556MB Available: 2223MB. Device memory is insufficient to use tactic.
|
140 |
+
[12/28/2023-15:47:03] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
141 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
142 |
+
[12/28/2023-15:47:03] [W] [TRT] Tactic Device request: 3556MB Available: 2223MB. Device memory is insufficient to use tactic.
|
143 |
+
[12/28/2023-15:47:03] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
144 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
145 |
+
[12/28/2023-15:47:05] [W] [TRT] Tactic Device request: 3140MB Available: 2192MB. Device memory is insufficient to use tactic.
|
146 |
+
[12/28/2023-15:47:05] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000004.
|
147 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
148 |
+
[12/28/2023-15:47:05] [W] [TRT] Tactic Device request: 3140MB Available: 2191MB. Device memory is insufficient to use tactic.
|
149 |
+
[12/28/2023-15:47:05] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3140 detected for tactic 0x000000000000003c.
|
150 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
151 |
+
[12/28/2023-15:47:06] [W] [TRT] Tactic Device request: 3140MB Available: 2191MB. Device memory is insufficient to use tactic.
|
152 |
+
[12/28/2023-15:47:06] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3140 detected for tactic 0x0000000000000074.
|
153 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
154 |
+
[12/28/2023-15:53:21] [W] [TRT] Tactic Device request: 3161MB Available: 2119MB. Device memory is insufficient to use tactic.
|
155 |
+
[12/28/2023-15:53:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000004.
|
156 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
157 |
+
[12/28/2023-15:53:21] [W] [TRT] Tactic Device request: 3161MB Available: 2119MB. Device memory is insufficient to use tactic.
|
158 |
+
[12/28/2023-15:53:21] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3161 detected for tactic 0x000000000000003c.
|
159 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
160 |
+
[12/28/2023-15:53:21] [W] [TRT] Tactic Device request: 3161MB Available: 2119MB. Device memory is insufficient to use tactic.
|
161 |
+
[12/28/2023-15:53:21] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3161 detected for tactic 0x0000000000000074.
|
162 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
163 |
+
[12/28/2023-15:53:26] [W] [TRT] Tactic Device request: 4189MB Available: 2117MB. Device memory is insufficient to use tactic.
|
164 |
+
[12/28/2023-15:53:26] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000004.
|
165 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
166 |
+
[12/28/2023-15:53:27] [W] [TRT] Tactic Device request: 4189MB Available: 2101MB. Device memory is insufficient to use tactic.
|
167 |
+
[12/28/2023-15:53:27] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4189 detected for tactic 0x000000000000003c.
|
168 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
169 |
+
[12/28/2023-15:53:27] [W] [TRT] Tactic Device request: 4189MB Available: 2101MB. Device memory is insufficient to use tactic.
|
170 |
+
[12/28/2023-15:53:27] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4189 detected for tactic 0x0000000000000074.
|
171 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
172 |
+
[12/28/2023-15:53:33] [W] [TRT] Tactic Device request: 4186MB Available: 2099MB. Device memory is insufficient to use tactic.
|
173 |
+
[12/28/2023-15:53:33] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000004.
|
174 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
175 |
+
[12/28/2023-15:53:33] [W] [TRT] Tactic Device request: 4186MB Available: 2099MB. Device memory is insufficient to use tactic.
|
176 |
+
[12/28/2023-15:53:33] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4186 detected for tactic 0x000000000000003c.
|
177 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
178 |
+
[12/28/2023-15:53:33] [W] [TRT] Tactic Device request: 4186MB Available: 2099MB. Device memory is insufficient to use tactic.
|
179 |
+
[12/28/2023-15:53:34] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4186 detected for tactic 0x0000000000000074.
|
180 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
181 |
+
[12/28/2023-16:00:19] [W] [TRT] Tactic Device request: 4764MB Available: 2172MB. Device memory is insufficient to use tactic.
|
182 |
+
[12/28/2023-16:00:19] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000004.
|
183 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
184 |
+
[12/28/2023-16:00:19] [W] [TRT] Tactic Device request: 4764MB Available: 2170MB. Device memory is insufficient to use tactic.
|
185 |
+
[12/28/2023-16:00:19] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4764 detected for tactic 0x000000000000003c.
|
186 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
187 |
+
[12/28/2023-16:00:19] [W] [TRT] Tactic Device request: 4764MB Available: 2170MB. Device memory is insufficient to use tactic.
|
188 |
+
[12/28/2023-16:00:19] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4764 detected for tactic 0x0000000000000074.
|
189 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
190 |
+
[12/28/2023-16:00:26] [W] [TRT] Tactic Device request: 4244MB Available: 2030MB. Device memory is insufficient to use tactic.
|
191 |
+
[12/28/2023-16:00:26] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000004.
|
192 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
193 |
+
[12/28/2023-16:00:27] [W] [TRT] Tactic Device request: 4244MB Available: 1979MB. Device memory is insufficient to use tactic.
|
194 |
+
[12/28/2023-16:00:27] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4244 detected for tactic 0x000000000000003c.
|
195 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
196 |
+
[12/28/2023-16:00:28] [W] [TRT] Tactic Device request: 4244MB Available: 1979MB. Device memory is insufficient to use tactic.
|
197 |
+
[12/28/2023-16:00:28] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4244 detected for tactic 0x0000000000000074.
|
198 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
199 |
+
[12/28/2023-16:00:35] [W] [TRT] Tactic Device request: 4241MB Available: 1980MB. Device memory is insufficient to use tactic.
|
200 |
+
[12/28/2023-16:00:35] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000004.
|
201 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
202 |
+
[12/28/2023-16:00:36] [W] [TRT] Tactic Device request: 4241MB Available: 1980MB. Device memory is insufficient to use tactic.
|
203 |
+
[12/28/2023-16:00:36] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4241 detected for tactic 0x000000000000003c.
|
204 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
205 |
+
[12/28/2023-16:00:37] [W] [TRT] Tactic Device request: 4241MB Available: 1979MB. Device memory is insufficient to use tactic.
|
206 |
+
[12/28/2023-16:00:37] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4241 detected for tactic 0x0000000000000074.
|
207 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
208 |
+
[12/28/2023-16:08:17] [W] [TRT] Tactic Device request: 3270MB Available: 1808MB. Device memory is insufficient to use tactic.
|
209 |
+
[12/28/2023-16:08:17] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000004.
|
210 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
211 |
+
[12/28/2023-16:08:17] [W] [TRT] Tactic Device request: 3270MB Available: 1808MB. Device memory is insufficient to use tactic.
|
212 |
+
[12/28/2023-16:08:17] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3270 detected for tactic 0x000000000000003c.
|
213 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
214 |
+
[12/28/2023-16:08:17] [W] [TRT] Tactic Device request: 3270MB Available: 1808MB. Device memory is insufficient to use tactic.
|
215 |
+
[12/28/2023-16:08:17] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3270 detected for tactic 0x0000000000000074.
|
216 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
217 |
+
[12/28/2023-16:08:21] [W] [TRT] Tactic Device request: 4377MB Available: 1804MB. Device memory is insufficient to use tactic.
|
218 |
+
[12/28/2023-16:08:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000004.
|
219 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
220 |
+
[12/28/2023-16:08:21] [W] [TRT] Tactic Device request: 2185MB Available: 1804MB. Device memory is insufficient to use tactic.
|
221 |
+
[12/28/2023-16:08:21] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000005.
|
222 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
223 |
+
[12/28/2023-16:08:21] [W] [TRT] Tactic Device request: 4377MB Available: 1804MB. Device memory is insufficient to use tactic.
|
224 |
+
[12/28/2023-16:08:21] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4377 detected for tactic 0x000000000000003c.
|
225 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
226 |
+
[12/28/2023-16:08:21] [W] [TRT] Tactic Device request: 2185MB Available: 1804MB. Device memory is insufficient to use tactic.
|
227 |
+
[12/28/2023-16:08:21] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2185 detected for tactic 0x000000000000003d.
|
228 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
229 |
+
[12/28/2023-16:08:22] [W] [TRT] Tactic Device request: 4377MB Available: 1803MB. Device memory is insufficient to use tactic.
|
230 |
+
[12/28/2023-16:08:22] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4377 detected for tactic 0x0000000000000074.
|
231 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
232 |
+
[12/28/2023-16:08:22] [W] [TRT] Tactic Device request: 2185MB Available: 1803MB. Device memory is insufficient to use tactic.
|
233 |
+
[12/28/2023-16:08:22] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2185 detected for tactic 0x0000000000000075.
|
234 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
235 |
+
[12/28/2023-16:08:31] [W] [TRT] Tactic Device request: 4376MB Available: 1803MB. Device memory is insufficient to use tactic.
|
236 |
+
[12/28/2023-16:08:31] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000004.
|
237 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
238 |
+
[12/28/2023-16:08:31] [W] [TRT] Tactic Device request: 2184MB Available: 1803MB. Device memory is insufficient to use tactic.
|
239 |
+
[12/28/2023-16:08:31] [W] [TRT] Skipping tactic 4 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000005.
|
240 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
241 |
+
[12/28/2023-16:08:31] [W] [TRT] Tactic Device request: 4376MB Available: 1803MB. Device memory is insufficient to use tactic.
|
242 |
+
[12/28/2023-16:08:31] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4376 detected for tactic 0x000000000000003c.
|
243 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
244 |
+
[12/28/2023-16:08:31] [W] [TRT] Tactic Device request: 2184MB Available: 1803MB. Device memory is insufficient to use tactic.
|
245 |
+
[12/28/2023-16:08:31] [W] [TRT] Skipping tactic 10 due to insufficient memory on requested size of 2184 detected for tactic 0x000000000000003d.
|
246 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
247 |
+
[12/28/2023-16:08:32] [W] [TRT] Tactic Device request: 4376MB Available: 1803MB. Device memory is insufficient to use tactic.
|
248 |
+
[12/28/2023-16:08:32] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4376 detected for tactic 0x0000000000000074.
|
249 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
250 |
+
[12/28/2023-16:08:32] [W] [TRT] Tactic Device request: 2184MB Available: 1803MB. Device memory is insufficient to use tactic.
|
251 |
+
[12/28/2023-16:08:32] [W] [TRT] Skipping tactic 16 due to insufficient memory on requested size of 2184 detected for tactic 0x0000000000000075.
|
252 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
253 |
+
[12/28/2023-16:09:30] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
254 |
+
[12/28/2023-16:09:30] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
255 |
+
[12/28/2023-16:09:30] [W] * GPU compute time is unstable, with coefficient of variance = 6.6527%.
|
256 |
+
[12/28/2023-16:09:30] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_fp32.onnx.int8.engine.log
ADDED
@@ -0,0 +1,332 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.int8.engine
|
2 |
+
[12/28/2023-15:10:07] [I] === Model Options ===
|
3 |
+
[12/28/2023-15:10:07] [I] Format: ONNX
|
4 |
+
[12/28/2023-15:10:07] [I] Model: yolo_nas_pose_l_fp32.onnx
|
5 |
+
[12/28/2023-15:10:07] [I] Output:
|
6 |
+
[12/28/2023-15:10:07] [I] === Build Options ===
|
7 |
+
[12/28/2023-15:10:07] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-15:10:07] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-15:10:07] [I] minTiming: 1
|
10 |
+
[12/28/2023-15:10:07] [I] avgTiming: 8
|
11 |
+
[12/28/2023-15:10:07] [I] Precision: FP32+INT8
|
12 |
+
[12/28/2023-15:10:07] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-15:10:07] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-15:10:07] [I] Refit: Disabled
|
15 |
+
[12/28/2023-15:10:07] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-15:10:07] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-15:10:07] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-15:10:07] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-15:10:07] [I] Build only: Disabled
|
20 |
+
[12/28/2023-15:10:07] [I] Save engine: yolo_nas_pose_l_fp32.onnx.int8.engine
|
21 |
+
[12/28/2023-15:10:07] [I] Load engine:
|
22 |
+
[12/28/2023-15:10:07] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-15:10:07] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-15:10:07] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-15:10:07] [I] timingCacheFile:
|
26 |
+
[12/28/2023-15:10:07] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-15:10:07] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-15:10:07] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-15:10:07] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-15:10:07] [I] Input build shapes: model
|
31 |
+
[12/28/2023-15:10:07] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-15:10:07] [I] === System Options ===
|
33 |
+
[12/28/2023-15:10:07] [I] Device: 0
|
34 |
+
[12/28/2023-15:10:07] [I] DLACore:
|
35 |
+
[12/28/2023-15:10:07] [I] Plugins:
|
36 |
+
[12/28/2023-15:10:07] [I] === Inference Options ===
|
37 |
+
[12/28/2023-15:10:07] [I] Batch: Explicit
|
38 |
+
[12/28/2023-15:10:07] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-15:10:07] [I] Iterations: 10
|
40 |
+
[12/28/2023-15:10:07] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-15:10:07] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-15:10:07] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-15:10:07] [I] Streams: 1
|
44 |
+
[12/28/2023-15:10:07] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-15:10:07] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-15:10:07] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-15:10:07] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-15:10:07] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-15:10:07] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-15:10:07] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-15:10:07] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-15:10:07] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-15:10:07] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-15:10:07] [I] Inputs:
|
55 |
+
[12/28/2023-15:10:07] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-15:10:07] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-15:10:07] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-15:10:07] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-15:10:07] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-15:10:07] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-15:10:07] [I] Profile: Disabled
|
62 |
+
[12/28/2023-15:10:07] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-15:10:07] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-15:10:07] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-15:10:07] [I]
|
66 |
+
[12/28/2023-15:10:07] [I] === Device Information ===
|
67 |
+
[12/28/2023-15:10:07] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-15:10:07] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-15:10:07] [I] SMs: 8
|
70 |
+
[12/28/2023-15:10:07] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-15:10:07] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-15:10:07] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-15:10:07] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-15:10:07] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-15:10:07] [I]
|
76 |
+
[12/28/2023-15:10:07] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-15:10:12] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 3019 (MiB)
|
78 |
+
[12/28/2023-15:10:17] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +286, now: CPU 574, GPU 3326 (MiB)
|
79 |
+
[12/28/2023-15:10:17] [I] Start parsing network model
|
80 |
+
[12/28/2023-15:10:20] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-15:10:20] [I] [TRT] Input filename: yolo_nas_pose_l_fp32.onnx
|
82 |
+
[12/28/2023-15:10:20] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-15:10:20] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-15:10:20] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-15:10:20] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-15:10:20] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-15:10:20] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-15:10:20] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-15:10:20] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-15:10:21] [I] Finish parsing network model
|
91 |
+
[12/28/2023-15:10:21] [I] FP32 and INT8 precisions have been specified - more performance might be enabled by additionally specifying --fp16 or --best
|
92 |
+
[12/28/2023-15:10:21] [I] [TRT] ---------- Layers Running on DLA ----------
|
93 |
+
[12/28/2023-15:10:21] [I] [TRT] ---------- Layers Running on GPU ----------
|
94 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
95 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
96 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 455) [Constant]
|
97 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 456) [Constant]
|
98 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 457) [Constant]
|
99 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
100 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
101 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
102 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
103 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
104 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
105 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
106 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
107 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
108 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
109 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
110 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
111 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
112 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
113 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
114 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
115 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
116 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
117 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
118 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
119 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
120 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
121 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
122 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
123 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
124 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
125 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
126 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
127 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
128 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
129 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
130 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
131 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
132 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
133 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
134 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
135 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
136 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
137 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
138 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
139 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
140 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
141 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
142 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
143 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
144 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
145 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
146 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
147 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
148 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
149 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
150 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
151 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
152 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
153 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
154 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
155 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
156 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
157 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
158 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
159 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
160 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
161 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
162 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
163 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
164 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
165 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv1/act/Relu_output_0 copy
|
166 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
167 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
168 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
169 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
170 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
171 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
172 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
173 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
174 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
175 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
176 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
177 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
178 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
179 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
180 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
181 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
182 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
183 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
184 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
185 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
186 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
187 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 187) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
188 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
189 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
190 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 195) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
191 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
192 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
193 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
194 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
195 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
196 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
197 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
198 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
199 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
200 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
201 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
202 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
203 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 224) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
204 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
205 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
206 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 232) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
207 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
208 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
209 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 240) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
210 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
211 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
212 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
213 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
214 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
215 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
216 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
217 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
218 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
219 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
220 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
221 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
222 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
223 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
224 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
225 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 271) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
226 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
227 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
228 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
229 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 294) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
230 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
231 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
232 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 302) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
233 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
234 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
235 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 310) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
236 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
237 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
238 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
239 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
240 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
241 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
242 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
243 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
244 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
245 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
246 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
247 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
248 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
249 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
250 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
251 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 341) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
252 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
253 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
254 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
255 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 364) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
256 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
257 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
258 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 372) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
259 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/act/Relu
|
260 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/act/Relu
|
261 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 380) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
262 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
263 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
264 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
265 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
266 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
267 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
268 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
269 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
270 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
271 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
272 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
273 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
274 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
275 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1.../post_process/Reshape_2]}
|
276 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
277 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 459) [NMS]_1_output[DevicetoShapeHostCopy]
|
278 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
279 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
280 |
+
[12/28/2023-15:10:21] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
281 |
+
[12/28/2023-15:10:35] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +335, now: CPU 1351, GPU 3954 (MiB)
|
282 |
+
[12/28/2023-15:10:37] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +82, GPU +63, now: CPU 1433, GPU 4017 (MiB)
|
283 |
+
[12/28/2023-15:10:37] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
284 |
+
[12/28/2023-16:08:54] [I] [TRT] Total Activation Memory: 7959592448
|
285 |
+
[12/28/2023-16:08:54] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
286 |
+
[12/28/2023-16:09:08] [I] [TRT] Total Host Persistent Memory: 331808
|
287 |
+
[12/28/2023-16:09:08] [I] [TRT] Total Device Persistent Memory: 38912
|
288 |
+
[12/28/2023-16:09:08] [I] [TRT] Total Scratch Memory: 134217728
|
289 |
+
[12/28/2023-16:09:08] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 88 MiB, GPU 2461 MiB
|
290 |
+
[12/28/2023-16:09:08] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 160 steps to complete.
|
291 |
+
[12/28/2023-16:09:08] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 55.0722ms to assign 13 blocks to 160 nodes requiring 147361280 bytes.
|
292 |
+
[12/28/2023-16:09:08] [I] [TRT] Total Activation Memory: 147361280
|
293 |
+
[12/28/2023-16:09:13] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU -1, now: CPU 1835, GPU 5360 (MiB)
|
294 |
+
[12/28/2023-16:09:13] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +52, GPU +64, now: CPU 52, GPU 64 (MiB)
|
295 |
+
[12/28/2023-16:09:14] [I] Engine built in 3546.25 sec.
|
296 |
+
[12/28/2023-16:09:14] [I] [TRT] Loaded engine size: 54 MiB
|
297 |
+
[12/28/2023-16:09:15] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1299, GPU 5007 (MiB)
|
298 |
+
[12/28/2023-16:09:15] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +52, now: CPU 0, GPU 52 (MiB)
|
299 |
+
[12/28/2023-16:09:15] [I] Engine deserialized in 0.128069 sec.
|
300 |
+
[12/28/2023-16:09:15] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +1, GPU +0, now: CPU 1300, GPU 5007 (MiB)
|
301 |
+
[12/28/2023-16:09:15] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +140, now: CPU 0, GPU 192 (MiB)
|
302 |
+
[12/28/2023-16:09:15] [I] Setting persistentCacheLimit to 0 bytes.
|
303 |
+
[12/28/2023-16:09:15] [I] Using random values for input onnx::Cast_0
|
304 |
+
[12/28/2023-16:09:15] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
305 |
+
[12/28/2023-16:09:15] [I] Using random values for output graph2_flat_predictions
|
306 |
+
[12/28/2023-16:09:15] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
307 |
+
[12/28/2023-16:09:15] [I] Starting inference
|
308 |
+
[12/28/2023-16:09:30] [I] Warmup completed 3 queries over 200 ms
|
309 |
+
[12/28/2023-16:09:30] [I] Timing trace has 720 queries over 15.0291 s
|
310 |
+
[12/28/2023-16:09:30] [I]
|
311 |
+
[12/28/2023-16:09:30] [I] === Trace details ===
|
312 |
+
[12/28/2023-16:09:30] [I] Trace averages of 100 runs:
|
313 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.9331 ms - Host latency: 21.0491 ms (enqueue 20.9849 ms)
|
314 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.3949 ms - Host latency: 20.5041 ms (enqueue 20.4581 ms)
|
315 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.9551 ms - Host latency: 21.0733 ms (enqueue 21.0198 ms)
|
316 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.8394 ms - Host latency: 20.9537 ms (enqueue 20.8945 ms)
|
317 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.4666 ms - Host latency: 20.5773 ms (enqueue 20.5432 ms)
|
318 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.689 ms - Host latency: 20.8023 ms (enqueue 20.7502 ms)
|
319 |
+
[12/28/2023-16:09:30] [I] Average on 100 runs - GPU latency: 20.7472 ms - Host latency: 20.8614 ms (enqueue 20.8134 ms)
|
320 |
+
[12/28/2023-16:09:30] [I]
|
321 |
+
[12/28/2023-16:09:30] [I] === Performance summary ===
|
322 |
+
[12/28/2023-16:09:30] [I] Throughput: 47.9071 qps
|
323 |
+
[12/28/2023-16:09:30] [I] Latency: min = 19.4119 ms, max = 30.8398 ms, mean = 20.8421 ms, median = 20.7168 ms, percentile(90%) = 21.5566 ms, percentile(95%) = 22.2598 ms, percentile(99%) = 28.5723 ms
|
324 |
+
[12/28/2023-16:09:30] [I] Enqueue Time: min = 19.3838 ms, max = 30.7852 ms, mean = 20.7908 ms, median = 20.6725 ms, percentile(90%) = 21.4995 ms, percentile(95%) = 22.1094 ms, percentile(99%) = 28.5068 ms
|
325 |
+
[12/28/2023-16:09:30] [I] H2D Latency: min = 0.0800781 ms, max = 0.133301 ms, mean = 0.0950138 ms, median = 0.0957031 ms, percentile(90%) = 0.0981445 ms, percentile(95%) = 0.0986328 ms, percentile(99%) = 0.0996094 ms
|
326 |
+
[12/28/2023-16:09:30] [I] GPU Compute Time: min = 19.304 ms, max = 30.7158 ms, mean = 20.7286 ms, median = 20.5989 ms, percentile(90%) = 21.4419 ms, percentile(95%) = 22.1621 ms, percentile(99%) = 28.4521 ms
|
327 |
+
[12/28/2023-16:09:30] [I] D2H Latency: min = 0.00292969 ms, max = 0.0688477 ms, mean = 0.0184459 ms, median = 0.0166016 ms, percentile(90%) = 0.0273438 ms, percentile(95%) = 0.0288086 ms, percentile(99%) = 0.0444336 ms
|
328 |
+
[12/28/2023-16:09:30] [I] Total Host Walltime: 15.0291 s
|
329 |
+
[12/28/2023-16:09:30] [I] Total GPU Compute Time: 14.9246 s
|
330 |
+
[12/28/2023-16:09:30] [I] Explanations of the performance metrics are printed in the verbose logs.
|
331 |
+
[12/28/2023-16:09:30] [I]
|
332 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_fp32.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_fp32.onnx.int8.engine
|
yolo_nas_pose_l_fp32.onnx.usage.txt
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
Model exported successfully to yolo_nas_pose_l_fp32.onnx
|
3 |
+
Model expects input image of shape [1, 3, 640, 640]
|
4 |
+
Input image dtype is torch.uint8
|
5 |
+
|
6 |
+
Exported model already contains preprocessing (normalization) step, so you don't need to do it manually.
|
7 |
+
Preprocessing steps to be applied to input image are:
|
8 |
+
Sequential(
|
9 |
+
(0): CastTensorTo(dtype=torch.float32)
|
10 |
+
(1): ChannelSelect(channels_indexes=tensor([2, 1, 0]))
|
11 |
+
(2): ApplyMeanStd(mean=[0.], scale=[255.])
|
12 |
+
)
|
13 |
+
|
14 |
+
|
15 |
+
Exported model contains postprocessing (NMS) step with the following parameters:
|
16 |
+
num_pre_nms_predictions=1000
|
17 |
+
max_predictions_per_image=10
|
18 |
+
nms_threshold=0.5
|
19 |
+
confidence_threshold=0.15
|
20 |
+
output_predictions_format=flat
|
21 |
+
|
22 |
+
|
23 |
+
Exported model is in ONNX format and can be used with ONNXRuntime
|
24 |
+
To run inference with ONNXRuntime, please use the following code snippet:
|
25 |
+
|
26 |
+
import onnxruntime
|
27 |
+
import numpy as np
|
28 |
+
session = onnxruntime.InferenceSession("yolo_nas_pose_l_fp32.onnx", providers=["CUDAExecutionProvider", "CPUExecutionProvider"])
|
29 |
+
inputs = [o.name for o in session.get_inputs()]
|
30 |
+
outputs = [o.name for o in session.get_outputs()]
|
31 |
+
|
32 |
+
example_input_image = np.zeros((1, 3, 640, 640)).astype(np.uint8)
|
33 |
+
predictions = session.run(outputs, {inputs[0]: example_input_image})
|
34 |
+
|
35 |
+
Exported model can also be used with TensorRT
|
36 |
+
To run inference with TensorRT, please see TensorRT deployment documentation
|
37 |
+
You can benchmark the model using the following code snippet:
|
38 |
+
|
39 |
+
trtexec --onnx=yolo_nas_pose_l_fp32.onnx --fp16 --avgRuns=100 --duration=15
|
40 |
+
|
41 |
+
|
42 |
+
Exported model has predictions in flat format:
|
43 |
+
|
44 |
+
# flat_predictions is a 2D array of [N,K] shape
|
45 |
+
# Each row represents (image_index, x_min, y_min, x_max, y_max, confidence, joints...)
|
46 |
+
# Please note all values are floats, so you have to convert them to integers if needed
|
47 |
+
|
48 |
+
[flat_predictions] = predictions
|
49 |
+
pred_bboxes = flat_predictions[:, 1:5]
|
50 |
+
pred_scores = flat_predictions[:, 5]
|
51 |
+
pred_joints = flat_predictions[:, 6:].reshape((len(pred_bboxes), -1, 3))
|
52 |
+
for i in range(len(pred_bboxes)):
|
53 |
+
confidence = pred_scores[i]
|
54 |
+
x_min, y_min, x_max, y_max = pred_bboxes[i]
|
55 |
+
print(f"Detected pose with confidence={{confidence}}, x_min={{x_min}}, y_min={{y_min}}, x_max={{x_max}}, y_max={{y_max}}")
|
56 |
+
for joint_index, (x, y, confidence) in enumerate(pred_joints[i]):")
|
57 |
+
print(f"Joint {{joint_index}} has coordinates x={{x}}, y={{y}}, confidence={{confidence}}")
|
58 |
+
|
yolo_nas_pose_l_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3acfcfd2f63c649f1a6695ff7c3a77dbfb67f654592ddf1abb8f5d32c2efd0cb
|
3 |
+
size 218735221
|
yolo_nas_pose_l_int8.onnx.best.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6be26b88c524b32a7fe99eeaa6166ae80bd428e90d7f45b24317115286e1c80
|
3 |
+
size 57269617
|
yolo_nas_pose_l_int8.onnx.best.engine.err
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-19:27:37] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-19:27:37] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-19:27:42] [W] [TRT] Calibrator won't be used in explicit precision mode. Use quantization aware training to generate network with Quantize/Dequantize nodes.
|
4 |
+
[12/28/2023-20:16:25] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
5 |
+
[12/28/2023-20:16:25] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
6 |
+
[12/28/2023-20:16:25] [W] * GPU compute time is unstable, with coefficient of variance = 6.69708%.
|
7 |
+
[12/28/2023-20:16:25] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_int8.onnx.best.engine.log
ADDED
@@ -0,0 +1,357 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.best.engine
|
2 |
+
[12/28/2023-19:27:34] [I] === Model Options ===
|
3 |
+
[12/28/2023-19:27:34] [I] Format: ONNX
|
4 |
+
[12/28/2023-19:27:34] [I] Model: yolo_nas_pose_l_int8.onnx
|
5 |
+
[12/28/2023-19:27:34] [I] Output:
|
6 |
+
[12/28/2023-19:27:34] [I] === Build Options ===
|
7 |
+
[12/28/2023-19:27:34] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-19:27:34] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-19:27:34] [I] minTiming: 1
|
10 |
+
[12/28/2023-19:27:34] [I] avgTiming: 8
|
11 |
+
[12/28/2023-19:27:34] [I] Precision: FP32+FP16+INT8
|
12 |
+
[12/28/2023-19:27:34] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-19:27:34] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-19:27:34] [I] Refit: Disabled
|
15 |
+
[12/28/2023-19:27:34] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-19:27:34] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-19:27:34] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-19:27:34] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-19:27:34] [I] Build only: Disabled
|
20 |
+
[12/28/2023-19:27:34] [I] Save engine: yolo_nas_pose_l_int8.onnx.best.engine
|
21 |
+
[12/28/2023-19:27:34] [I] Load engine:
|
22 |
+
[12/28/2023-19:27:34] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-19:27:34] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-19:27:34] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-19:27:34] [I] timingCacheFile:
|
26 |
+
[12/28/2023-19:27:34] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-19:27:34] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-19:27:34] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-19:27:34] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-19:27:34] [I] Input build shapes: model
|
31 |
+
[12/28/2023-19:27:34] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-19:27:34] [I] === System Options ===
|
33 |
+
[12/28/2023-19:27:34] [I] Device: 0
|
34 |
+
[12/28/2023-19:27:34] [I] DLACore:
|
35 |
+
[12/28/2023-19:27:34] [I] Plugins:
|
36 |
+
[12/28/2023-19:27:34] [I] === Inference Options ===
|
37 |
+
[12/28/2023-19:27:34] [I] Batch: Explicit
|
38 |
+
[12/28/2023-19:27:34] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-19:27:34] [I] Iterations: 10
|
40 |
+
[12/28/2023-19:27:34] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-19:27:34] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-19:27:34] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-19:27:34] [I] Streams: 1
|
44 |
+
[12/28/2023-19:27:34] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-19:27:34] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-19:27:34] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-19:27:34] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-19:27:34] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-19:27:34] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-19:27:34] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-19:27:34] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-19:27:34] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-19:27:34] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-19:27:34] [I] Inputs:
|
55 |
+
[12/28/2023-19:27:34] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-19:27:34] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-19:27:34] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-19:27:34] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-19:27:34] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-19:27:34] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-19:27:34] [I] Profile: Disabled
|
62 |
+
[12/28/2023-19:27:34] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-19:27:34] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-19:27:34] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-19:27:34] [I]
|
66 |
+
[12/28/2023-19:27:34] [I] === Device Information ===
|
67 |
+
[12/28/2023-19:27:34] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-19:27:34] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-19:27:34] [I] SMs: 8
|
70 |
+
[12/28/2023-19:27:34] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-19:27:34] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-19:27:34] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-19:27:34] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-19:27:34] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-19:27:34] [I]
|
76 |
+
[12/28/2023-19:27:34] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-19:27:35] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2833 (MiB)
|
78 |
+
[12/28/2023-19:27:37] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +284, now: CPU 574, GPU 3138 (MiB)
|
79 |
+
[12/28/2023-19:27:37] [I] Start parsing network model
|
80 |
+
[12/28/2023-19:27:37] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-19:27:37] [I] [TRT] Input filename: yolo_nas_pose_l_int8.onnx
|
82 |
+
[12/28/2023-19:27:37] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-19:27:37] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-19:27:37] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-19:27:37] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-19:27:37] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-19:27:37] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-19:27:37] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-19:27:37] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-19:27:42] [I] Finish parsing network model
|
91 |
+
[12/28/2023-19:27:47] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-19:27:47] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 1417) [Constant]
|
96 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 1418) [Constant]
|
97 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 1419) [Constant]
|
98 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stem/conv/rbr_reparam/_input_quantizer/QuantizeLinear
|
99 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stem.conv.rbr_reparam.weight + /model/backbone/stem/conv/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stem/conv/rbr_reparam/Conv
|
100 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.downsample.rbr_reparam.weight + /model/backbone/stage1/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/downsample/rbr_reparam/Conv
|
101 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.conv2.conv.weight + /model/backbone/stage1/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/conv2/conv/Conv
|
102 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.conv1.conv.weight + /model/backbone/stage1/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/conv1/conv/Conv
|
103 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
104 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
105 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
106 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 557) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
107 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
108 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
109 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
110 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 573) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
111 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
112 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
113 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.conv3.conv.weight + /model/backbone/stage1/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/conv3/conv/Conv
|
114 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.reduce_skip2.conv.weight + /model/neck/neck2/reduce_skip2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/reduce_skip2/conv/Conv
|
115 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.downsample.rbr_reparam.weight + /model/backbone/stage2/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/downsample/rbr_reparam/Conv
|
116 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.downsample.conv.weight + /model/neck/neck2/downsample/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/downsample/conv/Conv
|
117 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.conv2.conv.weight + /model/backbone/stage2/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/conv2/conv/Conv
|
118 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.conv1.conv.weight + /model/backbone/stage2/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/conv1/conv/Conv
|
119 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
120 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
121 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
122 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 620) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
123 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
124 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
125 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
126 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 636) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
127 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
128 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
129 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
130 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 652) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
131 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_2
|
132 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
133 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
134 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.conv3.conv.weight + /model/backbone/stage2/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/conv3/conv/Conv
|
135 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.reduce_skip2.conv.weight + /model/neck/neck1/reduce_skip2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/reduce_skip2/conv/Conv || model.neck.neck2.reduce_skip1.conv.weight + /model/neck/neck2/reduce_skip1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/reduce_skip1/conv/Conv
|
136 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.downsample.rbr_reparam.weight + /model/backbone/stage3/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/downsample/rbr_reparam/Conv
|
137 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.downsample.conv.weight + /model/neck/neck1/downsample/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/downsample/conv/Conv
|
138 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.conv2.conv.weight + /model/backbone/stage3/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/conv2/conv/Conv
|
139 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.conv1.conv.weight + /model/backbone/stage3/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/conv1/conv/Conv
|
140 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
141 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
142 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
143 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 702) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
144 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
145 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
146 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
147 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 718) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
148 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
149 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
150 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
151 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 734) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
152 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
153 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.3.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv
|
154 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.3.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv
|
155 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 750) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
156 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
157 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.4.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv
|
158 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.4.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv
|
159 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 766) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
160 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_4
|
161 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_2
|
162 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
163 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
164 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.conv3.conv.weight + /model/backbone/stage3/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/conv3/conv/Conv
|
165 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.reduce_skip1.conv.weight + /model/neck/neck1/reduce_skip1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/reduce_skip1/conv/Conv
|
166 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.downsample.rbr_reparam.weight + /model/backbone/stage4/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/downsample/rbr_reparam/Conv
|
167 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.conv2.conv.weight + /model/backbone/stage4/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/conv2/conv/Conv
|
168 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.conv1.conv.weight + /model/backbone/stage4/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/conv1/conv/Conv
|
169 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
170 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
171 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
172 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 806) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
173 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
174 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
175 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
176 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 822) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
177 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
178 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
179 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.conv3.conv.weight + /model/backbone/stage4/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/conv3/conv/Conv
|
180 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.context_module.cv1.conv.weight + /model/backbone/context_module/cv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/context_module/cv1/conv/Conv
|
181 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
182 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
183 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
184 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/m.2/MaxPool_output_0 copy
|
185 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.context_module.cv2.conv.weight + /model/backbone/context_module/cv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/context_module/cv2/conv/Conv
|
186 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.conv.conv.weight + /model/neck/neck1/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/conv/conv/Conv
|
187 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] DECONVOLUTION: model.neck.neck1.upsample.weight + /model/neck/neck1/upsample/_weight_quantizer/QuantizeLinear + /model/neck/neck1/upsample/ConvTranspose
|
188 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.reduce_after_concat.conv.weight + /model/neck/neck1/reduce_after_concat/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/reduce_after_concat/conv/Conv
|
189 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.conv2.conv.weight + /model/neck/neck1/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/conv2/conv/Conv
|
190 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.conv1.conv.weight + /model/neck/neck1/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/conv1/conv/Conv
|
191 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
192 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
193 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
194 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 887) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
195 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
196 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
197 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
198 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 903) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
199 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
200 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
201 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
202 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 919) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
203 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
204 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.3.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv
|
205 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.3.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv
|
206 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 935) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
207 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.conv3.conv.weight + /model/neck/neck1/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/conv3/conv/Conv
|
208 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.conv.conv.weight + /model/neck/neck2/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/conv/conv/Conv
|
209 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] DECONVOLUTION: model.neck.neck2.upsample.weight + /model/neck/neck2/upsample/_weight_quantizer/QuantizeLinear + /model/neck/neck2/upsample/ConvTranspose
|
210 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/Concat_/model/neck/neck2/reduce_skip1/act/Relu_output_0_clone_1 copy
|
211 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.reduce_after_concat.conv.weight + /model/neck/neck2/reduce_after_concat/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/reduce_after_concat/conv/Conv
|
212 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.conv2.conv.weight + /model/neck/neck2/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/conv2/conv/Conv
|
213 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.conv1.conv.weight + /model/neck/neck2/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/conv1/conv/Conv
|
214 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
215 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
216 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
217 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 984) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
218 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
219 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
220 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
221 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 1000) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
222 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
223 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
224 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
225 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 1016) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
226 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
227 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.3.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv
|
228 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.3.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv
|
229 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 1032) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
230 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.conv3.conv.weight + /model/neck/neck2/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/conv3/conv/Conv
|
231 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.bbox_stem.seq.conv.weight + /model/heads/head1/bbox_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/bbox_stem/seq/conv/Conv || model.heads.head1.pose_stem.seq.conv.weight + /model/heads/head1/pose_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_stem/seq/conv/Conv
|
232 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.conv.conv.weight + /model/neck/neck3/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/conv/conv/Conv
|
233 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.reg_convs.0.seq.conv.weight + /model/heads/head1/reg_convs/reg_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv || model.heads.head1.cls_convs.0.seq.conv.weight + /model/heads/head1/cls_convs/cls_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv
|
234 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.pose_convs.0.seq.conv.weight + /model/heads/head1/pose_convs/pose_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv
|
235 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.conv2.conv.weight + /model/neck/neck3/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/conv2/conv/Conv
|
236 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.conv1.conv.weight + /model/neck/neck3/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/conv1/conv/Conv
|
237 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.cls_pred.weight + /model/heads/head1/cls_pred/_weight_quantizer/QuantizeLinear + /model/heads/head1/cls_pred/Conv
|
238 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.reg_pred.weight + /model/heads/head1/reg_pred/_weight_quantizer/QuantizeLinear + /model/heads/head1/reg_pred/Conv
|
239 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.pose_convs.1.seq.conv.weight + /model/heads/head1/pose_convs/pose_convs.1/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv
|
240 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/_input_quantizer/QuantizeLinear
|
241 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
242 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.pose_pred.weight + /model/heads/head1/pose_pred/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_pred/Conv
|
243 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.0.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv
|
244 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
245 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.0.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv
|
246 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
247 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 1097) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
248 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/_input_quantizer/QuantizeLinear
|
249 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.1.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv
|
250 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.1.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv
|
251 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 1138) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
252 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/_input_quantizer/QuantizeLinear
|
253 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.2.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv
|
254 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.2.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv
|
255 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 1154) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
256 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/_input_quantizer/QuantizeLinear
|
257 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.3.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv
|
258 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.3.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv
|
259 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 1170) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
260 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.conv3.conv.weight + /model/neck/neck3/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/conv3/conv/Conv
|
261 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_stem.seq.conv.weight + /model/heads/head2/pose_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_stem/seq/conv/Conv || model.heads.head2.bbox_stem.seq.conv.weight + /model/heads/head2/bbox_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/bbox_stem/seq/conv/Conv
|
262 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.conv.conv.weight + /model/neck/neck4/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/conv/conv/Conv
|
263 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.reg_convs.0.seq.conv.weight + /model/heads/head2/reg_convs/reg_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv || model.heads.head2.cls_convs.0.seq.conv.weight + /model/heads/head2/cls_convs/cls_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv
|
264 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_convs.0.seq.conv.weight + /model/heads/head2/pose_convs/pose_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv
|
265 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.conv2.conv.weight + /model/neck/neck4/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/conv2/conv/Conv
|
266 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.conv1.conv.weight + /model/neck/neck4/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/conv1/conv/Conv
|
267 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.cls_pred.weight + /model/heads/head2/cls_pred/_weight_quantizer/QuantizeLinear + /model/heads/head2/cls_pred/Conv
|
268 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.reg_pred.weight + /model/heads/head2/reg_pred/_weight_quantizer/QuantizeLinear + /model/heads/head2/reg_pred/Conv
|
269 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_convs.1.seq.conv.weight + /model/heads/head2/pose_convs/pose_convs.1/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv
|
270 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/_input_quantizer/QuantizeLinear
|
271 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
272 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_pred.weight + /model/heads/head2/pose_pred/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_pred/Conv
|
273 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.0.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv
|
274 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
275 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.0.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv
|
276 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
277 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 1235) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
278 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/_input_quantizer/QuantizeLinear
|
279 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.1.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv
|
280 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.1.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv
|
281 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 1276) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
282 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/_input_quantizer/QuantizeLinear
|
283 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.2.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv
|
284 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.2.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv
|
285 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 1292) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
286 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/_input_quantizer/QuantizeLinear
|
287 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.3.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv
|
288 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.3.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv
|
289 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 1308) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
290 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.conv3.conv.weight + /model/neck/neck4/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/conv3/conv/Conv
|
291 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.bbox_stem.seq.conv.weight + /model/heads/head3/bbox_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/bbox_stem/seq/conv/Conv || model.heads.head3.pose_stem.seq.conv.weight + /model/heads/head3/pose_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_stem/seq/conv/Conv
|
292 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.reg_convs.0.seq.conv.weight + /model/heads/head3/reg_convs/reg_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv || model.heads.head3.cls_convs.0.seq.conv.weight + /model/heads/head3/cls_convs/cls_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv
|
293 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_convs.0.seq.conv.weight + /model/heads/head3/pose_convs/pose_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv
|
294 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.cls_pred.weight + /model/heads/head3/cls_pred/_weight_quantizer/QuantizeLinear + /model/heads/head3/cls_pred/Conv
|
295 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.reg_pred.weight + /model/heads/head3/reg_pred/_weight_quantizer/QuantizeLinear + /model/heads/head3/reg_pred/Conv
|
296 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_convs.1.seq.conv.weight + /model/heads/head3/pose_convs/pose_convs.1/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv
|
297 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
298 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_convs.2.seq.conv.weight + /model/heads/head3/pose_convs/pose_convs.2/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv
|
299 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
300 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_pred.weight + /model/heads/head3/pose_pred/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_pred/Conv
|
301 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
302 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1.../post_process/Reshape_2]}
|
303 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] NMS: batched_nms_274
|
304 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 1421) [NMS]_1_output[DevicetoShapeHostCopy]
|
305 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
306 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
307 |
+
[12/28/2023-19:27:47] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
308 |
+
[12/28/2023-19:28:00] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +418, now: CPU 1532, GPU 3937 (MiB)
|
309 |
+
[12/28/2023-19:28:02] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +83, GPU +79, now: CPU 1615, GPU 4016 (MiB)
|
310 |
+
[12/28/2023-19:28:02] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
311 |
+
[12/28/2023-20:15:51] [I] [TRT] Total Activation Memory: 7994521088
|
312 |
+
[12/28/2023-20:15:51] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
313 |
+
[12/28/2023-20:16:04] [I] [TRT] Total Host Persistent Memory: 355104
|
314 |
+
[12/28/2023-20:16:04] [I] [TRT] Total Device Persistent Memory: 38912
|
315 |
+
[12/28/2023-20:16:04] [I] [TRT] Total Scratch Memory: 134217728
|
316 |
+
[12/28/2023-20:16:04] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 264 MiB, GPU 454 MiB
|
317 |
+
[12/28/2023-20:16:04] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 188 steps to complete.
|
318 |
+
[12/28/2023-20:16:04] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 61.0389ms to assign 14 blocks to 188 nodes requiring 156376576 bytes.
|
319 |
+
[12/28/2023-20:16:04] [I] [TRT] Total Activation Memory: 156376576
|
320 |
+
[12/28/2023-20:16:09] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 2003, GPU 5524 (MiB)
|
321 |
+
[12/28/2023-20:16:09] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +52, GPU +64, now: CPU 52, GPU 64 (MiB)
|
322 |
+
[12/28/2023-20:16:09] [I] Engine built in 2915.03 sec.
|
323 |
+
[12/28/2023-20:16:09] [I] [TRT] Loaded engine size: 54 MiB
|
324 |
+
[12/28/2023-20:16:10] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1288, GPU 5322 (MiB)
|
325 |
+
[12/28/2023-20:16:10] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +52, now: CPU 0, GPU 52 (MiB)
|
326 |
+
[12/28/2023-20:16:10] [I] Engine deserialized in 0.222476 sec.
|
327 |
+
[12/28/2023-20:16:10] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1289, GPU 5322 (MiB)
|
328 |
+
[12/28/2023-20:16:10] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +149, now: CPU 0, GPU 201 (MiB)
|
329 |
+
[12/28/2023-20:16:10] [I] Setting persistentCacheLimit to 0 bytes.
|
330 |
+
[12/28/2023-20:16:10] [I] Using random values for input onnx::Cast_0
|
331 |
+
[12/28/2023-20:16:10] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
332 |
+
[12/28/2023-20:16:10] [I] Using random values for output graph2_flat_predictions
|
333 |
+
[12/28/2023-20:16:10] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
334 |
+
[12/28/2023-20:16:10] [I] Starting inference
|
335 |
+
[12/28/2023-20:16:25] [I] Warmup completed 7 queries over 200 ms
|
336 |
+
[12/28/2023-20:16:25] [I] Timing trace has 556 queries over 15.0394 s
|
337 |
+
[12/28/2023-20:16:25] [I]
|
338 |
+
[12/28/2023-20:16:25] [I] === Trace details ===
|
339 |
+
[12/28/2023-20:16:25] [I] Trace averages of 100 runs:
|
340 |
+
[12/28/2023-20:16:25] [I] Average on 100 runs - GPU latency: 27.1478 ms - Host latency: 27.2648 ms (enqueue 27.2126 ms)
|
341 |
+
[12/28/2023-20:16:25] [I] Average on 100 runs - GPU latency: 26.6955 ms - Host latency: 26.8082 ms (enqueue 26.7744 ms)
|
342 |
+
[12/28/2023-20:16:25] [I] Average on 100 runs - GPU latency: 27.0859 ms - Host latency: 27.1971 ms (enqueue 27.1502 ms)
|
343 |
+
[12/28/2023-20:16:25] [I] Average on 100 runs - GPU latency: 26.5486 ms - Host latency: 26.6622 ms (enqueue 26.6226 ms)
|
344 |
+
[12/28/2023-20:16:25] [I] Average on 100 runs - GPU latency: 26.938 ms - Host latency: 27.049 ms (enqueue 27.01 ms)
|
345 |
+
[12/28/2023-20:16:25] [I]
|
346 |
+
[12/28/2023-20:16:25] [I] === Performance summary ===
|
347 |
+
[12/28/2023-20:16:25] [I] Throughput: 36.9695 qps
|
348 |
+
[12/28/2023-20:16:25] [I] Latency: min = 24.9229 ms, max = 40.8822 ms, mean = 27.0196 ms, median = 26.4901 ms, percentile(90%) = 27.7676 ms, percentile(95%) = 29.9111 ms, percentile(99%) = 36.0352 ms
|
349 |
+
[12/28/2023-20:16:25] [I] Enqueue Time: min = 24.9536 ms, max = 40.8246 ms, mean = 26.9763 ms, median = 26.46 ms, percentile(90%) = 27.5393 ms, percentile(95%) = 30.0479 ms, percentile(99%) = 36.1467 ms
|
350 |
+
[12/28/2023-20:16:25] [I] H2D Latency: min = 0.0800781 ms, max = 0.117188 ms, mean = 0.0969461 ms, median = 0.0976562 ms, percentile(90%) = 0.100098 ms, percentile(95%) = 0.100586 ms, percentile(99%) = 0.101562 ms
|
351 |
+
[12/28/2023-20:16:25] [I] GPU Compute Time: min = 24.8271 ms, max = 40.7577 ms, mean = 26.9066 ms, median = 26.3784 ms, percentile(90%) = 27.6466 ms, percentile(95%) = 29.7852 ms, percentile(99%) = 35.9219 ms
|
352 |
+
[12/28/2023-20:16:25] [I] D2H Latency: min = 0.00292969 ms, max = 0.079834 ms, mean = 0.0159901 ms, median = 0.0146484 ms, percentile(90%) = 0.0258789 ms, percentile(95%) = 0.0291748 ms, percentile(99%) = 0.036377 ms
|
353 |
+
[12/28/2023-20:16:25] [I] Total Host Walltime: 15.0394 s
|
354 |
+
[12/28/2023-20:16:25] [I] Total GPU Compute Time: 14.9601 s
|
355 |
+
[12/28/2023-20:16:25] [I] Explanations of the performance metrics are printed in the verbose logs.
|
356 |
+
[12/28/2023-20:16:25] [I]
|
357 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.best.engine
|
yolo_nas_pose_l_int8.onnx.engine.err
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-19:27:20] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-19:27:20] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-19:27:24] [E] Error[4]: [network.cpp::validate::2922] Error Code 4: Internal Error (Int8 precision has been set for a layer or layer output, but int8 is not configured in the builder)
|
4 |
+
[12/28/2023-19:27:24] [E] Error[2]: [builder.cpp::buildSerializedNetwork::751] Error Code 2: Internal Error (Assertion engine != nullptr failed. )
|
5 |
+
[12/28/2023-19:27:24] [E] Engine could not be created from network
|
6 |
+
[12/28/2023-19:27:24] [E] Building engine failed
|
7 |
+
[12/28/2023-19:27:24] [E] Failed to create engine from model or file.
|
8 |
+
[12/28/2023-19:27:24] [E] Engine set up failed
|
yolo_nas_pose_l_int8.onnx.engine.log
ADDED
@@ -0,0 +1,91 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.engine
|
2 |
+
[12/28/2023-19:27:14] [I] === Model Options ===
|
3 |
+
[12/28/2023-19:27:14] [I] Format: ONNX
|
4 |
+
[12/28/2023-19:27:14] [I] Model: yolo_nas_pose_l_int8.onnx
|
5 |
+
[12/28/2023-19:27:14] [I] Output:
|
6 |
+
[12/28/2023-19:27:14] [I] === Build Options ===
|
7 |
+
[12/28/2023-19:27:14] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-19:27:14] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-19:27:14] [I] minTiming: 1
|
10 |
+
[12/28/2023-19:27:14] [I] avgTiming: 8
|
11 |
+
[12/28/2023-19:27:14] [I] Precision: FP32
|
12 |
+
[12/28/2023-19:27:14] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-19:27:14] [I] Calibration:
|
14 |
+
[12/28/2023-19:27:14] [I] Refit: Disabled
|
15 |
+
[12/28/2023-19:27:14] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-19:27:14] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-19:27:14] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-19:27:14] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-19:27:14] [I] Build only: Disabled
|
20 |
+
[12/28/2023-19:27:14] [I] Save engine: yolo_nas_pose_l_int8.onnx.engine
|
21 |
+
[12/28/2023-19:27:14] [I] Load engine:
|
22 |
+
[12/28/2023-19:27:14] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-19:27:14] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-19:27:14] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-19:27:14] [I] timingCacheFile:
|
26 |
+
[12/28/2023-19:27:14] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-19:27:14] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-19:27:14] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-19:27:14] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-19:27:14] [I] Input build shapes: model
|
31 |
+
[12/28/2023-19:27:14] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-19:27:14] [I] === System Options ===
|
33 |
+
[12/28/2023-19:27:14] [I] Device: 0
|
34 |
+
[12/28/2023-19:27:14] [I] DLACore:
|
35 |
+
[12/28/2023-19:27:14] [I] Plugins:
|
36 |
+
[12/28/2023-19:27:14] [I] === Inference Options ===
|
37 |
+
[12/28/2023-19:27:14] [I] Batch: Explicit
|
38 |
+
[12/28/2023-19:27:14] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-19:27:14] [I] Iterations: 10
|
40 |
+
[12/28/2023-19:27:14] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-19:27:14] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-19:27:14] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-19:27:14] [I] Streams: 1
|
44 |
+
[12/28/2023-19:27:14] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-19:27:14] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-19:27:14] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-19:27:14] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-19:27:14] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-19:27:14] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-19:27:14] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-19:27:14] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-19:27:14] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-19:27:14] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-19:27:14] [I] Inputs:
|
55 |
+
[12/28/2023-19:27:14] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-19:27:14] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-19:27:14] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-19:27:14] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-19:27:14] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-19:27:14] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-19:27:14] [I] Profile: Disabled
|
62 |
+
[12/28/2023-19:27:14] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-19:27:14] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-19:27:14] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-19:27:14] [I]
|
66 |
+
[12/28/2023-19:27:14] [I] === Device Information ===
|
67 |
+
[12/28/2023-19:27:14] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-19:27:14] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-19:27:14] [I] SMs: 8
|
70 |
+
[12/28/2023-19:27:14] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-19:27:14] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-19:27:14] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-19:27:14] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-19:27:14] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-19:27:14] [I]
|
76 |
+
[12/28/2023-19:27:14] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-19:27:14] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2835 (MiB)
|
78 |
+
[12/28/2023-19:27:17] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +286, now: CPU 574, GPU 3142 (MiB)
|
79 |
+
[12/28/2023-19:27:17] [I] Start parsing network model
|
80 |
+
[12/28/2023-19:27:20] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-19:27:20] [I] [TRT] Input filename: yolo_nas_pose_l_int8.onnx
|
82 |
+
[12/28/2023-19:27:20] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-19:27:20] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-19:27:20] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-19:27:20] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-19:27:20] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-19:27:20] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-19:27:20] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-19:27:20] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-19:27:24] [I] Finish parsing network model
|
91 |
+
&&&& FAILED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.engine
|
yolo_nas_pose_l_int8.onnx.fp16.engine.err
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-19:27:29] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-19:27:29] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-19:27:33] [E] Error[4]: [network.cpp::validate::2922] Error Code 4: Internal Error (Int8 precision has been set for a layer or layer output, but int8 is not configured in the builder)
|
4 |
+
[12/28/2023-19:27:33] [E] Error[2]: [builder.cpp::buildSerializedNetwork::751] Error Code 2: Internal Error (Assertion engine != nullptr failed. )
|
5 |
+
[12/28/2023-19:27:33] [E] Engine could not be created from network
|
6 |
+
[12/28/2023-19:27:33] [E] Building engine failed
|
7 |
+
[12/28/2023-19:27:33] [E] Failed to create engine from model or file.
|
8 |
+
[12/28/2023-19:27:33] [E] Engine set up failed
|
yolo_nas_pose_l_int8.onnx.fp16.engine.log
ADDED
@@ -0,0 +1,91 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.fp16.engine
|
2 |
+
[12/28/2023-19:27:25] [I] === Model Options ===
|
3 |
+
[12/28/2023-19:27:25] [I] Format: ONNX
|
4 |
+
[12/28/2023-19:27:25] [I] Model: yolo_nas_pose_l_int8.onnx
|
5 |
+
[12/28/2023-19:27:25] [I] Output:
|
6 |
+
[12/28/2023-19:27:25] [I] === Build Options ===
|
7 |
+
[12/28/2023-19:27:25] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-19:27:25] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-19:27:25] [I] minTiming: 1
|
10 |
+
[12/28/2023-19:27:25] [I] avgTiming: 8
|
11 |
+
[12/28/2023-19:27:25] [I] Precision: FP32+FP16
|
12 |
+
[12/28/2023-19:27:25] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-19:27:25] [I] Calibration:
|
14 |
+
[12/28/2023-19:27:25] [I] Refit: Disabled
|
15 |
+
[12/28/2023-19:27:25] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-19:27:25] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-19:27:25] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-19:27:25] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-19:27:25] [I] Build only: Disabled
|
20 |
+
[12/28/2023-19:27:25] [I] Save engine: yolo_nas_pose_l_int8.onnx.fp16.engine
|
21 |
+
[12/28/2023-19:27:25] [I] Load engine:
|
22 |
+
[12/28/2023-19:27:25] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-19:27:25] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-19:27:25] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-19:27:25] [I] timingCacheFile:
|
26 |
+
[12/28/2023-19:27:25] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-19:27:25] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-19:27:25] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-19:27:25] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-19:27:25] [I] Input build shapes: model
|
31 |
+
[12/28/2023-19:27:25] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-19:27:25] [I] === System Options ===
|
33 |
+
[12/28/2023-19:27:25] [I] Device: 0
|
34 |
+
[12/28/2023-19:27:25] [I] DLACore:
|
35 |
+
[12/28/2023-19:27:25] [I] Plugins:
|
36 |
+
[12/28/2023-19:27:25] [I] === Inference Options ===
|
37 |
+
[12/28/2023-19:27:25] [I] Batch: Explicit
|
38 |
+
[12/28/2023-19:27:25] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-19:27:25] [I] Iterations: 10
|
40 |
+
[12/28/2023-19:27:25] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-19:27:25] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-19:27:25] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-19:27:25] [I] Streams: 1
|
44 |
+
[12/28/2023-19:27:25] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-19:27:25] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-19:27:25] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-19:27:25] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-19:27:25] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-19:27:25] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-19:27:25] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-19:27:25] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-19:27:25] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-19:27:25] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-19:27:25] [I] Inputs:
|
55 |
+
[12/28/2023-19:27:25] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-19:27:25] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-19:27:25] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-19:27:25] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-19:27:25] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-19:27:25] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-19:27:25] [I] Profile: Disabled
|
62 |
+
[12/28/2023-19:27:25] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-19:27:25] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-19:27:25] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-19:27:25] [I]
|
66 |
+
[12/28/2023-19:27:25] [I] === Device Information ===
|
67 |
+
[12/28/2023-19:27:25] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-19:27:25] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-19:27:25] [I] SMs: 8
|
70 |
+
[12/28/2023-19:27:25] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-19:27:25] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-19:27:25] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-19:27:25] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-19:27:25] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-19:27:25] [I]
|
76 |
+
[12/28/2023-19:27:25] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-19:27:26] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2833 (MiB)
|
78 |
+
[12/28/2023-19:27:28] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +284, now: CPU 574, GPU 3139 (MiB)
|
79 |
+
[12/28/2023-19:27:28] [I] Start parsing network model
|
80 |
+
[12/28/2023-19:27:29] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-19:27:29] [I] [TRT] Input filename: yolo_nas_pose_l_int8.onnx
|
82 |
+
[12/28/2023-19:27:29] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-19:27:29] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-19:27:29] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-19:27:29] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-19:27:29] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-19:27:29] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-19:27:29] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-19:27:29] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-19:27:33] [I] Finish parsing network model
|
91 |
+
&&&& FAILED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.fp16.engine
|
yolo_nas_pose_l_int8.onnx.int8.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0437c2287a6331143c0b7181c0ce945e117b29eae0d9755f226919acbe4a8cff
|
3 |
+
size 57433967
|
yolo_nas_pose_l_int8.onnx.int8.engine.err
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-20:16:35] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-20:16:35] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-20:16:40] [W] [TRT] Calibrator won't be used in explicit precision mode. Use quantization aware training to generate network with Quantize/Dequantize nodes.
|
4 |
+
[12/28/2023-20:31:04] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
5 |
+
[12/28/2023-20:31:04] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
6 |
+
[12/28/2023-20:31:04] [W] * GPU compute time is unstable, with coefficient of variance = 6.47493%.
|
7 |
+
[12/28/2023-20:31:04] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_l_int8.onnx.int8.engine.log
ADDED
@@ -0,0 +1,357 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.int8.engine
|
2 |
+
[12/28/2023-20:16:29] [I] === Model Options ===
|
3 |
+
[12/28/2023-20:16:29] [I] Format: ONNX
|
4 |
+
[12/28/2023-20:16:29] [I] Model: yolo_nas_pose_l_int8.onnx
|
5 |
+
[12/28/2023-20:16:29] [I] Output:
|
6 |
+
[12/28/2023-20:16:29] [I] === Build Options ===
|
7 |
+
[12/28/2023-20:16:29] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-20:16:29] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-20:16:29] [I] minTiming: 1
|
10 |
+
[12/28/2023-20:16:29] [I] avgTiming: 8
|
11 |
+
[12/28/2023-20:16:29] [I] Precision: FP32+INT8
|
12 |
+
[12/28/2023-20:16:29] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-20:16:29] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-20:16:29] [I] Refit: Disabled
|
15 |
+
[12/28/2023-20:16:29] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-20:16:29] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-20:16:29] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-20:16:29] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-20:16:29] [I] Build only: Disabled
|
20 |
+
[12/28/2023-20:16:29] [I] Save engine: yolo_nas_pose_l_int8.onnx.int8.engine
|
21 |
+
[12/28/2023-20:16:29] [I] Load engine:
|
22 |
+
[12/28/2023-20:16:29] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-20:16:29] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-20:16:29] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-20:16:29] [I] timingCacheFile:
|
26 |
+
[12/28/2023-20:16:29] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-20:16:29] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-20:16:29] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-20:16:29] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-20:16:29] [I] Input build shapes: model
|
31 |
+
[12/28/2023-20:16:29] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-20:16:29] [I] === System Options ===
|
33 |
+
[12/28/2023-20:16:29] [I] Device: 0
|
34 |
+
[12/28/2023-20:16:29] [I] DLACore:
|
35 |
+
[12/28/2023-20:16:29] [I] Plugins:
|
36 |
+
[12/28/2023-20:16:29] [I] === Inference Options ===
|
37 |
+
[12/28/2023-20:16:29] [I] Batch: Explicit
|
38 |
+
[12/28/2023-20:16:29] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-20:16:29] [I] Iterations: 10
|
40 |
+
[12/28/2023-20:16:29] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-20:16:29] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-20:16:29] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-20:16:29] [I] Streams: 1
|
44 |
+
[12/28/2023-20:16:29] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-20:16:29] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-20:16:29] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-20:16:29] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-20:16:29] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-20:16:29] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-20:16:29] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-20:16:29] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-20:16:29] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-20:16:29] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-20:16:29] [I] Inputs:
|
55 |
+
[12/28/2023-20:16:29] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-20:16:29] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-20:16:29] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-20:16:29] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-20:16:29] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-20:16:29] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-20:16:29] [I] Profile: Disabled
|
62 |
+
[12/28/2023-20:16:29] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-20:16:29] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-20:16:29] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-20:16:29] [I]
|
66 |
+
[12/28/2023-20:16:29] [I] === Device Information ===
|
67 |
+
[12/28/2023-20:16:29] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-20:16:29] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-20:16:29] [I] SMs: 8
|
70 |
+
[12/28/2023-20:16:29] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-20:16:29] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-20:16:29] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-20:16:29] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-20:16:29] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-20:16:29] [I]
|
76 |
+
[12/28/2023-20:16:29] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-20:16:29] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2967 (MiB)
|
78 |
+
[12/28/2023-20:16:33] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +283, now: CPU 574, GPU 3271 (MiB)
|
79 |
+
[12/28/2023-20:16:33] [I] Start parsing network model
|
80 |
+
[12/28/2023-20:16:35] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-20:16:35] [I] [TRT] Input filename: yolo_nas_pose_l_int8.onnx
|
82 |
+
[12/28/2023-20:16:35] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-20:16:35] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-20:16:35] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-20:16:35] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-20:16:35] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-20:16:35] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-20:16:35] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-20:16:35] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-20:16:40] [I] Finish parsing network model
|
91 |
+
[12/28/2023-20:16:40] [I] FP32 and INT8 precisions have been specified - more performance might be enabled by additionally specifying --fp16 or --best
|
92 |
+
[12/28/2023-20:16:45] [I] [TRT] ---------- Layers Running on DLA ----------
|
93 |
+
[12/28/2023-20:16:45] [I] [TRT] ---------- Layers Running on GPU ----------
|
94 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
95 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
96 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 1417) [Constant]
|
97 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 1418) [Constant]
|
98 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 1419) [Constant]
|
99 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stem/conv/rbr_reparam/_input_quantizer/QuantizeLinear
|
100 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stem.conv.rbr_reparam.weight + /model/backbone/stem/conv/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stem/conv/rbr_reparam/Conv
|
101 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.downsample.rbr_reparam.weight + /model/backbone/stage1/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/downsample/rbr_reparam/Conv
|
102 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.conv2.conv.weight + /model/backbone/stage1/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/conv2/conv/Conv
|
103 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.conv1.conv.weight + /model/backbone/stage1/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/conv1/conv/Conv
|
104 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
105 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
106 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
107 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 557) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
108 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
109 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
110 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
111 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 573) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
112 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
113 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
114 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage1.blocks.conv3.conv.weight + /model/backbone/stage1/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage1/blocks/conv3/conv/Conv
|
115 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.reduce_skip2.conv.weight + /model/neck/neck2/reduce_skip2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/reduce_skip2/conv/Conv
|
116 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.downsample.rbr_reparam.weight + /model/backbone/stage2/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/downsample/rbr_reparam/Conv
|
117 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.downsample.conv.weight + /model/neck/neck2/downsample/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/downsample/conv/Conv
|
118 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.conv2.conv.weight + /model/backbone/stage2/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/conv2/conv/Conv
|
119 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.conv1.conv.weight + /model/backbone/stage2/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/conv1/conv/Conv
|
120 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
121 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
122 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
123 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 620) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
124 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
125 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
126 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
127 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 636) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
128 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
129 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
130 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
131 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 652) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
132 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_2
|
133 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
134 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
135 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage2.blocks.conv3.conv.weight + /model/backbone/stage2/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage2/blocks/conv3/conv/Conv
|
136 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.reduce_skip2.conv.weight + /model/neck/neck1/reduce_skip2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/reduce_skip2/conv/Conv || model.neck.neck2.reduce_skip1.conv.weight + /model/neck/neck2/reduce_skip1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/reduce_skip1/conv/Conv
|
137 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.downsample.rbr_reparam.weight + /model/backbone/stage3/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/downsample/rbr_reparam/Conv
|
138 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.downsample.conv.weight + /model/neck/neck1/downsample/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/downsample/conv/Conv
|
139 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.conv2.conv.weight + /model/backbone/stage3/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/conv2/conv/Conv
|
140 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.conv1.conv.weight + /model/backbone/stage3/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/conv1/conv/Conv
|
141 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
142 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
143 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
144 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 702) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
145 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
146 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
147 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
148 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 718) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
149 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
150 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
151 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
152 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 734) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
153 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
154 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.3.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv
|
155 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.3.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv
|
156 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 750) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
157 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
158 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.4.cv1.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv
|
159 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.bottlenecks.4.cv2.rbr_reparam.weight + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv
|
160 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 766) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
161 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_4
|
162 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_2
|
163 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
164 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
165 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage3.blocks.conv3.conv.weight + /model/backbone/stage3/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage3/blocks/conv3/conv/Conv
|
166 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.reduce_skip1.conv.weight + /model/neck/neck1/reduce_skip1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/reduce_skip1/conv/Conv
|
167 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.downsample.rbr_reparam.weight + /model/backbone/stage4/downsample/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/downsample/rbr_reparam/Conv
|
168 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.conv2.conv.weight + /model/backbone/stage4/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/conv2/conv/Conv
|
169 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.conv1.conv.weight + /model/backbone/stage4/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/conv1/conv/Conv
|
170 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
171 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
172 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
173 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 806) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
174 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
175 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
176 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
177 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 822) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
178 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_1
|
179 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv3/conv/_input_quantizer/QuantizeLinear_clone_0
|
180 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.stage4.blocks.conv3.conv.weight + /model/backbone/stage4/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/backbone/stage4/blocks/conv3/conv/Conv
|
181 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.context_module.cv1.conv.weight + /model/backbone/context_module/cv1/conv/_weight_quantizer/QuantizeLinear + /model/backbone/context_module/cv1/conv/Conv
|
182 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
183 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
184 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
185 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/m.2/MaxPool_output_0 copy
|
186 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.backbone.context_module.cv2.conv.weight + /model/backbone/context_module/cv2/conv/_weight_quantizer/QuantizeLinear + /model/backbone/context_module/cv2/conv/Conv
|
187 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.conv.conv.weight + /model/neck/neck1/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/conv/conv/Conv
|
188 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] DECONVOLUTION: model.neck.neck1.upsample.weight + /model/neck/neck1/upsample/_weight_quantizer/QuantizeLinear + /model/neck/neck1/upsample/ConvTranspose
|
189 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.reduce_after_concat.conv.weight + /model/neck/neck1/reduce_after_concat/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/reduce_after_concat/conv/Conv
|
190 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.conv2.conv.weight + /model/neck/neck1/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/conv2/conv/Conv
|
191 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.conv1.conv.weight + /model/neck/neck1/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/conv1/conv/Conv
|
192 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
193 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
194 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
195 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 887) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
196 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
197 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
198 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
199 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 903) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
200 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
201 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
202 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
203 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.2.alpha + (Unnamed Layer* 919) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.2/Add)
|
204 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
205 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.3.cv1.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv
|
206 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.bottlenecks.3.cv2.rbr_reparam.weight + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv
|
207 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.3.alpha + (Unnamed Layer* 935) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.3/Add)
|
208 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck1.blocks.conv3.conv.weight + /model/neck/neck1/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck1/blocks/conv3/conv/Conv
|
209 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.conv.conv.weight + /model/neck/neck2/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/conv/conv/Conv
|
210 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] DECONVOLUTION: model.neck.neck2.upsample.weight + /model/neck/neck2/upsample/_weight_quantizer/QuantizeLinear + /model/neck/neck2/upsample/ConvTranspose
|
211 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/Concat_/model/neck/neck2/reduce_skip1/act/Relu_output_0_clone_1 copy
|
212 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.reduce_after_concat.conv.weight + /model/neck/neck2/reduce_after_concat/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/reduce_after_concat/conv/Conv
|
213 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.conv2.conv.weight + /model/neck/neck2/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/conv2/conv/Conv
|
214 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.conv1.conv.weight + /model/neck/neck2/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/conv1/conv/Conv
|
215 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
216 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.0.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv
|
217 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.0.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv
|
218 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 984) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
219 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
220 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.1.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv
|
221 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.1.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv
|
222 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 1000) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
223 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
224 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.2.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv
|
225 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.2.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv
|
226 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 1016) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
227 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_input_quantizer/QuantizeLinear
|
228 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.3.cv1.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv
|
229 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.bottlenecks.3.cv2.rbr_reparam.weight + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv
|
230 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.3.alpha + (Unnamed Layer* 1032) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.3/Add)
|
231 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck2.blocks.conv3.conv.weight + /model/neck/neck2/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck2/blocks/conv3/conv/Conv
|
232 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.bbox_stem.seq.conv.weight + /model/heads/head1/bbox_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/bbox_stem/seq/conv/Conv || model.heads.head1.pose_stem.seq.conv.weight + /model/heads/head1/pose_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_stem/seq/conv/Conv
|
233 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.conv.conv.weight + /model/neck/neck3/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/conv/conv/Conv
|
234 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.reg_convs.0.seq.conv.weight + /model/heads/head1/reg_convs/reg_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv || model.heads.head1.cls_convs.0.seq.conv.weight + /model/heads/head1/cls_convs/cls_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv
|
235 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.pose_convs.0.seq.conv.weight + /model/heads/head1/pose_convs/pose_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv
|
236 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.conv2.conv.weight + /model/neck/neck3/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/conv2/conv/Conv
|
237 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.conv1.conv.weight + /model/neck/neck3/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/conv1/conv/Conv
|
238 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.cls_pred.weight + /model/heads/head1/cls_pred/_weight_quantizer/QuantizeLinear + /model/heads/head1/cls_pred/Conv
|
239 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.reg_pred.weight + /model/heads/head1/reg_pred/_weight_quantizer/QuantizeLinear + /model/heads/head1/reg_pred/Conv
|
240 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.pose_convs.1.seq.conv.weight + /model/heads/head1/pose_convs/pose_convs.1/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv
|
241 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/_input_quantizer/QuantizeLinear
|
242 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
243 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head1.pose_pred.weight + /model/heads/head1/pose_pred/_weight_quantizer/QuantizeLinear + /model/heads/head1/pose_pred/Conv
|
244 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.0.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv
|
245 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
246 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.0.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv
|
247 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
248 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 1097) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
249 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/_input_quantizer/QuantizeLinear
|
250 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.1.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv
|
251 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.1.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv
|
252 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 1138) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
253 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/_input_quantizer/QuantizeLinear
|
254 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.2.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv
|
255 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.2.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv
|
256 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 1154) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.2/Add)
|
257 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/_input_quantizer/QuantizeLinear
|
258 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.3.cv1.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv
|
259 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.bottlenecks.3.cv2.conv.weight + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv
|
260 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 1170) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.3/Add)
|
261 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck3.blocks.conv3.conv.weight + /model/neck/neck3/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck3/blocks/conv3/conv/Conv
|
262 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_stem.seq.conv.weight + /model/heads/head2/pose_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_stem/seq/conv/Conv || model.heads.head2.bbox_stem.seq.conv.weight + /model/heads/head2/bbox_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/bbox_stem/seq/conv/Conv
|
263 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.conv.conv.weight + /model/neck/neck4/conv/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/conv/conv/Conv
|
264 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.reg_convs.0.seq.conv.weight + /model/heads/head2/reg_convs/reg_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv || model.heads.head2.cls_convs.0.seq.conv.weight + /model/heads/head2/cls_convs/cls_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv
|
265 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_convs.0.seq.conv.weight + /model/heads/head2/pose_convs/pose_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv
|
266 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.conv2.conv.weight + /model/neck/neck4/blocks/conv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/conv2/conv/Conv
|
267 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.conv1.conv.weight + /model/neck/neck4/blocks/conv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/conv1/conv/Conv
|
268 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.cls_pred.weight + /model/heads/head2/cls_pred/_weight_quantizer/QuantizeLinear + /model/heads/head2/cls_pred/Conv
|
269 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.reg_pred.weight + /model/heads/head2/reg_pred/_weight_quantizer/QuantizeLinear + /model/heads/head2/reg_pred/Conv
|
270 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_convs.1.seq.conv.weight + /model/heads/head2/pose_convs/pose_convs.1/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv
|
271 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/_input_quantizer/QuantizeLinear
|
272 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
273 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head2.pose_pred.weight + /model/heads/head2/pose_pred/_weight_quantizer/QuantizeLinear + /model/heads/head2/pose_pred/Conv
|
274 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.0.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv
|
275 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
276 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.0.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv
|
277 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
278 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 1235) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
279 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/_input_quantizer/QuantizeLinear
|
280 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.1.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv
|
281 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.1.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv
|
282 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 1276) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
283 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/_input_quantizer/QuantizeLinear
|
284 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.2.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv
|
285 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.2.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv
|
286 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 1292) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
287 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/_input_quantizer/QuantizeLinear
|
288 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.3.cv1.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv1/conv/Conv
|
289 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.bottlenecks.3.cv2.conv.weight + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/cv2/conv/Conv
|
290 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.3.alpha + (Unnamed Layer* 1308) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.3/Add)
|
291 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.neck.neck4.blocks.conv3.conv.weight + /model/neck/neck4/blocks/conv3/conv/_weight_quantizer/QuantizeLinear + /model/neck/neck4/blocks/conv3/conv/Conv
|
292 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.bbox_stem.seq.conv.weight + /model/heads/head3/bbox_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/bbox_stem/seq/conv/Conv || model.heads.head3.pose_stem.seq.conv.weight + /model/heads/head3/pose_stem/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_stem/seq/conv/Conv
|
293 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.reg_convs.0.seq.conv.weight + /model/heads/head3/reg_convs/reg_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv || model.heads.head3.cls_convs.0.seq.conv.weight + /model/heads/head3/cls_convs/cls_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv
|
294 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_convs.0.seq.conv.weight + /model/heads/head3/pose_convs/pose_convs.0/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv
|
295 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.cls_pred.weight + /model/heads/head3/cls_pred/_weight_quantizer/QuantizeLinear + /model/heads/head3/cls_pred/Conv
|
296 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.reg_pred.weight + /model/heads/head3/reg_pred/_weight_quantizer/QuantizeLinear + /model/heads/head3/reg_pred/Conv
|
297 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_convs.1.seq.conv.weight + /model/heads/head3/pose_convs/pose_convs.1/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv
|
298 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
299 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_convs.2.seq.conv.weight + /model/heads/head3/pose_convs/pose_convs.2/seq/conv/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv
|
300 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
301 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: model.heads.head3.pose_pred.weight + /model/heads/head3/pose_pred/_weight_quantizer/QuantizeLinear + /model/heads/head3/pose_pred/Conv
|
302 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
303 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1.../post_process/Reshape_2]}
|
304 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] NMS: batched_nms_274
|
305 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 1421) [NMS]_1_output[DevicetoShapeHostCopy]
|
306 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
307 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
308 |
+
[12/28/2023-20:16:45] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
309 |
+
[12/28/2023-20:16:46] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +481, now: CPU 1532, GPU 4180 (MiB)
|
310 |
+
[12/28/2023-20:16:47] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +83, GPU +76, now: CPU 1615, GPU 4256 (MiB)
|
311 |
+
[12/28/2023-20:16:47] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
312 |
+
[12/28/2023-20:30:40] [I] [TRT] Total Activation Memory: 8076738048
|
313 |
+
[12/28/2023-20:30:40] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
314 |
+
[12/28/2023-20:30:46] [I] [TRT] Total Host Persistent Memory: 355104
|
315 |
+
[12/28/2023-20:30:46] [I] [TRT] Total Device Persistent Memory: 38912
|
316 |
+
[12/28/2023-20:30:46] [I] [TRT] Total Scratch Memory: 134217728
|
317 |
+
[12/28/2023-20:30:46] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 264 MiB, GPU 132 MiB
|
318 |
+
[12/28/2023-20:30:46] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 194 steps to complete.
|
319 |
+
[12/28/2023-20:30:46] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 71.4503ms to assign 13 blocks to 194 nodes requiring 183278080 bytes.
|
320 |
+
[12/28/2023-20:30:46] [I] [TRT] Total Activation Memory: 183278080
|
321 |
+
[12/28/2023-20:30:48] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +1, GPU +7, now: CPU 2003, GPU 5811 (MiB)
|
322 |
+
[12/28/2023-20:30:48] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +52, GPU +64, now: CPU 52, GPU 64 (MiB)
|
323 |
+
[12/28/2023-20:30:48] [I] Engine built in 859.207 sec.
|
324 |
+
[12/28/2023-20:30:48] [I] [TRT] Loaded engine size: 54 MiB
|
325 |
+
[12/28/2023-20:30:48] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +11, now: CPU 1289, GPU 5551 (MiB)
|
326 |
+
[12/28/2023-20:30:48] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +52, now: CPU 0, GPU 52 (MiB)
|
327 |
+
[12/28/2023-20:30:48] [I] Engine deserialized in 0.183216 sec.
|
328 |
+
[12/28/2023-20:30:49] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +6, now: CPU 1289, GPU 5551 (MiB)
|
329 |
+
[12/28/2023-20:30:49] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +175, now: CPU 0, GPU 227 (MiB)
|
330 |
+
[12/28/2023-20:30:49] [I] Setting persistentCacheLimit to 0 bytes.
|
331 |
+
[12/28/2023-20:30:49] [I] Using random values for input onnx::Cast_0
|
332 |
+
[12/28/2023-20:30:49] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
333 |
+
[12/28/2023-20:30:49] [I] Using random values for output graph2_flat_predictions
|
334 |
+
[12/28/2023-20:30:49] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
335 |
+
[12/28/2023-20:30:49] [I] Starting inference
|
336 |
+
[12/28/2023-20:31:04] [I] Warmup completed 5 queries over 200 ms
|
337 |
+
[12/28/2023-20:31:04] [I] Timing trace has 467 queries over 15.0803 s
|
338 |
+
[12/28/2023-20:31:04] [I]
|
339 |
+
[12/28/2023-20:31:04] [I] === Trace details ===
|
340 |
+
[12/28/2023-20:31:04] [I] Trace averages of 100 runs:
|
341 |
+
[12/28/2023-20:31:04] [I] Average on 100 runs - GPU latency: 32.4935 ms - Host latency: 32.6124 ms (enqueue 32.5531 ms)
|
342 |
+
[12/28/2023-20:31:04] [I] Average on 100 runs - GPU latency: 32.0289 ms - Host latency: 32.1442 ms (enqueue 32.092 ms)
|
343 |
+
[12/28/2023-20:31:04] [I] Average on 100 runs - GPU latency: 31.9715 ms - Host latency: 32.0855 ms (enqueue 32.0299 ms)
|
344 |
+
[12/28/2023-20:31:04] [I] Average on 100 runs - GPU latency: 32.1741 ms - Host latency: 32.2872 ms (enqueue 32.2448 ms)
|
345 |
+
[12/28/2023-20:31:04] [I]
|
346 |
+
[12/28/2023-20:31:04] [I] === Performance summary ===
|
347 |
+
[12/28/2023-20:31:04] [I] Throughput: 30.9676 qps
|
348 |
+
[12/28/2023-20:31:04] [I] Latency: min = 29.5527 ms, max = 48.669 ms, mean = 32.255 ms, median = 31.8447 ms, percentile(90%) = 33.2435 ms, percentile(95%) = 35.3904 ms, percentile(99%) = 42.4307 ms
|
349 |
+
[12/28/2023-20:31:04] [I] Enqueue Time: min = 29.5156 ms, max = 48.6032 ms, mean = 32.204 ms, median = 31.8164 ms, percentile(90%) = 32.9639 ms, percentile(95%) = 35.3633 ms, percentile(99%) = 42.3721 ms
|
350 |
+
[12/28/2023-20:31:04] [I] H2D Latency: min = 0.0800781 ms, max = 0.116211 ms, mean = 0.0943801 ms, median = 0.0952148 ms, percentile(90%) = 0.0976562 ms, percentile(95%) = 0.0981445 ms, percentile(99%) = 0.107422 ms
|
351 |
+
[12/28/2023-20:31:04] [I] GPU Compute Time: min = 29.4414 ms, max = 48.5475 ms, mean = 32.1403 ms, median = 31.7275 ms, percentile(90%) = 33.1393 ms, percentile(95%) = 35.2798 ms, percentile(99%) = 42.3066 ms
|
352 |
+
[12/28/2023-20:31:04] [I] D2H Latency: min = 0.00292969 ms, max = 0.0655518 ms, mean = 0.0203297 ms, median = 0.0205078 ms, percentile(90%) = 0.0288086 ms, percentile(95%) = 0.03125 ms, percentile(99%) = 0.0375977 ms
|
353 |
+
[12/28/2023-20:31:04] [I] Total Host Walltime: 15.0803 s
|
354 |
+
[12/28/2023-20:31:04] [I] Total GPU Compute Time: 15.0095 s
|
355 |
+
[12/28/2023-20:31:04] [I] Explanations of the performance metrics are printed in the verbose logs.
|
356 |
+
[12/28/2023-20:31:04] [I]
|
357 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_l_int8.onnx --int8 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_l_int8.onnx.int8.engine
|
yolo_nas_pose_l_int8.onnx.usage.txt
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
Model exported successfully to yolo_nas_pose_l_int8.onnx
|
3 |
+
Model expects input image of shape [1, 3, 640, 640]
|
4 |
+
Input image dtype is torch.uint8
|
5 |
+
|
6 |
+
Exported model already contains preprocessing (normalization) step, so you don't need to do it manually.
|
7 |
+
Preprocessing steps to be applied to input image are:
|
8 |
+
Sequential(
|
9 |
+
(0): CastTensorTo(dtype=torch.float32)
|
10 |
+
(1): ChannelSelect(channels_indexes=tensor([2, 1, 0]))
|
11 |
+
(2): ApplyMeanStd(mean=[0.], scale=[255.])
|
12 |
+
)
|
13 |
+
|
14 |
+
|
15 |
+
Exported model contains postprocessing (NMS) step with the following parameters:
|
16 |
+
num_pre_nms_predictions=1000
|
17 |
+
max_predictions_per_image=10
|
18 |
+
nms_threshold=0.5
|
19 |
+
confidence_threshold=0.15
|
20 |
+
output_predictions_format=flat
|
21 |
+
|
22 |
+
|
23 |
+
Exported model is in ONNX format and can be used with ONNXRuntime
|
24 |
+
To run inference with ONNXRuntime, please use the following code snippet:
|
25 |
+
|
26 |
+
import onnxruntime
|
27 |
+
import numpy as np
|
28 |
+
session = onnxruntime.InferenceSession("yolo_nas_pose_l_int8.onnx", providers=["CUDAExecutionProvider", "CPUExecutionProvider"])
|
29 |
+
inputs = [o.name for o in session.get_inputs()]
|
30 |
+
outputs = [o.name for o in session.get_outputs()]
|
31 |
+
|
32 |
+
example_input_image = np.zeros((1, 3, 640, 640)).astype(np.uint8)
|
33 |
+
predictions = session.run(outputs, {inputs[0]: example_input_image})
|
34 |
+
|
35 |
+
Exported model can also be used with TensorRT
|
36 |
+
To run inference with TensorRT, please see TensorRT deployment documentation
|
37 |
+
You can benchmark the model using the following code snippet:
|
38 |
+
|
39 |
+
trtexec --onnx=yolo_nas_pose_l_int8.onnx --int8 --avgRuns=100 --duration=15
|
40 |
+
|
41 |
+
|
42 |
+
Exported model has predictions in flat format:
|
43 |
+
|
44 |
+
# flat_predictions is a 2D array of [N,K] shape
|
45 |
+
# Each row represents (image_index, x_min, y_min, x_max, y_max, confidence, joints...)
|
46 |
+
# Please note all values are floats, so you have to convert them to integers if needed
|
47 |
+
|
48 |
+
[flat_predictions] = predictions
|
49 |
+
pred_bboxes = flat_predictions[:, 1:5]
|
50 |
+
pred_scores = flat_predictions[:, 5]
|
51 |
+
pred_joints = flat_predictions[:, 6:].reshape((len(pred_bboxes), -1, 3))
|
52 |
+
for i in range(len(pred_bboxes)):
|
53 |
+
confidence = pred_scores[i]
|
54 |
+
x_min, y_min, x_max, y_max = pred_bboxes[i]
|
55 |
+
print(f"Detected pose with confidence={{confidence}}, x_min={{x_min}}, y_min={{y_min}}, x_max={{x_max}}, y_max={{y_max}}")
|
56 |
+
for joint_index, (x, y, confidence) in enumerate(pred_joints[i]):")
|
57 |
+
print(f"Joint {{joint_index}} has coordinates x={{x}}, y={{y}}, confidence={{confidence}}")
|
58 |
+
|
yolo_nas_pose_m_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7674809abd50d8acbab6500f1b7ad6cb0103539e6102066d7695160b9b0f8413
|
3 |
+
size 78063545
|
yolo_nas_pose_m_fp16.onnx.best.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d694deef0e1f970fb285d669185a1984b38cb587324b7c380b896a02794431ae
|
3 |
+
size 41498155
|
yolo_nas_pose_m_fp16.onnx.best.engine.err
ADDED
@@ -0,0 +1,406 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-08:45:30] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-08:45:30] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-08:45:30] [W] [TRT] Calibrator is not being used. Users must provide dynamic range for all tensors that are not Int32 or Bool.
|
4 |
+
[12/28/2023-09:13:06] [W] [TRT] Tactic Device request: 6262MB Available: 3108MB. Device memory is insufficient to use tactic.
|
5 |
+
[12/28/2023-09:13:07] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6262 detected for tactic 0x0000000000000004.
|
6 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
7 |
+
[12/28/2023-09:13:07] [W] [TRT] Tactic Device request: 6262MB Available: 3107MB. Device memory is insufficient to use tactic.
|
8 |
+
[12/28/2023-09:13:07] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6262 detected for tactic 0x000000000000003c.
|
9 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
10 |
+
[12/28/2023-09:13:07] [W] [TRT] Tactic Device request: 6262MB Available: 3106MB. Device memory is insufficient to use tactic.
|
11 |
+
[12/28/2023-09:13:07] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6262 detected for tactic 0x0000000000000074.
|
12 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
13 |
+
[12/28/2023-09:13:09] [W] [TRT] Tactic Device request: 6251MB Available: 3131MB. Device memory is insufficient to use tactic.
|
14 |
+
[12/28/2023-09:13:09] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6251 detected for tactic 0x0000000000000004.
|
15 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
16 |
+
[12/28/2023-09:13:09] [W] [TRT] Tactic Device request: 6251MB Available: 3131MB. Device memory is insufficient to use tactic.
|
17 |
+
[12/28/2023-09:13:09] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6251 detected for tactic 0x000000000000003c.
|
18 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
19 |
+
[12/28/2023-09:21:25] [W] [TRT] Tactic Device request: 4711MB Available: 2436MB. Device memory is insufficient to use tactic.
|
20 |
+
[12/28/2023-09:21:25] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
21 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
22 |
+
[12/28/2023-09:21:25] [W] [TRT] Tactic Device request: 4711MB Available: 2436MB. Device memory is insufficient to use tactic.
|
23 |
+
[12/28/2023-09:21:26] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
24 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
25 |
+
[12/28/2023-09:21:26] [W] [TRT] Tactic Device request: 4711MB Available: 2437MB. Device memory is insufficient to use tactic.
|
26 |
+
[12/28/2023-09:21:26] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
27 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
28 |
+
[12/28/2023-09:21:27] [W] [TRT] Tactic Device request: 4701MB Available: 2436MB. Device memory is insufficient to use tactic.
|
29 |
+
[12/28/2023-09:21:27] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4701 detected for tactic 0x0000000000000004.
|
30 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
31 |
+
[12/28/2023-09:21:27] [W] [TRT] Tactic Device request: 4701MB Available: 2436MB. Device memory is insufficient to use tactic.
|
32 |
+
[12/28/2023-09:21:27] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4701 detected for tactic 0x000000000000003c.
|
33 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
34 |
+
[12/28/2023-09:21:47] [W] [TRT] Tactic Device request: 6275MB Available: 2435MB. Device memory is insufficient to use tactic.
|
35 |
+
[12/28/2023-09:21:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
36 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
37 |
+
[12/28/2023-09:21:47] [W] [TRT] Tactic Device request: 6275MB Available: 2435MB. Device memory is insufficient to use tactic.
|
38 |
+
[12/28/2023-09:21:47] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
39 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
40 |
+
[12/28/2023-09:21:47] [W] [TRT] Tactic Device request: 6275MB Available: 2435MB. Device memory is insufficient to use tactic.
|
41 |
+
[12/28/2023-09:21:47] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
42 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
43 |
+
[12/28/2023-09:21:49] [W] [TRT] Tactic Device request: 6270MB Available: 2436MB. Device memory is insufficient to use tactic.
|
44 |
+
[12/28/2023-09:21:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6270 detected for tactic 0x0000000000000004.
|
45 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
46 |
+
[12/28/2023-09:21:49] [W] [TRT] Tactic Device request: 6270MB Available: 2436MB. Device memory is insufficient to use tactic.
|
47 |
+
[12/28/2023-09:21:49] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6270 detected for tactic 0x000000000000003c.
|
48 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
49 |
+
[12/28/2023-09:32:33] [W] [TRT] Tactic Device request: 7056MB Available: 2270MB. Device memory is insufficient to use tactic.
|
50 |
+
[12/28/2023-09:32:33] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
51 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
52 |
+
[12/28/2023-09:32:33] [W] [TRT] Tactic Device request: 7056MB Available: 2270MB. Device memory is insufficient to use tactic.
|
53 |
+
[12/28/2023-09:32:33] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
54 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
55 |
+
[12/28/2023-09:32:33] [W] [TRT] Tactic Device request: 7056MB Available: 2270MB. Device memory is insufficient to use tactic.
|
56 |
+
[12/28/2023-09:32:33] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
57 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
58 |
+
[12/28/2023-09:32:35] [W] [TRT] Tactic Device request: 7050MB Available: 2269MB. Device memory is insufficient to use tactic.
|
59 |
+
[12/28/2023-09:32:35] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7050 detected for tactic 0x0000000000000004.
|
60 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
61 |
+
[12/28/2023-09:32:35] [W] [TRT] Tactic Device request: 7050MB Available: 2269MB. Device memory is insufficient to use tactic.
|
62 |
+
[12/28/2023-09:32:35] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 7050 detected for tactic 0x000000000000003c.
|
63 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
64 |
+
[12/28/2023-09:32:56] [W] [TRT] Tactic Device request: 6354MB Available: 2266MB. Device memory is insufficient to use tactic.
|
65 |
+
[12/28/2023-09:32:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
66 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
67 |
+
[12/28/2023-09:32:56] [W] [TRT] Tactic Device request: 6354MB Available: 2266MB. Device memory is insufficient to use tactic.
|
68 |
+
[12/28/2023-09:32:56] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
69 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
70 |
+
[12/28/2023-09:32:56] [W] [TRT] Tactic Device request: 6354MB Available: 2267MB. Device memory is insufficient to use tactic.
|
71 |
+
[12/28/2023-09:32:56] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
72 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
73 |
+
[12/28/2023-09:32:58] [W] [TRT] Tactic Device request: 6351MB Available: 2267MB. Device memory is insufficient to use tactic.
|
74 |
+
[12/28/2023-09:32:58] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6351 detected for tactic 0x0000000000000004.
|
75 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
76 |
+
[12/28/2023-09:32:58] [W] [TRT] Tactic Device request: 6351MB Available: 2267MB. Device memory is insufficient to use tactic.
|
77 |
+
[12/28/2023-09:32:58] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6351 detected for tactic 0x000000000000003c.
|
78 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
79 |
+
[12/28/2023-09:47:49] [W] [TRT] Tactic Device request: 2394MB Available: 2107MB. Device memory is insufficient to use tactic.
|
80 |
+
[12/28/2023-09:47:50] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
81 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
82 |
+
[12/28/2023-09:47:50] [W] [TRT] Tactic Device request: 2394MB Available: 2107MB. Device memory is insufficient to use tactic.
|
83 |
+
[12/28/2023-09:47:50] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
84 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
85 |
+
[12/28/2023-09:47:50] [W] [TRT] Tactic Device request: 2392MB Available: 2105MB. Device memory is insufficient to use tactic.
|
86 |
+
[12/28/2023-09:47:50] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
87 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
88 |
+
[12/28/2023-09:47:51] [W] [TRT] Tactic Device request: 2392MB Available: 2105MB. Device memory is insufficient to use tactic.
|
89 |
+
[12/28/2023-09:47:51] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
90 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
91 |
+
[12/28/2023-09:47:51] [W] [TRT] Tactic Device request: 2392MB Available: 2105MB. Device memory is insufficient to use tactic.
|
92 |
+
[12/28/2023-09:47:51] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
93 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
94 |
+
[12/28/2023-09:47:52] [W] [TRT] Tactic Device request: 2391MB Available: 2105MB. Device memory is insufficient to use tactic.
|
95 |
+
[12/28/2023-09:47:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2391 detected for tactic 0x0000000000000004.
|
96 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
97 |
+
[12/28/2023-09:47:52] [W] [TRT] Tactic Device request: 2391MB Available: 2105MB. Device memory is insufficient to use tactic.
|
98 |
+
[12/28/2023-09:47:52] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2391 detected for tactic 0x000000000000003c.
|
99 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
100 |
+
[12/28/2023-09:47:52] [W] [TRT] Tactic Device request: 2390MB Available: 2105MB. Device memory is insufficient to use tactic.
|
101 |
+
[12/28/2023-09:47:52] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
102 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
103 |
+
[12/28/2023-09:47:52] [W] [TRT] Tactic Device request: 2390MB Available: 2105MB. Device memory is insufficient to use tactic.
|
104 |
+
[12/28/2023-09:47:52] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
105 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
106 |
+
[12/28/2023-09:48:10] [W] [TRT] Tactic Device request: 4906MB Available: 2087MB. Device memory is insufficient to use tactic.
|
107 |
+
[12/28/2023-09:48:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4906 detected for tactic 0x0000000000000004.
|
108 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
109 |
+
[12/28/2023-09:48:10] [W] [TRT] Tactic Device request: 4906MB Available: 2087MB. Device memory is insufficient to use tactic.
|
110 |
+
[12/28/2023-09:48:10] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4906 detected for tactic 0x000000000000003c.
|
111 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
112 |
+
[12/28/2023-09:48:10] [W] [TRT] Tactic Device request: 4906MB Available: 2087MB. Device memory is insufficient to use tactic.
|
113 |
+
[12/28/2023-09:48:10] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4906 detected for tactic 0x0000000000000074.
|
114 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
115 |
+
[12/28/2023-09:48:12] [W] [TRT] Tactic Device request: 4905MB Available: 2088MB. Device memory is insufficient to use tactic.
|
116 |
+
[12/28/2023-09:48:12] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4905 detected for tactic 0x0000000000000004.
|
117 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
118 |
+
[12/28/2023-09:48:12] [W] [TRT] Tactic Device request: 4905MB Available: 2088MB. Device memory is insufficient to use tactic.
|
119 |
+
[12/28/2023-09:48:12] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4905 detected for tactic 0x000000000000003c.
|
120 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
121 |
+
[12/28/2023-09:56:12] [W] [TRT] Tactic Device request: 4906MB Available: 1978MB. Device memory is insufficient to use tactic.
|
122 |
+
[12/28/2023-09:56:12] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4906 detected for tactic 0x0000000000000004.
|
123 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
124 |
+
[12/28/2023-09:56:12] [W] [TRT] Tactic Device request: 4906MB Available: 1978MB. Device memory is insufficient to use tactic.
|
125 |
+
[12/28/2023-09:56:12] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4906 detected for tactic 0x000000000000003c.
|
126 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
127 |
+
[12/28/2023-09:56:12] [W] [TRT] Tactic Device request: 4906MB Available: 1978MB. Device memory is insufficient to use tactic.
|
128 |
+
[12/28/2023-09:56:12] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4906 detected for tactic 0x0000000000000074.
|
129 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
130 |
+
[12/28/2023-09:56:13] [W] [TRT] Tactic Device request: 4905MB Available: 1977MB. Device memory is insufficient to use tactic.
|
131 |
+
[12/28/2023-09:56:14] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4905 detected for tactic 0x0000000000000004.
|
132 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
133 |
+
[12/28/2023-09:56:14] [W] [TRT] Tactic Device request: 4905MB Available: 1977MB. Device memory is insufficient to use tactic.
|
134 |
+
[12/28/2023-09:56:14] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4905 detected for tactic 0x000000000000003c.
|
135 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
136 |
+
[12/28/2023-09:56:16] [W] [TRT] Tactic Device request: 2457MB Available: 1978MB. Device memory is insufficient to use tactic.
|
137 |
+
[12/28/2023-09:56:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
138 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
139 |
+
[12/28/2023-09:56:16] [W] [TRT] Tactic Device request: 2457MB Available: 1977MB. Device memory is insufficient to use tactic.
|
140 |
+
[12/28/2023-09:56:16] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
141 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
142 |
+
[12/28/2023-09:56:16] [W] [TRT] Tactic Device request: 2457MB Available: 1978MB. Device memory is insufficient to use tactic.
|
143 |
+
[12/28/2023-09:56:16] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
144 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
145 |
+
[12/28/2023-09:56:18] [W] [TRT] Tactic Device request: 2456MB Available: 1978MB. Device memory is insufficient to use tactic.
|
146 |
+
[12/28/2023-09:56:18] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2456 detected for tactic 0x0000000000000004.
|
147 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
148 |
+
[12/28/2023-09:56:18] [W] [TRT] Tactic Device request: 2456MB Available: 1978MB. Device memory is insufficient to use tactic.
|
149 |
+
[12/28/2023-09:56:18] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2456 detected for tactic 0x000000000000003c.
|
150 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
151 |
+
[12/28/2023-09:56:46] [W] [TRT] Tactic Device request: 3587MB Available: 1952MB. Device memory is insufficient to use tactic.
|
152 |
+
[12/28/2023-09:56:46] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
153 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
154 |
+
[12/28/2023-09:56:46] [W] [TRT] Tactic Device request: 3587MB Available: 1952MB. Device memory is insufficient to use tactic.
|
155 |
+
[12/28/2023-09:56:46] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
156 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
157 |
+
[12/28/2023-09:56:46] [W] [TRT] Tactic Device request: 3587MB Available: 1952MB. Device memory is insufficient to use tactic.
|
158 |
+
[12/28/2023-09:56:46] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
159 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
160 |
+
[12/28/2023-09:56:47] [W] [TRT] Tactic Device request: 3585MB Available: 1951MB. Device memory is insufficient to use tactic.
|
161 |
+
[12/28/2023-09:56:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3585 detected for tactic 0x0000000000000004.
|
162 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
163 |
+
[12/28/2023-09:56:47] [W] [TRT] Tactic Device request: 3585MB Available: 1951MB. Device memory is insufficient to use tactic.
|
164 |
+
[12/28/2023-09:56:47] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3585 detected for tactic 0x000000000000003c.
|
165 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
166 |
+
[12/28/2023-09:56:49] [W] [TRT] Tactic Device request: 2385MB Available: 1949MB. Device memory is insufficient to use tactic.
|
167 |
+
[12/28/2023-09:56:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2385 detected for tactic 0x0000000000000004.
|
168 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
169 |
+
[12/28/2023-09:56:49] [W] [TRT] Tactic Device request: 2385MB Available: 1949MB. Device memory is insufficient to use tactic.
|
170 |
+
[12/28/2023-09:56:49] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2385 detected for tactic 0x000000000000003c.
|
171 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
172 |
+
[12/28/2023-09:56:49] [W] [TRT] Tactic Device request: 2385MB Available: 1949MB. Device memory is insufficient to use tactic.
|
173 |
+
[12/28/2023-09:56:49] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2385 detected for tactic 0x0000000000000074.
|
174 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
175 |
+
[12/28/2023-09:56:50] [W] [TRT] Tactic Device request: 2384MB Available: 1950MB. Device memory is insufficient to use tactic.
|
176 |
+
[12/28/2023-09:56:50] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2384 detected for tactic 0x0000000000000004.
|
177 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
178 |
+
[12/28/2023-09:56:50] [W] [TRT] Tactic Device request: 2384MB Available: 1950MB. Device memory is insufficient to use tactic.
|
179 |
+
[12/28/2023-09:56:50] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2384 detected for tactic 0x000000000000003c.
|
180 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
181 |
+
[12/28/2023-10:05:05] [W] [TRT] Tactic Device request: 3556MB Available: 1897MB. Device memory is insufficient to use tactic.
|
182 |
+
[12/28/2023-10:05:05] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
183 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
184 |
+
[12/28/2023-10:05:05] [W] [TRT] Tactic Device request: 3556MB Available: 1897MB. Device memory is insufficient to use tactic.
|
185 |
+
[12/28/2023-10:05:05] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
186 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
187 |
+
[12/28/2023-10:05:05] [W] [TRT] Tactic Device request: 3556MB Available: 1897MB. Device memory is insufficient to use tactic.
|
188 |
+
[12/28/2023-10:05:05] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
189 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
190 |
+
[12/28/2023-10:05:06] [W] [TRT] Tactic Device request: 3551MB Available: 1897MB. Device memory is insufficient to use tactic.
|
191 |
+
[12/28/2023-10:05:06] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3551 detected for tactic 0x0000000000000004.
|
192 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
193 |
+
[12/28/2023-10:05:06] [W] [TRT] Tactic Device request: 3551MB Available: 1897MB. Device memory is insufficient to use tactic.
|
194 |
+
[12/28/2023-10:05:06] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3551 detected for tactic 0x000000000000003c.
|
195 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
196 |
+
[12/28/2023-10:15:43] [W] [TRT] Tactic Device request: 2359MB Available: 1749MB. Device memory is insufficient to use tactic.
|
197 |
+
[12/28/2023-10:15:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000004.
|
198 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
199 |
+
[12/28/2023-10:15:43] [W] [TRT] Tactic Device request: 2359MB Available: 1749MB. Device memory is insufficient to use tactic.
|
200 |
+
[12/28/2023-10:15:43] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2359 detected for tactic 0x000000000000003c.
|
201 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
202 |
+
[12/28/2023-10:15:43] [W] [TRT] Tactic Device request: 2359MB Available: 1749MB. Device memory is insufficient to use tactic.
|
203 |
+
[12/28/2023-10:15:43] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000074.
|
204 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
205 |
+
[12/28/2023-10:15:44] [W] [TRT] Tactic Device request: 2355MB Available: 1749MB. Device memory is insufficient to use tactic.
|
206 |
+
[12/28/2023-10:15:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2355 detected for tactic 0x0000000000000004.
|
207 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
208 |
+
[12/28/2023-10:15:44] [W] [TRT] Tactic Device request: 2355MB Available: 1749MB. Device memory is insufficient to use tactic.
|
209 |
+
[12/28/2023-10:15:44] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2355 detected for tactic 0x000000000000003c.
|
210 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
211 |
+
[12/28/2023-10:15:51] [W] [TRT] Tactic Device request: 2362MB Available: 1754MB. Device memory is insufficient to use tactic.
|
212 |
+
[12/28/2023-10:15:51] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2362 detected for tactic 0x0000000000000004.
|
213 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
214 |
+
[12/28/2023-10:15:51] [W] [TRT] Tactic Device request: 2362MB Available: 1754MB. Device memory is insufficient to use tactic.
|
215 |
+
[12/28/2023-10:15:51] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2362 detected for tactic 0x000000000000003c.
|
216 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
217 |
+
[12/28/2023-10:15:51] [W] [TRT] Tactic Device request: 2362MB Available: 1754MB. Device memory is insufficient to use tactic.
|
218 |
+
[12/28/2023-10:15:51] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2362 detected for tactic 0x0000000000000074.
|
219 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
220 |
+
[12/28/2023-10:15:54] [W] [TRT] Tactic Device request: 2357MB Available: 1752MB. Device memory is insufficient to use tactic.
|
221 |
+
[12/28/2023-10:15:54] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2357 detected for tactic 0x0000000000000004.
|
222 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
223 |
+
[12/28/2023-10:15:54] [W] [TRT] Tactic Device request: 2357MB Available: 1752MB. Device memory is insufficient to use tactic.
|
224 |
+
[12/28/2023-10:15:54] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2357 detected for tactic 0x000000000000003c.
|
225 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
226 |
+
[12/28/2023-10:15:57] [W] [TRT] Tactic Device request: 2359MB Available: 1752MB. Device memory is insufficient to use tactic.
|
227 |
+
[12/28/2023-10:15:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000004.
|
228 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
229 |
+
[12/28/2023-10:15:57] [W] [TRT] Tactic Device request: 2359MB Available: 1752MB. Device memory is insufficient to use tactic.
|
230 |
+
[12/28/2023-10:15:57] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2359 detected for tactic 0x000000000000003c.
|
231 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
232 |
+
[12/28/2023-10:15:57] [W] [TRT] Tactic Device request: 2359MB Available: 1752MB. Device memory is insufficient to use tactic.
|
233 |
+
[12/28/2023-10:15:58] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000074.
|
234 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
235 |
+
[12/28/2023-10:16:00] [W] [TRT] Tactic Device request: 2356MB Available: 1752MB. Device memory is insufficient to use tactic.
|
236 |
+
[12/28/2023-10:16:00] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2356 detected for tactic 0x0000000000000004.
|
237 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
238 |
+
[12/28/2023-10:16:00] [W] [TRT] Tactic Device request: 2356MB Available: 1752MB. Device memory is insufficient to use tactic.
|
239 |
+
[12/28/2023-10:16:00] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2356 detected for tactic 0x000000000000003c.
|
240 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
241 |
+
[12/28/2023-10:24:58] [W] [TRT] Tactic Device request: 3575MB Available: 2009MB. Device memory is insufficient to use tactic.
|
242 |
+
[12/28/2023-10:24:58] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3575 detected for tactic 0x0000000000000004.
|
243 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
244 |
+
[12/28/2023-10:24:58] [W] [TRT] Tactic Device request: 3575MB Available: 2009MB. Device memory is insufficient to use tactic.
|
245 |
+
[12/28/2023-10:24:58] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3575 detected for tactic 0x000000000000003c.
|
246 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
247 |
+
[12/28/2023-10:24:58] [W] [TRT] Tactic Device request: 3575MB Available: 2009MB. Device memory is insufficient to use tactic.
|
248 |
+
[12/28/2023-10:24:58] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3575 detected for tactic 0x0000000000000074.
|
249 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
250 |
+
[12/28/2023-10:24:59] [W] [TRT] Tactic Device request: 3572MB Available: 2008MB. Device memory is insufficient to use tactic.
|
251 |
+
[12/28/2023-10:24:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3572 detected for tactic 0x0000000000000004.
|
252 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
253 |
+
[12/28/2023-10:24:59] [W] [TRT] Tactic Device request: 3572MB Available: 2008MB. Device memory is insufficient to use tactic.
|
254 |
+
[12/28/2023-10:24:59] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3572 detected for tactic 0x000000000000003c.
|
255 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
256 |
+
[12/28/2023-10:25:08] [W] [TRT] Tactic Device request: 2390MB Available: 1909MB. Device memory is insufficient to use tactic.
|
257 |
+
[12/28/2023-10:25:08] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
258 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
259 |
+
[12/28/2023-10:25:08] [W] [TRT] Tactic Device request: 2390MB Available: 1824MB. Device memory is insufficient to use tactic.
|
260 |
+
[12/28/2023-10:25:08] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
261 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
262 |
+
[12/28/2023-10:25:09] [W] [TRT] Tactic Device request: 2390MB Available: 1822MB. Device memory is insufficient to use tactic.
|
263 |
+
[12/28/2023-10:25:09] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000074.
|
264 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
265 |
+
[12/28/2023-10:25:12] [W] [TRT] Tactic Device request: 2387MB Available: 1824MB. Device memory is insufficient to use tactic.
|
266 |
+
[12/28/2023-10:25:12] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2387 detected for tactic 0x0000000000000004.
|
267 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
268 |
+
[12/28/2023-10:25:12] [W] [TRT] Tactic Device request: 2387MB Available: 1800MB. Device memory is insufficient to use tactic.
|
269 |
+
[12/28/2023-10:25:12] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2387 detected for tactic 0x000000000000003c.
|
270 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
271 |
+
[12/28/2023-10:25:15] [W] [TRT] Tactic Device request: 2388MB Available: 1797MB. Device memory is insufficient to use tactic.
|
272 |
+
[12/28/2023-10:25:15] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2388 detected for tactic 0x0000000000000004.
|
273 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
274 |
+
[12/28/2023-10:25:16] [W] [TRT] Tactic Device request: 2388MB Available: 1753MB. Device memory is insufficient to use tactic.
|
275 |
+
[12/28/2023-10:25:16] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2388 detected for tactic 0x000000000000003c.
|
276 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
277 |
+
[12/28/2023-10:25:16] [W] [TRT] Tactic Device request: 2388MB Available: 1749MB. Device memory is insufficient to use tactic.
|
278 |
+
[12/28/2023-10:25:16] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2388 detected for tactic 0x0000000000000074.
|
279 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
280 |
+
[12/28/2023-10:25:19] [W] [TRT] Tactic Device request: 2386MB Available: 1749MB. Device memory is insufficient to use tactic.
|
281 |
+
[12/28/2023-10:25:19] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2386 detected for tactic 0x0000000000000004.
|
282 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
283 |
+
[12/28/2023-10:25:19] [W] [TRT] Tactic Device request: 2386MB Available: 1729MB. Device memory is insufficient to use tactic.
|
284 |
+
[12/28/2023-10:25:19] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2386 detected for tactic 0x000000000000003c.
|
285 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
286 |
+
[12/28/2023-10:25:23] [W] [TRT] Tactic Device request: 4775MB Available: 1722MB. Device memory is insufficient to use tactic.
|
287 |
+
[12/28/2023-10:25:23] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4775 detected for tactic 0x0000000000000004.
|
288 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
289 |
+
[12/28/2023-10:25:24] [W] [TRT] Tactic Device request: 4775MB Available: 1600MB. Device memory is insufficient to use tactic.
|
290 |
+
[12/28/2023-10:25:24] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4775 detected for tactic 0x000000000000003c.
|
291 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
292 |
+
[12/28/2023-10:25:25] [W] [TRT] Tactic Device request: 4775MB Available: 1593MB. Device memory is insufficient to use tactic.
|
293 |
+
[12/28/2023-10:25:25] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4775 detected for tactic 0x0000000000000074.
|
294 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
295 |
+
[12/28/2023-10:25:30] [W] [TRT] Tactic Device request: 4772MB Available: 1593MB. Device memory is insufficient to use tactic.
|
296 |
+
[12/28/2023-10:25:30] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4772 detected for tactic 0x0000000000000004.
|
297 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
298 |
+
[12/28/2023-10:25:31] [W] [TRT] Tactic Device request: 4772MB Available: 1591MB. Device memory is insufficient to use tactic.
|
299 |
+
[12/28/2023-10:25:31] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4772 detected for tactic 0x000000000000003c.
|
300 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
301 |
+
[12/28/2023-10:25:36] [W] [TRT] Tactic Device request: 4774MB Available: 1593MB. Device memory is insufficient to use tactic.
|
302 |
+
[12/28/2023-10:25:36] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4774 detected for tactic 0x0000000000000004.
|
303 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
304 |
+
[12/28/2023-10:25:37] [W] [TRT] Tactic Device request: 4774MB Available: 1592MB. Device memory is insufficient to use tactic.
|
305 |
+
[12/28/2023-10:25:37] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4774 detected for tactic 0x000000000000003c.
|
306 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
307 |
+
[12/28/2023-10:25:38] [W] [TRT] Tactic Device request: 4774MB Available: 1593MB. Device memory is insufficient to use tactic.
|
308 |
+
[12/28/2023-10:25:38] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4774 detected for tactic 0x0000000000000074.
|
309 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
310 |
+
[12/28/2023-10:25:43] [W] [TRT] Tactic Device request: 4771MB Available: 1592MB. Device memory is insufficient to use tactic.
|
311 |
+
[12/28/2023-10:25:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4771 detected for tactic 0x0000000000000004.
|
312 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
313 |
+
[12/28/2023-10:25:44] [W] [TRT] Tactic Device request: 4771MB Available: 1592MB. Device memory is insufficient to use tactic.
|
314 |
+
[12/28/2023-10:25:44] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4771 detected for tactic 0x000000000000003c.
|
315 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
316 |
+
[12/28/2023-10:25:48] [W] [TRT] Tactic Device request: 1637MB Available: 1594MB. Device memory is insufficient to use tactic.
|
317 |
+
[12/28/2023-10:25:48] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
318 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
319 |
+
[12/28/2023-10:25:49] [W] [TRT] Tactic Device request: 1637MB Available: 1594MB. Device memory is insufficient to use tactic.
|
320 |
+
[12/28/2023-10:25:49] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
321 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
322 |
+
[12/28/2023-10:25:49] [W] [TRT] Tactic Device request: 1637MB Available: 1594MB. Device memory is insufficient to use tactic.
|
323 |
+
[12/28/2023-10:25:49] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000074.
|
324 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
325 |
+
[12/28/2023-10:25:50] [W] [TRT] Tactic Device request: 1636MB Available: 1592MB. Device memory is insufficient to use tactic.
|
326 |
+
[12/28/2023-10:25:50] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1636 detected for tactic 0x0000000000000004.
|
327 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
328 |
+
[12/28/2023-10:25:50] [W] [TRT] Tactic Device request: 1636MB Available: 1592MB. Device memory is insufficient to use tactic.
|
329 |
+
[12/28/2023-10:25:50] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1636 detected for tactic 0x000000000000003c.
|
330 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
331 |
+
[12/28/2023-10:26:03] [W] [TRT] Tactic Device request: 4774MB Available: 1593MB. Device memory is insufficient to use tactic.
|
332 |
+
[12/28/2023-10:26:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4774 detected for tactic 0x0000000000000004.
|
333 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
334 |
+
[12/28/2023-10:26:04] [W] [TRT] Tactic Device request: 4774MB Available: 1591MB. Device memory is insufficient to use tactic.
|
335 |
+
[12/28/2023-10:26:04] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4774 detected for tactic 0x000000000000003c.
|
336 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
337 |
+
[12/28/2023-10:26:05] [W] [TRT] Tactic Device request: 4774MB Available: 1589MB. Device memory is insufficient to use tactic.
|
338 |
+
[12/28/2023-10:26:05] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4774 detected for tactic 0x0000000000000074.
|
339 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
340 |
+
[12/28/2023-10:26:10] [W] [TRT] Tactic Device request: 4771MB Available: 1591MB. Device memory is insufficient to use tactic.
|
341 |
+
[12/28/2023-10:26:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4771 detected for tactic 0x0000000000000004.
|
342 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
343 |
+
[12/28/2023-10:26:11] [W] [TRT] Tactic Device request: 4771MB Available: 1588MB. Device memory is insufficient to use tactic.
|
344 |
+
[12/28/2023-10:26:11] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4771 detected for tactic 0x000000000000003c.
|
345 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
346 |
+
[12/28/2023-10:36:30] [W] [TRT] Tactic Device request: 1638MB Available: 1396MB. Device memory is insufficient to use tactic.
|
347 |
+
[12/28/2023-10:36:30] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 1638 detected for tactic 0x000000000000003c.
|
348 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
349 |
+
[12/28/2023-10:36:30] [W] [TRT] Tactic Device request: 1638MB Available: 1396MB. Device memory is insufficient to use tactic.
|
350 |
+
[12/28/2023-10:36:30] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 1638 detected for tactic 0x0000000000000074.
|
351 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
352 |
+
[12/28/2023-10:36:31] [W] [TRT] Tactic Device request: 1637MB Available: 1395MB. Device memory is insufficient to use tactic.
|
353 |
+
[12/28/2023-10:36:31] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 1637 detected for tactic 0x0000000000000004.
|
354 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
355 |
+
[12/28/2023-10:36:31] [W] [TRT] Tactic Device request: 1637MB Available: 1396MB. Device memory is insufficient to use tactic.
|
356 |
+
[12/28/2023-10:36:31] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 1637 detected for tactic 0x000000000000003c.
|
357 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
358 |
+
[12/28/2023-10:36:33] [W] [TRT] Tactic Device request: 2454MB Available: 1396MB. Device memory is insufficient to use tactic.
|
359 |
+
[12/28/2023-10:36:33] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2454 detected for tactic 0x0000000000000004.
|
360 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
361 |
+
[12/28/2023-10:36:33] [W] [TRT] Tactic Device request: 2454MB Available: 1396MB. Device memory is insufficient to use tactic.
|
362 |
+
[12/28/2023-10:36:33] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2454 detected for tactic 0x000000000000003c.
|
363 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
364 |
+
[12/28/2023-10:36:33] [W] [TRT] Tactic Device request: 2454MB Available: 1397MB. Device memory is insufficient to use tactic.
|
365 |
+
[12/28/2023-10:36:33] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2454 detected for tactic 0x0000000000000074.
|
366 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
367 |
+
[12/28/2023-10:36:34] [W] [TRT] Tactic Device request: 2453MB Available: 1397MB. Device memory is insufficient to use tactic.
|
368 |
+
[12/28/2023-10:36:34] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2453 detected for tactic 0x0000000000000004.
|
369 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
370 |
+
[12/28/2023-10:36:34] [W] [TRT] Tactic Device request: 2453MB Available: 1397MB. Device memory is insufficient to use tactic.
|
371 |
+
[12/28/2023-10:36:34] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2453 detected for tactic 0x000000000000003c.
|
372 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
373 |
+
[12/28/2023-10:36:37] [W] [TRT] Tactic Device request: 2463MB Available: 1427MB. Device memory is insufficient to use tactic.
|
374 |
+
[12/28/2023-10:36:37] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000004.
|
375 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
376 |
+
[12/28/2023-10:36:38] [W] [TRT] Tactic Device request: 2463MB Available: 1390MB. Device memory is insufficient to use tactic.
|
377 |
+
[12/28/2023-10:36:38] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2463 detected for tactic 0x000000000000003c.
|
378 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
379 |
+
[12/28/2023-10:36:39] [W] [TRT] Tactic Device request: 2463MB Available: 1388MB. Device memory is insufficient to use tactic.
|
380 |
+
[12/28/2023-10:36:39] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000074.
|
381 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
382 |
+
[12/28/2023-10:36:43] [W] [TRT] Tactic Device request: 2462MB Available: 1596MB. Device memory is insufficient to use tactic.
|
383 |
+
[12/28/2023-10:36:43] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2462 detected for tactic 0x0000000000000004.
|
384 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
385 |
+
[12/28/2023-10:36:44] [W] [TRT] Tactic Device request: 2462MB Available: 1379MB. Device memory is insufficient to use tactic.
|
386 |
+
[12/28/2023-10:36:44] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2462 detected for tactic 0x000000000000003c.
|
387 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
388 |
+
[12/28/2023-10:36:49] [W] [TRT] Tactic Device request: 2463MB Available: 1378MB. Device memory is insufficient to use tactic.
|
389 |
+
[12/28/2023-10:36:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000004.
|
390 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
391 |
+
[12/28/2023-10:36:49] [W] [TRT] Tactic Device request: 2463MB Available: 1376MB. Device memory is insufficient to use tactic.
|
392 |
+
[12/28/2023-10:36:49] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2463 detected for tactic 0x000000000000003c.
|
393 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
394 |
+
[12/28/2023-10:36:50] [W] [TRT] Tactic Device request: 2463MB Available: 1376MB. Device memory is insufficient to use tactic.
|
395 |
+
[12/28/2023-10:36:50] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000074.
|
396 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
397 |
+
[12/28/2023-10:36:54] [W] [TRT] Tactic Device request: 2462MB Available: 1375MB. Device memory is insufficient to use tactic.
|
398 |
+
[12/28/2023-10:36:54] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2462 detected for tactic 0x0000000000000004.
|
399 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
400 |
+
[12/28/2023-10:36:55] [W] [TRT] Tactic Device request: 2462MB Available: 1375MB. Device memory is insufficient to use tactic.
|
401 |
+
[12/28/2023-10:36:55] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2462 detected for tactic 0x000000000000003c.
|
402 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
403 |
+
[12/28/2023-10:38:08] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
404 |
+
[12/28/2023-10:38:08] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
405 |
+
[12/28/2023-10:38:08] [W] * GPU compute time is unstable, with coefficient of variance = 7.66665%.
|
406 |
+
[12/28/2023-10:38:08] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_m_fp16.onnx.best.engine.log
ADDED
@@ -0,0 +1,312 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_m_fp16.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_m_fp16.onnx.best.engine
|
2 |
+
[12/28/2023-08:45:20] [I] === Model Options ===
|
3 |
+
[12/28/2023-08:45:20] [I] Format: ONNX
|
4 |
+
[12/28/2023-08:45:20] [I] Model: yolo_nas_pose_m_fp16.onnx
|
5 |
+
[12/28/2023-08:45:20] [I] Output:
|
6 |
+
[12/28/2023-08:45:20] [I] === Build Options ===
|
7 |
+
[12/28/2023-08:45:20] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-08:45:20] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-08:45:20] [I] minTiming: 1
|
10 |
+
[12/28/2023-08:45:20] [I] avgTiming: 8
|
11 |
+
[12/28/2023-08:45:20] [I] Precision: FP32+FP16+INT8
|
12 |
+
[12/28/2023-08:45:20] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-08:45:20] [I] Calibration: Dynamic
|
14 |
+
[12/28/2023-08:45:20] [I] Refit: Disabled
|
15 |
+
[12/28/2023-08:45:20] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-08:45:20] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-08:45:20] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-08:45:20] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-08:45:20] [I] Build only: Disabled
|
20 |
+
[12/28/2023-08:45:20] [I] Save engine: yolo_nas_pose_m_fp16.onnx.best.engine
|
21 |
+
[12/28/2023-08:45:20] [I] Load engine:
|
22 |
+
[12/28/2023-08:45:20] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-08:45:20] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-08:45:20] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-08:45:20] [I] timingCacheFile:
|
26 |
+
[12/28/2023-08:45:20] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-08:45:20] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-08:45:20] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-08:45:20] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-08:45:20] [I] Input build shapes: model
|
31 |
+
[12/28/2023-08:45:20] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-08:45:20] [I] === System Options ===
|
33 |
+
[12/28/2023-08:45:20] [I] Device: 0
|
34 |
+
[12/28/2023-08:45:20] [I] DLACore:
|
35 |
+
[12/28/2023-08:45:20] [I] Plugins:
|
36 |
+
[12/28/2023-08:45:20] [I] === Inference Options ===
|
37 |
+
[12/28/2023-08:45:20] [I] Batch: Explicit
|
38 |
+
[12/28/2023-08:45:20] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-08:45:20] [I] Iterations: 10
|
40 |
+
[12/28/2023-08:45:20] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-08:45:20] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-08:45:20] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-08:45:20] [I] Streams: 1
|
44 |
+
[12/28/2023-08:45:20] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-08:45:20] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-08:45:20] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-08:45:20] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-08:45:20] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-08:45:20] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-08:45:20] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-08:45:20] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-08:45:20] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-08:45:20] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-08:45:20] [I] Inputs:
|
55 |
+
[12/28/2023-08:45:20] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-08:45:20] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-08:45:20] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-08:45:20] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-08:45:20] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-08:45:20] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-08:45:20] [I] Profile: Disabled
|
62 |
+
[12/28/2023-08:45:20] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-08:45:20] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-08:45:20] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-08:45:20] [I]
|
66 |
+
[12/28/2023-08:45:20] [I] === Device Information ===
|
67 |
+
[12/28/2023-08:45:20] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-08:45:20] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-08:45:20] [I] SMs: 8
|
70 |
+
[12/28/2023-08:45:20] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-08:45:20] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-08:45:20] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-08:45:20] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-08:45:20] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-08:45:20] [I]
|
76 |
+
[12/28/2023-08:45:20] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-08:45:24] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 2980 (MiB)
|
78 |
+
[12/28/2023-08:45:29] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +284, now: CPU 574, GPU 3286 (MiB)
|
79 |
+
[12/28/2023-08:45:29] [I] Start parsing network model
|
80 |
+
[12/28/2023-08:45:30] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-08:45:30] [I] [TRT] Input filename: yolo_nas_pose_m_fp16.onnx
|
82 |
+
[12/28/2023-08:45:30] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-08:45:30] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-08:45:30] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-08:45:30] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-08:45:30] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-08:45:30] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-08:45:30] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-08:45:30] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-08:45:30] [I] Finish parsing network model
|
91 |
+
[12/28/2023-08:45:31] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-08:45:31] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 410) [Constant]
|
96 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 411) [Constant]
|
97 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 412) [Constant]
|
98 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
166 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
167 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
168 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
169 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
170 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
171 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
172 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
173 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
174 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
175 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
176 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
177 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
178 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
179 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
180 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
181 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
182 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
183 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
184 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
185 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
186 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
187 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
188 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
189 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
190 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
191 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 200) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
192 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
193 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
194 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 208) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
195 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
196 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
197 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
198 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
199 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
200 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
201 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
202 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
203 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
204 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
205 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
206 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
207 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
208 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
209 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
210 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
211 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
212 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
213 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 247) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
214 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
215 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
216 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
217 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 270) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
218 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
219 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
220 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
221 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
222 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
223 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
224 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
225 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
226 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
227 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
228 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
229 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
230 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
231 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
232 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
233 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 301) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
234 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
235 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
236 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
237 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 324) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
238 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
239 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
240 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 332) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
241 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
242 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
243 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
244 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
245 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
246 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
247 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
248 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
249 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
250 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
251 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
252 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
253 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
254 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1...cast_boxes_to_fp32]}
|
255 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
256 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 414) [NMS]_1_output[DevicetoShapeHostCopy]
|
257 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
258 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
259 |
+
[12/28/2023-08:45:31] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
260 |
+
[12/28/2023-08:45:44] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +400, now: CPU 1196, GPU 3820 (MiB)
|
261 |
+
[12/28/2023-08:45:46] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +82, GPU +70, now: CPU 1278, GPU 3890 (MiB)
|
262 |
+
[12/28/2023-08:45:46] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
263 |
+
[12/28/2023-10:37:30] [I] [TRT] Total Activation Memory: 7941309952
|
264 |
+
[12/28/2023-10:37:30] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
265 |
+
[12/28/2023-10:37:43] [I] [TRT] Total Host Persistent Memory: 294816
|
266 |
+
[12/28/2023-10:37:43] [I] [TRT] Total Device Persistent Memory: 38912
|
267 |
+
[12/28/2023-10:37:43] [I] [TRT] Total Scratch Memory: 134217728
|
268 |
+
[12/28/2023-10:37:43] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 54 MiB, GPU 2398 MiB
|
269 |
+
[12/28/2023-10:37:43] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 157 steps to complete.
|
270 |
+
[12/28/2023-10:37:43] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 76.003ms to assign 14 blocks to 157 nodes requiring 144914944 bytes.
|
271 |
+
[12/28/2023-10:37:43] [I] [TRT] Total Activation Memory: 144914944
|
272 |
+
[12/28/2023-10:37:50] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU -1, now: CPU 1667, GPU 5526 (MiB)
|
273 |
+
[12/28/2023-10:37:50] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +38, GPU +64, now: CPU 38, GPU 64 (MiB)
|
274 |
+
[12/28/2023-10:37:51] [I] Engine built in 6750.81 sec.
|
275 |
+
[12/28/2023-10:37:52] [I] [TRT] Loaded engine size: 39 MiB
|
276 |
+
[12/28/2023-10:37:52] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1284, GPU 5348 (MiB)
|
277 |
+
[12/28/2023-10:37:52] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +37, now: CPU 0, GPU 37 (MiB)
|
278 |
+
[12/28/2023-10:37:52] [I] Engine deserialized in 0.265686 sec.
|
279 |
+
[12/28/2023-10:37:52] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1284, GPU 5348 (MiB)
|
280 |
+
[12/28/2023-10:37:52] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +138, now: CPU 0, GPU 175 (MiB)
|
281 |
+
[12/28/2023-10:37:52] [I] Setting persistentCacheLimit to 0 bytes.
|
282 |
+
[12/28/2023-10:37:52] [I] Using random values for input onnx::Cast_0
|
283 |
+
[12/28/2023-10:37:52] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
284 |
+
[12/28/2023-10:37:52] [I] Using random values for output graph2_flat_predictions
|
285 |
+
[12/28/2023-10:37:52] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
286 |
+
[12/28/2023-10:37:52] [I] Starting inference
|
287 |
+
[12/28/2023-10:38:08] [I] Warmup completed 2 queries over 200 ms
|
288 |
+
[12/28/2023-10:38:08] [I] Timing trace has 875 queries over 15.0204 s
|
289 |
+
[12/28/2023-10:38:08] [I]
|
290 |
+
[12/28/2023-10:38:08] [I] === Trace details ===
|
291 |
+
[12/28/2023-10:38:08] [I] Trace averages of 100 runs:
|
292 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 17.3015 ms - Host latency: 17.42 ms (enqueue 17.373 ms)
|
293 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 16.7848 ms - Host latency: 16.8974 ms (enqueue 16.8579 ms)
|
294 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 16.7202 ms - Host latency: 16.8311 ms (enqueue 16.7917 ms)
|
295 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 16.7189 ms - Host latency: 16.8301 ms (enqueue 16.7925 ms)
|
296 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 16.8722 ms - Host latency: 16.9814 ms (enqueue 16.939 ms)
|
297 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 17.0499 ms - Host latency: 17.165 ms (enqueue 17.1147 ms)
|
298 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 17.4353 ms - Host latency: 17.5548 ms (enqueue 17.5031 ms)
|
299 |
+
[12/28/2023-10:38:08] [I] Average on 100 runs - GPU latency: 17.2635 ms - Host latency: 17.3821 ms (enqueue 17.328 ms)
|
300 |
+
[12/28/2023-10:38:08] [I]
|
301 |
+
[12/28/2023-10:38:08] [I] === Performance summary ===
|
302 |
+
[12/28/2023-10:38:08] [I] Throughput: 58.254 qps
|
303 |
+
[12/28/2023-10:38:08] [I] Latency: min = 15.8867 ms, max = 26.5801 ms, mean = 17.1335 ms, median = 16.9814 ms, percentile(90%) = 17.8691 ms, percentile(95%) = 18.4963 ms, percentile(99%) = 24.3384 ms
|
304 |
+
[12/28/2023-10:38:08] [I] Enqueue Time: min = 15.8533 ms, max = 26.5361 ms, mean = 17.0885 ms, median = 16.9271 ms, percentile(90%) = 17.8125 ms, percentile(95%) = 18.4688 ms, percentile(99%) = 23.7695 ms
|
305 |
+
[12/28/2023-10:38:08] [I] H2D Latency: min = 0.0800781 ms, max = 0.148483 ms, mean = 0.0972059 ms, median = 0.0976562 ms, percentile(90%) = 0.100464 ms, percentile(95%) = 0.100586 ms, percentile(99%) = 0.110596 ms
|
306 |
+
[12/28/2023-10:38:08] [I] GPU Compute Time: min = 15.7729 ms, max = 26.4624 ms, mean = 17.019 ms, median = 16.8655 ms, percentile(90%) = 17.7568 ms, percentile(95%) = 18.3837 ms, percentile(99%) = 24.2227 ms
|
307 |
+
[12/28/2023-10:38:08] [I] D2H Latency: min = 0.00292969 ms, max = 0.0673828 ms, mean = 0.0172236 ms, median = 0.0146484 ms, percentile(90%) = 0.0263672 ms, percentile(95%) = 0.0283203 ms, percentile(99%) = 0.0407715 ms
|
308 |
+
[12/28/2023-10:38:08] [I] Total Host Walltime: 15.0204 s
|
309 |
+
[12/28/2023-10:38:08] [I] Total GPU Compute Time: 14.8917 s
|
310 |
+
[12/28/2023-10:38:08] [I] Explanations of the performance metrics are printed in the verbose logs.
|
311 |
+
[12/28/2023-10:38:08] [I]
|
312 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_m_fp16.onnx --best --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_m_fp16.onnx.best.engine
|
yolo_nas_pose_m_fp16.onnx.engine.err
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-07:47:56] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-07:47:56] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-07:47:57] [E] Error[4]: [network.cpp::validate::2925] Error Code 4: Internal Error (fp16 precision has been set for a layer or layer output, but fp16 is not configured in the builder)
|
4 |
+
[12/28/2023-07:47:57] [E] Error[2]: [builder.cpp::buildSerializedNetwork::751] Error Code 2: Internal Error (Assertion engine != nullptr failed. )
|
5 |
+
[12/28/2023-07:47:57] [E] Engine could not be created from network
|
6 |
+
[12/28/2023-07:47:57] [E] Building engine failed
|
7 |
+
[12/28/2023-07:47:57] [E] Failed to create engine from model or file.
|
8 |
+
[12/28/2023-07:47:57] [E] Engine set up failed
|
yolo_nas_pose_m_fp16.onnx.engine.log
ADDED
@@ -0,0 +1,91 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_m_fp16.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_m_fp16.onnx.engine
|
2 |
+
[12/28/2023-07:47:46] [I] === Model Options ===
|
3 |
+
[12/28/2023-07:47:46] [I] Format: ONNX
|
4 |
+
[12/28/2023-07:47:46] [I] Model: yolo_nas_pose_m_fp16.onnx
|
5 |
+
[12/28/2023-07:47:46] [I] Output:
|
6 |
+
[12/28/2023-07:47:46] [I] === Build Options ===
|
7 |
+
[12/28/2023-07:47:46] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-07:47:46] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-07:47:46] [I] minTiming: 1
|
10 |
+
[12/28/2023-07:47:46] [I] avgTiming: 8
|
11 |
+
[12/28/2023-07:47:46] [I] Precision: FP32
|
12 |
+
[12/28/2023-07:47:46] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-07:47:46] [I] Calibration:
|
14 |
+
[12/28/2023-07:47:46] [I] Refit: Disabled
|
15 |
+
[12/28/2023-07:47:46] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-07:47:46] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-07:47:46] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-07:47:46] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-07:47:46] [I] Build only: Disabled
|
20 |
+
[12/28/2023-07:47:46] [I] Save engine: yolo_nas_pose_m_fp16.onnx.engine
|
21 |
+
[12/28/2023-07:47:46] [I] Load engine:
|
22 |
+
[12/28/2023-07:47:46] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-07:47:46] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-07:47:46] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-07:47:46] [I] timingCacheFile:
|
26 |
+
[12/28/2023-07:47:46] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-07:47:46] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-07:47:46] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-07:47:46] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-07:47:46] [I] Input build shapes: model
|
31 |
+
[12/28/2023-07:47:46] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-07:47:46] [I] === System Options ===
|
33 |
+
[12/28/2023-07:47:46] [I] Device: 0
|
34 |
+
[12/28/2023-07:47:46] [I] DLACore:
|
35 |
+
[12/28/2023-07:47:46] [I] Plugins:
|
36 |
+
[12/28/2023-07:47:46] [I] === Inference Options ===
|
37 |
+
[12/28/2023-07:47:46] [I] Batch: Explicit
|
38 |
+
[12/28/2023-07:47:46] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-07:47:46] [I] Iterations: 10
|
40 |
+
[12/28/2023-07:47:46] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-07:47:46] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-07:47:46] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-07:47:46] [I] Streams: 1
|
44 |
+
[12/28/2023-07:47:46] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-07:47:46] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-07:47:46] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-07:47:46] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-07:47:46] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-07:47:46] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-07:47:46] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-07:47:46] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-07:47:46] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-07:47:46] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-07:47:46] [I] Inputs:
|
55 |
+
[12/28/2023-07:47:46] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-07:47:46] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-07:47:46] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-07:47:46] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-07:47:46] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-07:47:46] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-07:47:46] [I] Profile: Disabled
|
62 |
+
[12/28/2023-07:47:46] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-07:47:46] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-07:47:46] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-07:47:46] [I]
|
66 |
+
[12/28/2023-07:47:46] [I] === Device Information ===
|
67 |
+
[12/28/2023-07:47:46] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-07:47:46] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-07:47:46] [I] SMs: 8
|
70 |
+
[12/28/2023-07:47:46] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-07:47:46] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-07:47:46] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-07:47:46] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-07:47:46] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-07:47:46] [I]
|
76 |
+
[12/28/2023-07:47:46] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-07:47:51] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 3024 (MiB)
|
78 |
+
[12/28/2023-07:47:55] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +284, now: CPU 574, GPU 3327 (MiB)
|
79 |
+
[12/28/2023-07:47:55] [I] Start parsing network model
|
80 |
+
[12/28/2023-07:47:56] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-07:47:56] [I] [TRT] Input filename: yolo_nas_pose_m_fp16.onnx
|
82 |
+
[12/28/2023-07:47:56] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-07:47:56] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-07:47:56] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-07:47:56] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-07:47:56] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-07:47:56] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-07:47:56] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-07:47:56] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-07:47:57] [I] Finish parsing network model
|
91 |
+
&&&& FAILED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_m_fp16.onnx --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_m_fp16.onnx.engine
|
yolo_nas_pose_m_fp16.onnx.fp16.engine
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88b66cc2f44220a42e474a86ccc143cd0982f5549e47a979486545e1657fbbc8
|
3 |
+
size 79706512
|
yolo_nas_pose_m_fp16.onnx.fp16.engine.err
ADDED
@@ -0,0 +1,348 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-07:48:01] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-07:48:01] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-07:52:40] [W] [TRT] Tactic Device request: 6262MB Available: 3207MB. Device memory is insufficient to use tactic.
|
4 |
+
[12/28/2023-07:52:40] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6262 detected for tactic 0x0000000000000004.
|
5 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
6 |
+
[12/28/2023-07:52:40] [W] [TRT] Tactic Device request: 6262MB Available: 3207MB. Device memory is insufficient to use tactic.
|
7 |
+
[12/28/2023-07:52:40] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6262 detected for tactic 0x000000000000003c.
|
8 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
9 |
+
[12/28/2023-07:52:40] [W] [TRT] Tactic Device request: 6262MB Available: 3207MB. Device memory is insufficient to use tactic.
|
10 |
+
[12/28/2023-07:52:40] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6262 detected for tactic 0x0000000000000074.
|
11 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
12 |
+
[12/28/2023-07:52:42] [W] [TRT] Tactic Device request: 6251MB Available: 3210MB. Device memory is insufficient to use tactic.
|
13 |
+
[12/28/2023-07:52:42] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6251 detected for tactic 0x0000000000000004.
|
14 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
15 |
+
[12/28/2023-07:52:42] [W] [TRT] Tactic Device request: 6251MB Available: 3210MB. Device memory is insufficient to use tactic.
|
16 |
+
[12/28/2023-07:52:43] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6251 detected for tactic 0x000000000000003c.
|
17 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
18 |
+
[12/28/2023-07:57:47] [W] [TRT] Tactic Device request: 4711MB Available: 2426MB. Device memory is insufficient to use tactic.
|
19 |
+
[12/28/2023-07:57:47] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000004.
|
20 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
21 |
+
[12/28/2023-07:57:47] [W] [TRT] Tactic Device request: 4711MB Available: 2426MB. Device memory is insufficient to use tactic.
|
22 |
+
[12/28/2023-07:57:47] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4711 detected for tactic 0x000000000000003c.
|
23 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
24 |
+
[12/28/2023-07:57:47] [W] [TRT] Tactic Device request: 4711MB Available: 2426MB. Device memory is insufficient to use tactic.
|
25 |
+
[12/28/2023-07:57:47] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4711 detected for tactic 0x0000000000000074.
|
26 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
27 |
+
[12/28/2023-07:57:49] [W] [TRT] Tactic Device request: 4701MB Available: 2426MB. Device memory is insufficient to use tactic.
|
28 |
+
[12/28/2023-07:57:49] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4701 detected for tactic 0x0000000000000004.
|
29 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
30 |
+
[12/28/2023-07:57:49] [W] [TRT] Tactic Device request: 4701MB Available: 2426MB. Device memory is insufficient to use tactic.
|
31 |
+
[12/28/2023-07:57:49] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4701 detected for tactic 0x000000000000003c.
|
32 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
33 |
+
[12/28/2023-07:58:04] [W] [TRT] Tactic Device request: 6275MB Available: 2426MB. Device memory is insufficient to use tactic.
|
34 |
+
[12/28/2023-07:58:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000004.
|
35 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
36 |
+
[12/28/2023-07:58:05] [W] [TRT] Tactic Device request: 6275MB Available: 2426MB. Device memory is insufficient to use tactic.
|
37 |
+
[12/28/2023-07:58:05] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6275 detected for tactic 0x000000000000003c.
|
38 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
39 |
+
[12/28/2023-07:58:05] [W] [TRT] Tactic Device request: 6275MB Available: 2426MB. Device memory is insufficient to use tactic.
|
40 |
+
[12/28/2023-07:58:05] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6275 detected for tactic 0x0000000000000074.
|
41 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
42 |
+
[12/28/2023-07:58:06] [W] [TRT] Tactic Device request: 6270MB Available: 2425MB. Device memory is insufficient to use tactic.
|
43 |
+
[12/28/2023-07:58:06] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6270 detected for tactic 0x0000000000000004.
|
44 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
45 |
+
[12/28/2023-07:58:06] [W] [TRT] Tactic Device request: 6270MB Available: 2426MB. Device memory is insufficient to use tactic.
|
46 |
+
[12/28/2023-07:58:06] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6270 detected for tactic 0x000000000000003c.
|
47 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
48 |
+
[12/28/2023-08:04:38] [W] [TRT] Tactic Device request: 7056MB Available: 2305MB. Device memory is insufficient to use tactic.
|
49 |
+
[12/28/2023-08:04:38] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000004.
|
50 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
51 |
+
[12/28/2023-08:04:38] [W] [TRT] Tactic Device request: 7056MB Available: 2305MB. Device memory is insufficient to use tactic.
|
52 |
+
[12/28/2023-08:04:38] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 7056 detected for tactic 0x000000000000003c.
|
53 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
54 |
+
[12/28/2023-08:04:38] [W] [TRT] Tactic Device request: 7056MB Available: 2302MB. Device memory is insufficient to use tactic.
|
55 |
+
[12/28/2023-08:04:38] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 7056 detected for tactic 0x0000000000000074.
|
56 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
57 |
+
[12/28/2023-08:04:40] [W] [TRT] Tactic Device request: 7050MB Available: 2302MB. Device memory is insufficient to use tactic.
|
58 |
+
[12/28/2023-08:04:40] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 7050 detected for tactic 0x0000000000000004.
|
59 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
60 |
+
[12/28/2023-08:04:40] [W] [TRT] Tactic Device request: 7050MB Available: 2302MB. Device memory is insufficient to use tactic.
|
61 |
+
[12/28/2023-08:04:40] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 7050 detected for tactic 0x000000000000003c.
|
62 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
63 |
+
[12/28/2023-08:04:56] [W] [TRT] Tactic Device request: 6354MB Available: 2299MB. Device memory is insufficient to use tactic.
|
64 |
+
[12/28/2023-08:04:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000004.
|
65 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
66 |
+
[12/28/2023-08:04:56] [W] [TRT] Tactic Device request: 6354MB Available: 2299MB. Device memory is insufficient to use tactic.
|
67 |
+
[12/28/2023-08:04:56] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 6354 detected for tactic 0x000000000000003c.
|
68 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
69 |
+
[12/28/2023-08:04:57] [W] [TRT] Tactic Device request: 6354MB Available: 2308MB. Device memory is insufficient to use tactic.
|
70 |
+
[12/28/2023-08:04:57] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 6354 detected for tactic 0x0000000000000074.
|
71 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
72 |
+
[12/28/2023-08:04:58] [W] [TRT] Tactic Device request: 6351MB Available: 2305MB. Device memory is insufficient to use tactic.
|
73 |
+
[12/28/2023-08:04:58] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 6351 detected for tactic 0x0000000000000004.
|
74 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
75 |
+
[12/28/2023-08:04:58] [W] [TRT] Tactic Device request: 6351MB Available: 2306MB. Device memory is insufficient to use tactic.
|
76 |
+
[12/28/2023-08:04:58] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 6351 detected for tactic 0x000000000000003c.
|
77 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
78 |
+
[12/28/2023-08:13:43] [W] [TRT] Tactic Device request: 2394MB Available: 2369MB. Device memory is insufficient to use tactic.
|
79 |
+
[12/28/2023-08:13:43] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2394 detected for tactic 0x000000000000003c.
|
80 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
81 |
+
[12/28/2023-08:13:43] [W] [TRT] Tactic Device request: 2394MB Available: 2369MB. Device memory is insufficient to use tactic.
|
82 |
+
[12/28/2023-08:13:43] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2394 detected for tactic 0x0000000000000074.
|
83 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
84 |
+
[12/28/2023-08:13:44] [W] [TRT] Tactic Device request: 2392MB Available: 2366MB. Device memory is insufficient to use tactic.
|
85 |
+
[12/28/2023-08:13:44] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000004.
|
86 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
87 |
+
[12/28/2023-08:13:44] [W] [TRT] Tactic Device request: 2392MB Available: 2366MB. Device memory is insufficient to use tactic.
|
88 |
+
[12/28/2023-08:13:44] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2392 detected for tactic 0x000000000000003c.
|
89 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
90 |
+
[12/28/2023-08:13:44] [W] [TRT] Tactic Device request: 2392MB Available: 2366MB. Device memory is insufficient to use tactic.
|
91 |
+
[12/28/2023-08:13:44] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2392 detected for tactic 0x0000000000000074.
|
92 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
93 |
+
[12/28/2023-08:13:45] [W] [TRT] Tactic Device request: 2391MB Available: 2367MB. Device memory is insufficient to use tactic.
|
94 |
+
[12/28/2023-08:13:45] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2391 detected for tactic 0x0000000000000004.
|
95 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
96 |
+
[12/28/2023-08:13:45] [W] [TRT] Tactic Device request: 2391MB Available: 2367MB. Device memory is insufficient to use tactic.
|
97 |
+
[12/28/2023-08:13:45] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2391 detected for tactic 0x000000000000003c.
|
98 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
99 |
+
[12/28/2023-08:13:45] [W] [TRT] Tactic Device request: 2390MB Available: 2367MB. Device memory is insufficient to use tactic.
|
100 |
+
[12/28/2023-08:13:45] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
101 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
102 |
+
[12/28/2023-08:13:45] [W] [TRT] Tactic Device request: 2390MB Available: 2365MB. Device memory is insufficient to use tactic.
|
103 |
+
[12/28/2023-08:13:45] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
104 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
105 |
+
[12/28/2023-08:13:59] [W] [TRT] Tactic Device request: 4906MB Available: 2349MB. Device memory is insufficient to use tactic.
|
106 |
+
[12/28/2023-08:13:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4906 detected for tactic 0x0000000000000004.
|
107 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
108 |
+
[12/28/2023-08:13:59] [W] [TRT] Tactic Device request: 4906MB Available: 2348MB. Device memory is insufficient to use tactic.
|
109 |
+
[12/28/2023-08:13:59] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4906 detected for tactic 0x000000000000003c.
|
110 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
111 |
+
[12/28/2023-08:14:00] [W] [TRT] Tactic Device request: 4906MB Available: 2349MB. Device memory is insufficient to use tactic.
|
112 |
+
[12/28/2023-08:14:00] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 4906 detected for tactic 0x0000000000000074.
|
113 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
114 |
+
[12/28/2023-08:14:01] [W] [TRT] Tactic Device request: 4905MB Available: 2337MB. Device memory is insufficient to use tactic.
|
115 |
+
[12/28/2023-08:14:01] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4905 detected for tactic 0x0000000000000004.
|
116 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
117 |
+
[12/28/2023-08:14:01] [W] [TRT] Tactic Device request: 4905MB Available: 2336MB. Device memory is insufficient to use tactic.
|
118 |
+
[12/28/2023-08:14:01] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 4905 detected for tactic 0x000000000000003c.
|
119 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
120 |
+
[12/28/2023-08:18:56] [W] [TRT] Tactic Device request: 2457MB Available: 2273MB. Device memory is insufficient to use tactic.
|
121 |
+
[12/28/2023-08:18:56] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000004.
|
122 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
123 |
+
[12/28/2023-08:18:56] [W] [TRT] Tactic Device request: 2457MB Available: 2273MB. Device memory is insufficient to use tactic.
|
124 |
+
[12/28/2023-08:18:56] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2457 detected for tactic 0x000000000000003c.
|
125 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
126 |
+
[12/28/2023-08:18:56] [W] [TRT] Tactic Device request: 2457MB Available: 2273MB. Device memory is insufficient to use tactic.
|
127 |
+
[12/28/2023-08:18:56] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2457 detected for tactic 0x0000000000000074.
|
128 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
129 |
+
[12/28/2023-08:18:57] [W] [TRT] Tactic Device request: 2456MB Available: 2272MB. Device memory is insufficient to use tactic.
|
130 |
+
[12/28/2023-08:18:57] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2456 detected for tactic 0x0000000000000004.
|
131 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
132 |
+
[12/28/2023-08:18:57] [W] [TRT] Tactic Device request: 2456MB Available: 2272MB. Device memory is insufficient to use tactic.
|
133 |
+
[12/28/2023-08:18:57] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2456 detected for tactic 0x000000000000003c.
|
134 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
135 |
+
[12/28/2023-08:19:19] [W] [TRT] Tactic Device request: 3587MB Available: 2263MB. Device memory is insufficient to use tactic.
|
136 |
+
[12/28/2023-08:19:19] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000004.
|
137 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
138 |
+
[12/28/2023-08:19:19] [W] [TRT] Tactic Device request: 3587MB Available: 2263MB. Device memory is insufficient to use tactic.
|
139 |
+
[12/28/2023-08:19:19] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3587 detected for tactic 0x000000000000003c.
|
140 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
141 |
+
[12/28/2023-08:19:19] [W] [TRT] Tactic Device request: 3587MB Available: 2263MB. Device memory is insufficient to use tactic.
|
142 |
+
[12/28/2023-08:19:19] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3587 detected for tactic 0x0000000000000074.
|
143 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
144 |
+
[12/28/2023-08:19:20] [W] [TRT] Tactic Device request: 3585MB Available: 2263MB. Device memory is insufficient to use tactic.
|
145 |
+
[12/28/2023-08:19:20] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3585 detected for tactic 0x0000000000000004.
|
146 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
147 |
+
[12/28/2023-08:19:20] [W] [TRT] Tactic Device request: 3585MB Available: 2263MB. Device memory is insufficient to use tactic.
|
148 |
+
[12/28/2023-08:19:20] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3585 detected for tactic 0x000000000000003c.
|
149 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
150 |
+
[12/28/2023-08:19:21] [W] [TRT] Tactic Device request: 2385MB Available: 2264MB. Device memory is insufficient to use tactic.
|
151 |
+
[12/28/2023-08:19:21] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2385 detected for tactic 0x0000000000000004.
|
152 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
153 |
+
[12/28/2023-08:19:21] [W] [TRT] Tactic Device request: 2385MB Available: 2264MB. Device memory is insufficient to use tactic.
|
154 |
+
[12/28/2023-08:19:21] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2385 detected for tactic 0x000000000000003c.
|
155 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
156 |
+
[12/28/2023-08:19:21] [W] [TRT] Tactic Device request: 2385MB Available: 2264MB. Device memory is insufficient to use tactic.
|
157 |
+
[12/28/2023-08:19:21] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2385 detected for tactic 0x0000000000000074.
|
158 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
159 |
+
[12/28/2023-08:19:22] [W] [TRT] Tactic Device request: 2384MB Available: 2262MB. Device memory is insufficient to use tactic.
|
160 |
+
[12/28/2023-08:19:22] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2384 detected for tactic 0x0000000000000004.
|
161 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
162 |
+
[12/28/2023-08:19:22] [W] [TRT] Tactic Device request: 2384MB Available: 2262MB. Device memory is insufficient to use tactic.
|
163 |
+
[12/28/2023-08:19:22] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2384 detected for tactic 0x000000000000003c.
|
164 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
165 |
+
[12/28/2023-08:24:28] [W] [TRT] Tactic Device request: 3556MB Available: 2243MB. Device memory is insufficient to use tactic.
|
166 |
+
[12/28/2023-08:24:28] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000004.
|
167 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
168 |
+
[12/28/2023-08:24:28] [W] [TRT] Tactic Device request: 3556MB Available: 2243MB. Device memory is insufficient to use tactic.
|
169 |
+
[12/28/2023-08:24:28] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3556 detected for tactic 0x000000000000003c.
|
170 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
171 |
+
[12/28/2023-08:24:28] [W] [TRT] Tactic Device request: 3556MB Available: 2243MB. Device memory is insufficient to use tactic.
|
172 |
+
[12/28/2023-08:24:28] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3556 detected for tactic 0x0000000000000074.
|
173 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
174 |
+
[12/28/2023-08:24:29] [W] [TRT] Tactic Device request: 3551MB Available: 2243MB. Device memory is insufficient to use tactic.
|
175 |
+
[12/28/2023-08:24:30] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3551 detected for tactic 0x0000000000000004.
|
176 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
177 |
+
[12/28/2023-08:24:30] [W] [TRT] Tactic Device request: 3551MB Available: 2243MB. Device memory is insufficient to use tactic.
|
178 |
+
[12/28/2023-08:24:30] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3551 detected for tactic 0x000000000000003c.
|
179 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
180 |
+
[12/28/2023-08:31:02] [W] [TRT] Tactic Device request: 2359MB Available: 2128MB. Device memory is insufficient to use tactic.
|
181 |
+
[12/28/2023-08:31:02] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000004.
|
182 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
183 |
+
[12/28/2023-08:31:02] [W] [TRT] Tactic Device request: 2359MB Available: 2128MB. Device memory is insufficient to use tactic.
|
184 |
+
[12/28/2023-08:31:02] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2359 detected for tactic 0x000000000000003c.
|
185 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
186 |
+
[12/28/2023-08:31:02] [W] [TRT] Tactic Device request: 2359MB Available: 2128MB. Device memory is insufficient to use tactic.
|
187 |
+
[12/28/2023-08:31:02] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000074.
|
188 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
189 |
+
[12/28/2023-08:31:03] [W] [TRT] Tactic Device request: 2355MB Available: 2129MB. Device memory is insufficient to use tactic.
|
190 |
+
[12/28/2023-08:31:03] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2355 detected for tactic 0x0000000000000004.
|
191 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
192 |
+
[12/28/2023-08:31:03] [W] [TRT] Tactic Device request: 2355MB Available: 2129MB. Device memory is insufficient to use tactic.
|
193 |
+
[12/28/2023-08:31:03] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2355 detected for tactic 0x000000000000003c.
|
194 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
195 |
+
[12/28/2023-08:31:07] [W] [TRT] Tactic Device request: 2362MB Available: 2128MB. Device memory is insufficient to use tactic.
|
196 |
+
[12/28/2023-08:31:07] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2362 detected for tactic 0x0000000000000004.
|
197 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
198 |
+
[12/28/2023-08:31:08] [W] [TRT] Tactic Device request: 2362MB Available: 2128MB. Device memory is insufficient to use tactic.
|
199 |
+
[12/28/2023-08:31:08] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2362 detected for tactic 0x000000000000003c.
|
200 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
201 |
+
[12/28/2023-08:31:08] [W] [TRT] Tactic Device request: 2362MB Available: 2128MB. Device memory is insufficient to use tactic.
|
202 |
+
[12/28/2023-08:31:08] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2362 detected for tactic 0x0000000000000074.
|
203 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
204 |
+
[12/28/2023-08:31:10] [W] [TRT] Tactic Device request: 2357MB Available: 2129MB. Device memory is insufficient to use tactic.
|
205 |
+
[12/28/2023-08:31:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2357 detected for tactic 0x0000000000000004.
|
206 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
207 |
+
[12/28/2023-08:31:11] [W] [TRT] Tactic Device request: 2357MB Available: 2129MB. Device memory is insufficient to use tactic.
|
208 |
+
[12/28/2023-08:31:11] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2357 detected for tactic 0x000000000000003c.
|
209 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
210 |
+
[12/28/2023-08:31:12] [W] [TRT] Tactic Device request: 2359MB Available: 2129MB. Device memory is insufficient to use tactic.
|
211 |
+
[12/28/2023-08:31:12] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000004.
|
212 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
213 |
+
[12/28/2023-08:31:13] [W] [TRT] Tactic Device request: 2359MB Available: 2128MB. Device memory is insufficient to use tactic.
|
214 |
+
[12/28/2023-08:31:13] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2359 detected for tactic 0x000000000000003c.
|
215 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
216 |
+
[12/28/2023-08:31:13] [W] [TRT] Tactic Device request: 2359MB Available: 2128MB. Device memory is insufficient to use tactic.
|
217 |
+
[12/28/2023-08:31:13] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2359 detected for tactic 0x0000000000000074.
|
218 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
219 |
+
[12/28/2023-08:31:15] [W] [TRT] Tactic Device request: 2356MB Available: 2128MB. Device memory is insufficient to use tactic.
|
220 |
+
[12/28/2023-08:31:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2356 detected for tactic 0x0000000000000004.
|
221 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
222 |
+
[12/28/2023-08:31:16] [W] [TRT] Tactic Device request: 2356MB Available: 2128MB. Device memory is insufficient to use tactic.
|
223 |
+
[12/28/2023-08:31:16] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2356 detected for tactic 0x000000000000003c.
|
224 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
225 |
+
[12/28/2023-08:36:53] [W] [TRT] Tactic Device request: 3575MB Available: 2474MB. Device memory is insufficient to use tactic.
|
226 |
+
[12/28/2023-08:36:53] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3575 detected for tactic 0x0000000000000004.
|
227 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
228 |
+
[12/28/2023-08:36:53] [W] [TRT] Tactic Device request: 3575MB Available: 2475MB. Device memory is insufficient to use tactic.
|
229 |
+
[12/28/2023-08:36:53] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 3575 detected for tactic 0x000000000000003c.
|
230 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
231 |
+
[12/28/2023-08:36:53] [W] [TRT] Tactic Device request: 3575MB Available: 2475MB. Device memory is insufficient to use tactic.
|
232 |
+
[12/28/2023-08:36:53] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 3575 detected for tactic 0x0000000000000074.
|
233 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
234 |
+
[12/28/2023-08:36:54] [W] [TRT] Tactic Device request: 3572MB Available: 2475MB. Device memory is insufficient to use tactic.
|
235 |
+
[12/28/2023-08:36:54] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 3572 detected for tactic 0x0000000000000004.
|
236 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
237 |
+
[12/28/2023-08:36:54] [W] [TRT] Tactic Device request: 3572MB Available: 2475MB. Device memory is insufficient to use tactic.
|
238 |
+
[12/28/2023-08:36:54] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 3572 detected for tactic 0x000000000000003c.
|
239 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
240 |
+
[12/28/2023-08:37:00] [W] [TRT] Tactic Device request: 2390MB Available: 2347MB. Device memory is insufficient to use tactic.
|
241 |
+
[12/28/2023-08:37:00] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000004.
|
242 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
243 |
+
[12/28/2023-08:37:00] [W] [TRT] Tactic Device request: 2390MB Available: 2269MB. Device memory is insufficient to use tactic.
|
244 |
+
[12/28/2023-08:37:00] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2390 detected for tactic 0x000000000000003c.
|
245 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
246 |
+
[12/28/2023-08:37:01] [W] [TRT] Tactic Device request: 2390MB Available: 2265MB. Device memory is insufficient to use tactic.
|
247 |
+
[12/28/2023-08:37:01] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2390 detected for tactic 0x0000000000000074.
|
248 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
249 |
+
[12/28/2023-08:37:04] [W] [TRT] Tactic Device request: 2387MB Available: 2263MB. Device memory is insufficient to use tactic.
|
250 |
+
[12/28/2023-08:37:04] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2387 detected for tactic 0x0000000000000004.
|
251 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
252 |
+
[12/28/2023-08:37:04] [W] [TRT] Tactic Device request: 2387MB Available: 2239MB. Device memory is insufficient to use tactic.
|
253 |
+
[12/28/2023-08:37:04] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2387 detected for tactic 0x000000000000003c.
|
254 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
255 |
+
[12/28/2023-08:37:06] [W] [TRT] Tactic Device request: 2388MB Available: 2234MB. Device memory is insufficient to use tactic.
|
256 |
+
[12/28/2023-08:37:06] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2388 detected for tactic 0x0000000000000004.
|
257 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
258 |
+
[12/28/2023-08:37:07] [W] [TRT] Tactic Device request: 2388MB Available: 2205MB. Device memory is insufficient to use tactic.
|
259 |
+
[12/28/2023-08:37:07] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2388 detected for tactic 0x000000000000003c.
|
260 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
261 |
+
[12/28/2023-08:37:07] [W] [TRT] Tactic Device request: 2388MB Available: 2203MB. Device memory is insufficient to use tactic.
|
262 |
+
[12/28/2023-08:37:07] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2388 detected for tactic 0x0000000000000074.
|
263 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
264 |
+
[12/28/2023-08:37:10] [W] [TRT] Tactic Device request: 2386MB Available: 2203MB. Device memory is insufficient to use tactic.
|
265 |
+
[12/28/2023-08:37:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2386 detected for tactic 0x0000000000000004.
|
266 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
267 |
+
[12/28/2023-08:37:10] [W] [TRT] Tactic Device request: 2386MB Available: 2176MB. Device memory is insufficient to use tactic.
|
268 |
+
[12/28/2023-08:37:10] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2386 detected for tactic 0x000000000000003c.
|
269 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
270 |
+
[12/28/2023-08:37:13] [W] [TRT] Tactic Device request: 4775MB Available: 2174MB. Device memory is insufficient to use tactic.
|
271 |
+
[12/28/2023-08:37:13] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4775 detected for tactic 0x0000000000000004.
|
272 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
273 |
+
[12/28/2023-08:37:13] [W] [TRT] Tactic Device request: 4775MB Available: 2034MB. Device memory is insufficient to use tactic.
|
274 |
+
[12/28/2023-08:37:13] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4775 detected for tactic 0x000000000000003c.
|
275 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
276 |
+
[12/28/2023-08:37:14] [W] [TRT] Tactic Device request: 4775MB Available: 2034MB. Device memory is insufficient to use tactic.
|
277 |
+
[12/28/2023-08:37:14] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4775 detected for tactic 0x0000000000000074.
|
278 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
279 |
+
[12/28/2023-08:37:19] [W] [TRT] Tactic Device request: 4772MB Available: 2034MB. Device memory is insufficient to use tactic.
|
280 |
+
[12/28/2023-08:37:19] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4772 detected for tactic 0x0000000000000004.
|
281 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
282 |
+
[12/28/2023-08:37:20] [W] [TRT] Tactic Device request: 4772MB Available: 2034MB. Device memory is insufficient to use tactic.
|
283 |
+
[12/28/2023-08:37:20] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4772 detected for tactic 0x000000000000003c.
|
284 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
285 |
+
[12/28/2023-08:37:24] [W] [TRT] Tactic Device request: 4774MB Available: 2033MB. Device memory is insufficient to use tactic.
|
286 |
+
[12/28/2023-08:37:24] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4774 detected for tactic 0x0000000000000004.
|
287 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
288 |
+
[12/28/2023-08:37:25] [W] [TRT] Tactic Device request: 4774MB Available: 2033MB. Device memory is insufficient to use tactic.
|
289 |
+
[12/28/2023-08:37:25] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 4774 detected for tactic 0x000000000000003c.
|
290 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
291 |
+
[12/28/2023-08:37:26] [W] [TRT] Tactic Device request: 4774MB Available: 2034MB. Device memory is insufficient to use tactic.
|
292 |
+
[12/28/2023-08:37:26] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 4774 detected for tactic 0x0000000000000074.
|
293 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
294 |
+
[12/28/2023-08:37:31] [W] [TRT] Tactic Device request: 4771MB Available: 2034MB. Device memory is insufficient to use tactic.
|
295 |
+
[12/28/2023-08:37:31] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 4771 detected for tactic 0x0000000000000004.
|
296 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
297 |
+
[12/28/2023-08:37:31] [W] [TRT] Tactic Device request: 4771MB Available: 2034MB. Device memory is insufficient to use tactic.
|
298 |
+
[12/28/2023-08:37:32] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 4771 detected for tactic 0x000000000000003c.
|
299 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
300 |
+
[12/28/2023-08:43:58] [W] [TRT] Tactic Device request: 2454MB Available: 1908MB. Device memory is insufficient to use tactic.
|
301 |
+
[12/28/2023-08:43:58] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2454 detected for tactic 0x0000000000000004.
|
302 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
303 |
+
[12/28/2023-08:43:58] [W] [TRT] Tactic Device request: 2454MB Available: 1908MB. Device memory is insufficient to use tactic.
|
304 |
+
[12/28/2023-08:43:58] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2454 detected for tactic 0x000000000000003c.
|
305 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
306 |
+
[12/28/2023-08:43:58] [W] [TRT] Tactic Device request: 2454MB Available: 1907MB. Device memory is insufficient to use tactic.
|
307 |
+
[12/28/2023-08:43:58] [W] [TRT] Skipping tactic 13 due to insufficient memory on requested size of 2454 detected for tactic 0x0000000000000074.
|
308 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
309 |
+
[12/28/2023-08:43:59] [W] [TRT] Tactic Device request: 2453MB Available: 1907MB. Device memory is insufficient to use tactic.
|
310 |
+
[12/28/2023-08:43:59] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2453 detected for tactic 0x0000000000000004.
|
311 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
312 |
+
[12/28/2023-08:43:59] [W] [TRT] Tactic Device request: 2453MB Available: 1906MB. Device memory is insufficient to use tactic.
|
313 |
+
[12/28/2023-08:43:59] [W] [TRT] Skipping tactic 7 due to insufficient memory on requested size of 2453 detected for tactic 0x000000000000003c.
|
314 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
315 |
+
[12/28/2023-08:44:01] [W] [TRT] Tactic Device request: 2463MB Available: 1901MB. Device memory is insufficient to use tactic.
|
316 |
+
[12/28/2023-08:44:01] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000004.
|
317 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
318 |
+
[12/28/2023-08:44:02] [W] [TRT] Tactic Device request: 2463MB Available: 1909MB. Device memory is insufficient to use tactic.
|
319 |
+
[12/28/2023-08:44:02] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2463 detected for tactic 0x000000000000003c.
|
320 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
321 |
+
[12/28/2023-08:44:03] [W] [TRT] Tactic Device request: 2463MB Available: 1910MB. Device memory is insufficient to use tactic.
|
322 |
+
[12/28/2023-08:44:03] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000074.
|
323 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
324 |
+
[12/28/2023-08:44:07] [W] [TRT] Tactic Device request: 2462MB Available: 1898MB. Device memory is insufficient to use tactic.
|
325 |
+
[12/28/2023-08:44:07] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2462 detected for tactic 0x0000000000000004.
|
326 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
327 |
+
[12/28/2023-08:44:07] [W] [TRT] Tactic Device request: 2462MB Available: 1898MB. Device memory is insufficient to use tactic.
|
328 |
+
[12/28/2023-08:44:07] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2462 detected for tactic 0x000000000000003c.
|
329 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
330 |
+
[12/28/2023-08:44:10] [W] [TRT] Tactic Device request: 2463MB Available: 1898MB. Device memory is insufficient to use tactic.
|
331 |
+
[12/28/2023-08:44:10] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000004.
|
332 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
333 |
+
[12/28/2023-08:44:11] [W] [TRT] Tactic Device request: 2463MB Available: 1898MB. Device memory is insufficient to use tactic.
|
334 |
+
[12/28/2023-08:44:11] [W] [TRT] Skipping tactic 9 due to insufficient memory on requested size of 2463 detected for tactic 0x000000000000003c.
|
335 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
336 |
+
[12/28/2023-08:44:12] [W] [TRT] Tactic Device request: 2463MB Available: 1898MB. Device memory is insufficient to use tactic.
|
337 |
+
[12/28/2023-08:44:12] [W] [TRT] Skipping tactic 15 due to insufficient memory on requested size of 2463 detected for tactic 0x0000000000000074.
|
338 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
339 |
+
[12/28/2023-08:44:16] [W] [TRT] Tactic Device request: 2462MB Available: 1899MB. Device memory is insufficient to use tactic.
|
340 |
+
[12/28/2023-08:44:16] [W] [TRT] Skipping tactic 3 due to insufficient memory on requested size of 2462 detected for tactic 0x0000000000000004.
|
341 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
342 |
+
[12/28/2023-08:44:17] [W] [TRT] Tactic Device request: 2462MB Available: 1898MB. Device memory is insufficient to use tactic.
|
343 |
+
[12/28/2023-08:44:17] [W] [TRT] Skipping tactic 8 due to insufficient memory on requested size of 2462 detected for tactic 0x000000000000003c.
|
344 |
+
Try decreasing the workspace size with IBuilderConfig::setMemoryPoolLimit().
|
345 |
+
[12/28/2023-08:45:16] [W] * Throughput may be bound by Enqueue Time rather than GPU Compute and the GPU may be under-utilized.
|
346 |
+
[12/28/2023-08:45:16] [W] If not already in use, --useCudaGraph (utilize CUDA graphs where possible) may increase the throughput.
|
347 |
+
[12/28/2023-08:45:16] [W] * GPU compute time is unstable, with coefficient of variance = 2.78032%.
|
348 |
+
[12/28/2023-08:45:16] [W] If not already in use, locking GPU clock frequency or adding --useSpinWait may improve the stability.
|
yolo_nas_pose_m_fp16.onnx.fp16.engine.log
ADDED
@@ -0,0 +1,309 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
&&&& RUNNING TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_m_fp16.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_m_fp16.onnx.fp16.engine
|
2 |
+
[12/28/2023-07:47:57] [I] === Model Options ===
|
3 |
+
[12/28/2023-07:47:57] [I] Format: ONNX
|
4 |
+
[12/28/2023-07:47:57] [I] Model: yolo_nas_pose_m_fp16.onnx
|
5 |
+
[12/28/2023-07:47:57] [I] Output:
|
6 |
+
[12/28/2023-07:47:57] [I] === Build Options ===
|
7 |
+
[12/28/2023-07:47:57] [I] Max batch: explicit batch
|
8 |
+
[12/28/2023-07:47:57] [I] Memory Pools: workspace: default, dlaSRAM: default, dlaLocalDRAM: default, dlaGlobalDRAM: default
|
9 |
+
[12/28/2023-07:47:57] [I] minTiming: 1
|
10 |
+
[12/28/2023-07:47:57] [I] avgTiming: 8
|
11 |
+
[12/28/2023-07:47:57] [I] Precision: FP32+FP16
|
12 |
+
[12/28/2023-07:47:57] [I] LayerPrecisions:
|
13 |
+
[12/28/2023-07:47:57] [I] Calibration:
|
14 |
+
[12/28/2023-07:47:57] [I] Refit: Disabled
|
15 |
+
[12/28/2023-07:47:57] [I] Sparsity: Disabled
|
16 |
+
[12/28/2023-07:47:57] [I] Safe mode: Disabled
|
17 |
+
[12/28/2023-07:47:57] [I] DirectIO mode: Disabled
|
18 |
+
[12/28/2023-07:47:57] [I] Restricted mode: Disabled
|
19 |
+
[12/28/2023-07:47:57] [I] Build only: Disabled
|
20 |
+
[12/28/2023-07:47:57] [I] Save engine: yolo_nas_pose_m_fp16.onnx.fp16.engine
|
21 |
+
[12/28/2023-07:47:57] [I] Load engine:
|
22 |
+
[12/28/2023-07:47:57] [I] Profiling verbosity: 0
|
23 |
+
[12/28/2023-07:47:57] [I] Tactic sources: Using default tactic sources
|
24 |
+
[12/28/2023-07:47:57] [I] timingCacheMode: local
|
25 |
+
[12/28/2023-07:47:57] [I] timingCacheFile:
|
26 |
+
[12/28/2023-07:47:57] [I] Heuristic: Disabled
|
27 |
+
[12/28/2023-07:47:57] [I] Preview Features: Use default preview flags.
|
28 |
+
[12/28/2023-07:47:57] [I] Input(s)s format: fp32:CHW
|
29 |
+
[12/28/2023-07:47:57] [I] Output(s)s format: fp32:CHW
|
30 |
+
[12/28/2023-07:47:57] [I] Input build shapes: model
|
31 |
+
[12/28/2023-07:47:57] [I] Input calibration shapes: model
|
32 |
+
[12/28/2023-07:47:57] [I] === System Options ===
|
33 |
+
[12/28/2023-07:47:57] [I] Device: 0
|
34 |
+
[12/28/2023-07:47:57] [I] DLACore:
|
35 |
+
[12/28/2023-07:47:57] [I] Plugins:
|
36 |
+
[12/28/2023-07:47:57] [I] === Inference Options ===
|
37 |
+
[12/28/2023-07:47:57] [I] Batch: Explicit
|
38 |
+
[12/28/2023-07:47:57] [I] Input inference shapes: model
|
39 |
+
[12/28/2023-07:47:57] [I] Iterations: 10
|
40 |
+
[12/28/2023-07:47:57] [I] Duration: 15s (+ 200ms warm up)
|
41 |
+
[12/28/2023-07:47:57] [I] Sleep time: 0ms
|
42 |
+
[12/28/2023-07:47:57] [I] Idle time: 0ms
|
43 |
+
[12/28/2023-07:47:57] [I] Streams: 1
|
44 |
+
[12/28/2023-07:47:57] [I] ExposeDMA: Disabled
|
45 |
+
[12/28/2023-07:47:57] [I] Data transfers: Enabled
|
46 |
+
[12/28/2023-07:47:57] [I] Spin-wait: Disabled
|
47 |
+
[12/28/2023-07:47:57] [I] Multithreading: Disabled
|
48 |
+
[12/28/2023-07:47:57] [I] CUDA Graph: Disabled
|
49 |
+
[12/28/2023-07:47:57] [I] Separate profiling: Disabled
|
50 |
+
[12/28/2023-07:47:57] [I] Time Deserialize: Disabled
|
51 |
+
[12/28/2023-07:47:57] [I] Time Refit: Disabled
|
52 |
+
[12/28/2023-07:47:57] [I] NVTX verbosity: 0
|
53 |
+
[12/28/2023-07:47:57] [I] Persistent Cache Ratio: 0
|
54 |
+
[12/28/2023-07:47:57] [I] Inputs:
|
55 |
+
[12/28/2023-07:47:57] [I] === Reporting Options ===
|
56 |
+
[12/28/2023-07:47:57] [I] Verbose: Disabled
|
57 |
+
[12/28/2023-07:47:57] [I] Averages: 100 inferences
|
58 |
+
[12/28/2023-07:47:57] [I] Percentiles: 90,95,99
|
59 |
+
[12/28/2023-07:47:57] [I] Dump refittable layers:Disabled
|
60 |
+
[12/28/2023-07:47:57] [I] Dump output: Disabled
|
61 |
+
[12/28/2023-07:47:57] [I] Profile: Disabled
|
62 |
+
[12/28/2023-07:47:57] [I] Export timing to JSON file:
|
63 |
+
[12/28/2023-07:47:57] [I] Export output to JSON file:
|
64 |
+
[12/28/2023-07:47:57] [I] Export profile to JSON file:
|
65 |
+
[12/28/2023-07:47:57] [I]
|
66 |
+
[12/28/2023-07:47:57] [I] === Device Information ===
|
67 |
+
[12/28/2023-07:47:57] [I] Selected Device: Orin
|
68 |
+
[12/28/2023-07:47:57] [I] Compute Capability: 8.7
|
69 |
+
[12/28/2023-07:47:57] [I] SMs: 8
|
70 |
+
[12/28/2023-07:47:57] [I] Compute Clock Rate: 0.624 GHz
|
71 |
+
[12/28/2023-07:47:57] [I] Device Global Memory: 7471 MiB
|
72 |
+
[12/28/2023-07:47:57] [I] Shared Memory per SM: 164 KiB
|
73 |
+
[12/28/2023-07:47:57] [I] Memory Bus Width: 128 bits (ECC disabled)
|
74 |
+
[12/28/2023-07:47:57] [I] Memory Clock Rate: 0.624 GHz
|
75 |
+
[12/28/2023-07:47:57] [I]
|
76 |
+
[12/28/2023-07:47:57] [I] TensorRT version: 8.5.2
|
77 |
+
[12/28/2023-07:47:58] [I] [TRT] [MemUsageChange] Init CUDA: CPU +220, GPU +0, now: CPU 249, GPU 3022 (MiB)
|
78 |
+
[12/28/2023-07:48:00] [I] [TRT] [MemUsageChange] Init builder kernel library: CPU +302, GPU +284, now: CPU 574, GPU 3325 (MiB)
|
79 |
+
[12/28/2023-07:48:00] [I] Start parsing network model
|
80 |
+
[12/28/2023-07:48:01] [I] [TRT] ----------------------------------------------------------------
|
81 |
+
[12/28/2023-07:48:01] [I] [TRT] Input filename: yolo_nas_pose_m_fp16.onnx
|
82 |
+
[12/28/2023-07:48:01] [I] [TRT] ONNX IR version: 0.0.8
|
83 |
+
[12/28/2023-07:48:01] [I] [TRT] Opset version: 17
|
84 |
+
[12/28/2023-07:48:01] [I] [TRT] Producer name: pytorch
|
85 |
+
[12/28/2023-07:48:01] [I] [TRT] Producer version: 2.1.2
|
86 |
+
[12/28/2023-07:48:01] [I] [TRT] Domain:
|
87 |
+
[12/28/2023-07:48:01] [I] [TRT] Model version: 0
|
88 |
+
[12/28/2023-07:48:01] [I] [TRT] Doc string:
|
89 |
+
[12/28/2023-07:48:01] [I] [TRT] ----------------------------------------------------------------
|
90 |
+
[12/28/2023-07:48:01] [I] Finish parsing network model
|
91 |
+
[12/28/2023-07:48:01] [I] [TRT] ---------- Layers Running on DLA ----------
|
92 |
+
[12/28/2023-07:48:01] [I] [TRT] ---------- Layers Running on GPU ----------
|
93 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation1]
|
94 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/pre_process/pre_process.0/Cast.../pre_process/pre_process.2/Mul]}
|
95 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 410) [Constant]
|
96 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 411) [Constant]
|
97 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONSTANT: (Unnamed Layer* 412) [Constant]
|
98 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stem/conv/rbr_reparam/Conv + /model/backbone/stem/conv/nonlinearity/Relu
|
99 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/downsample/rbr_reparam/Conv + /model/backbone/stage1/downsample/nonlinearity/Relu
|
100 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv2/conv/Conv + /model/backbone/stage1/blocks/conv2/act/Relu || /model/backbone/stage1/blocks/conv1/conv/Conv + /model/backbone/stage1/blocks/conv1/act/Relu
|
101 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
102 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
103 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 15) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add)
|
104 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
105 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
106 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 23) [Shuffle] + /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage1/blocks/bottlenecks/bottlenecks.1/Add)
|
107 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv1/act/Relu_output_0 copy
|
108 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
109 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage1/blocks/conv2/act/Relu_output_0 copy
|
110 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage1/blocks/conv3/conv/Conv + /model/backbone/stage1/blocks/conv3/act/Relu
|
111 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_skip2/conv/Conv + /model/neck/neck2/reduce_skip2/act/Relu
|
112 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/downsample/rbr_reparam/Conv + /model/backbone/stage2/downsample/nonlinearity/Relu
|
113 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/downsample/conv/Conv + /model/neck/neck2/downsample/act/Relu
|
114 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv2/conv/Conv + /model/backbone/stage2/blocks/conv2/act/Relu || /model/backbone/stage2/blocks/conv1/conv/Conv + /model/backbone/stage2/blocks/conv1/act/Relu
|
115 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
116 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
117 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 44) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add)
|
118 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
119 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
120 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 52) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add)
|
121 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
122 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
123 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 60) [Shuffle] + /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage2/blocks/bottlenecks/bottlenecks.2/Add)
|
124 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv1/act/Relu_output_0 copy
|
125 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
126 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
127 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage2/blocks/conv2/act/Relu_output_0 copy
|
128 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage2/blocks/conv3/conv/Conv + /model/backbone/stage2/blocks/conv3/act/Relu
|
129 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip2/conv/Conv + /model/neck/neck1/reduce_skip2/act/Relu || /model/neck/neck2/reduce_skip1/conv/Conv + /model/neck/neck2/reduce_skip1/act/Relu
|
130 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/downsample/rbr_reparam/Conv + /model/backbone/stage3/downsample/nonlinearity/Relu
|
131 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/downsample/conv/Conv + /model/neck/neck1/downsample/act/Relu
|
132 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv2/conv/Conv + /model/backbone/stage3/blocks/conv2/act/Relu || /model/backbone/stage3/blocks/conv1/conv/Conv + /model/backbone/stage3/blocks/conv1/act/Relu
|
133 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
134 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
135 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 83) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add)
|
136 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
137 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
138 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 91) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add)
|
139 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
140 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
141 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.2.alpha + (Unnamed Layer* 99) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add)
|
142 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv1/nonlinearity/Relu
|
143 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/cv2/nonlinearity/Relu
|
144 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.3.alpha + (Unnamed Layer* 107) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add)
|
145 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv1/nonlinearity/Relu
|
146 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/rbr_reparam/Conv + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/cv2/nonlinearity/Relu
|
147 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage3.blocks.bottlenecks.4.alpha + (Unnamed Layer* 115) [Shuffle] + /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Mul, /model/backbone/stage3/blocks/bottlenecks/bottlenecks.4/Add)
|
148 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv1/act/Relu_output_0 copy
|
149 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.0/Add_output_0 copy
|
150 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.1/Add_output_0 copy
|
151 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.2/Add_output_0 copy
|
152 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/bottlenecks/bottlenecks.3/Add_output_0 copy
|
153 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage3/blocks/conv2/act/Relu_output_0 copy
|
154 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage3/blocks/conv3/conv/Conv + /model/backbone/stage3/blocks/conv3/act/Relu
|
155 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_skip1/conv/Conv + /model/neck/neck1/reduce_skip1/act/Relu
|
156 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/downsample/rbr_reparam/Conv + /model/backbone/stage4/downsample/nonlinearity/Relu
|
157 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv2/conv/Conv + /model/backbone/stage4/blocks/conv2/act/Relu || /model/backbone/stage4/blocks/conv1/conv/Conv + /model/backbone/stage4/blocks/conv1/act/Relu
|
158 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
159 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
160 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 134) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.0/Add)
|
161 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
162 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
163 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.backbone.stage4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 142) [Shuffle] + /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Mul, /model/backbone/stage4/blocks/bottlenecks/bottlenecks.1/Add)
|
164 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/stage4/blocks/conv2/act/Relu_output_0 copy
|
165 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/stage4/blocks/conv3/conv/Conv + /model/backbone/stage4/blocks/conv3/act/Relu
|
166 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv1/conv/Conv + /model/backbone/context_module/cv1/act/Relu
|
167 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.2/MaxPool
|
168 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.1/MaxPool
|
169 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POOLING: /model/backbone/context_module/m.0/MaxPool
|
170 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/backbone/context_module/cv1/act/Relu_output_0 copy
|
171 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/backbone/context_module/cv2/conv/Conv + /model/backbone/context_module/cv2/act/Relu
|
172 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/conv/conv/Conv + /model/neck/neck1/conv/act/Relu
|
173 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck1/upsample/ConvTranspose
|
174 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/reduce_after_concat/conv/Conv + /model/neck/neck1/reduce_after_concat/act/Relu
|
175 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv2/conv/Conv + /model/neck/neck1/blocks/conv2/act/Relu || /model/neck/neck1/blocks/conv1/conv/Conv + /model/neck/neck1/blocks/conv1/act/Relu
|
176 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
177 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
178 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.0.alpha + (Unnamed Layer* 171) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.0/Add)
|
179 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
180 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
181 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck1.blocks.bottlenecks.1.alpha + (Unnamed Layer* 179) [Shuffle] + /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck1/blocks/bottlenecks/bottlenecks.1/Add)
|
182 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/neck/neck1/blocks/conv2/act/Relu_output_0 copy
|
183 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck1/blocks/conv3/conv/Conv + /model/neck/neck1/blocks/conv3/act/Relu
|
184 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/conv/conv/Conv + /model/neck/neck2/conv/act/Relu
|
185 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] DECONVOLUTION: /model/neck/neck2/upsample/ConvTranspose
|
186 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/reduce_skip1/act/Relu_output_0 copy
|
187 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/reduce_after_concat/conv/Conv + /model/neck/neck2/reduce_after_concat/act/Relu
|
188 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv2/conv/Conv + /model/neck/neck2/blocks/conv2/act/Relu || /model/neck/neck2/blocks/conv1/conv/Conv + /model/neck/neck2/blocks/conv1/act/Relu
|
189 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv1/nonlinearity/Relu
|
190 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/cv2/nonlinearity/Relu
|
191 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.0.alpha + (Unnamed Layer* 200) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.0/Add)
|
192 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv1/nonlinearity/Relu
|
193 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/cv2/nonlinearity/Relu
|
194 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.1.alpha + (Unnamed Layer* 208) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.1/Add)
|
195 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv1/nonlinearity/Relu
|
196 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/rbr_reparam/Conv + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/cv2/nonlinearity/Relu
|
197 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck2.blocks.bottlenecks.2.alpha + (Unnamed Layer* 216) [Shuffle] + /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck2/blocks/bottlenecks/bottlenecks.2/Add)
|
198 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/neck/neck2/blocks/conv2/act/Relu_output_0 copy
|
199 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck2/blocks/conv3/conv/Conv + /model/neck/neck2/blocks/conv3/act/Relu
|
200 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/bbox_stem/seq/conv/Conv + /model/heads/head1/bbox_stem/seq/act/Relu || /model/heads/head1/pose_stem/seq/conv/Conv + /model/heads/head1/pose_stem/seq/act/Relu
|
201 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/conv/conv/Conv + /model/neck/neck3/conv/act/Relu
|
202 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head1/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head1/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head1/cls_convs/cls_convs.0/seq/act/Relu
|
203 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.0/seq/act/Relu
|
204 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv2/conv/Conv + /model/neck/neck3/blocks/conv2/act/Relu || /model/neck/neck3/blocks/conv1/conv/Conv + /model/neck/neck3/blocks/conv1/act/Relu
|
205 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/cls_pred/Conv
|
206 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/reg_pred/Conv
|
207 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head1/pose_convs/pose_convs.1/seq/act/Relu
|
208 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
209 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape + /model/heads/Transpose
|
210 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head1/pose_pred/Conv
|
211 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
212 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax
|
213 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.0.alpha + (Unnamed Layer* 247) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.0/Add)
|
214 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv
|
215 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
216 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
217 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck3.blocks.bottlenecks.1.alpha + (Unnamed Layer* 270) [Shuffle] + /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck3/blocks/bottlenecks/bottlenecks.1/Add)
|
218 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/neck/neck3/blocks/conv2/act/Relu_output_0 copy
|
219 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck3/blocks/conv3/conv/Conv + /model/neck/neck3/blocks/conv3/act/Relu
|
220 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_stem/seq/conv/Conv + /model/heads/head2/pose_stem/seq/act/Relu || /model/heads/head2/bbox_stem/seq/conv/Conv + /model/heads/head2/bbox_stem/seq/act/Relu
|
221 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/conv/conv/Conv + /model/neck/neck4/conv/act/Relu
|
222 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head2/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head2/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head2/cls_convs/cls_convs.0/seq/act/Relu
|
223 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.0/seq/act/Relu
|
224 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv2/conv/Conv + /model/neck/neck4/blocks/conv2/act/Relu || /model/neck/neck4/blocks/conv1/conv/Conv + /model/neck/neck4/blocks/conv1/act/Relu
|
225 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/cls_pred/Conv
|
226 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/reg_pred/Conv
|
227 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head2/pose_convs/pose_convs.1/seq/act/Relu
|
228 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv1/act/Relu
|
229 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_4 + /model/heads/Transpose_3
|
230 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head2/pose_pred/Conv
|
231 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/cv2/act/Relu
|
232 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_1
|
233 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.0.alpha + (Unnamed Layer* 301) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.0/Add)
|
234 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_1
|
235 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv1/act/Relu
|
236 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/cv2/act/Relu
|
237 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.1.alpha + (Unnamed Layer* 324) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.1/Add)
|
238 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv1/act/Relu
|
239 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/conv/Conv + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/cv2/act/Relu
|
240 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] POINTWISE: PWN(model.neck.neck4.blocks.bottlenecks.2.alpha + (Unnamed Layer* 332) [Shuffle] + /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Mul, /model/neck/neck4/blocks/bottlenecks/bottlenecks.2/Add)
|
241 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] COPY: /model/neck/neck4/blocks/conv2/act/Relu_output_0 copy
|
242 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/neck/neck4/blocks/conv3/conv/Conv + /model/neck/neck4/blocks/conv3/act/Relu
|
243 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/bbox_stem/seq/conv/Conv + /model/heads/head3/bbox_stem/seq/act/Relu || /model/heads/head3/pose_stem/seq/conv/Conv + /model/heads/head3/pose_stem/seq/act/Relu
|
244 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_convs/reg_convs.0/seq/conv/Conv + /model/heads/head3/reg_convs/reg_convs.0/seq/act/Relu || /model/heads/head3/cls_convs/cls_convs.0/seq/conv/Conv + /model/heads/head3/cls_convs/cls_convs.0/seq/act/Relu
|
245 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.0/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.0/seq/act/Relu
|
246 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/cls_pred/Conv
|
247 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/reg_pred/Conv
|
248 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.1/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.1/seq/act/Relu
|
249 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] SHUFFLE: /model/heads/Reshape_8 + /model/heads/Transpose_6
|
250 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_convs/pose_convs.2/seq/conv/Conv + /model/heads/head3/pose_convs/pose_convs.2/seq/act/Relu
|
251 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] SOFTMAX: /model/heads/Softmax_2
|
252 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/head3/pose_pred/Conv
|
253 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] CONVOLUTION: /model/heads/Conv_2
|
254 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice_1...cast_boxes_to_fp32]}
|
255 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] NMS: batched_nms_26
|
256 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] DEVICE_TO_SHAPE_HOST: (Unnamed Layer* 414) [NMS]_1_output[DevicetoShapeHostCopy]
|
257 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation2]
|
258 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] MYELIN: {ForeignNode[/model/heads/head1/Slice...graph2_/Concat_5]}
|
259 |
+
[12/28/2023-07:48:01] [I] [TRT] [GpuLayer] TRAIN_STATION: [trainStation3]
|
260 |
+
[12/28/2023-07:48:12] [I] [TRT] [MemUsageChange] Init cuBLAS/cuBLASLt: CPU +534, GPU +430, now: CPU 1195, GPU 3835 (MiB)
|
261 |
+
[12/28/2023-07:48:14] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +83, GPU +64, now: CPU 1278, GPU 3899 (MiB)
|
262 |
+
[12/28/2023-07:48:14] [I] [TRT] Local timing cache in use. Profiling results in this builder pass will not be stored.
|
263 |
+
[12/28/2023-08:44:43] [I] [TRT] Total Activation Memory: 8017417728
|
264 |
+
[12/28/2023-08:44:44] [I] [TRT] Detected 1 inputs and 1 output network tensors.
|
265 |
+
[12/28/2023-08:44:54] [I] [TRT] Total Host Persistent Memory: 330944
|
266 |
+
[12/28/2023-08:44:54] [I] [TRT] Total Device Persistent Memory: 115712
|
267 |
+
[12/28/2023-08:44:54] [I] [TRT] Total Scratch Memory: 134217728
|
268 |
+
[12/28/2023-08:44:54] [I] [TRT] [MemUsageStats] Peak memory usage of TRT CPU/GPU memory allocators: CPU 40 MiB, GPU 2398 MiB
|
269 |
+
[12/28/2023-08:44:54] [I] [TRT] [BlockAssignment] Started assigning block shifts. This will take 181 steps to complete.
|
270 |
+
[12/28/2023-08:44:54] [I] [TRT] [BlockAssignment] Algorithm ShiftNTopDown took 85.1996ms to assign 14 blocks to 181 nodes requiring 155574784 bytes.
|
271 |
+
[12/28/2023-08:44:54] [I] [TRT] Total Activation Memory: 155574784
|
272 |
+
[12/28/2023-08:44:59] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1625, GPU 5501 (MiB)
|
273 |
+
[12/28/2023-08:44:59] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in building engine: CPU +10, GPU +128, now: CPU 10, GPU 128 (MiB)
|
274 |
+
[12/28/2023-08:45:00] [I] Engine built in 3422.28 sec.
|
275 |
+
[12/28/2023-08:45:00] [I] [TRT] Loaded engine size: 76 MiB
|
276 |
+
[12/28/2023-08:45:00] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1317, GPU 5134 (MiB)
|
277 |
+
[12/28/2023-08:45:00] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in engine deserialization: CPU +0, GPU +74, now: CPU 0, GPU 74 (MiB)
|
278 |
+
[12/28/2023-08:45:00] [I] Engine deserialized in 0.264761 sec.
|
279 |
+
[12/28/2023-08:45:00] [I] [TRT] [MemUsageChange] Init cuDNN: CPU +0, GPU +0, now: CPU 1317, GPU 5134 (MiB)
|
280 |
+
[12/28/2023-08:45:01] [I] [TRT] [MemUsageChange] TensorRT-managed allocation in IExecutionContext creation: CPU +0, GPU +148, now: CPU 0, GPU 222 (MiB)
|
281 |
+
[12/28/2023-08:45:01] [I] Setting persistentCacheLimit to 0 bytes.
|
282 |
+
[12/28/2023-08:45:01] [I] Using random values for input onnx::Cast_0
|
283 |
+
[12/28/2023-08:45:01] [I] Created input binding for onnx::Cast_0 with dimensions 1x3x640x640
|
284 |
+
[12/28/2023-08:45:01] [I] Using random values for output graph2_flat_predictions
|
285 |
+
[12/28/2023-08:45:01] [I] Created output binding for graph2_flat_predictions with dimensions -1x57
|
286 |
+
[12/28/2023-08:45:01] [I] Starting inference
|
287 |
+
[12/28/2023-08:45:16] [I] Warmup completed 2 queries over 200 ms
|
288 |
+
[12/28/2023-08:45:16] [I] Timing trace has 569 queries over 15.0311 s
|
289 |
+
[12/28/2023-08:45:16] [I]
|
290 |
+
[12/28/2023-08:45:16] [I] === Trace details ===
|
291 |
+
[12/28/2023-08:45:16] [I] Trace averages of 100 runs:
|
292 |
+
[12/28/2023-08:45:16] [I] Average on 100 runs - GPU latency: 26.4061 ms - Host latency: 26.5181 ms (enqueue 26.4696 ms)
|
293 |
+
[12/28/2023-08:45:16] [I] Average on 100 runs - GPU latency: 26.2062 ms - Host latency: 26.3239 ms (enqueue 26.2673 ms)
|
294 |
+
[12/28/2023-08:45:16] [I] Average on 100 runs - GPU latency: 26.2202 ms - Host latency: 26.3345 ms (enqueue 26.2829 ms)
|
295 |
+
[12/28/2023-08:45:16] [I] Average on 100 runs - GPU latency: 26.1667 ms - Host latency: 26.2764 ms (enqueue 26.2337 ms)
|
296 |
+
[12/28/2023-08:45:16] [I] Average on 100 runs - GPU latency: 26.4629 ms - Host latency: 26.5727 ms (enqueue 26.5274 ms)
|
297 |
+
[12/28/2023-08:45:16] [I]
|
298 |
+
[12/28/2023-08:45:16] [I] === Performance summary ===
|
299 |
+
[12/28/2023-08:45:16] [I] Throughput: 37.8547 qps
|
300 |
+
[12/28/2023-08:45:16] [I] Latency: min = 25.1152 ms, max = 32.1547 ms, mean = 26.393 ms, median = 26.3442 ms, percentile(90%) = 27.0601 ms, percentile(95%) = 27.4189 ms, percentile(99%) = 29.4863 ms
|
301 |
+
[12/28/2023-08:45:16] [I] Enqueue Time: min = 25.0762 ms, max = 32.1133 ms, mean = 26.3436 ms, median = 26.2896 ms, percentile(90%) = 26.9199 ms, percentile(95%) = 27.0813 ms, percentile(99%) = 29.4521 ms
|
302 |
+
[12/28/2023-08:45:16] [I] H2D Latency: min = 0.0800781 ms, max = 0.117188 ms, mean = 0.0960489 ms, median = 0.097168 ms, percentile(90%) = 0.0996094 ms, percentile(95%) = 0.100098 ms, percentile(99%) = 0.101318 ms
|
303 |
+
[12/28/2023-08:45:16] [I] GPU Compute Time: min = 25.0037 ms, max = 32.0377 ms, mean = 26.281 ms, median = 26.2241 ms, percentile(90%) = 26.9429 ms, percentile(95%) = 27.3164 ms, percentile(99%) = 29.3721 ms
|
304 |
+
[12/28/2023-08:45:16] [I] D2H Latency: min = 0.00292969 ms, max = 0.0490723 ms, mean = 0.0159815 ms, median = 0.0146484 ms, percentile(90%) = 0.0253906 ms, percentile(95%) = 0.0271912 ms, percentile(99%) = 0.0324707 ms
|
305 |
+
[12/28/2023-08:45:16] [I] Total Host Walltime: 15.0311 s
|
306 |
+
[12/28/2023-08:45:16] [I] Total GPU Compute Time: 14.9539 s
|
307 |
+
[12/28/2023-08:45:16] [I] Explanations of the performance metrics are printed in the verbose logs.
|
308 |
+
[12/28/2023-08:45:16] [I]
|
309 |
+
&&&& PASSED TensorRT.trtexec [TensorRT v8502] # /usr/src/tensorrt/bin/trtexec --onnx=yolo_nas_pose_m_fp16.onnx --fp16 --avgRuns=100 --duration=15 --saveEngine=yolo_nas_pose_m_fp16.onnx.fp16.engine
|
yolo_nas_pose_m_fp16.onnx.int8.engine.err
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[12/28/2023-10:38:24] [W] [TRT] onnx2trt_utils.cpp:375: Your ONNX model has been generated with INT64 weights, while TensorRT does not natively support INT64. Attempting to cast down to INT32.
|
2 |
+
[12/28/2023-10:38:24] [W] [TRT] onnx2trt_utils.cpp:403: One or more weights outside the range of INT32 was clamped
|
3 |
+
[12/28/2023-10:38:24] [E] Error[4]: [network.cpp::validate::2925] Error Code 4: Internal Error (fp16 precision has been set for a layer or layer output, but fp16 is not configured in the builder)
|
4 |
+
[12/28/2023-10:38:24] [E] Error[2]: [builder.cpp::buildSerializedNetwork::751] Error Code 2: Internal Error (Assertion engine != nullptr failed. )
|
5 |
+
[12/28/2023-10:38:24] [E] Engine could not be created from network
|
6 |
+
[12/28/2023-10:38:24] [E] Building engine failed
|
7 |
+
[12/28/2023-10:38:24] [E] Failed to create engine from model or file.
|
8 |
+
[12/28/2023-10:38:24] [E] Engine set up failed
|