From 972323f1b60e7532e0487f40012116acecaa1910 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=EC=B5=9C=EC=B0=BD=EC=9C=A4?= <45411281+cyun9601@users.noreply.github.com> Date: Fri, 25 Jul 2025 10:22:03 +0900 Subject: [PATCH 1/4] Fix a error while following tutorial 1 When following the tutorial from the link below: https://docs.nvidia.com/deeplearning/triton-inference-server/user-guide/docs/tutorials/Conceptual_Guide/Part_1-model_deployment/README.html#launching-the-server an error occurs in the config.pbtxt for text_recognition: """ failed to load 'text_recognition' version 1: Invalid argument: unexpected inference output '308', allowed outputs are: 307 """ Update config.pbtxt --- .../model_repository/text_recognition/config.pbtxt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Conceptual_Guide/Part_1-model_deployment/model_repository/text_recognition/config.pbtxt b/Conceptual_Guide/Part_1-model_deployment/model_repository/text_recognition/config.pbtxt index 20671fa1..739c5af8 100644 --- a/Conceptual_Guide/Part_1-model_deployment/model_repository/text_recognition/config.pbtxt +++ b/Conceptual_Guide/Part_1-model_deployment/model_repository/text_recognition/config.pbtxt @@ -36,7 +36,7 @@ input [ ] output [ { - name: "308" + name: "307" data_type: TYPE_FP32 dims: [ 1, 26, 37 ] } From 84daa0ba9514a27a1d1f5ab3092daab8b00bfdb5 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=EC=B5=9C=EC=B0=BD=EC=9C=A4?= <45411281+cyun9601@users.noreply.github.com> Date: Fri, 25 Jul 2025 10:43:46 +0900 Subject: [PATCH 2/4] Update client.py --- Conceptual_Guide/Part_1-model_deployment/client.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Conceptual_Guide/Part_1-model_deployment/client.py b/Conceptual_Guide/Part_1-model_deployment/client.py index 82e8f0a0..b32e9d84 100644 --- a/Conceptual_Guide/Part_1-model_deployment/client.py +++ b/Conceptual_Guide/Part_1-model_deployment/client.py @@ -206,6 +206,6 @@ def recognition_postprocessing(scores: np.ndarray) -> str: ) # Process response from recognition model - final_text = recognition_postprocessing(recognition_response.as_numpy("308")) + final_text = recognition_postprocessing(recognition_response.as_numpy("307")) print(final_text) From 2150d06845a72647b91061227bf94f4e30b4a021 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=EC=B5=9C=EC=B0=BD=EC=9C=A4?= <45411281+cyun9601@users.noreply.github.com> Date: Fri, 25 Jul 2025 14:46:52 +0900 Subject: [PATCH 3/4] Update README.md --- .../Part_2-improving_resource_utilization/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Conceptual_Guide/Part_2-improving_resource_utilization/README.md b/Conceptual_Guide/Part_2-improving_resource_utilization/README.md index 8bfe5b7a..0e2197d3 100644 --- a/Conceptual_Guide/Part_2-improving_resource_utilization/README.md +++ b/Conceptual_Guide/Part_2-improving_resource_utilization/README.md @@ -110,7 +110,7 @@ model.load_state_dict(state) # Create ONNX file by tracing model trace_input = torch.randn(1, 1, 32, 100) -torch.onnx.export(model, trace_input, "str.onnx", verbose=True, dynamic_axes={'input.1':[0],'308':[0]}) +torch.onnx.export(model, trace_input, "str.onnx", verbose=True, dynamic_axes={'input.1':[0],'307':[0]}) ``` ### Launching the server From 74b28ee6e83d35f5e87c92d50cb04b10a41241ff Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=EC=B5=9C=EC=B0=BD=EC=9C=A4?= <45411281+cyun9601@users.noreply.github.com> Date: Fri, 25 Jul 2025 14:47:17 +0900 Subject: [PATCH 4/4] Update config.pbtxt --- .../model_repository/text_recognition/config.pbtxt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Conceptual_Guide/Part_2-improving_resource_utilization/model_repository/text_recognition/config.pbtxt b/Conceptual_Guide/Part_2-improving_resource_utilization/model_repository/text_recognition/config.pbtxt index a19bd2c5..2f627c8e 100644 --- a/Conceptual_Guide/Part_2-improving_resource_utilization/model_repository/text_recognition/config.pbtxt +++ b/Conceptual_Guide/Part_2-improving_resource_utilization/model_repository/text_recognition/config.pbtxt @@ -36,7 +36,7 @@ input [ ] output [ { - name: "308" + name: "307" data_type: TYPE_FP32 dims: [ 26, 37 ] }