triton-inference-server · yinggeh · Jul 31, 2024 · Jul 18, 2024 · Jul 19, 2024 · Jul 26, 2024
diff --git a/include/triton/backend/backend_common.h b/include/triton/backend/backend_common.h
@@ -28,6 +28,7 @@
 #include <chrono>
 #include <condition_variable>
 #include <deque>
+#include <functional>
 #include <iostream>
 #include <mutex>
 #include <set>
@@ -671,4 +672,23 @@ TRITONSERVER_Error* BufferAsTypedString(
 /// \return a formatted string for logging the request ID.
 std::string GetRequestId(TRITONBACKEND_Request* request);
 
+/// Validate the contiguous string buffer with correct format
+/// <int32_len><bytes>...<int32_len><bytes>.
+/// @param buffer The pointer to the contiguous string buffer.
+/// @param buffer_byte_size The size of the buffer in bytes.
+/// @param expected_element_cnt The number of expected string elements.
+/// @param input_name The name of the input buffer.
+/// @param element_idx Returns the number of validated strings.
+/// @param set_string_tensor_cb Callback function which sets string input tensor
+/// depending on the backend platform.
+/// @param onnx_backend Whether the backend platform is ONNX runtime.
+/// @return a TRITONSERVER_Error indicating success or failure.
+TRITONSERVER_Error* ValidateStringBuffer(
+    const char* buffer, size_t buffer_byte_size,
+    const size_t expected_element_cnt, const char* input_name,
+    size_t* element_idx,
+    const std::function<void(size_t, const char*, const uint32_t)>&
+        set_string_tensor_cb,
+    bool onnx_backend = false);
+
 }}  // namespace triton::backend
diff --git a/src/backend_common.cc b/src/backend_common.cc
@@ -1372,4 +1372,74 @@ GetRequestId(TRITONBACKEND_Request* request)
   return std::string("[request id: ") + request_id + "] ";
 }
 
+TRITONSERVER_Error*
+ValidateStringBuffer(
+    const char* buffer, size_t buffer_byte_size,
+    const size_t expected_element_cnt, const char* input_name,
+    size_t* element_idx,
+    const std::function<void(size_t, const char*, const uint32_t)>&
+        set_string_tensor_cb,
+    bool onnx_backend)
+{
+  *element_idx = 0;
+  size_t remaining_bytes = buffer_byte_size;
+
+  // Each string in 'buffer' is a 4-byte length followed by the string itself
+  // with no null-terminator.
+  while (remaining_bytes >= sizeof(uint32_t)) {
+    if (*element_idx >= expected_element_cnt) {
+      return TRITONSERVER_ErrorNew(
+          TRITONSERVER_ERROR_INVALID_ARG,
+          std::string(
+              "unexpected number of string elements " +
+              std::to_string(*element_idx + 1) + " for inference input '" +
+              input_name + "', expecting " +
+              std::to_string(expected_element_cnt))
+              .c_str());
+    }
+
+    const uint32_t len = *(reinterpret_cast<const uint32_t*>(buffer));
+    remaining_bytes -= sizeof(uint32_t);
+    // Special handling for ONNX runtime backend
+    if (onnx_backend) {
+      // Make first byte of size info 0, so that if there is string data
+      // in front of it, the data becomes valid C string.
+      *const_cast<char*>(buffer) = 0;
+    }
+    buffer += sizeof(uint32_t);
+
+    if (remaining_bytes < len) {
+      return TRITONSERVER_ErrorNew(
+          TRITONSERVER_ERROR_INVALID_ARG,
+          std::string(
+              "incomplete string data for inference input '" +
+              std::string(input_name) + "', expecting string of length " +
+              std::to_string(len) + " but only " +
+              std::to_string(remaining_bytes) + " bytes available")
+              .c_str());
+    }
+
+    set_string_tensor_cb(*element_idx, buffer, len);
+    buffer += len;
+    remaining_bytes -= len;
+    (*element_idx)++;
+  }
+
+  // Special handling for ONNX runtime backend
+  if (onnx_backend && remaining_bytes > 0) {
+    *const_cast<char*>(buffer) = 0;
+  }
+
+  if (*element_idx != expected_element_cnt) {
+    return TRITONSERVER_ErrorNew(
+        TRITONSERVER_ERROR_INTERNAL,
+        std::string(
+            "expected " + std::to_string(expected_element_cnt) +
+            " strings for inference input '" + input_name + "', got " +
+            std::to_string(*element_idx))
+            .c_str());
+  }
+  return nullptr;
+}
+
 }}  // namespace triton::backend