Index _ | A | B | C | D | F | G | I | K | L | M | N | P | R | S | T | U _ __call__() (tritonclient.grpc.InferenceServerClientPlugin method) (tritonclient.http.InferenceServerClientPlugin method) _abc_impl (tritonclient.grpc.auth.BasicAuth attribute) (tritonclient.grpc.InferenceServerClientPlugin attribute) (tritonclient.http.auth.BasicAuth attribute) (tritonclient.http.InferenceServerClientPlugin attribute) _fix_header() (tritonclient.http.aio.InferenceServerClient method) _get() (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) _get_binary_data() (tritonclient.http.InferInput method) _get_content() (tritonclient.grpc.InferInput method) _get_error() (in module tritonclient.http.aio) _get_metadata() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) _get_or_create_global_cuda_stream() (in module tritonclient.utils.cuda_shared_memory) _get_tensor() (tritonclient.grpc.InferInput method) (tritonclient.grpc.InferRequestedOutput method) (tritonclient.http.InferInput method) (tritonclient.http.InferRequestedOutput method) _is_device_supported() (in module tritonclient.utils.cuda_shared_memory) _post() (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) _raise_if_error() (in module tritonclient.http.aio) _return_response() (tritonclient.grpc.aio.InferenceServerClient method) _support_uva() (in module tritonclient.utils.cuda_shared_memory) _validate_headers() (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) A allocated_shared_memory_regions() (in module tritonclient.utils.cuda_shared_memory) as_numpy() (tritonclient.grpc.InferResult method) (tritonclient.http.InferResult method) as_shared_memory_tensor() (in module tritonclient.utils.cuda_shared_memory) async_infer() (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) async_stream_infer() (tritonclient.grpc.InferenceServerClient method) B BasicAuth (class in tritonclient.grpc.auth) (class in tritonclient.http.auth) C close() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) create_shared_memory_region() (in module tritonclient.utils.cuda_shared_memory) (in module tritonclient.utils.shared_memory) D datatype() (tritonclient.grpc.InferInput method) (tritonclient.http.InferInput method) debug_details() (tritonclient.grpc.InferenceServerException method) (tritonclient.http.InferenceServerException method) (tritonclient.utils.InferenceServerException method) deserialize_bf16_tensor() (in module tritonclient.utils) deserialize_bytes_tensor() (in module tritonclient.utils) destroy_shared_memory_region() (in module tritonclient.utils.cuda_shared_memory) (in module tritonclient.utils.shared_memory) F from_response_body() (tritonclient.http.InferResult class method) G generate_request_body() (tritonclient.http.aio.InferenceServerClient static method) (tritonclient.http.InferenceServerClient static method) get_contents_as_numpy() (in module tritonclient.utils.cuda_shared_memory) (in module tritonclient.utils.shared_memory) get_cuda_shared_memory_status() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_inference_statistics() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_log_settings() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_model_config() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_model_metadata() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_model_repository_index() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_output() (tritonclient.grpc.InferResult method) (tritonclient.http.InferResult method) get_raw_handle() (in module tritonclient.utils.cuda_shared_memory) get_response() (tritonclient.grpc.InferResult method) (tritonclient.http.InferResult method) get_result() (tritonclient.http.InferAsyncRequest method) get_server_metadata() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_system_shared_memory_status() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) get_trace_settings() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) I infer() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) InferAsyncRequest (class in tritonclient.http) InferenceServerClient (class in tritonclient.grpc) (class in tritonclient.grpc.aio) (class in tritonclient.http) (class in tritonclient.http.aio) InferenceServerClientPlugin (class in tritonclient.grpc) (class in tritonclient.http) InferenceServerException, [1], [2] InferInput (class in tritonclient.grpc) (class in tritonclient.http) InferRequestedOutput (class in tritonclient.grpc) (class in tritonclient.http) InferResult (class in tritonclient.grpc) (class in tritonclient.http) is_model_ready() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) is_server_live() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) is_server_ready() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) K KeepAliveOptions (class in tritonclient.grpc) L load_model() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) M mapped_shared_memory_regions() (in module tritonclient.utils.shared_memory) message() (tritonclient.grpc.InferenceServerException method) (tritonclient.http.InferenceServerException method) (tritonclient.utils.InferenceServerException method) module tritonclient tritonclient.grpc tritonclient.grpc.aio tritonclient.grpc.aio.auth tritonclient.grpc.auth tritonclient.http tritonclient.http.aio tritonclient.http.aio.auth tritonclient.http.auth tritonclient.utils tritonclient.utils.cuda_shared_memory tritonclient.utils.shared_memory N name() (tritonclient.grpc.InferInput method) (tritonclient.grpc.InferRequestedOutput method) (tritonclient.http.InferInput method) (tritonclient.http.InferRequestedOutput method) np_to_triton_dtype() (in module tritonclient.utils) P parse_response_body() (tritonclient.http.aio.InferenceServerClient static method) (tritonclient.http.InferenceServerClient static method) R raise_error() (in module tritonclient.utils) register_cuda_shared_memory() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) register_system_shared_memory() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) Request (class in tritonclient.grpc) (class in tritonclient.http) S serialize_bf16_tensor() (in module tritonclient.utils) serialize_byte_tensor() (in module tritonclient.utils) serialized_byte_size() (in module tritonclient.utils) set_data_from_numpy() (tritonclient.grpc.InferInput method) (tritonclient.http.InferInput method) set_shape() (tritonclient.grpc.InferInput method) (tritonclient.http.InferInput method) set_shared_memory() (tritonclient.grpc.InferInput method) (tritonclient.grpc.InferRequestedOutput method) (tritonclient.http.InferInput method) (tritonclient.http.InferRequestedOutput method) set_shared_memory_region() (in module tritonclient.utils.cuda_shared_memory) (in module tritonclient.utils.shared_memory) set_shared_memory_region_from_dlpack() (in module tritonclient.utils.cuda_shared_memory) shape() (tritonclient.grpc.InferInput method) (tritonclient.http.InferInput method) SharedMemoryException SharedMemoryRegion (class in tritonclient.utils.shared_memory) start_stream() (tritonclient.grpc.InferenceServerClient method) status() (tritonclient.grpc.InferenceServerException method) (tritonclient.http.InferenceServerException method) (tritonclient.utils.InferenceServerException method) stop_stream() (tritonclient.grpc.InferenceServerClient method) stream_infer() (tritonclient.grpc.aio.InferenceServerClient method) T triton_to_np_dtype() (in module tritonclient.utils) tritonclient module tritonclient.grpc module tritonclient.grpc.aio module tritonclient.grpc.aio.auth module tritonclient.grpc.auth module tritonclient.http module tritonclient.http.aio module tritonclient.http.aio.auth module tritonclient.http.auth module tritonclient.utils module tritonclient.utils.cuda_shared_memory module tritonclient.utils.shared_memory module U unload_model() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) unregister_cuda_shared_memory() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) unregister_system_shared_memory() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) unset_shared_memory() (tritonclient.grpc.InferRequestedOutput method) (tritonclient.http.InferRequestedOutput method) update_log_settings() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method) update_trace_settings() (tritonclient.grpc.aio.InferenceServerClient method) (tritonclient.grpc.InferenceServerClient method) (tritonclient.http.aio.InferenceServerClient method) (tritonclient.http.InferenceServerClient method)