Spaces:

Liusuthu
/

Portable-Depression-Detecting-System

Runtime error

App Files Files Community

Portable-Depression-Detecting-System / paraformer /runtime /python /utils /puncOrtInferRuntimeSession.py

Liusuthu

Upload folder using huggingface_hub

890de26 verified 11 months ago

raw

history blame

3.87 kB

	# -- coding:utf-8 --
	# @FileName :OrtInferSession.py
	# @Time :2023/4/13 15:13
	# @Author :lovemefan
	# @Email :[email protected]
	import logging
	from pathlib import Path
	from typing import List, Union

	import numpy as np
	from onnxruntime import (GraphOptimizationLevel, InferenceSession,
	SessionOptions, get_available_providers, get_device)

	from paraformer.runtime.python.utils.singleton import singleton


	class ONNXRuntimeError(Exception):
	pass


	@singleton
	class PuncOrtInferRuntimeSession:
	def __init__(self, model_file, device_id=-1, intra_op_num_threads=4):
	device_id = str(device_id)
	sess_opt = SessionOptions()
	sess_opt.intra_op_num_threads = intra_op_num_threads
	sess_opt.log_severity_level = 4
	sess_opt.enable_cpu_mem_arena = False
	sess_opt.graph_optimization_level = GraphOptimizationLevel.ORT_ENABLE_ALL

	cuda_ep = "CUDAExecutionProvider"
	cuda_provider_options = {
	"device_id": device_id,
	"arena_extend_strategy": "kNextPowerOfTwo",
	"cudnn_conv_algo_search": "EXHAUSTIVE",
	"do_copy_in_default_stream": "true",
	}
	cpu_ep = "CPUExecutionProvider"
	cpu_provider_options = {
	"arena_extend_strategy": "kSameAsRequested",
	}

	EP_list = []
	if (
	device_id != "-1"
	and get_device() == "GPU"
	and cuda_ep in get_available_providers()
	):
	EP_list = [(cuda_ep, cuda_provider_options)]
	EP_list.append((cpu_ep, cpu_provider_options))

	if isinstance(model_file, list):
	merged_model_file = b""
	for file in sorted(model_file):
	with open(file, "rb") as onnx_file:
	merged_model_file += onnx_file.read()

	model_file = merged_model_file
	else:
	self._verify_model(model_file)
	self.session = InferenceSession(
	model_file, sess_options=sess_opt, providers=EP_list
	)

	if device_id != "-1" and cuda_ep not in self.session.get_providers():
	logging.warnings.warn(
	f"{cuda_ep} is not avaiable for current env, "
	f"the inference part is automatically shifted to be executed under {cpu_ep}.\n"
	"Please ensure the installed onnxruntime-gpu version matches your cuda and cudnn version, "
	"you can check their relations from the offical web site: "
	"https://onnxruntime.ai/docs/execution-providers/CUDA-ExecutionProvider.html",
	RuntimeWarning,
	)

	def __call__(
	self, input_content: List[Union[np.ndarray, np.ndarray]]
	) -> np.ndarray:
	input_dict = dict(zip(self.get_input_names(), input_content))
	try:
	return self.session.run(self.get_output_names(), input_dict)
	except Exception as e:
	raise ONNXRuntimeError("ONNXRuntime inferece failed.") from e

	def get_input_names(
	self,
	):
	return [v.name for v in self.session.get_inputs()]

	def get_output_names(
	self,
	):
	return [v.name for v in self.session.get_outputs()]

	def get_character_list(self, key: str = "character"):
	return self.meta_dict[key].splitlines()

	def have_key(self, key: str = "character") -> bool:
	self.meta_dict = self.session.get_modelmeta().custom_metadata_map
	if key in self.meta_dict.keys():
	return True
	return False

	@staticmethod
	def _verify_model(model_path):
	model_path = Path(model_path)
	if not model_path.exists():
	raise FileNotFoundError(f"{model_path} does not exists.")
	if not model_path.is_file():
	raise FileExistsError(f"{model_path} is not a file.")