Spaces:

Zana897465
/

Sparrow

Configuration error

Sparrow / sparrow_parse /vllm /inference_factory.py

Upload 24 files

05e6f93 verified 4 months ago

1.17 kB

	from sparrow_parse.vllm.huggingface_inference import HuggingFaceInference
	from sparrow_parse.vllm.local_gpu_inference import LocalGPUInference
	from sparrow_parse.vllm.mlx_inference import MLXInference


	class InferenceFactory:
	def __init__(self, config):
	self.config = config

	def get_inference_instance(self):
	if self.config["method"] == "huggingface":
	return HuggingFaceInference(hf_space=self.config["hf_space"], hf_token=self.config["hf_token"])
	elif self.config["method"] == "local_gpu":
	model = self._load_local_model() # Replace with actual model loading logic
	return LocalGPUInference(model=model, device=self.config.get("device", "cuda"))
	elif self.config["method"] == "mlx":
	return MLXInference(model_name=self.config["model_name"])
	else:
	raise ValueError(f"Unknown method: {self.config['method']}")

	def _load_local_model(self):
	# Example: Load a PyTorch model (replace with actual loading code)
	# model = torch.load('model.pth')
	# return model
	raise NotImplementedError("Model loading logic not implemented")