diff --git a/handler.py b/handler.py index 4e010b4..b61289f 100644 --- a/handler.py +++ b/handler.py @@ -6,7 +6,7 @@ class EndpointHandler: def __init__(self, path=""): # load model and processor from path self.tokenizer = AutoTokenizer.from_pretrained(path, trust_remote_code=True) - self.model = AutoModel.from_pretrained(path, trust_remote_code=True).half().cuda() + self.model = AutoModel.from_pretrained(path, trust_remote_code=True).float() def __call__(self, data: Dict[str, Any]) -> Dict[str, str]: """