EnariGmbH
/

surftown-1.0

llava_next_video

Inference Endpoints

Model card Files Files and versions Community

EnariGmbH commited on Sep 5

Commit

a700cdc

•

1 Parent(s): 018de9e

Update handler.py

Files changed (1) hide show

handler.py +20 -5

handler.py CHANGED Viewed

@@ -1,13 +1,28 @@
 from typing import Dict, List, Any
 import torch
-from transformers import LlavaNextVideoForConditionalGeneration, AutoProcessor, AutoConfig
 class EndpointHandler:
-    def __init__(self, path="/app"):
-        self.model = LlavaNextVideoForConditionalGeneration.from_pretrained(path)
-        # Load the processor from the configuration files
-        self.processor = AutoProcessor.from_pretrained(path)
         # Ensure the model is in evaluation mode
         self.model.eval()

 from typing import Dict, List, Any
 import torch
+from transformers import LlavaNextVideoForConditionalGeneration, LlavaNextVideoProcessor
+from peft import PeftModel
 class EndpointHandler:
+    def __init__(self):
+        self.base_model_name = "llava-hf/LLaVA-NeXT-Video-7B-hf"
+        self.adapter_model_name = "EnariGmbH/surftown-1.0"
+        # Load the base model
+        self.model = LlavaNextVideoForConditionalGeneration.from_pretrained(
+            self.base_model_name,
+            torch_dtype=torch.float16,
+            device_map="auto"
+        )
+        # Load the fine-tuned adapter model into the base model
+        self.model = PeftModel.from_pretrained(self.model, self.adapter_model_name)
+        # Merge the adapter weights into the base model and unload the adapter
+        self.model = self.model.merge_and_unload()
+        # # Optionally, load and save the processor (if needed)
+        self.processor = LlavaNextVideoProcessor.from_pretrained(self.adapter_model_name)
         # Ensure the model is in evaluation mode
         self.model.eval()