fix(grpc): pass by modelpath (#4023)

Instead of trying to derive it from the model file. In backends that specify HF url this results in a fragile logic. Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
2025-06-09 02:31:36 +00:00 · 2024-10-31 12:12:22 +01:00 · 2024-10-31 12:12:22 +01:00 · 61c964dce7
commit 61c964dce7
parent 48d621c64e
3 changed files with 7 additions and 6 deletions
--- a/backend/backend.proto
+++ b/backend/backend.proto
@ -233,6 +233,8 @@ message ModelOptions {

  bool FlashAttention = 56;
  bool NoKVOffload = 57;
+
+  string ModelPath = 59;
 }

 message Result {
--- a/backend/python/diffusers/backend.py
+++ b/backend/python/diffusers/backend.py
@ -301,13 +301,11 @@ class BackendServicer(backend_pb2_grpc.BackendServicer):
                self.pipe.controlnet = self.controlnet
            else:
                self.controlnet = None
-            # Assume directory from request.ModelFile.
-            # Only if request.LoraAdapter it's not an absolute path
-            if request.LoraAdapter and request.ModelFile != "" and not os.path.isabs(request.LoraAdapter) and request.LoraAdapter:
-                # get base path of modelFile
-                modelFileBase = os.path.dirname(request.ModelFile)
+
+            if request.LoraAdapter and not os.path.isabs(request.LoraAdapter):
                # modify LoraAdapter to be relative to modelFileBase
-                request.LoraAdapter = os.path.join(modelFileBase, request.LoraAdapter)
+                request.LoraAdapter = os.path.join(request.ModelPath, request.LoraAdapter)
+
            device = "cpu" if not request.CUDA else "cuda"
            self.device = device
            if request.LoraAdapter:
--- a/pkg/model/initializers.go
+++ b/pkg/model/initializers.go
@ -425,6 +425,7 @@ func (ml *ModelLoader) grpcModel(backend string, autodetect bool, o *Options) fu
 		options := *o.gRPCOptions
 		options.Model = modelName
 		options.ModelFile = modelFile
+		options.ModelPath = ml.ModelPath

 		log.Debug().Msgf("GRPC: Loading model with options: %+v", options)