FluxM-Lightning-Upscaler

Running on Zero

LPX commited on 6 days ago

Commit

f725d52

1 Parent(s): b971b27

Remove sequential CPU offload from model loading and simplify return value in safe_model_load function

Files changed (1) hide show

model_loader.py CHANGED Viewed

@@ -39,7 +39,7 @@ def safe_model_load():
             print(f"XFormers not available: {e}")
         pipe.enable_attention_slicing()
-        pipe.enable_sequential_cpu_offload()
         pipe.to("cuda")
         # For memory-sensitive environments
@@ -47,13 +47,8 @@ def safe_model_load():
             torch.multiprocessing.set_sharing_strategy('file_system')
         except Exception as e:
             print(f"Exception raised (torch.multiprocessing): {e}")
-        # Moondream
-        model = vl(api_key=md_api_key)
-        return {
-            "pipeline": pipe,
-            "captioner": model
-        }
     except Exception as e:
         print(f"Model loading failed: {e}")

             print(f"XFormers not available: {e}")
         pipe.enable_attention_slicing()
+        # pipe.enable_sequential_cpu_offload()
         pipe.to("cuda")
         # For memory-sensitive environments
             torch.multiprocessing.set_sharing_strategy('file_system')
         except Exception as e:
             print(f"Exception raised (torch.multiprocessing): {e}")
+        return pipe
     except Exception as e:
         print(f"Model loading failed: {e}")