Spaces:

Gamahea
/

lemm-test-100

Running on Zero

Gamahea commited on 2 days ago

Commit

33cfbff

verified ·

1 Parent(s): 3faef55

Fix tensor serialization error - disable gradients for ZeroGPU

Files changed (1) hide show

backend/services/diffrhythm_service.py CHANGED Viewed

@@ -125,6 +125,10 @@ class DiffRhythmService:
             # Load weights
             ckpt = load_file(model_ckpt)
             self.model.load_state_dict(ckpt)
             # Note: Model will be moved to device inside GPU-decorated function
             # Load MuLan for style encoding (keep on CPU initially)
@@ -132,6 +136,10 @@ class DiffRhythmService:
                 "OpenMuQ/MuQ-MuLan-large",
                 cache_dir=os.path.join(self.model_path, "mulan")
             )
             # Note: MuLan will be moved to device inside GPU-decorated function
             # Load tokenizer
@@ -176,6 +184,10 @@ class DiffRhythmService:
             # Load decoder (keep on CPU initially)
             self.decoder = Generator(decoder_config, decoder_ckpt)
             # Note: Decoder will be moved to device inside GPU-decorated function
             logger.info("✅ DiffRhythm 2 model loaded successfully")

             # Load weights
             ckpt = load_file(model_ckpt)
             self.model.load_state_dict(ckpt)
+            self.model.eval()  # Set to evaluation mode
+            # Disable gradients for all parameters to allow ZeroGPU serialization
+            for param in self.model.parameters():
+                param.requires_grad = False
             # Note: Model will be moved to device inside GPU-decorated function
             # Load MuLan for style encoding (keep on CPU initially)
                 "OpenMuQ/MuQ-MuLan-large",
                 cache_dir=os.path.join(self.model_path, "mulan")
             )
+            self.mulan.eval()  # Set to evaluation mode
+            # Disable gradients
+            for param in self.mulan.parameters():
+                param.requires_grad = False
             # Note: MuLan will be moved to device inside GPU-decorated function
             # Load tokenizer
             # Load decoder (keep on CPU initially)
             self.decoder = Generator(decoder_config, decoder_ckpt)
+            self.decoder.eval()  # Set to evaluation mode
+            # Disable gradients
+            for param in self.decoder.parameters():
+                param.requires_grad = False
             # Note: Decoder will be moved to device inside GPU-decorated function
             logger.info("✅ DiffRhythm 2 model loaded successfully")