karthik
/

music_gen_unlimited

Model card Files Files and versions

karthik commited on Aug 6, 2023

Commit

965d33a

·

1 Parent(s): 7b3a1b2

update code

Files changed (3) hide show

README.md +1 -0
handler.py +6 -8
requirements.txt +1 -2

README.md CHANGED Viewed

@@ -3,6 +3,7 @@ inference: false
 tags:
 - musicgen
 license: cc-by-nc-4.0
 ---
 # MusicGen - Small - 300M

 tags:
 - musicgen
 license: cc-by-nc-4.0
+duplicated_from: facebook/musicgen-small
 ---
 # MusicGen - Small - 300M

handler.py CHANGED Viewed

@@ -3,10 +3,10 @@ from transformers import AutoProcessor, MusicgenForConditionalGeneration
 import torch
 class EndpointHandler:
-    def __init__(self, path="karthik/music_gen_unlimited"):
         # load model and processor from path
         self.processor = AutoProcessor.from_pretrained(path)
-        self.model = MusicgenForConditionalGeneration.from_pretrained(path, torch_dtype=torch.float16).to("cuda")
     def __call__(self, data: Dict[str, Any]) -> Dict[str, str]:
         """
@@ -26,13 +26,11 @@ class EndpointHandler:
         # pass inputs with all kwargs in data
         if parameters is not None:
-            with torch.autocast("cuda"):
-                outputs = self.model.generate(**inputs,do_sample=True, guidance_scale=3, max_new_tokens=256, **parameters)
         else:
-            with torch.autocast("cuda"):
-                outputs = self.model.generate(**inputs,do_sample=True, guidance_scale=3, max_new_tokens=256)
         # postprocess the prediction
-        prediction = outputs[0].cpu().numpy().tolist()
-        return [{"generated_audio": prediction}]

 import torch
 class EndpointHandler:
+    def __init__(self, path=""):
         # load model and processor from path
         self.processor = AutoProcessor.from_pretrained(path)
+        self.model = MusicgenForConditionalGeneration.from_pretrained(path).to("cuda")
     def __call__(self, data: Dict[str, Any]) -> Dict[str, str]:
         """
         # pass inputs with all kwargs in data
         if parameters is not None:
+            outputs = self.model.generate(**inputs, max_new_tokens=256, **parameters)
         else:
+            outputs = self.model.generate(**inputs, max_new_tokens=256)
         # postprocess the prediction
+        prediction = outputs[0].cpu().numpy()
+        return [{"generated_text": prediction}]

requirements.txt CHANGED Viewed

@@ -1,3 +1,2 @@
 transformers==4.31.0
-accelerate>=0.20.3


1	transformers==4.31.0
2	+ accelerate>=0.20.3