Spaces:

Staticaliza
/

Sense

Running

Staticaliza commited on May 28

Commit

ceea9f7

verified ·

1 Parent(s): e52a62d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -56,23 +56,19 @@ def generate(image, video, audio, instruction=DEFAULT_INPUT, sampling=False, tem
     if image is not None:
         img = Image.fromarray(image.astype("uint8"), "RGB")
         inputs = [{"role": "user", "content": [img, instruction]}]
-        media = img
     elif video is not None:
         vid = encode_video(video)
-        inputs = [{"role": "user", "content": [vid, instruction]}]
-        media = vid
     elif audio is not None:
         if isinstance(audio, str):
             aud, _ = librosa.load(audio, sr=16000, mono=True)
         else:
             aud = audio
         inputs = [{"role": "user", "content": [aud, instruction]}]
-        media = aud
     else:
         return "No input provided."
     params = {
-        "image": media,
         "msgs": inputs,
         "tokenizer": tokenizer,
         #"processor": processor,

     if image is not None:
         img = Image.fromarray(image.astype("uint8"), "RGB")
         inputs = [{"role": "user", "content": [img, instruction]}]
     elif video is not None:
         vid = encode_video(video)
+        inputs = [{"role": "user", "content": vid + [instruction]}]
     elif audio is not None:
         if isinstance(audio, str):
             aud, _ = librosa.load(audio, sr=16000, mono=True)
         else:
             aud = audio
         inputs = [{"role": "user", "content": [aud, instruction]}]
     else:
         return "No input provided."
     params = {
         "msgs": inputs,
         "tokenizer": tokenizer,
         #"processor": processor,