added whisperx (mediasources need some fixes)

2025-11-19 16:16:28 +01:00 · 2023-11-28 16:20:56 +01:00
parent a2433aa70c
commit 261bed427d
22 changed files with 1451 additions and 218 deletions
--- a/utils/mediasource_utils.py
+++ b/utils/mediasource_utils.py
@@ -0,0 +1,330 @@
+import os
+import urllib
+from datetime import time
+from urllib.parse import urlparse
+import ffmpegio
+from decord import AudioReader, cpu
+import requests
+from utils.nostr_utils import get_event_by_id
+
+
+def input_data_file_duration(event, dvm_config, client, start=0, end=0):
+    input_value = ""
+    input_type = "url"
+    for tag in event.tags():
+        if tag.as_vec()[0] == 'i':
+            input_value = tag.as_vec()[1]
+            input_type = tag.as_vec()[2]
+
+    if input_type == "event":  # NIP94 event
+        evt = get_event_by_id(input_value, client=client, config=dvm_config)
+        if evt is not None:
+            input_value, input_type = check_nip94_event_for_media(evt, input_value, input_type)
+
+
+    if input_type == "url":
+        source_type = check_source_type(input_value)
+
+        filename, start, end, type = get_file_start_end_type(input_value, source_type, start, end)
+        if type != "audio" and type != "video":
+            return 1
+        if filename == "" or filename is None:
+            return 0
+        try:
+            file_reader = AudioReader(filename, ctx=cpu(0), mono=False)
+            duration = float(file_reader.duration())
+        except Exception as e:
+            print(e)
+            return 0
+        print("Original Duration of the Media file: " + str(duration))
+        start_time, end_time, new_duration = (
+            convert_media_length(start, end, duration))
+        print("New Duration of the Media file: " + str(new_duration))
+        return new_duration
+
+    return 1
+
+
+
+
+def organize_input_data(input_value, input_type, start, end, dvm_config, client, process=True) -> str:
+    if input_type == "event":  # NIP94 event
+        evt = get_event_by_id(input_value, client=client, config=dvm_config)
+        if evt is not None:
+            input_value, input_type = check_nip94_event_for_media(evt, input_value, input_type)
+
+    if input_type == "url":
+        source_type = check_source_type(input_value)
+        filename, start, end, type = get_file_start_end_type(input_value, source_type, start, end)
+        if filename == "" or filename is None:
+            return ""
+        try:
+            file_reader = AudioReader(filename, ctx=cpu(0), mono=False)
+            duration = float(file_reader.duration())
+        except Exception as e:
+            print(e)
+            return ""
+
+        print("Original Duration of the Media file: " + str(duration))
+        start_time, end_time, new_duration = (
+            convert_media_length(start, end, duration))
+        print("New Duration of the Media file: " + str(new_duration))
+
+
+        # TODO if already in a working format and time is 0 0, dont convert
+        print("Converting from " + str(start_time) + " until " + str(end_time))
+        # for now, we cut and convert all files to mp3
+        final_filename = '.\\outputs\\audio.mp3'
+        print(final_filename)
+        fs, x = ffmpegio.audio.read(filename, ss=start_time, to=end_time, sample_fmt='dbl', ac=1)
+        ffmpegio.audio.write(final_filename, fs, x, overwrite=True)
+        return final_filename
+
+def check_nip94_event_for_media(evt, input_value, input_type):
+    # Parse NIP94 event for url, if found, use it.
+    if evt.kind() == 1063:
+        for tag in evt.tags():
+            if tag.as_vec()[0] == 'url':
+                input_type = "url"
+                input_value = tag.as_vec()[1]
+                return input_value, input_type
+
+    return input_value, input_type
+
+def convert_media_length(start: float, end: float, duration: float):
+    if end == 0.0:
+        end_time = duration
+    elif end > duration:
+        end_time = duration
+    else:
+        end_time = end
+    if start <= 0.0 or start > end_time:
+        start_time = 0.0
+    else:
+        start_time = start
+    dur = end_time - start_time
+    return start_time, end_time, dur
+
+
+def get_file_start_end_type(url, source_type, start, end) -> (str, str):
+    #  Overcast
+    if source_type == "overcast":
+        name, start, end = get_overcast(url, start, end)
+        return name, start, end, "audio"
+    #  Youtube
+    elif source_type == "youtube":
+        audio_only = True
+
+        name, start, end = get_youtube(url, start, end, audio_only)
+
+        return name, start, end, "audio"
+    #  Xitter
+    elif source_type == "xitter":
+        name, start, end = get_Twitter(url, start, end)
+        return name, start, end, "video"
+    #  Tiktok
+    elif source_type == "tiktok":
+        name, start, end = get_TikTok(url, start, end)
+        return name, start, end, "video"
+    #  Instagram
+    elif source_type == "instagram":
+        name, start, end = get_Instagram(url, start, end)
+        if name.endswith("jpg"):
+            type = "image"
+        else:
+            type = "video"
+        return name, start, end, type
+    #  A file link
+    else:
+        filename, filetype = get_media_link(url)
+        return filename, start, end, filetype
+
+
+def media_source(source_type):
+    if source_type == "overcast":
+        return "audio"
+    elif source_type == "youtube":
+        return "audio"
+    elif source_type == "xitter":
+        return "video"
+    elif source_type == "tiktok":
+        return "video"
+    elif source_type == "instagram":
+        return "video"
+    else:
+        return "url"
+
+
+def check_source_type(url):
+    if str(url).startswith("https://overcast.fm/"):
+        return "overcast"
+    elif str(url).replace("http://", "").replace("https://", "").replace(
+            "www.", "").replace("youtu.be/", "youtube.com?v=")[0:11] == "youtube.com":
+        return "youtube"
+    elif str(url).startswith("https://x.com") or str(url).startswith("https://twitter.com"):
+        return "xitter"
+    elif str(url).startswith("https://vm.tiktok.com") or str(url).startswith(
+            "https://www.tiktok.com") or str(url).startswith("https://m.tiktok.com"):
+        return "tiktok"
+    elif str(url).startswith("https://www.instagram.com") or str(url).startswith(
+            "https://instagram.com"):
+        return "instagram"
+    else:
+        return "url"
+
+
+def get_overcast(input_value, start, end):
+    filename = '.\\outputs\\' + ".originalaudio.mp3"
+    print("Found overcast.fm Link.. downloading")
+    start_time = start
+    end_time = end
+    downloadOvercast(input_value, filename)
+    finaltag = str(input_value).replace("https://overcast.fm/", "").split('/')
+    if start == 0.0:
+        if len(finaltag) > 1:
+            t = time.strptime(finaltag[1], "%H:%M:%S")
+            seconds = t.tm_hour * 60 * 60 + t.tm_min * 60 + t.tm_sec
+            start_time = float(seconds)
+            print("Setting start time automatically to " + str(start_time))
+            if end > 0.0:
+                end_time = float(seconds + end)
+                print("Moving end time automatically to " + str(end_time))
+
+    return filename, start_time, end_time
+
+
+def get_TikTok(input_value, start, end):
+    filepath = '.\\outputs\\'
+    try:
+        filename = downloadTikTok(input_value, filepath)
+        print(filename)
+    except Exception as e:
+        print(e)
+        return "", start, end
+    return filename, start, end
+
+
+def get_Instagram(input_value, start, end):
+    filepath = '.\\outputs\\'
+    try:
+        filename = downloadInstagram(input_value, filepath)
+        print(filename)
+    except Exception as e:
+        print(e)
+        return "", start, end
+    return filename, start, end
+
+
+def get_Twitter(input_value, start, end):
+    filepath = '.\\outputs\\'
+    cleanlink = str(input_value).replace("twitter.com", "x.com")
+    try:
+        filename = downloadTwitter(cleanlink, filepath)
+        print(filename)
+    except Exception as e:
+        print(e)
+        return "", start, end
+    return filename, start, end
+
+
+def get_youtube(input_value, start, end, audioonly=True):
+    filepath = '.\\outputs\\'
+    filename = ""
+    try:
+        filename = downloadYouTube(input_value, filepath, audioonly)
+
+    except Exception as e:
+        print("Youtube" + str(e))
+        return filename, start, end
+    try:
+        o = urlparse(input_value)
+        q = urllib.parse.parse_qs(o.query)
+        if start == 0.0:
+            if o.query.find('?t=') != -1:
+                start = q['t'][0]  # overwrite from link.. why not..
+                print("Setting start time automatically to " + start)
+                if end > 0.0:
+                    end = float(q['t'][0]) + end
+                    print("Moving end time automatically to " + str(end))
+
+    except Exception as e:
+        print(e)
+        return filename, start, end
+
+    return filename, start, end
+
+
+def get_media_link(url) -> (str, str):
+    req = requests.get(url)
+    content_type = req.headers['content-type']
+    print(content_type)
+    if content_type == 'audio/x-wav' or str(url).lower().endswith(".wav"):
+        ext = "wav"
+        file_type = "audio"
+        with open('.\\outputs\\file.' + ext, 'wb') as fd:
+            fd.write(req.content)
+        return '.\\outputs\\file.' + ext, file_type
+    elif content_type == 'audio/mpeg' or str(url).lower().endswith(".mp3"):
+        ext = "mp3"
+        file_type = "audio"
+        with open('.\\outputs\\file.' + '\\file.' + ext, 'wb') as fd:
+            fd.write(req.content)
+        return '.\\outputs\\file.' + ext, file_type
+    elif content_type == 'audio/ogg' or str(url).lower().endswith(".ogg"):
+        ext = "ogg"
+        file_type = "audio"
+        with open('.\\outputs\\file.' + ext, 'wb') as fd:
+            fd.write(req.content)
+        return '.\\outputs\\file.' + ext, file_type
+    elif content_type == 'video/mp4' or str(url).lower().endswith(".mp4"):
+        ext = "mp4"
+        file_type = "video"
+        with open('.\\outputs\\file.' + ext, 'wb') as fd:
+            fd.write(req.content)
+        return '.\\outputs\\file.' + ext, file_type
+    elif content_type == 'video/avi' or str(url).lower().endswith(".avi"):
+        ext = "avi"
+        file_type = "video"
+        with open('.\\outputs\\file.' + ext, 'wb') as fd:
+            fd.write(req.content)
+        return '.\\outputs\\file.' + ext, file_type
+    elif content_type == 'video/quicktime' or str(url).lower().endswith(".mov"):
+        ext = "mov"
+        file_type = "video"
+        with open('.\\outputs\\file.' + ext, 'wb') as fd:
+            fd.write(req.content)
+        return '.\\outputs\\file.' + ext, file_type
+
+    else:
+        print(str(url).lower())
+        return None, None
+
+
+def downloadOvercast(source_url, target_location):
+    from utils.scrapper.media_scrapper import OvercastDownload
+    result = OvercastDownload(source_url, target_location)
+    return result
+
+
+def downloadTwitter(videourl, path):
+    from utils.scrapper.media_scrapper import XitterDownload
+    result = XitterDownload(videourl, path + "x.mp4")
+    return result
+
+
+def downloadTikTok(videourl, path):
+    from utils.scrapper.media_scrapper import TiktokDownloadAll
+    result = TiktokDownloadAll([videourl], path)
+    return result
+
+
+def downloadInstagram(videourl, path):
+    from utils.scrapper.media_scrapper import InstagramDownload
+    result = InstagramDownload(videourl, "insta", path)
+    return result
+
+
+def downloadYouTube(link, path, audioonly=True):
+    from utils.scrapper.media_scrapper import YouTubeDownload
+    result = YouTubeDownload(link, path, audio_only=True)
+    return result