mirror of
https://github.com/believethehype/nostrdvm.git
synced 2025-06-08 01:09:17 +02:00
156 lines
6.3 KiB
Python
156 lines
6.3 KiB
Python
import typing
|
|
|
|
import requests
|
|
from nostr_sdk import Event, Tag
|
|
|
|
from utils.definitions import EventDefinitions
|
|
from utils.mediasource_utils import check_source_type, media_source
|
|
from utils.nostr_utils import get_event_by_id
|
|
|
|
|
|
def get_task(event, client, dvm_config):
|
|
try:
|
|
if event.kind() == EventDefinitions.KIND_NIP90_GENERIC: # use this for events that have no id yet, inclufr j tag
|
|
for tag in event.tags():
|
|
if tag.as_vec()[0] == 'j':
|
|
return tag.as_vec()[1]
|
|
else:
|
|
return "unknown job: " + event.as_json()
|
|
elif event.kind() == EventDefinitions.KIND_DM: # dm
|
|
for tag in event.tags():
|
|
if tag.as_vec()[0] == 'j':
|
|
return tag.as_vec()[1]
|
|
else:
|
|
return "unknown job: " + event.as_json()
|
|
|
|
# This looks a bit more complicated, but we do several tasks for text-extraction in the future
|
|
elif event.kind() == EventDefinitions.KIND_NIP90_EXTRACT_TEXT:
|
|
for tag in event.tags():
|
|
if tag.as_vec()[0] == "i":
|
|
if tag.as_vec()[2] == "url":
|
|
file_type = check_url_is_readable(tag.as_vec()[1])
|
|
print(file_type)
|
|
if file_type == "pdf":
|
|
return "pdf-to-text"
|
|
elif file_type == "audio" or file_type == "video":
|
|
return "speech-to-text"
|
|
else:
|
|
return "unknown job"
|
|
elif tag.as_vec()[2] == "event":
|
|
evt = get_event_by_id(tag.as_vec()[1], client=client, config=dvm_config)
|
|
if evt is not None:
|
|
if evt.kind() == 1063:
|
|
for tg in evt.tags():
|
|
if tg.as_vec()[0] == 'url':
|
|
file_type = check_url_is_readable(tg.as_vec()[1])
|
|
if file_type == "pdf":
|
|
return "pdf-to-text"
|
|
elif file_type == "audio" or file_type == "video":
|
|
return "speech-to-text"
|
|
else:
|
|
return "unknown job"
|
|
else:
|
|
return "unknown type"
|
|
else:
|
|
return "unknown job"
|
|
|
|
# TODO if a task can consist of multiple inputs add them here
|
|
# else if kind is supported, simply return task
|
|
else:
|
|
|
|
for dvm in dvm_config.SUPPORTED_DVMS:
|
|
if dvm.KIND == event.kind():
|
|
return dvm.TASK
|
|
except Exception as e:
|
|
print("Get task: " + str(e))
|
|
|
|
return "unknown type"
|
|
|
|
|
|
def is_input_supported_generic(tags, client, dvm_config) -> bool:
|
|
try:
|
|
for tag in tags:
|
|
if tag.as_vec()[0] == 'i':
|
|
if len(tag.as_vec()) < 3:
|
|
print("Job Event missing/malformed i tag, skipping..")
|
|
return False
|
|
else:
|
|
input_value = tag.as_vec()[1]
|
|
input_type = tag.as_vec()[2]
|
|
if input_type == "event":
|
|
evt = get_event_by_id(input_value, client=client, config=dvm_config)
|
|
if evt is None:
|
|
print("Event not found")
|
|
return False
|
|
# TODO check_url_is_readable might be more relevant per task in the future
|
|
# if input_type == 'url' and check_url_is_readable(input_value) is None:
|
|
# print("Url not readable / supported")
|
|
# return False
|
|
|
|
return True
|
|
except Exception as e:
|
|
print("Generic input check: " + str(e))
|
|
|
|
|
|
def check_task_is_supported(event: Event, client, config=None):
|
|
try:
|
|
dvm_config = config
|
|
task = get_task(event, client=client, dvm_config=dvm_config)
|
|
if task not in (x.TASK for x in dvm_config.SUPPORTED_DVMS):
|
|
return False, task
|
|
|
|
if not is_input_supported_generic(event.tags(), client, dvm_config):
|
|
return False, ""
|
|
for dvm in dvm_config.SUPPORTED_DVMS:
|
|
if dvm.TASK == task:
|
|
if not dvm.is_input_supported(event.tags()):
|
|
return False, task
|
|
|
|
return True, task
|
|
|
|
|
|
except Exception as e:
|
|
print("Check task: " + str(e))
|
|
|
|
|
|
def check_url_is_readable(url):
|
|
if not str(url).startswith("http"):
|
|
return None
|
|
|
|
source = check_source_type(url)
|
|
type = media_source(source)
|
|
|
|
if type == "url":
|
|
# If link is comaptible with one of these file formats, move on.
|
|
req = requests.get(url)
|
|
content_type = req.headers['content-type']
|
|
if content_type == 'audio/x-wav' or str(url).endswith(".wav") or content_type == 'audio/mpeg' or str(url).endswith(
|
|
".mp3") or content_type == 'audio/ogg' or str(url).endswith(".ogg"):
|
|
return "audio"
|
|
elif (content_type == 'image/png' or str(url).endswith(".png") or content_type == 'image/jpg' or str(url).endswith(
|
|
".jpg") or content_type == 'image/jpeg' or str(url).endswith(".jpeg") or content_type == 'image/png' or
|
|
str(url).endswith(".png")):
|
|
return "image"
|
|
elif content_type == 'video/mp4' or str(url).endswith(".mp4") or content_type == 'video/avi' or str(url).endswith(
|
|
".avi") or content_type == 'video/mov' or str(url).endswith(".mov"):
|
|
return "video"
|
|
elif (str(url)).endswith(".pdf"):
|
|
return "pdf"
|
|
else:
|
|
return type
|
|
|
|
# Otherwise we will not offer to do the job.
|
|
return None
|
|
|
|
|
|
def get_amount_per_task(task, dvm_config, duration=1):
|
|
# duration is either static 1 (for images etc) or in seconds by default (e.g. audio/video)
|
|
for dvm in dvm_config.SUPPORTED_DVMS: # this is currently just one
|
|
if dvm.TASK == task:
|
|
amount = dvm.FIX_COST + (dvm.PER_UNIT_COST * duration)
|
|
return amount
|
|
else:
|
|
print("[" + dvm_config.SUPPORTED_DVMS[
|
|
0].NAME + "] Task " + task + " is currently not supported by this instance, skipping")
|
|
return None
|