1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
|
from datetime import datetime
from dotenv import load_dotenv
from common import create_database_connection
from catboxpy.catbox import CatboxClient
import os
import time
import openai
import json
from summarizer import generate_headline_and_content_from_images
load_dotenv()
def check_is_generation_possible():
return os.getenv("OPENAI_API_KEY") is not None and os.getenv("DISCORD_AUTHORIZATION") is not None
def check_is_announcement_image(img_url: str):
openai.api_key = os.getenv("OPENAI_API_KEY")
tools = [
{
"type": "function",
"function": {
"name": "classify_wacca_plus_image",
"description": "Classify if an image is WACCA PLUS announcement, update, or information",
"parameters": {
"type": "object",
"properties": {
"is_wacca_plus_related": {
"type": "boolean",
"description": "Is this image related to WACCA PLUS?",
},
"category": {
"type": "string",
"enum": ["announcement", "update", "info", "null"],
"description": "Category of image if related; otherwise null.",
},
},
"required": ["is_wacca_plus_related", "category"],
},
}
}
]
response = openai.chat.completions.create(
model="gpt-4o",
messages=[
{
"role": "user",
"content": [
{"type": "text", "text": "Does this image contain official update, event, or announcement information for the game WACCA PLUS? Ignore unrelated content like gameplay screenshots, score posts, or arcade cabinet photos. Classify accordingly."},
{"type": "image_url", "image_url": {"url": img_url}},
],
}
],
tools=tools,
tool_choice={"type": "function", "function": {"name": "classify_wacca_plus_image"}},
)
tool_args = response.choices[0].message.tool_calls[0].function.arguments
parsed_result = json.loads(tool_args)
return parsed_result["is_wacca_plus_related"], parsed_result["category"]
def _upload_image_to_catbox(image_url: str):
client = CatboxClient()
file_url = client.upload(image_url)
if not file_url or file_url == "":
return image_url
return file_url
def parse_announcement_messages(message_json: dict):
news_posts = []
database = create_database_connection()
for message in message_json:
type = None
message_content = message.get("content", "")
if len(message["attachments"]) == 0:
continue
image_attachments = []
for attachment in message["attachments"]:
if "image" in attachment["content_type"]:
image_attachments.append(attachment)
if len(image_attachments) == 0:
continue
filtered_images = []
image_urls = [] # save the images before they get encoded
for image in image_attachments:
image_urls.append(image["url"])
entry = database.get_wac_entry(image["id"])
if entry:
is_related = entry[0]
type = entry[1]
else:
is_related, type = check_is_announcement_image(image["url"])
database.add_new_wac_entry(key=image["id"], is_news=is_related, post_type=type)
if not is_related:
continue
filtered_images.append({"image": _upload_image_to_catbox(image["url"]), "url": None})
if len(filtered_images) == 0:
continue
date = message["timestamp"].split("T")[0]
date_obj = datetime.strptime(date, "%Y-%m-%d")
unix_time = int(time.mktime(date_obj.timetuple()))
headline, content = generate_headline_and_content_from_images(image_urls, "WACCA PLUS", message_content)
news_posts.append({
"date": date,
"identifier": "WACCA_PLUS",
"type": type.upper(),
"timestamp": unix_time,
"content": content,
"headline": headline,
"url": None,
"images": filtered_images,
'is_ai_summary': True
})
database.close()
return news_posts
|