aboutsummaryrefslogtreecommitdiffstats
path: root/summarizer.py
blob: d3d66f11453da2d153897bb90352835651102916 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
from dotenv import load_dotenv
import openai
import json
import hashlib
import os

load_dotenv()


def summarization_is_possible() -> bool:
    return os.getenv("OPENAI_API_KEY")


def _load_cache():
    cache_file = "summarization_cache.json"
    if not os.path.exists(cache_file):
        with open(cache_file, "w") as file:
            json.dump({}, file)
    with open(cache_file, "r") as file:
        return json.load(file)


def _save_cache(cache: dict):
    cache_file = "summarization_cache.json"
    with open(cache_file, "w") as file:
        json.dump(cache, file)


def _make_cache_key(game: str, img_urls: list[str]) -> str:
    normalized_game = game.strip().lower()
    img_data = json.dumps(sorted(img_urls), separators=(",", ":"))
    hash_digest = hashlib.sha256(img_data.encode()).hexdigest()[:12]
    return f"{normalized_game}_{hash_digest}"


def generate_headline_and_content_from_images(img_urls: list[str], game: str):
    """
    Uses LLM to generate the headline and content when none provided by source, based on one or more images.
    """
    cache = _load_cache()
    cache_key = _make_cache_key(game, img_urls)
    if cache_key in cache:
        cached = cache[cache_key]
        return cached["headline"], cached["content"]
    tools = [
        {
            "type": "function",
            "function": {
                "name": "generate_update_text",
                "description": "Generates a concise English headline and short description for a rhythm game update image.",
                "parameters": {
                    "type": "object",
                    "properties": {
                        "headline": {
                            "type": "string",
                            "description": "A short English headline summarizing the game update.",
                        },
                        "content": {
                            "type": "string",
                            "description": "A brief English description of the new content shown in the image(s).",
                        },
                    },
                    "required": ["headline", "content"],
                },
            },
        }
    ]

    messages = [
        {
            "role": "user",
            "content": [
                {
                    "type": "text",
                    "text": (
                        f"Given one or more update-related images for the arcade game {game}, return a short, professional English headline and a brief, stern and concise description summarizing the content. No need to repeat game name"
                    ),
                },
                *[{"type": "image_url", "image_url": {"url": url}} for url in img_urls],
            ],
        }
    ]

    response = openai.chat.completions.create(
        model="gpt-4o",
        messages=messages,
        tools=tools,
        tool_choice={
            "type": "function",
            "function": {"name": "generate_update_text"},
        },
    )

    tool_result = response.choices[0].message.tool_calls[0].function.arguments
    parsed_result = json.loads(tool_result)
    headline = parsed_result["headline"]
    content = parsed_result["content"]
    cache[cache_key] = {"headline": headline, "content": content}
    _save_cache(cache)
    return headline, content
send patches to the email below
yukais@pinapelz.com
include the subject [PATCH repo_name]
pinapelz.com
homepage