File size: 14,108 Bytes
b5b4980
 
 
 
fb29fff
 
 
 
b5b4980
025a281
726ed91
b5b4980
fb29fff
025a281
b5b4980
025a281
b5b4980
 
 
025a281
726ed91
 
 
 
b5b4980
fb29fff
 
 
 
 
 
 
 
 
 
 
 
 
b5b4980
 
 
5dd8e5c
b5b4980
 
 
 
 
 
 
 
 
5dd8e5c
b5b4980
5dd8e5c
868c4e3
5dd8e5c
868c4e3
5dd8e5c
868c4e3
5dd8e5c
868c4e3
 
 
 
 
 
 
 
fb29fff
868c4e3
 
5b04683
ac150a8
5b04683
 
67d1e7e
9d92743
 
8433342
b5b4980
67d1e7e
fb29fff
 
 
b5b4980
 
 
 
 
fb29fff
b5b4980
 
 
 
 
 
 
025a281
 
 
 
 
 
 
 
fb29fff
025a281
 
 
 
 
 
 
 
 
 
 
 
fb29fff
025a281
 
 
 
 
 
 
 
 
 
 
 
 
 
fb29fff
025a281
fb29fff
025a281
 
 
 
 
 
 
 
 
 
fb29fff
025a281
 
 
b5b4980
726ed91
 
 
 
 
 
 
 
 
 
 
 
025a281
 
b5b4980
 
 
 
 
 
 
 
fb29fff
b5b4980
 
 
 
fb29fff
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
import os
import re
from datetime import datetime

import anthropic
from groq import Groq
from openai import OpenAI

huggingface_token = os.getenv("HUGGINGFACE_TOKEN")
groq_api_key = os.getenv("GROQ_API_KEY")
sambanova_api_key = os.getenv("SAMBANOVA_API_KEY")


class LLMInferenceNode:
    def __init__(self):
        self.huggingface_client = OpenAI(
            base_url="https://api-inference.huggingface.co/v1/",
            api_key=huggingface_token,
        )
        self.groq_client = Groq(api_key=groq_api_key)
        self.sambanova_client = OpenAI(
            api_key=sambanova_api_key,
            base_url="https://api.sambanova.ai/v1",
        )

    def generate(
        self,
        input_text,
        happy_talk,
        compress,
        compression_level,
        poster,
        prompt_type,
        custom_base_prompt="",
        provider="Hugging Face",
        api_key=None,
        model=None,
    ):
        try:
            default_happy_prompt = """Create a detailed visually descriptive caption of this description, which will be used as a prompt for a text to image AI system (caption only, no instructions like "create an image").Remove any mention of digital artwork or artwork style. Give detailed visual descriptions of the character(s), including ethnicity, skin tone, expression etc. Imagine using keywords for a still for someone who has aphantasia. Describe the image style, e.g. any photographic or art styles / techniques utilized. Make sure to fully describe all aspects of the cinematography, with abundant technical details and visual descriptions. If there is more than one image, combine the elements and characters from all of the images creatively into a single cohesive composition with a single background, inventing an interaction between the characters. Be creative in combining the characters into a single cohesive scene. Focus on two primary characters (or one) and describe an interesting interaction between them, such as a hug, a kiss, a fight, giving an object, an emotional reaction / interaction. If there is more than one background in the images, pick the most appropriate one. Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph. If you feel the images are inappropriate, invent a new scene / characters inspired by these. Additionally, incorporate a specific movie director's visual style and describe the lighting setup in detail, including the type, color, and placement of light sources to create the desired mood and atmosphere. Always frame the scene, including details about the film grain, color grading, and any artifacts or characteristics specific."""

            default_simple_prompt = """Create a brief, straightforward caption for this description, suitable for a text-to-image AI system. Focus on the main elements, key characters, and overall scene without elaborate details. Provide a clear and concise description in one or two sentences. Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph."""

            poster_prompt = """Analyze the provided description and extract key information to create a movie poster style description. Format the output as follows:
Title: A catchy, intriguing title that captures the essence of the scene, place the title in "".
Main character: Give a description of the main character.
Background: Describe the background in detail.
Supporting characters: Describe the supporting characters
Branding type: Describe the branding type
Tagline: Include a tagline that captures the essence of the movie.
Visual style: Ensure that the visual style fits the branding type and tagline.
You are allowed to make up film and branding names, and do them like 80's, 90's or modern movie posters.Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph."""

            only_objects_prompt = """Create a highly detailed and visually rich description focusing solely on inanimate objects, without including any human or animal figures. Describe the objects' shapes, sizes, colors, textures, and materials in great detail. Pay attention to their arrangement, positioning, and how they interact with light and shadow. Include information about the setting or environment these objects are in, such as indoor/outdoor, time of day, weather conditions, and any atmospheric effects. Mention any unique features, patterns, or imperfections on the objects. Describe the overall composition, perspective, and any artistic techniques that might be employed to render these objects (e.g., photorealism, impressionistic style, etc.). Your description should paint a vivid picture that allows someone to imagine the scene without seeing it, focusing on the beauty, complexity, or significance of everyday objects. Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph."""

            no_figure_prompt = """Generate a comprehensive and visually evocative description of a scene or landscape without including any human or animal figures. Focus on the environment, natural elements, and man-made structures if present. Describe the topography, vegetation, weather conditions, and time of day in great detail. Pay attention to colors, textures, and how light interacts with different elements of the scene. If there are buildings or other structures, describe their architecture, condition, and how they fit into the landscape. Include sensory details beyond just visual elements - mention sounds, smells, and the overall atmosphere or mood of the scene. Describe any notable features like bodies of water, geological formations, or sky phenomena. Consider the perspective from which the scene is viewed and how this affects the composition. Your description should transport the reader to this location, allowing them to vividly imagine the scene without any living subjects present. Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph."""

            landscape_prompt = """Create an immersive and detailed description of a landscape, focusing on its natural beauty and geographical features. Begin with the overall topography - is it mountainous, coastal, forested, desert, or a combination? Describe the horizon and how land meets sky. Detail the vegetation, noting types of trees, flowers, or grass, and how they're distributed across the landscape. Include information about any water features - rivers, lakes, oceans - and how they interact with the land. Describe the sky, including cloud formations, color gradients, and any celestial bodies visible. Pay attention to the quality of light, time of day, and season, explaining how these factors affect the colors and shadows in the scene. Include details about weather conditions and how they impact the landscape. Mention any geological features like rock formations, cliffs, or unique land patterns. If there are any distant man-made elements, describe how they integrate with the natural setting. Your description should capture the grandeur and mood of the landscape, allowing the reader to feel as if they're standing within this awe-inspiring natural scene. Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph."""

            fantasy_prompt = """Craft an extraordinarily detailed and imaginative description of a fantasy scene, blending elements of magic, otherworldly creatures, and fantastical environments. Begin by setting the overall tone - is this a dark and foreboding realm, a whimsical fairytale setting, or an epic high-fantasy world? Describe the landscape, including any impossible or magical geographical features like floating islands, crystal forests, or rivers of starlight. Detail the flora and fauna, focusing on fantastical plants and creatures that don't exist in our world. Include descriptions of any structures or ruins, emphasizing their otherworldly architecture and magical properties. Describe the sky and any celestial bodies, considering how they might differ from our reality. Include details about the presence of magic - how it manifests visually, its effects on the environment, and any magical phenomena occurring in the scene. If there are characters present, describe their appearance, focusing on non-human features, magical auras, or fantastical clothing and accessories. Pay attention to colors, textures, and light sources, especially those that couldn't exist in the real world. Your description should transport the reader to a realm of pure imagination, where the laws of physics and nature as we know them don't apply. Your output is only the caption itself, no comments or extra formatting. The caption is in a single long paragraph."""

            prompt_types = {
                "happy": default_happy_prompt,
                "simple": default_simple_prompt,
                "poster": poster_prompt,
                "only_objects": only_objects_prompt,
                "no_figure": no_figure_prompt,
                "landscape": landscape_prompt,
                "fantasy": fantasy_prompt,
            }

            # Update this part to handle the prompt_type correctly
            print(f"Received prompt_type: '{prompt_type}'")  # Debug print
            if prompt_type and prompt_type.strip() and prompt_type in prompt_types:
                base_prompt = prompt_types[prompt_type]
                print(f"Using {prompt_type} prompt")
            elif custom_base_prompt.strip():
                base_prompt = custom_base_prompt
                print("Using custom base prompt")
            else:
                base_prompt = default_happy_prompt
                print(
                    f"Warning: Unknown or empty prompt type '{prompt_type}'. Using default happy prompt."
                )

            if compress and not poster:
                compression_chars = {
                    "soft": 600 if happy_talk else 300,
                    "medium": 400 if happy_talk else 200,
                    "hard": 200 if happy_talk else 100,
                }
                char_limit = compression_chars[compression_level]
                base_prompt += f" Compress the output to be concise while retaining key visual details. MAX OUTPUT SIZE no more than {char_limit} characters."

            system_message = "You are a helpful assistant. Try your best to give the best response possible to the user."
            user_message = f"{base_prompt}\nDescription: {input_text}"

            if provider == "Hugging Face":
                response = self.huggingface_client.chat.completions.create(
                    model=model or "meta-llama/Meta-Llama-3.1-70B-Instruct",
                    max_tokens=1024,
                    temperature=0.7,
                    top_p=0.95,
                    messages=[
                        {"role": "system", "content": system_message},
                        {"role": "user", "content": user_message},
                    ],
                )
                output = response.choices[0].message.content.strip()

            elif provider == "OpenAI":
                openai_client = OpenAI(api_key=api_key)
                response = openai_client.chat.completions.create(
                    model=model or "gpt-4",
                    max_tokens=1024,
                    temperature=0.7,
                    messages=[
                        {"role": "system", "content": system_message},
                        {"role": "user", "content": user_message},
                    ],
                )
                output = response.choices[0].message.content.strip()

            elif provider == "Anthropic":
                anthropic_client = anthropic.Anthropic(api_key=api_key)
                response = anthropic_client.messages.create(
                    model=model or "claude-3-5-sonnet-20240620",
                    max_tokens=1024,
                    temperature=0.7,
                    system=system_message,
                    messages=[
                        {
                            "role": "user",
                            "content": [{"type": "text", "text": user_message}],
                        }
                    ],
                )
                output = response.content[0].text

            elif provider == "Groq":
                response = self.groq_client.chat.completions.create(
                    model=model or "llama-3.1-70b-versatile",
                    max_tokens=1024,
                    temperature=0.7,
                    messages=[
                        {"role": "system", "content": system_message},
                        {"role": "user", "content": user_message},
                    ],
                )
                output = response.choices[0].message.content.strip()

            elif provider == "SambaNova":
                response = self.sambanova_client.chat.completions.create(
                    model=model or "Meta-Llama-3.1-70B-Instruct",
                    max_tokens=1024,
                    temperature=0.7,
                    messages=[
                        {"role": "system", "content": system_message},
                        {"role": "user", "content": user_message},
                    ],
                )
                output = response.choices[0].message.content.strip()

            else:
                raise ValueError(f"Unsupported provider: {provider}")

            # Clean up the output
            if ": " in output:
                output = output.split(": ", 1)[1].strip()
            elif output.lower().startswith("here"):
                sentences = output.split(". ")
                if len(sentences) > 1:
                    output = ". ".join(sentences[1:]).strip()

            return output

        except Exception as e:
            print(f"An error occurred: {e}")
            return f"Error occurred while processing the request: {str(e)}"