File size: 8,387 Bytes
fbb0bdf
327982a
 
2ef37b6
44bab49
2ef37b6
139217d
 
550885e
 
 
 
139217d
 
 
 
550885e
327982a
c995e6d
 
 
ec7a11c
 
 
 
fbb0bdf
 
 
ec7a11c
 
 
 
 
139217d
 
 
 
 
 
 
 
ec7a11c
 
 
 
f065ef3
52ff483
2a25399
e4b918c
ec7a11c
2ef37b6
 
fbb0bdf
ec7a11c
52ff483
ec7a11c
 
 
 
52ff483
ec7a11c
 
 
 
 
52ff483
 
ec7a11c
 
 
 
52ff483
e4b918c
ec7a11c
 
 
e4b918c
ec7a11c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52ff483
ec7a11c
 
 
 
 
 
 
 
 
 
 
fbb0bdf
 
f065ef3
e30b729
52ff483
e30b729
2a25399
e30b729
 
52ff483
e30b729
c995e6d
fbb0bdf
f065ef3
fbb0bdf
2a25399
fbb0bdf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4901d0f
2a25399
 
 
2ef37b6
 
 
 
 
 
 
fbb0bdf
 
 
 
 
 
 
 
 
 
ec7a11c
68a2a07
ec7a11c
f932ac0
 
ec7a11c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
import argparse
import json
import time
import uuid
from data import log_to_jsonl
from datetime import datetime
from utils import calculate_overall_score, query_ai_prompt
from promptObjects import (
    improve_prompt,
    critique_prompt,
    faith_scorer_prompt,
    spicy_scorer_prompt,
    ImprovedText,
    Critique,
    FaithfulnessScore,
    SpicyScore,
)

# This script uses the large language model to improve a text, it depends on a llama_cpp server being setup with a model loaded.
# There are several different interfaces it can use, see utils.py for more details.
# Here is a bit of a local setup example:
# pip install llama-cpp-python[server] --upgrade
# python3 -m llama_cpp.server --model mixtral-8x7b-instruct-v0.1.Q4_K_M.gguf  --port 5834 --n_ctx 4096 --use_mlock false
# Run this script:
# python3 chill.py
# This should then try and improve the original text below.
# Or you could import the improvement_loop function with a string as an argument to improve a specific text,
# or use it as a command line tool with the -t flag to improve a specific text.

original_text = """Stop chasing dreams instead. Life is not a Hollywood movie. Not everyone is going to get a famous billionaire. Adjust your expectations to reality, and stop thinking so highly of yourself, stop judging others. Assume the responsibility for the things that happen in your life. It is kind of annoying to read your text, it is always some external thing that "happened" to you, and it is always other people who are not up to your standards. At some moment you even declare with despair. And guess what? This is true and false at the same time, in a fundamental level most people are not remarkable, and you probably aren't too. But at the same time, nobody is the same, you have worth just by being, and other people have too. The impression I get is that you must be someone incredibly annoying to work with, and that your performance is not even nearly close to what you think it is, and that you really need to come down to earth. Stop looking outside, work on yourself instead. You'll never be satisfied just by changing jobs. Do therapy if you wish, become acquainted with stoicism, be a volunteer in some poor country, whatever, but do something to regain control of your life, to get some perspective, and to adjust your expectations to reality."""
# From elzbardico on https://news.ycombinator.com/item?id=36119858

"""
Outputs something like this:
 {
    "critique": "The revised text effectively conveys the same message as the original but in a more constructive and diplomatic tone, maintaining the original's intention while promoting a more positive discussion.",
    "faithfulness_score": 0.85,
    "spicy_score": 0.25,
    "overall_score": 0.89,
    "edit": "Consider shifting your focus from chasing dreams to finding fulfillment in reality. Life isn't a Hollywood movie, and becoming a famous billionaire isn't a realistic goal for everyone. It might be helpful to recalibrate your expectations to better align with what's possible. Instead of judging others, try to understand them better. Take responsibility for the events in your life, rather than attributing them to external factors or other people. I understand that it can be frustrating when things don't go as planned, but keep in mind that most people, including yourself, are not inherently exceptional or unremarkable. However, everyone has unique worth that doesn't depend on their achievements or status. It's essential to recognize that you may come across as demanding to work with and that your self-perception might not match others' opinions of your performance. To gain a fresh perspective and adjust your expectations, you could explore personal growth opportunities such as therapy, practicing stoicism, volunteering in underserved communities, or any other activity that helps you develop self-awareness and emotional intelligence."
}
"""

global suggestions
suggestions = []
last_edit = ""
request_count = 0
start_time = None




def improve_text_attempt():
    global suggestions
    global request_count
    replacements = {
        "original_text": json.dumps(original_text),
        "previous_suggestions": json.dumps(suggestions, indent=2),
    }
    request_count += 1
    resp_json = query_ai_prompt(improve_prompt, replacements, ImprovedText)
    return resp_json["text"]


def critique_text(last_edit):
    global suggestions
    global request_count
    replacements = {"original_text": original_text, "last_edit": last_edit}

    # Query the AI for each of the new prompts separately

    request_count += 3
    critique_resp = query_ai_prompt(critique_prompt, replacements, Critique)
    faithfulness_resp = query_ai_prompt(
        faith_scorer_prompt, replacements, FaithfulnessScore
    )
    spiciness_resp = query_ai_prompt(spicy_scorer_prompt, replacements, SpicyScore)

    # Combine the results from the three queries into a single dictionary
    combined_resp = {
        "critique": critique_resp["critique"],
        "faithfulness_score": faithfulness_resp["faithfulness_score"],
        "spicy_score": spiciness_resp["spicy_score"],
    }

    return combined_resp


def should_stop(
    iteration,
    overall_score,
    time_used,
    min_iterations=2,
    min_overall_score=0.85,
    max_seconds=60,
):
    good_attempt = iteration >= min_iterations and overall_score >= min_overall_score
    too_long = time_used > max_seconds and overall_score >= 0.7
    return good_attempt or too_long


def update_suggestions(critique_dict):
    global suggestions
    critique_dict["overall_score"] = round(
        calculate_overall_score(
            critique_dict["faithfulness_score"], critique_dict["spicy_score"]
        ),
        2,
    )
    critique_dict["edit"] = last_edit
    suggestions.append(critique_dict)
    suggestions = sorted(suggestions, key=lambda x: x["overall_score"], reverse=True)[
        :2
    ]
    critique_dict["request_count"] = request_count


def print_iteration_result(iteration, overall_score, time_used):
    global suggestions
    print(
        f"Iteration {iteration}: overall_score={overall_score:.2f}, time_used={time_used:.2f} seconds."
    )
    print("suggestions:")
    print(json.dumps(suggestions, indent=2))


def improvement_loop(input_text):
    global original_text
    global last_edit
    global suggestions
    global request_count
    global start_time
    iteration_count = 0
    suggestions = []
    last_edit = ""
    request_count = 0
    start_time = time.time()
    max_iterations = 6
    original_text = input_text

    for iteration in range(1, max_iterations + 1):
        iteration_count = iteration
        try:
            if iteration % 2 == 1:
                last_edit = improve_text_attempt()
            else:
                critique_dict = critique_text(last_edit)
                update_suggestions(critique_dict)
                overall_score = critique_dict["overall_score"]
                time_used = time.time() - start_time

                print_iteration_result(iteration, overall_score, time_used)

                if should_stop(iteration, overall_score, time_used):
                    print(
                        "Stopping\nTop suggestion:\n",
                        json.dumps(suggestions[0], indent=4),
                    )
                    break
        except ValueError as e:
            print("ValueError:", e)
            continue
    assert len(suggestions) > 0
    suggestions[0]["iteration_count"] = iteration_count
    suggestions[0]["max_allowed_iterations"] = max_iterations
    suggestions[0]["time_used"] = time_used
    log_entry = {
        "uuid": str(uuid.uuid4()),
        "timestamp": datetime.utcnow().isoformat(),
        "input": original_text,
        "output": suggestions[0]
    }
    log_to_jsonl('inputs_and_outputs.jsonl', log_entry)
    return suggestions[0]


if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Process and improve text.")
    parser.add_argument("-t", "--text", type=str, help="Text to be improved", default=original_text)
    args = parser.parse_args()

    improvement_loop(args.text)


# TODO: Segment the text into sentences for parallel processing, and isolate the most problematic parts for improvement
"""
# import pysbd
# sentences = pysbd.Segmenter(language="en", clean=False).segment(paragraph)
"""