lykeven commited on
Commit
8d00201
·
1 Parent(s): d3049aa
app.py ADDED
@@ -0,0 +1,195 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python
2
+
3
+ import gradio as gr
4
+ import os
5
+ import re
6
+ from PIL import Image
7
+ import base64
8
+ import time
9
+
10
+ DESCRIPTION = '''# <a href="https://github.com/THUDM/CogVLM">VisualGLM</a>'''
11
+
12
+ MAINTENANCE_NOTICE1 = 'Hint 1: If the app report "Something went wrong, connection error out", please turn off your proxy and retry.\nHint 2: If you upload a large size of image like 10MB, it may take some time to upload and process. Please be patient and wait.'
13
+
14
+ NOTES = 'This app is adapted from <a href="https://github.com/THUDM/CogVLM">https://github.com/THUDM/CogVLM</a>. It would be recommended to check out the repo if you want to see the detail of our model.'
15
+
16
+ import json
17
+ import requests
18
+ import base64
19
+ import hashlib
20
+
21
+ default_chatbox = [("", "Hi, What do you want to know about this image?")]
22
+
23
+ URL = os.environ.get("URL")
24
+
25
+ def process_image(image_prompt):
26
+ image = Image.open(image_prompt)
27
+ print(f"height:{image.height}, width:{image.width}")
28
+ resized_image = image.resize((224, 224), )
29
+ timestamp = int(time.time())
30
+ file_ext = os.path.splitext(image_prompt)[1]
31
+ filename = f"examples/{timestamp}{file_ext}"
32
+ resized_image.save(filename)
33
+ print(f"temporal filename {filename}")
34
+ with open(filename, "rb") as image_file:
35
+ bytes = base64.b64encode(image_file.read())
36
+ encoded_img = str(bytes, encoding='utf-8')
37
+ image_hash = hashlib.sha256(bytes).hexdigest()
38
+ os.remove(filename)
39
+ return encoded_img, image_hash
40
+
41
+
42
+ def process_image_without_resize(image_prompt):
43
+ image = Image.open(image_prompt)
44
+ print(f"height:{image.height}, width:{image.width}")
45
+ timestamp = int(time.time())
46
+ file_ext = os.path.splitext(image_prompt)[1]
47
+ filename = f"examples/{timestamp}{file_ext}"
48
+ image.save(filename)
49
+ print(f"temporal filename {filename}")
50
+ with open(filename, "rb") as image_file:
51
+ bytes = base64.b64encode(image_file.read())
52
+ encoded_img = str(bytes, encoding='utf-8')
53
+ image_hash = hashlib.sha256(bytes).hexdigest()
54
+ os.remove(filename)
55
+ return encoded_img, image_hash
56
+
57
+
58
+ def is_chinese(text):
59
+ zh_pattern = re.compile(u'[\u4e00-\u9fa5]+')
60
+ return zh_pattern.search(text)
61
+
62
+
63
+ def post(
64
+ input_text,
65
+ temperature,
66
+ top_p,
67
+ image_prompt,
68
+ result_previous,
69
+ hidden_image
70
+ ):
71
+ result_text = [(ele[0], ele[1]) for ele in result_previous]
72
+ for i in range(len(result_text)-1, -1, -1):
73
+ if result_text[i][0] == "":
74
+ del result_text[i]
75
+ print(f"history {result_text}")
76
+
77
+ is_zh = is_chinese(input_text)
78
+
79
+ if image_prompt is None:
80
+ print("Image empty")
81
+ if is_zh:
82
+ result_text.append((input_text, '图片为空!请上传图片并重试。'))
83
+ else:
84
+ result_text.append((input_text, 'Image empty! Please upload a image and retry.'))
85
+ return input_text, result_text, hidden_image
86
+ elif input_text == "":
87
+ print("Text empty")
88
+ result_text.append((input_text, 'Text empty! Please enter text and retry.'))
89
+ return "", result_text, hidden_image
90
+
91
+ headers = {
92
+ "Content-Type": "application/json; charset=UTF-8",
93
+ "User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.87 Safari/537.36",
94
+ }
95
+ if image_prompt:
96
+ encoded_img, image_hash = process_image_without_resize(image_prompt)
97
+ print(f"image_hash:{image_hash}, hidden_image_hash:{hidden_image}")
98
+
99
+ if hidden_image is not None and image_hash != hidden_image:
100
+ print("image has been update")
101
+ result_text = []
102
+ hidden_image = image_hash
103
+ else:
104
+ encoded_img = None
105
+
106
+ print('开始请求...')
107
+ data = json.dumps({
108
+ 'text': input_text,
109
+ 'image': encoded_img,
110
+ 'temperature': temperature,
111
+ 'top_p': top_p,
112
+ 'history': result_text
113
+ })
114
+ try:
115
+ response = requests.request("POST", URL, headers=headers, data=data, timeout=(60, 100)).json()
116
+ except Exception as e:
117
+ print("error message", e)
118
+ if is_zh:
119
+ result_text.append((input_text, '超时!请稍等几分钟再重试。'))
120
+ else:
121
+ result_text.append((input_text, 'Timeout! Please wait a few minutes and retry.'))
122
+ return "", result_text, hidden_image
123
+ print('请求完毕...')
124
+ # response = {'result':input_text}
125
+
126
+ answer = str(response['result'])
127
+ result_text.append((input_text, answer))
128
+ print(result_text)
129
+ print('finished')
130
+ return "", result_text, hidden_image
131
+
132
+
133
+ def clear_fn(value):
134
+ return "", default_chatbox, None
135
+
136
+ def clear_fn2(value):
137
+ return default_chatbox
138
+
139
+
140
+ def main():
141
+ gr.close_all()
142
+ examples = []
143
+ with open("./examples/example_inputs.jsonl") as f:
144
+ for line in f:
145
+ data = json.loads(line)
146
+ examples.append(data)
147
+
148
+
149
+ with gr.Blocks(css='style.css') as demo:
150
+
151
+ with gr.Row():
152
+ with gr.Column(scale=4.5):
153
+ with gr.Group():
154
+ input_text = gr.Textbox(label='Input Text', placeholder='Please enter text prompt below and press ENTER.')
155
+ with gr.Row():
156
+ run_button = gr.Button('Generate')
157
+ clear_button = gr.Button('Clear')
158
+
159
+ image_prompt = gr.Image(type="filepath", label="Image Prompt", value=None)
160
+ with gr.Row():
161
+ temperature = gr.Slider(maximum=1, value=0.8, minimum=0, label='Temperature')
162
+ top_p = gr.Slider(maximum=1, value=0.4, minimum=0, label='Top P')
163
+ with gr.Group():
164
+ with gr.Row():
165
+ with gr.Column(scale=7):
166
+ maintenance_notice = gr.Markdown(MAINTENANCE_NOTICE1)
167
+ with gr.Column(scale=2):
168
+ change_button = gr.Button('Change hint to English', visible=False)
169
+ with gr.Column(scale=5.5):
170
+ result_text = gr.components.Chatbot(label='Multi-round conversation History', value=[("", "Hi, What do you want to know about this image?")]).style(height=550)
171
+ hidden_image_hash = gr.Textbox(visible=False)
172
+
173
+ gr_examples = gr.Examples(examples=[[example["text"], example["image"]] for example in examples],
174
+ inputs=[input_text, image_prompt],
175
+ label="Example Inputs (Click to insert an examplet into the input box)",
176
+ examples_per_page=3)
177
+
178
+ gr.Markdown(NOTES)
179
+
180
+ print(gr.__version__)
181
+ run_button.click(fn=post,inputs=[input_text, temperature, top_p, image_prompt, result_text, hidden_image_hash],
182
+ outputs=[input_text, result_text, hidden_image_hash])
183
+ input_text.submit(fn=post,inputs=[input_text, temperature, top_p, image_prompt, result_text, hidden_image_hash],
184
+ outputs=[input_text, result_text, hidden_image_hash])
185
+ clear_button.click(fn=clear_fn, inputs=clear_button, outputs=[input_text, result_text, image_prompt])
186
+ image_prompt.upload(fn=clear_fn2, inputs=clear_button, outputs=[result_text])
187
+ image_prompt.clear(fn=clear_fn2, inputs=clear_button, outputs=[result_text])
188
+
189
+ print(gr.__version__)
190
+
191
+ demo.queue(concurrency_count=10)
192
+ demo.launch()
193
+
194
+ if __name__ == '__main__':
195
+ main()
examples/1.jpeg ADDED
examples/1.png ADDED
examples/2.jpeg ADDED
examples/2.jpg ADDED
examples/3.jpeg ADDED
examples/3.jpg ADDED
examples/example_inputs.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {"id":1, "text": "Describe this image", "image": "examples/1.png"}
2
+ {"id":2, "text": "What is written in the image?", "image": "examples/2.jpg"}
3
+ {"id":3, "text": "How many houses are there in this cartoon?", "image": "examples/3.jpg"}
style.css ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ h1 {
2
+ text-align: center;
3
+ }
4
+ img#visitor-badge {
5
+ display: block;
6
+ margin: auto;
7
+ }