mistral_chat / app.py
ndurner's picture
Mistral adaptation
575c087
import gradio as gr
import base64
import os
from mistralai import Mistral
import json
import fitz
from PIL import Image
import io
from settings_mgr import generate_download_settings_js, generate_upload_settings_js
from doc2json import process_docx
dump_controls = False
log_to_console = False
temp_files = []
def encode_image(image_data):
"""Generates a prefix for image base64 data in the required format for the
four known image formats: png, jpeg, gif, and webp.
Args:
image_data: The image data, encoded in base64.
Returns:
A string containing the prefix.
"""
# Get the first few bytes of the image data.
magic_number = image_data[:4]
# Check the magic number to determine the image type.
if magic_number.startswith(b'\x89PNG'):
image_type = 'png'
elif magic_number.startswith(b'\xFF\xD8'):
image_type = 'jpeg'
elif magic_number.startswith(b'GIF89a'):
image_type = 'gif'
elif magic_number.startswith(b'RIFF'):
if image_data[8:12] == b'WEBP':
image_type = 'webp'
else:
# Unknown image type.
raise Exception("Unknown image type")
else:
# Unknown image type.
raise Exception("Unknown image type")
return f"data:image/{image_type};base64,{base64.b64encode(image_data).decode('utf-8')}"
def process_pdf_img(pdf_fn: str):
pdf = fitz.open(pdf_fn)
message_parts = []
for page in pdf.pages():
# Create a transformation matrix for rendering at the calculated scale
mat = fitz.Matrix(0.6, 0.6)
# Render the page to a pixmap
pix = page.get_pixmap(matrix=mat, alpha=False)
# Convert pixmap to PIL Image
img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
# Convert PIL Image to bytes
img_byte_arr = io.BytesIO()
img.save(img_byte_arr, format='PNG')
img_byte_arr = img_byte_arr.getvalue()
# Encode image to base64
base64_encoded = base64.b64encode(img_byte_arr).decode('utf-8')
# Construct the data URL
image_url = f"data:image/png;base64,{base64_encoded}"
# Append the message part
message_parts.append({
"type": "text",
"text": f"Page {page.number} of file '{pdf_fn}'"
})
message_parts.append({
"type": "image_url",
"image_url": image_url
})
pdf.close()
return message_parts
def encode_file(fn: str) -> list:
user_msg_parts = []
if fn.endswith(".docx"):
user_msg_parts.append({"type": "text", "text": process_docx(fn)})
elif fn.endswith(".pdf"):
user_msg_parts.extend(process_pdf_img(fn))
else:
with open(fn, mode="rb") as f:
content = f.read()
isImage = False
if isinstance(content, bytes):
try:
# try to add as image
content = encode_image(content)
isImage = True
except:
# not an image, try text
content = content.decode('utf-8', 'replace')
else:
content = str(content)
if isImage:
user_msg_parts.append({"type": "image_url", "image_url": content})
else:
user_msg_parts.append({"type": "text", "text": content})
return user_msg_parts
def bot(message, history, mistral_key, system_prompt, seed, temperature, max_tokens, model):
try:
client = Mistral(
api_key=mistral_key
)
history_mistral_format = []
user_msg_parts = []
if system_prompt:
history_mistral_format.append({"role": "system", "content": system_prompt})
for human, assi in history:
if human is not None:
if type(human) is tuple:
user_msg_parts.extend(encode_file(human[0]))
else:
user_msg_parts.append({"type": "text", "text": human})
if assi is not None:
if user_msg_parts:
history_mistral_format.append({"role": "user", "content": user_msg_parts})
user_msg_parts = []
history_mistral_format.append({"role": "assistant", "content": assi})
if message["text"]:
user_msg_parts.append({"type": "text", "text": message["text"]})
if message["files"]:
for file in message["files"]:
user_msg_parts.extend(encode_file(file))
history_mistral_format.append({"role": "user", "content": user_msg_parts})
if log_to_console:
print(f"br_prompt: {str(history_mistral_format)}")
response = client.chat.stream(
model=model,
messages=history_mistral_format,
temperature=temperature,
max_tokens=max_tokens
)
partial_response = ""
for chunk in response:
if chunk.data.choices:
txt = chunk.data.choices[0].delta.content
if txt:
partial_response += txt
yield partial_response
if log_to_console:
print(f"br_result: {str(history)}")
except Exception as e:
raise gr.Error(f"Error: {str(e)}")
def undo(history):
history.pop()
return history
def dump(history):
return str(history)
def load_settings():
# Dummy Python function, actual loading is done in JS
pass
def save_settings(acc, sec, prompt, temp, tokens, model):
# Dummy Python function, actual saving is done in JS
pass
def import_history(history, file):
with open(file.name, mode="rb") as f:
content = f.read()
if isinstance(content, bytes):
content = content.decode('utf-8', 'replace')
else:
content = str(content)
os.remove(file.name)
# Deserialize the JSON content
import_data = json.loads(content)
# Check if 'history' key exists for backward compatibility
if 'history' in import_data:
history = import_data['history']
system_prompt.value = import_data.get('system_prompt', '') # Set default if not present
else:
# Assume it's an old format with only history data
history = import_data
return history, system_prompt.value
with gr.Blocks(delete_cache=(86400, 86400)) as demo:
gr.Markdown("# Mistral Chat")
with gr.Accordion("Startup"):
gr.Markdown("""Use of this interface permitted under the terms and conditions of the
[MIT license](https://github.com/ndurner/mistral_chat/blob/main/LICENSE).
Third party terms and conditions apply. This app and the AI models may make mistakes, so verify any outputs.""")
mistral_key = gr.Textbox(label="Mistral API Key", elem_id="mistral_key")
model = gr.Dropdown(label="Model", value="pixtral-large-latest", allow_custom_value=True, elem_id="model",
choices=["pixtral-large-latest", "mistral-large-latest", "pixtral-12b-2409"])
system_prompt = gr.TextArea("You are a helpful yet diligent AI assistant. Answer faithfully and factually correct. Respond with 'I do not know' if uncertain.",
label="System Prompt", lines=3, max_lines=250, elem_id="system_prompt")
seed = gr.Textbox(label="Seed", elem_id="seed")
temp = gr.Slider(0, 1, label="Temperature", elem_id="temp", value=0.7)
max_tokens = gr.Slider(1, 4096, label="Max. Tokens", elem_id="max_tokens", value=800)
save_button = gr.Button("Save Settings")
load_button = gr.Button("Load Settings")
dl_settings_button = gr.Button("Download Settings")
ul_settings_button = gr.Button("Upload Settings")
load_button.click(load_settings, js="""
() => {
let elems = ['#mistral_key textarea', '#system_prompt textarea', '#seed textarea', '#temp input', '#max_tokens input', '#model'];
elems.forEach(elem => {
let item = document.querySelector(elem);
let event = new InputEvent('input', { bubbles: true });
item.value = localStorage.getItem(elem.split(" ")[0].slice(1)) || '';
item.dispatchEvent(event);
});
}
""")
save_button.click(save_settings, [mistral_key, system_prompt, seed, temp, max_tokens, model], js="""
(key, sys, seed, temp, ntok, model) => {
localStorage.setItem('mistral_key', key);
localStorage.setItem('system_prompt', sys);
localStorage.setItem('seed', seed);
localStorage.setItem('temp', document.querySelector('#temp input').value);
localStorage.setItem('max_tokens', document.querySelector('#max_tokens input').value);
localStorage.setItem('model', model);
}
""")
control_ids = [('mistral_key', '#mistral_key textarea'),
('system_prompt', '#system_prompt textarea'),
('seed', '#seed textarea'),
('temp', '#temp input'),
('max_tokens', '#max_tokens input'),
('model', '#model')]
controls = [mistral_key, system_prompt, seed, temp, max_tokens, model]
dl_settings_button.click(None, controls, js=generate_download_settings_js("mistral_chat_settings.bin", control_ids))
ul_settings_button.click(None, None, None, js=generate_upload_settings_js(control_ids))
chat = gr.ChatInterface(fn=bot, multimodal=True, additional_inputs=controls, autofocus=False)
chat.textbox.file_count = "multiple"
chatbot = chat.chatbot
chatbot.show_copy_button = True
chatbot.height = 450
if dump_controls:
with gr.Row():
dmp_btn = gr.Button("Dump")
txt_dmp = gr.Textbox("Dump")
dmp_btn.click(dump, inputs=[chatbot], outputs=[txt_dmp])
with gr.Accordion("Import/Export", open=False):
import_button = gr.UploadButton("History Import")
export_button = gr.Button("History Export")
export_button.click(lambda: None, [chatbot, system_prompt], js="""
(chat_history, system_prompt) => {
const export_data = {
history: chat_history,
system_prompt: system_prompt
};
const history_json = JSON.stringify(export_data);
const blob = new Blob([history_json], {type: 'application/json'});
const url = URL.createObjectURL(blob);
const a = document.createElement('a');
a.href = url;
a.download = 'chat_history.json';
document.body.appendChild(a);
a.click();
document.body.removeChild(a);
URL.revokeObjectURL(url);
}
""")
dl_button = gr.Button("File download")
dl_button.click(lambda: None, [chatbot], js="""
(chat_history) => {
const languageToExt = {
'python': 'py',
'javascript': 'js',
'typescript': 'ts',
'csharp': 'cs',
'ruby': 'rb',
'shell': 'sh',
'bash': 'sh',
'markdown': 'md',
'yaml': 'yml',
'rust': 'rs',
'golang': 'go',
'kotlin': 'kt'
};
const contentRegex = /```(?:([^\\n]+)?\\n)?([\\s\\S]*?)```/;
const match = contentRegex.exec(chat_history[chat_history.length - 1][1]);
if (match && match[2]) {
const specifier = match[1] ? match[1].trim() : '';
const content = match[2];
let filename = 'download';
let fileExtension = 'txt'; // default
if (specifier) {
if (specifier.includes('.')) {
// If specifier contains a dot, treat it as a filename
const parts = specifier.split('.');
filename = parts[0];
fileExtension = parts[1];
} else {
// Use mapping if exists, otherwise use specifier itself
const langLower = specifier.toLowerCase();
fileExtension = languageToExt[langLower] || langLower;
filename = 'code';
}
}
const blob = new Blob([content], {type: 'text/plain'});
const url = URL.createObjectURL(blob);
const a = document.createElement('a');
a.href = url;
a.download = `${filename}.${fileExtension}`;
document.body.appendChild(a);
a.click();
document.body.removeChild(a);
URL.revokeObjectURL(url);
}
}
""")
import_button.upload(import_history, inputs=[chatbot, import_button], outputs=[chatbot, system_prompt])
demo.unload(lambda: [os.remove(file) for file in temp_files])
demo.launch()