TextToImages

Running

App Files Files Community

ArrcttacsrjksX commited on Feb 12

Commit

fbb991c

verified ·

1 Parent(s): dc08df9

Update app.py

Browse files

Files changed (1) hide show

app.py +140 -175

app.py CHANGED Viewed

@@ -1,56 +1,60 @@
-import gradio as gr
-import matplotlib.pyplot as plt
-from io import BytesIO
-from PIL import Image, ImageDraw, ImageFont
-import textwrap
 import os
-import matplotlib
 import math
-import tempfile
-from pathlib import Path
-# A list of common fonts to prioritize
-COMMON_FONTS = [
-    "Times New Roman",
-    "Arial",
-    "Calibri",
-    "Helvetica",
-    "Verdana",
-    "Tahoma",
-    "Georgia",
-    "Roboto",
-    "Open Sans",
-    "Segoe UI"
-]
-def get_system_fonts():
-    fonts = []
-    common_fonts_found = []
-    for font in matplotlib.font_manager.findSystemFonts(fontpaths=None, fontext='ttf'):
-        font_name = os.path.basename(font)
-        actual_name = matplotlib.font_manager.FontProperties(fname=font).get_name()
-        if any(common_font.lower() in actual_name.lower() for common_font in COMMON_FONTS):
-            common_fonts_found.append((font_name, font))
-        fonts.append((font_name, font))
-    sorted_fonts = sorted(common_fonts_found, key=lambda x: COMMON_FONTS.index(
-        next(cf for cf in COMMON_FONTS if cf.lower() in matplotlib.font_manager.FontProperties(fname=x[1]).get_name().lower())
-    ))
-    sorted_fonts.extend([(f[0], f[1]) for f in fonts if f not in common_fonts_found])
-    return [f[0] for f in sorted_fonts], {f[0]: f[1] for f in sorted_fonts}
-def parse_color(color):
-    if isinstance(color, str) and color.startswith('rgba'):
-        color = color.replace('rgba', '').strip('()').split(',')
-        return tuple(int(float(c.strip())) for c in color[:3])
-    return color
 def calculate_text_dimensions(text, font, max_width, margin):
     lines = []
     for line in text.split('\n'):
         lines.extend(textwrap.wrap(line, width=int(max_width / font.size * 1.8)))
     bbox = font.getbbox('Ay')
@@ -60,6 +64,7 @@ def calculate_text_dimensions(text, font, max_width, margin):
     return lines, line_height, total_height
 def create_text_segment(lines, start_idx, max_lines, width, height, bg_color, text_color, font, align, margin):
     img = Image.new("RGB", (width, height), color=bg_color)
     draw = ImageDraw.Draw(img)
@@ -74,11 +79,11 @@ def create_text_segment(lines, start_idx, max_lines, width, height, bg_color, te
         bbox = font.getbbox(line)
         line_width = bbox[2] - bbox[0]
-        if align == 'Left':
             x = margin
-        elif align == 'Center':
             x = (width - line_width) // 2
-        else:  # Right alignment
             x = width - line_width - margin
         draw.text((x, y), line, fill=text_color, font=font)
@@ -86,22 +91,13 @@ def create_text_segment(lines, start_idx, max_lines, width, height, bg_color, te
     return img, end_idx
-def save_image_to_file(img, format="PNG"):
-    temp_dir = Path(tempfile.gettempdir())
-    temp_file = temp_dir / f"text_image.{format.lower()}"
-    img.save(temp_file, format=format)
-    return str(temp_file)
-def render_plain_text_image(text, font_size, width, height, bg_color, text_color, font_name, align):
-    bg_color = parse_color(bg_color)
-    text_color = parse_color(text_color)
     margin = 10
     try:
-        font_path = FONT_PATHS.get(font_name, font_name)
         font = ImageFont.truetype(font_path, font_size)
     except Exception:
         font = ImageFont.load_default()
     max_width = width - 2 * margin
@@ -112,30 +108,27 @@ def render_plain_text_image(text, font_size, width, height, bg_color, text_color
     segments = []
     current_line = 0
-    for i in range(num_segments):
         segment_img, current_line = create_text_segment(
             lines, current_line, max_lines_per_segment,
             width, height, bg_color, text_color, font, align, margin
         )
         segments.append(segment_img)
-    total_height = len(segments) * height
-    final_image = Image.new("RGB", (width, total_height), color=bg_color)
     for i, segment in enumerate(segments):
         final_image.paste(segment, (0, i * height))
     return final_image
 def render_math_image(text, font_size, width, height, bg_color, text_color):
-    bg_color = parse_color(bg_color)
-    text_color = parse_color(text_color)
     fig, ax = plt.subplots(figsize=(width / 100, height / 100), facecolor=bg_color)
     ax.set_facecolor(bg_color)
     ax.axis('off')
     if not (text.startswith(r"$") and text.endswith(r"$")):
         text = rf"${text}$"
@@ -144,116 +137,88 @@ def render_math_image(text, font_size, width, height, bg_color, text_color):
     buf = BytesIO()
     plt.savefig(buf, format='png', bbox_inches='tight', pad_inches=0)
     plt.close(fig)
     buf.seek(0)
     img = Image.open(buf)
     return img
-def text_to_image(input_text, font_size, width, height, bg_color, text_color,
-                  mode, font_name, align, image_format, preview_mode):
-    if mode == "Plain Text":
-        img = render_plain_text_image(input_text, font_size, width, height,
-                                      bg_color, text_color, font_name, align)
-    elif mode == "LaTeX Math":
-        img = render_math_image(input_text, font_size, width, height, bg_color, text_color)
-    else:
-        return "Invalid mode selected!"
-    if preview_mode:
-        return img
-    else:
-        return save_image_to_file(img, image_format)
-def handle_file_upload(file, font_size, width, height, bg_color, text_color,
-                       mode, font_name, align, image_format, preview_mode):
-    if file is not None:
-        file_path = file[0]
-        with open(file_path, "r", encoding="utf-8") as f:
-            text = f.read()
-        return text_to_image(text, font_size, width, height, bg_color, text_color,
-                             mode, font_name, align, image_format, preview_mode)
-    return "No file uploaded!"
-# Retrieve the system fonts and choose a default font.
-font_list, FONT_PATHS = get_system_fonts()
-default_font = next((f for f in font_list if "times" in f.lower() or "arial" in f.lower()), font_list[0])
-with gr.Blocks() as demo:
-    gr.Markdown("# 🖼️ Text to Image Converter")
-    with gr.Row():
-        input_text = gr.Textbox(label="Enter Text", placeholder="Type or paste text here...", lines=5)
-        file_input = gr.File(label="Upload a Text File", type="filepath")
-    with gr.Row():
-        font_size = gr.Slider(10, 100, value=30, label="Font Size")
-        font_name = gr.Dropdown(choices=font_list, value=default_font, label="Font")
-        align = gr.Radio(["Left", "Center", "Right"], label="Text Alignment", value="Center")
-    with gr.Row():
-        width = gr.Slider(200, 2000, value=800, label="Image Width")
-        height = gr.Slider(200, 2000, value=600, label="Base Height")
-    with gr.Row():
-        bg_color = gr.ColorPicker(label="Background Color", value="#FFFFFF")
-        text_color = gr.ColorPicker(label="Text Color", value="#000000")
-    with gr.Row():
-        mode = gr.Radio(["Plain Text", "LaTeX Math"], label="Rendering Mode", value="Plain Text")
-        image_format = gr.Radio(["PNG", "JPEG"], label="Image Format", value="PNG")
-        preview_mode = gr.Checkbox(label="Preview Mode", value=True,
-                                   info="Uncheck to get download link instead of preview")
-    # Replace gr.Variable with gr.State for maintaining state
-    output = gr.State()
-    preview_image = gr.Image(label="Preview", visible=True)
-    download_link = gr.File(label="Download Image", visible=False)
-    # The update function now returns a tuple of two outputs.
-    def update_output(result, preview_mode):
-        if preview_mode:
-            # When in preview mode, show the image preview and hide the download link.
-            return result, gr.update(visible=False)
         else:
-            # Otherwise, hide the preview and show the download link.
-            return gr.update(visible=False), result
-    with gr.Row():
-        convert_button = gr.Button("Convert Text to Image")
-        file_convert_button = gr.Button("Convert File to Image")
-    # When clicking the convert button, first run text_to_image and then update the outputs.
-    convert_button.click(
-        text_to_image,
-        inputs=[
-            input_text, font_size, width, height, bg_color, text_color,
-            mode, font_name, align, image_format, preview_mode
-        ],
-        outputs=[output]
-    ).then(
-        update_output,
-        inputs=[output, preview_mode],
-        outputs=[preview_image, download_link]
-    )
-    # For file upload conversion:
-    file_convert_button.click(
-        handle_file_upload,
-        inputs=[
-            file_input, font_size, width, height, bg_color, text_color,
-            mode, font_name, align, image_format, preview_mode
-        ],
-        outputs=[output]
-    ).then(
-        update_output,
-        inputs=[output, preview_mode],
-        outputs=[preview_image, download_link]
-    )
-    preview_mode.change(
-        update_output,
-        inputs=[output, preview_mode],
-        outputs=[preview_image, download_link]
-    )
-demo.launch()

 import os
 import math
+import textwrap
+from io import BytesIO
+import gradio as gr
+import matplotlib.pyplot as plt
+from PIL import Image, ImageDraw, ImageFont
+from huggingface_hub import hf_hub_download
+# --- Phần tải về CLI tool từ Hugging Face Hub ---
+# Giả sử tên file CLI trong repo là "Texttoimage" (bạn có thể thay đổi nếu cần)
+CLI_FILENAME = "Texttoimage"
+if not os.path.exists(CLI_FILENAME):
+    hf_token = os.environ.get("HF_TOKEN")
+    if not hf_token:
+        print("Biến môi trường HF_TOKEN chưa được thiết lập!")
+    else:
+        try:
+            # Tải file CLI từ repo ArrcttacsrjksX/Texttoimage
+            cli_local_path = hf_hub_download(
+                repo_id="ArrcttacsrjksX/Texttoimage",
+                filename=CLI_FILENAME,
+                token=hf_token
+            )
+            # Di chuyển (hoặc đổi tên) file tải về nếu cần
+            os.rename(cli_local_path, CLI_FILENAME)
+            # Cho phép chạy được file CLI
+            os.chmod(CLI_FILENAME, 0o755)
+            print(f"Đã tải về CLI tool: {CLI_FILENAME}")
+        except Exception as e:
+            print(f"Lỗi khi tải CLI tool: {e}")
+# --- Các hàm hỗ trợ render ảnh text ---
+def parse_color(color: str):
+    """
+    Chuyển đổi chuỗi màu (hex hoặc RGB dạng "R,G,B") thành tuple RGB.
+    Ví dụ: "#FFEEEE" hoặc "255,238,238"
+    """
+    color = color.strip()
+    if color.startswith('#'):
+        color = color.lstrip('#')
+        if len(color) != 6:
+            raise ValueError("Mã hex phải có 6 ký tự.")
+        return tuple(int(color[i:i+2], 16) for i in (0, 2, 4))
+    else:
+        parts = color.split(',')
+        if len(parts) != 3:
+            raise ValueError("Màu dạng RGB phải có 3 thành phần cách nhau bởi dấu phẩy.")
+        return tuple(int(x) for x in parts)
 def calculate_text_dimensions(text, font, max_width, margin):
+    """Tính toán kích thước text cho việc wrap theo chiều rộng cho trước."""
     lines = []
     for line in text.split('\n'):
+        # Sử dụng độ rộng ước tính dựa trên kích thước font
         lines.extend(textwrap.wrap(line, width=int(max_width / font.size * 1.8)))
     bbox = font.getbbox('Ay')
     return lines, line_height, total_height
 def create_text_segment(lines, start_idx, max_lines, width, height, bg_color, text_color, font, align, margin):
+    """Tạo một đoạn ảnh chứa một phần các dòng text."""
     img = Image.new("RGB", (width, height), color=bg_color)
     draw = ImageDraw.Draw(img)
         bbox = font.getbbox(line)
         line_width = bbox[2] - bbox[0]
+        if align == 'left':
             x = margin
+        elif align == 'center':
             x = (width - line_width) // 2
+        else:  # 'right'
             x = width - line_width - margin
         draw.text((x, y), line, fill=text_color, font=font)
     return img, end_idx
+def render_plain_text_image(text, font_size, width, height, bg_color, text_color, font_path, align):
+    """Render ảnh chứa text dạng thông thường."""
     margin = 10
     try:
         font = ImageFont.truetype(font_path, font_size)
     except Exception:
+        print(f"Cảnh báo: Không tải được font {font_path}. Sử dụng font mặc định.")
         font = ImageFont.load_default()
     max_width = width - 2 * margin
     segments = []
     current_line = 0
+    for _ in range(num_segments):
         segment_img, current_line = create_text_segment(
             lines, current_line, max_lines_per_segment,
             width, height, bg_color, text_color, font, align, margin
         )
         segments.append(segment_img)
+    total_img_height = len(segments) * height
+    final_image = Image.new("RGB", (width, total_img_height), color=bg_color)
     for i, segment in enumerate(segments):
         final_image.paste(segment, (0, i * height))
     return final_image
 def render_math_image(text, font_size, width, height, bg_color, text_color):
+    """Render ảnh chứa biểu thức toán học sử dụng matplotlib."""
     fig, ax = plt.subplots(figsize=(width / 100, height / 100), facecolor=bg_color)
     ax.set_facecolor(bg_color)
     ax.axis('off')
+    # Nếu text chưa được bọc trong dấu $, thêm vào
     if not (text.startswith(r"$") and text.endswith(r"$")):
         text = rf"${text}$"
     buf = BytesIO()
     plt.savefig(buf, format='png', bbox_inches='tight', pad_inches=0)
     plt.close(fig)
     buf.seek(0)
     img = Image.open(buf)
     return img
+# --- Hàm xử lý chính cho giao diện Gradio ---
+def generate_image(text: str,
+                   font_size: int,
+                   width: int,
+                   height: int,
+                   bg_color: str,
+                   text_color: str,
+                   align: str,
+                   mode: str,
+                   font_path: str):
+    """
+    Hàm tạo ảnh từ text với các tham số đầu vào.
+    Nếu mode = "plain" thì render text bình thường,
+    nếu mode = "math" thì render biểu thức toán học.
+    """
+    try:
+        bg_color_tuple = parse_color(bg_color)
+        text_color_tuple = parse_color(text_color)
+    except Exception as e:
+        return f"Lỗi khi parse màu: {e}"
+    try:
+        if mode == "plain":
+            img = render_plain_text_image(
+                text, font_size, width, height,
+                bg_color_tuple, text_color_tuple, font_path, align
+            )
         else:
+            img = render_math_image(
+                text, font_size, width, height,
+                bg_color_tuple, text_color_tuple
+            )
+    except Exception as e:
+        return f"Lỗi khi tạo ảnh: {e}"
+    return img
+# --- Tạo giao diện Gradio ---
+# Các widget đầu vào
+text_input = gr.Textbox(label="Text cần chuyển", placeholder="Nhập text của bạn vào đây...", lines=4)
+font_size_input = gr.Slider(10, 100, value=40, step=1, label="Cỡ chữ (font size)")
+width_input = gr.Number(value=1000, label="Chiều rộng ảnh (px)")
+height_input = gr.Number(value=800, label="Chiều cao ảnh (px)")
+bg_color_input = gr.Textbox(value="#FFEEEE", label="Màu nền (hex hoặc R,G,B)")
+text_color_input = gr.Textbox(value="#000066", label="Màu chữ (hex hoặc R,G,B)")
+align_input = gr.Radio(choices=["left", "center", "right"], value="right", label="Căn chỉnh text")
+mode_input = gr.Radio(choices=["plain", "math"], value="plain", label="Chế độ render")
+font_path_input = gr.Textbox(value="/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf", label="Đường dẫn font")
+# Một số CSS tùy chỉnh để làm đẹp giao diện
+custom_css = """
+body {
+    background: linear-gradient(135deg, #f6d365 0%, #fda085 100%);
+    font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
+}
+.gradio-container {
+    border-radius: 15px;
+    box-shadow: 0 4px 10px rgba(0,0,0,0.2);
+    padding: 20px;
+    background-color: rgba(255, 255, 255, 0.9);
+}
+"""
+# Xây dựng giao diện Gradio
+demo = gr.Interface(
+    fn=generate_image,
+    inputs=[text_input, font_size_input, width_input, height_input,
+            bg_color_input, text_color_input, align_input, mode_input, font_path_input],
+    outputs=gr.Image(type="pil", label="Ảnh được tạo"),
+    title="Text to Image - Texttoimage CLI",
+    description=("Giao diện demo chuyển text thành ảnh. "
+                 "Bạn có thể nhập text, chọn các tham số như kích thước, màu sắc, căn chỉnh, "
+                 "và xem ảnh được render theo thời gian thực."),
+    css=custom_css,
+    allow_flagging="never"
+)
+if __name__ == "__main__":
+    demo.launch()