Spaces:

Trudy
/

gemini-codrawing

Running

App Files Files Community

gemini-codrawing / pages /api /generate.js

Trudy's picture

first commit

eceac5b 14 days ago

3.81 kB

	import { GoogleGenerativeAI } from "@google/generative-ai";
	import fs from 'node:fs';
	import path from 'node:path';

	export default async function handler(req, res) {
	// Only allow POST requests
	if (req.method !== 'POST') {
	return res.status(405).json({ error: 'Method not allowed' });
	}

	// Get prompt and drawing from request body
	const { prompt, drawingData, saveToFile } = req.body;

	// Log request details (truncating drawingData for brevity)
	console.log("API Request:", {
	prompt,
	hasDrawingData: !!drawingData,
	drawingDataLength: drawingData ? drawingData.length : 0,
	drawingDataSample: drawingData ? `${drawingData.substring(0, 50)}... (truncated)` : null,
	saveToFile
	});

	if (!prompt) {
	return res.status(400).json({ error: 'Prompt is required' });
	}

	const genAI = new GoogleGenerativeAI(process.env.GEMINI_API_KEY);

	// Set responseModalities to include "Image" so the model can generate an image
	const model = genAI.getGenerativeModel({
	model: "gemini-2.0-flash-exp-image-generation",
	generationConfig: {
	responseModalities: ['Text', 'Image']
	},
	});

	try {
	let generationContent;

	// If drawingData is provided, include it as an image in the request
	if (drawingData) {
	// Create a content part with the base64-encoded image
	const imagePart = {
	inlineData: {
	data: drawingData,
	mimeType: "image/png"
	}
	};

	// Combine drawing with text prompt
	generationContent = [
	imagePart,
	{ text: `${prompt}. Keep the same minimal line doodle style.` \|\| "Add something new to this drawing, in the same style." }
	];
	console.log("Using multipart content with drawing data and prompt");
	} else {
	// Use text-only prompt if no drawing is provided
	generationContent = prompt;
	console.log("Using text-only prompt");
	}

	console.log("Calling Gemini API...");
	const response = await model.generateContent(generationContent);
	console.log("Gemini API response received");

	// Initialize response data
	const result = {
	success: true,
	message: '',
	imageData: null
	};

	// Process response parts
	for (const part of response.response.candidates[0].content.parts) {
	// Based on the part type, either get the text or image data
	if (part.text) {
	result.message = part.text;
	console.log("Received text response:", part.text);
	} else if (part.inlineData) {
	const imageData = part.inlineData.data;
	console.log("Received image data, length:", imageData.length);

	// Save the image to the public directory if requested
	if (saveToFile) {
	const publicDir = path.join(process.cwd(), 'public');
	const fileName = `gemini-image-${Date.now()}.png`;
	const filePath = path.join(publicDir, fileName);

	// Ensure the directory exists
	if (!fs.existsSync(publicDir)) {
	fs.mkdirSync(publicDir, { recursive: true });
	}

	const buffer = Buffer.from(imageData, 'base64');
	fs.writeFileSync(filePath, buffer);

	result.fileName = fileName;
	result.filePath = `/public/${fileName}`;
	console.log("Saved image to:", filePath);
	}

	// Always include the base64 data in the response
	result.imageData = imageData;
	}
	}

	console.log("Sending successful response");
	return res.status(200).json(result);
	} catch (error) {
	console.error("Error generating content:", error);
	return res.status(500).json({
	success: false,
	error: error.message \|\| 'Failed to generate image'
	});
	}
	}