gemini-3d-drawing / pages /api /generate-thumbnail.js
Trudy's picture
Initial commit with proper LFS tracking
5f07a23
import { GoogleGenerativeAI } from '@google/generative-ai';
import fs from 'fs';
import path from 'path';
// Define a fallback shape in case no reference image is provided and the file doesn't exist
// This is a simple white circle on black background encoded as base64
const DEFAULT_SHAPE_DATA_URL = '';
// Helper function to read the image file
const loadImageData = (filePath) => {
try {
const absolutePath = path.resolve('./public', filePath); // Adjust if your public dir is elsewhere
console.log(`Loading reference image from: ${absolutePath}`);
if (fs.existsSync(absolutePath)) {
const imageBuffer = fs.readFileSync(absolutePath);
return imageBuffer.toString('base64');
} else {
console.error(`Reference image not found at: ${absolutePath}`);
return null;
}
} catch (error) {
console.error('Error loading reference image:', error);
return null;
}
};
export default async function handler(req, res) {
if (req.method !== 'POST') {
return res.status(405).json({ error: 'Method not allowed' });
}
console.log('Starting thumbnail generation request');
try {
const { prompt, referenceImageData } = req.body;
if (!prompt) {
console.error('Missing prompt in request');
return res.status(400).json({ error: 'Prompt is required' });
}
console.log('Received prompt:', prompt.substring(0, 100));
// Initialize the model
const genAI = new GoogleGenerativeAI(process.env.GEMINI_API_KEY);
const model = genAI.getGenerativeModel({
model: "gemini-2.0-flash-exp-image-generation",
generationConfig: {
temperature: 0.8,
topP: 0.9,
topK: 40,
maxOutputTokens: 8192,
}
});
// Get the base image data (either from request or default)
const baseImageData = referenceImageData || DEFAULT_SHAPE_DATA_URL;
console.log('Using reference image:', referenceImageData ? 'Custom' : 'Default');
// Construct the prompt for the image model
const imageGenerationPrompt = `Treat the object shown in the reference image (the white circle) as a simple 3D sphere. Apply the following material description or style directly onto this sphere...`;
console.log('Generated image prompt:', imageGenerationPrompt.substring(0, 100));
// Prepare generation content
const generationContent = [
{ text: imageGenerationPrompt },
{
inlineData: {
data: baseImageData,
mimeType: "image/png"
}
},
];
console.log('Calling Gemini API for image generation...');
// Generate content
const result = await model.generateContent(generationContent);
const response = await result.response;
console.log('Received response from Gemini API');
// Process response
let generatedImageData = null;
// Safely access parts
const parts = response?.candidates?.[0]?.content?.parts;
if (!parts) {
console.error('No parts in response:', JSON.stringify(response));
throw new Error('No parts in response from Gemini API');
}
console.log('Processing response parts:', parts.length);
if (Array.isArray(parts)) {
for (const part of parts) {
if (part.inlineData && part.inlineData.mimeType?.startsWith('image/')) {
generatedImageData = part.inlineData.data;
console.log('Found image data in response');
break;
}
}
}
if (!generatedImageData) {
console.error('No image data in response parts:', JSON.stringify(parts));
throw new Error('No image data found in response parts');
}
console.log('Successfully generated thumbnail');
return res.status(200).json({
success: true,
imageData: generatedImageData
});
} catch (error) {
console.error('Error in thumbnail generation:', error);
return res.status(500).json({
success: false,
error: error.message || 'An error occurred during thumbnail generation'
});
}
}