2025-04-26 04:30:58 -04:00
const axios = require ( 'axios' ) ;
const { v4 } = require ( 'uuid' ) ;
const OpenAI = require ( 'openai' ) ;
const FormData = require ( 'form-data' ) ;
2025-07-28 15:12:29 -04:00
const { ProxyAgent } = require ( 'undici' ) ;
2025-04-26 04:30:58 -04:00
const { tool } = require ( '@langchain/core/tools' ) ;
2025-06-13 15:14:57 -04:00
const { logger } = require ( '@librechat/data-schemas' ) ;
2025-08-26 12:10:18 -04:00
const { logAxiosError , oaiToolkit } = require ( '@librechat/api' ) ;
2025-04-26 04:30:58 -04:00
const { ContentTypes , EImageOutputType } = require ( 'librechat-data-provider' ) ;
const { getStrategyFunctions } = require ( '~/server/services/Files/strategies' ) ;
2025-08-26 12:10:18 -04:00
const extractBaseURL = require ( '~/utils/extractBaseURL' ) ;
2025-04-26 04:30:58 -04:00
const { getFiles } = require ( '~/models/File' ) ;
const displayMessage =
2025-05-30 18:16:34 +02:00
"The tool displayed an image. All generated images are already plainly visible, so don't repeat the descriptions in detail. Do not list download links as they are available in the UI already. The user may download the images by clicking on them, but do not mention anything about downloading to the user." ;
2025-04-26 04:30:58 -04:00
/ * *
* Replaces unwanted characters from the input string
* @ param { string } inputString - The input string to process
* @ returns { string } - The processed string
* /
function replaceUnwantedChars ( inputString ) {
return inputString
. replace ( /\r\n|\r|\n/g , ' ' )
. replace ( /"/g , '' )
. trim ( ) ;
}
function returnValue ( value ) {
if ( typeof value === 'string' ) {
return [ value , { } ] ;
} else if ( typeof value === 'object' ) {
if ( Array . isArray ( value ) ) {
return value ;
}
return [ displayMessage , value ] ;
}
return value ;
}
2025-06-23 19:44:24 -04:00
function createAbortHandler ( ) {
return function ( ) {
logger . debug ( '[ImageGenOAI] Image generation aborted' ) ;
} ;
}
2025-04-26 04:30:58 -04:00
/ * *
* Creates OpenAI Image tools ( generation and editing )
* @ param { Object } fields - Configuration fields
* @ param { ServerRequest } fields . req - Whether the tool is being used in an agent context
* @ param { boolean } fields . isAgent - Whether the tool is being used in an agent context
* @ param { string } fields . IMAGE _GEN _OAI _API _KEY - The OpenAI API key
* @ param { boolean } [ fields . override ] - Whether to override the API key check , necessary for app initialization
* @ param { MongoFile [ ] } [ fields . imageFiles ] - The images to be used for editing
2025-08-26 12:10:18 -04:00
* @ param { string } [ fields . imageOutputType ] - The image output type configuration
* @ param { string } [ fields . fileStrategy ] - The file storage strategy
* @ returns { Array < ReturnType < tool >> } - Array of image tools
2025-04-26 04:30:58 -04:00
* /
function createOpenAIImageTools ( fields = { } ) {
/** @type {boolean} Used to initialize the Tool without necessary variables. */
const override = fields . override ? ? false ;
/** @type {boolean} */
if ( ! override && ! fields . isAgent ) {
throw new Error ( 'This tool is only available for agents.' ) ;
}
const { req } = fields ;
2025-08-26 12:10:18 -04:00
const imageOutputType = fields . imageOutputType || EImageOutputType . PNG ;
const appFileStrategy = fields . fileStrategy ;
2025-04-26 04:30:58 -04:00
const getApiKey = ( ) => {
const apiKey = process . env . IMAGE _GEN _OAI _API _KEY ? ? '' ;
if ( ! apiKey && ! override ) {
throw new Error ( 'Missing IMAGE_GEN_OAI_API_KEY environment variable.' ) ;
}
return apiKey ;
} ;
let apiKey = fields . IMAGE _GEN _OAI _API _KEY ? ? getApiKey ( ) ;
const closureConfig = { apiKey } ;
let baseURL = 'https://api.openai.com/v1/' ;
if ( ! override && process . env . IMAGE _GEN _OAI _BASEURL ) {
baseURL = extractBaseURL ( process . env . IMAGE _GEN _OAI _BASEURL ) ;
closureConfig . baseURL = baseURL ;
}
// Note: Azure may not yet support the latest image generation models
if (
! override &&
process . env . IMAGE _GEN _OAI _AZURE _API _VERSION &&
process . env . IMAGE _GEN _OAI _BASEURL
) {
baseURL = process . env . IMAGE _GEN _OAI _BASEURL ;
closureConfig . baseURL = baseURL ;
closureConfig . defaultQuery = { 'api-version' : process . env . IMAGE _GEN _OAI _AZURE _API _VERSION } ;
closureConfig . defaultHeaders = {
'api-key' : process . env . IMAGE _GEN _OAI _API _KEY ,
'Content-Type' : 'application/json' ,
} ;
closureConfig . apiKey = process . env . IMAGE _GEN _OAI _API _KEY ;
}
const imageFiles = fields . imageFiles ? ? [ ] ;
/ * *
* Image Generation Tool
* /
const imageGenTool = tool (
async (
{
prompt ,
background = 'auto' ,
n = 1 ,
output _compression = 100 ,
quality = 'auto' ,
size = 'auto' ,
} ,
runnableConfig ,
) => {
if ( ! prompt ) {
throw new Error ( 'Missing required field: prompt' ) ;
}
const clientConfig = { ... closureConfig } ;
if ( process . env . PROXY ) {
2025-07-28 15:12:29 -04:00
const proxyAgent = new ProxyAgent ( process . env . PROXY ) ;
clientConfig . fetchOptions = {
dispatcher : proxyAgent ,
} ;
2025-04-26 04:30:58 -04:00
}
/** @type {OpenAI} */
const openai = new OpenAI ( clientConfig ) ;
let output _format = imageOutputType ;
if (
background === 'transparent' &&
output _format !== EImageOutputType . PNG &&
output _format !== EImageOutputType . WEBP
) {
logger . warn (
'[ImageGenOAI] Transparent background requires PNG or WebP format, defaulting to PNG' ,
) ;
output _format = EImageOutputType . PNG ;
}
let resp ;
2025-06-23 19:44:24 -04:00
/** @type {AbortSignal} */
let derivedSignal = null ;
/** @type {() => void} */
let abortHandler = null ;
2025-04-26 04:30:58 -04:00
try {
2025-06-23 19:44:24 -04:00
if ( runnableConfig ? . signal ) {
derivedSignal = AbortSignal . any ( [ runnableConfig . signal ] ) ;
abortHandler = createAbortHandler ( ) ;
derivedSignal . addEventListener ( 'abort' , abortHandler , { once : true } ) ;
}
2025-04-26 04:30:58 -04:00
resp = await openai . images . generate (
{
model : 'gpt-image-1' ,
prompt : replaceUnwantedChars ( prompt ) ,
n : Math . min ( Math . max ( 1 , n ) , 10 ) ,
background ,
output _format ,
output _compression :
output _format === EImageOutputType . WEBP || output _format === EImageOutputType . JPEG
? output _compression
: undefined ,
quality ,
size ,
} ,
{
signal : derivedSignal ,
} ,
) ;
} catch ( error ) {
const message = '[image_gen_oai] Problem generating the image:' ;
logAxiosError ( { error , message } ) ;
return returnValue ( ` Something went wrong when trying to generate the image. The OpenAI API may be unavailable:
Error Message : $ { error . message } ` );
2025-06-23 19:44:24 -04:00
} finally {
if ( abortHandler && derivedSignal ) {
derivedSignal . removeEventListener ( 'abort' , abortHandler ) ;
}
2025-04-26 04:30:58 -04:00
}
if ( ! resp ) {
return returnValue (
'Something went wrong when trying to generate the image. The OpenAI API may be unavailable' ,
) ;
}
// For gpt-image-1, the response contains base64-encoded images
// TODO: handle cost in `resp.usage`
const base64Image = resp . data [ 0 ] . b64 _json ;
if ( ! base64Image ) {
return returnValue (
'No image data returned from OpenAI API. There may be a problem with the API or your configuration.' ,
) ;
}
const content = [
{
type : ContentTypes . IMAGE _URL ,
image _url : {
url : ` data:image/ ${ output _format } ;base64, ${ base64Image } ` ,
} ,
} ,
] ;
const file _ids = [ v4 ( ) ] ;
const response = [
{
type : ContentTypes . TEXT ,
text : displayMessage + ` \n \n generated_image_id: " ${ file _ids [ 0 ] } " ` ,
} ,
] ;
return [ response , { content , file _ids } ] ;
} ,
2025-08-26 12:10:18 -04:00
oaiToolkit . image _gen _oai ,
2025-04-26 04:30:58 -04:00
) ;
/ * *
* Image Editing Tool
* /
const imageEditTool = tool (
async ( { prompt , image _ids , quality = 'auto' , size = 'auto' } , runnableConfig ) => {
if ( ! prompt ) {
throw new Error ( 'Missing required field: prompt' ) ;
}
const clientConfig = { ... closureConfig } ;
if ( process . env . PROXY ) {
2025-07-28 15:12:29 -04:00
const proxyAgent = new ProxyAgent ( process . env . PROXY ) ;
clientConfig . fetchOptions = {
dispatcher : proxyAgent ,
} ;
2025-04-26 04:30:58 -04:00
}
const formData = new FormData ( ) ;
formData . append ( 'model' , 'gpt-image-1' ) ;
formData . append ( 'prompt' , replaceUnwantedChars ( prompt ) ) ;
// TODO: `mask` support
// TODO: more than 1 image support
// formData.append('n', n.toString());
formData . append ( 'quality' , quality ) ;
formData . append ( 'size' , size ) ;
/** @type {Record<FileSources, undefined | NodeStreamDownloader<File>>} */
const streamMethods = { } ;
const requestFilesMap = Object . fromEntries ( imageFiles . map ( ( f ) => [ f . file _id , { ... f } ] ) ) ;
const orderedFiles = new Array ( image _ids . length ) ;
const idsToFetch = [ ] ;
const indexOfMissing = Object . create ( null ) ;
for ( let i = 0 ; i < image _ids . length ; i ++ ) {
const id = image _ids [ i ] ;
const file = requestFilesMap [ id ] ;
if ( file ) {
orderedFiles [ i ] = file ;
} else {
idsToFetch . push ( id ) ;
indexOfMissing [ id ] = i ;
}
}
if ( idsToFetch . length ) {
const fetchedFiles = await getFiles (
{
user : req . user . id ,
file _id : { $in : idsToFetch } ,
height : { $exists : true } ,
width : { $exists : true } ,
} ,
{ } ,
{ } ,
) ;
for ( const file of fetchedFiles ) {
requestFilesMap [ file . file _id ] = file ;
orderedFiles [ indexOfMissing [ file . file _id ] ] = file ;
}
}
for ( const imageFile of orderedFiles ) {
if ( ! imageFile ) {
continue ;
}
/** @type {NodeStream<File>} */
let stream ;
/** @type {NodeStreamDownloader<File>} */
let getDownloadStream ;
const source = imageFile . source || appFileStrategy ;
if ( ! source ) {
throw new Error ( 'No source found for image file' ) ;
}
if ( streamMethods [ source ] ) {
getDownloadStream = streamMethods [ source ] ;
} else {
( { getDownloadStream } = getStrategyFunctions ( source ) ) ;
streamMethods [ source ] = getDownloadStream ;
}
if ( ! getDownloadStream ) {
throw new Error ( ` No download stream method found for source: ${ source } ` ) ;
}
stream = await getDownloadStream ( req , imageFile . filepath ) ;
if ( ! stream ) {
throw new Error ( 'Failed to get download stream for image file' ) ;
}
formData . append ( 'image[]' , stream , {
filename : imageFile . filename ,
contentType : imageFile . type ,
} ) ;
}
/** @type {import('axios').RawAxiosHeaders} */
let headers = {
... formData . getHeaders ( ) ,
} ;
if ( process . env . IMAGE _GEN _OAI _AZURE _API _VERSION && process . env . IMAGE _GEN _OAI _BASEURL ) {
headers [ 'api-key' ] = apiKey ;
} else {
headers [ 'Authorization' ] = ` Bearer ${ apiKey } ` ;
}
2025-06-23 19:44:24 -04:00
/** @type {AbortSignal} */
let derivedSignal = null ;
/** @type {() => void} */
let abortHandler = null ;
2025-04-26 04:30:58 -04:00
try {
2025-06-23 19:44:24 -04:00
if ( runnableConfig ? . signal ) {
derivedSignal = AbortSignal . any ( [ runnableConfig . signal ] ) ;
abortHandler = createAbortHandler ( ) ;
derivedSignal . addEventListener ( 'abort' , abortHandler , { once : true } ) ;
}
2025-04-26 04:30:58 -04:00
/** @type {import('axios').AxiosRequestConfig} */
const axiosConfig = {
headers ,
... clientConfig ,
signal : derivedSignal ,
baseURL ,
} ;
2025-07-28 15:12:29 -04:00
if ( process . env . PROXY ) {
try {
const url = new URL ( process . env . PROXY ) ;
axiosConfig . proxy = {
host : url . hostname . replace ( /^\[|\]$/g , '' ) ,
port : url . port ? parseInt ( url . port , 10 ) : undefined ,
protocol : url . protocol . replace ( ':' , '' ) ,
} ;
} catch ( error ) {
logger . error ( 'Error parsing proxy URL:' , error ) ;
}
}
2025-04-26 04:30:58 -04:00
if ( process . env . IMAGE _GEN _OAI _AZURE _API _VERSION && process . env . IMAGE _GEN _OAI _BASEURL ) {
axiosConfig . params = {
'api-version' : process . env . IMAGE _GEN _OAI _AZURE _API _VERSION ,
... axiosConfig . params ,
} ;
}
const response = await axios . post ( '/images/edits' , formData , axiosConfig ) ;
if ( ! response . data || ! response . data . data || ! response . data . data . length ) {
return returnValue (
'No image data returned from OpenAI API. There may be a problem with the API or your configuration.' ,
) ;
}
const base64Image = response . data . data [ 0 ] . b64 _json ;
if ( ! base64Image ) {
return returnValue (
'No image data returned from OpenAI API. There may be a problem with the API or your configuration.' ,
) ;
}
const content = [
{
type : ContentTypes . IMAGE _URL ,
image _url : {
url : ` data:image/ ${ imageOutputType } ;base64, ${ base64Image } ` ,
} ,
} ,
] ;
const file _ids = [ v4 ( ) ] ;
const textResponse = [
{
type : ContentTypes . TEXT ,
text :
displayMessage +
` \n \n generated_image_id: " ${ file _ids [ 0 ] } " \n referenced_image_ids: [" ${ image _ids . join ( '", "' ) } "] ` ,
} ,
] ;
return [ textResponse , { content , file _ids } ] ;
} catch ( error ) {
const message = '[image_edit_oai] Problem editing the image:' ;
logAxiosError ( { error , message } ) ;
return returnValue ( ` Something went wrong when trying to edit the image. The OpenAI API may be unavailable:
Error Message : $ { error . message || 'Unknown error' } ` );
2025-06-23 19:44:24 -04:00
} finally {
if ( abortHandler && derivedSignal ) {
derivedSignal . removeEventListener ( 'abort' , abortHandler ) ;
}
2025-04-26 04:30:58 -04:00
}
} ,
2025-08-26 12:10:18 -04:00
oaiToolkit . image _edit _oai ,
2025-04-26 04:30:58 -04:00
) ;
return [ imageGenTool , imageEditTool ] ;
}
module . exports = createOpenAIImageTools ;