feat: support dall-e 3

This commit is contained in:
Hk-Gosuto
2023-11-07 17:57:53 +08:00
parent d5566f8c56
commit 8272245f7b
2 changed files with 66 additions and 27 deletions

View File

@@ -1,20 +1,27 @@
import { Tool } from "langchain/tools";
import { StructuredTool } from "langchain/tools";
import { z } from "zod";
import S3FileStorage from "../../utils/r2_file_storage";
export class DallEAPIWrapper extends Tool {
export class DallEAPIWrapper extends StructuredTool {
name = "dalle_image_generator";
n = 1;
size: "256x256" | "512x512" | "1024x1024" | null = "1024x1024";
apiKey: string;
baseURL?: string;
constructor(apiKey?: string | undefined, baseURL?: string | undefined) {
callback?: (data: string) => Promise<void>;
constructor(
apiKey?: string | undefined,
baseURL?: string | undefined,
callback?: (data: string) => Promise<void>,
) {
super();
if (!apiKey) {
throw new Error("OpenAI API key not set.");
}
this.apiKey = apiKey;
this.baseURL = baseURL;
this.callback = callback;
}
async saveImageFromUrl(url: string) {
@@ -24,23 +31,35 @@ export class DallEAPIWrapper extends Tool {
return await S3FileStorage.put(`${Date.now()}.png`, buffer);
}
schema = z.object({
prompt: z
.string()
.describe(
'input must be a english prompt. you can set `quality: "hd"` for enhanced detail.',
),
size: z
.enum(["1024x1024", "1024x1792", "1792x1024"])
.default("1024x1024")
.describe("images size"),
});
/** @ignore */
async _call(prompt: string) {
async _call({ prompt, size }: z.infer<typeof this.schema>) {
let image_url;
const apiUrl = `${this.baseURL}/images/generations`;
try {
const requestOptions = {
method: 'POST',
method: "POST",
headers: {
'Content-Type': 'application/json',
'Authorization': `Bearer ${this.apiKey}`
"Content-Type": "application/json",
Authorization: `Bearer ${this.apiKey}`,
},
body: JSON.stringify({
model: "dall-e-3",
prompt: prompt,
n: this.n,
size: this.size
})
size: size,
}),
};
const response = await fetch(apiUrl, requestOptions);
const json = await response.json();
@@ -50,13 +69,18 @@ export class DallEAPIWrapper extends Tool {
console.error("[DALL-E]", e);
}
if (!image_url) return "No image was generated";
let filePath = await this.saveImageFromUrl(image_url);
console.log(filePath);
return filePath;
try {
let filePath = await this.saveImageFromUrl(image_url);
console.log("[DALL-E]", filePath);
var imageMarkdown = `![img](${filePath})`;
if (this.callback != null) await this.callback(imageMarkdown);
return imageMarkdown;
} catch (e) {
if (this.callback != null)
await this.callback("Image upload to R2 storage failed");
return "Image upload to R2 storage failed";
}
}
description = `openai's dall-e image generator.
input must be a english prompt.
output will be the image link url.
use markdown to display images. like: ![img](/api/file/xxx.png)`;
description = `openai's dall-e 3 image generator.`;
}