@llumiverse/common
Version:
Public types, enums and options used by Llumiverse API.
293 lines • 14.1 kB
JavaScript
"use strict";
Object.defineProperty(exports, "__esModule", { value: true });
exports.ImagenMaskMode = exports.ImagenTaskType = void 0;
exports.getVertexAiOptions = getVertexAiOptions;
const types_js_1 = require("../types.js");
const fallback_js_1 = require("./fallback.js");
var ImagenTaskType;
(function (ImagenTaskType) {
ImagenTaskType["TEXT_IMAGE"] = "TEXT_IMAGE";
ImagenTaskType["EDIT_MODE_INPAINT_REMOVAL"] = "EDIT_MODE_INPAINT_REMOVAL";
ImagenTaskType["EDIT_MODE_INPAINT_INSERTION"] = "EDIT_MODE_INPAINT_INSERTION";
ImagenTaskType["EDIT_MODE_BGSWAP"] = "EDIT_MODE_BGSWAP";
ImagenTaskType["EDIT_MODE_OUTPAINT"] = "EDIT_MODE_OUTPAINT";
ImagenTaskType["CUSTOMIZATION_SUBJECT"] = "CUSTOMIZATION_SUBJECT";
ImagenTaskType["CUSTOMIZATION_STYLE"] = "CUSTOMIZATION_STYLE";
ImagenTaskType["CUSTOMIZATION_CONTROLLED"] = "CUSTOMIZATION_CONTROLLED";
ImagenTaskType["CUSTOMIZATION_INSTRUCT"] = "CUSTOMIZATION_INSTRUCT";
})(ImagenTaskType || (exports.ImagenTaskType = ImagenTaskType = {}));
var ImagenMaskMode;
(function (ImagenMaskMode) {
ImagenMaskMode["MASK_MODE_USER_PROVIDED"] = "MASK_MODE_USER_PROVIDED";
ImagenMaskMode["MASK_MODE_BACKGROUND"] = "MASK_MODE_BACKGROUND";
ImagenMaskMode["MASK_MODE_FOREGROUND"] = "MASK_MODE_FOREGROUND";
ImagenMaskMode["MASK_MODE_SEMANTIC"] = "MASK_MODE_SEMANTIC";
})(ImagenMaskMode || (exports.ImagenMaskMode = ImagenMaskMode = {}));
function getVertexAiOptions(model, option) {
if (model.includes("imagen-")) {
const commonOptions = [
{
name: types_js_1.SharedOptions.number_of_images, type: types_js_1.OptionType.numeric, min: 1, max: 4, default: 1,
integer: true, description: "Number of Images to generate",
},
{
name: types_js_1.SharedOptions.seed, type: types_js_1.OptionType.numeric, min: 0, max: 4294967295, default: 12,
integer: true, description: "The seed of the generated image"
},
{
name: "person_generation", type: types_js_1.OptionType.enum, enum: { "Disallow the inclusion of people or faces in images": "dont_allow", "Allow generation of adults only": "allow_adult", "Allow generation of people of all ages": "allow_all" },
default: "allow_adult", description: "The safety setting for allowing the generation of people in the image"
},
{
name: "safety_setting", type: types_js_1.OptionType.enum, enum: { "Block very few problematic prompts and responses": "block_none", "Block only few problematic prompts and responses": "block_only_high", "Block some problematic prompts and responses": "block_medium_and_above", "Strictest filtering": "block_low_and_above" },
default: "block_medium_and_above", description: "The overall safety setting"
},
];
const outputOptions = [
{
name: "image_file_type", type: types_js_1.OptionType.enum, enum: { "JPEG": "image/jpeg", "PNG": "image/png" },
default: "image/png", description: "The file type of the generated image",
refresh: true,
},
];
const jpegQuality = {
name: "jpeg_compression_quality", type: types_js_1.OptionType.numeric, min: 0, max: 100, default: 75,
integer: true, description: "The compression quality of the JPEG image",
};
if (option?.image_file_type === "image/jpeg") {
outputOptions.push(jpegQuality);
}
if (model.includes("generate")) {
//Generate models
const modeOptions = [
{
name: "aspect_ratio", type: types_js_1.OptionType.enum, enum: { "1:1": "1:1", "4:3": "4:3", "3:4": "3:4", "16:9": "16:9", "9:16": "9:16" },
default: "1:1", description: "The aspect ratio of the generated image"
},
{
name: "add_watermark", type: types_js_1.OptionType.boolean, default: false, description: "Add an invisible watermark to the generated image, useful for detection of AI images"
},
];
const enhanceOptions = !model.includes("generate-001") ? [
{
name: "enhance_prompt", type: types_js_1.OptionType.boolean, default: true, description: "VertexAI automatically rewrites the prompt to better reflect the prompt's intent."
},
] : [];
return {
_option_id: "vertexai-imagen",
options: [
...commonOptions,
...modeOptions,
...outputOptions,
...enhanceOptions,
]
};
}
if (model.includes("capability")) {
//Edit models
let guidanceScaleDefault = 75;
if (option?.edit_mode === ImagenTaskType.EDIT_MODE_INPAINT_INSERTION) {
guidanceScaleDefault = 60;
}
const modeOptions = [
{
name: "edit_mode", type: types_js_1.OptionType.enum,
enum: {
"EDIT_MODE_INPAINT_REMOVAL": "EDIT_MODE_INPAINT_REMOVAL",
"EDIT_MODE_INPAINT_INSERTION": "EDIT_MODE_INPAINT_INSERTION",
"EDIT_MODE_BGSWAP": "EDIT_MODE_BGSWAP",
"EDIT_MODE_OUTPAINT": "EDIT_MODE_OUTPAINT",
"CUSTOMIZATION_SUBJECT": "CUSTOMIZATION_SUBJECT",
"CUSTOMIZATION_STYLE": "CUSTOMIZATION_STYLE",
"CUSTOMIZATION_CONTROLLED": "CUSTOMIZATION_CONTROLLED",
"CUSTOMIZATION_INSTRUCT": "CUSTOMIZATION_INSTRUCT",
},
description: "The editing mode. CUSTOMIZATION options use few-shot learning to generate images based on a few examples."
},
{
name: "guidance_scale", type: types_js_1.OptionType.numeric, min: 0, max: 500, default: guidanceScaleDefault,
integer: true, description: "How closely the generation follows the prompt"
}
];
const maskOptions = (option?.edit_mode?.includes("EDIT")) ? [
{
name: "mask_mode", type: types_js_1.OptionType.enum,
enum: {
"MASK_MODE_USER_PROVIDED": "MASK_MODE_USER_PROVIDED",
"MASK_MODE_BACKGROUND": "MASK_MODE_BACKGROUND",
"MASK_MODE_FOREGROUND": "MASK_MODE_FOREGROUND",
"MASK_MODE_SEMANTIC": "MASK_MODE_SEMANTIC",
},
default: "MASK_MODE_USER_PROVIDED",
description: "How should the mask for the generation be provided"
},
{
name: "mask_dilation", type: types_js_1.OptionType.numeric, min: 0, max: 1,
integer: true, description: "The mask dilation, grows the mask by a percentage of image width to compensate for imprecise masks."
},
] : [];
const maskClassOptions = (option?.mask_mode === ImagenMaskMode.MASK_MODE_SEMANTIC) ? [
{
name: "mask_class", type: types_js_1.OptionType.string_list, default: [],
description: "Input Class IDs. Create a mask based on image class, based on https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/imagen-api-customization#segment-ids"
}
] : [];
const editOptions = option?.edit_mode?.includes("EDIT") ? [
{
name: "edit_steps", type: types_js_1.OptionType.numeric, default: 75,
integer: true, description: "The number of steps for the base image generation, more steps means more time and better quality"
},
] : [];
const customizationOptions = option?.edit_mode === ImagenTaskType.CUSTOMIZATION_CONTROLLED
|| option?.edit_mode === ImagenTaskType.CUSTOMIZATION_SUBJECT ? [
{
name: "controlType", type: types_js_1.OptionType.enum, enum: { "Face Mesh": "CONTROL_TYPE_FACE_MESH", "Canny": "CONTROL_TYPE_CANNY", "Scribble": "CONTROL_TYPE_SCRIBBLE" },
default: "CONTROL_TYPE_CANNY", description: "Method used to generate the control image"
},
{
name: "controlImageComputation", type: types_js_1.OptionType.boolean, default: true, description: "Should the control image be computed from the input image, or is it provided"
}
] : [];
return {
_option_id: "vertexai-imagen",
options: [
...modeOptions,
...commonOptions,
...maskOptions,
...maskClassOptions,
...editOptions,
...customizationOptions,
...outputOptions,
]
};
}
}
else if (model.includes("gemini")) {
const max_tokens_limit = getGeminiMaxTokensLimit(model);
const excludeOptions = ["max_tokens", "presence_penalty"];
let commonOptions = fallback_js_1.textOptionsFallback.options.filter((option) => !excludeOptions.includes(option.name));
if (model.includes("1.5")) {
commonOptions = commonOptions.filter((option) => option.name !== "frequency_penalty");
}
const max_tokens = [{
name: types_js_1.SharedOptions.max_tokens, type: types_js_1.OptionType.numeric, min: 1, max: max_tokens_limit,
integer: true, step: 200, description: "The maximum number of tokens to generate"
}];
return {
_option_id: "text-fallback",
options: [
...max_tokens,
...commonOptions,
]
};
}
else if (model.includes("claude")) {
const max_tokens_limit = getClaudeMaxTokensLimit(model, option);
const excludeOptions = ["max_tokens", "presence_penalty", "frequency_penalty"];
let commonOptions = fallback_js_1.textOptionsFallback.options.filter((option) => !excludeOptions.includes(option.name));
const max_tokens = [{
name: types_js_1.SharedOptions.max_tokens, type: types_js_1.OptionType.numeric, min: 1, max: max_tokens_limit,
integer: true, step: 200, description: "The maximum number of tokens to generate"
}];
if (model.includes("-3-7") || model.includes("-4")) {
const claudeModeOptions = [
{
name: "thinking_mode",
type: types_js_1.OptionType.boolean,
default: false,
description: "If true, use the extended reasoning mode"
},
];
const claudeThinkingOptions = option?.thinking_mode ? [
{
name: "thinking_budget_tokens",
type: types_js_1.OptionType.numeric,
min: 1024,
default: 4000,
integer: true,
step: 100,
description: "The target number of tokens to use for reasoning, not a hard limit."
},
] : [];
return {
_option_id: "vertexai-claude",
options: [
...max_tokens,
...commonOptions,
...claudeModeOptions,
...claudeThinkingOptions,
]
};
}
return {
_option_id: "vertexai-claude",
options: [
...max_tokens,
...commonOptions,
]
};
}
else if (model.includes("llama")) {
const max_tokens_limit = getLlamaMaxTokensLimit(model);
const excludeOptions = ["max_tokens", "presence_penalty", "frequency_penalty", "stop_sequence"];
let commonOptions = fallback_js_1.textOptionsFallback.options.filter((option) => !excludeOptions.includes(option.name));
const max_tokens = [{
name: types_js_1.SharedOptions.max_tokens, type: types_js_1.OptionType.numeric, min: 1, max: max_tokens_limit,
integer: true, step: 200, description: "The maximum number of tokens to generate"
}];
//Set max temperature to 1.0 for Llama models
commonOptions = commonOptions.map((option) => {
if (option.name === types_js_1.SharedOptions.temperature &&
option.type === types_js_1.OptionType.numeric) {
return {
...option,
max: 1.0,
};
}
return option;
});
return {
_option_id: "text-fallback",
options: [
...max_tokens,
...commonOptions,
]
};
}
return fallback_js_1.textOptionsFallback;
}
function getGeminiMaxTokensLimit(model) {
if (model.includes("thinking") || model.includes("-2.5-")) {
return 65536;
}
if (model.includes("ultra") || model.includes("vision")) {
return 2048;
}
return 8192;
}
function getClaudeMaxTokensLimit(model, option) {
if (model.includes("-4-")) {
if (model.includes("opus-")) {
return 32768;
}
return 65536;
}
else if (model.includes("-3-7-")) {
if (option && option?.thinking_mode) {
return 131072;
}
else {
return 8192;
}
}
else if (model.includes("-3-5-")) {
return 8192;
}
else {
return 4096;
}
}
function getLlamaMaxTokensLimit(_model) {
return 8192;
}
//# sourceMappingURL=vertexai.js.map