@ui-tars/shared
Version:
Shared types for UI-TARS
75 lines • 2.1 kB
TypeScript
export interface Message {
from: 'gpt' | 'human';
value: string;
}
export declare enum ErrorStatusEnum {
/** 100000 */
SCREENSHOT_RETRY_ERROR = -100000,
/** 100001 */
INVOKE_RETRY_ERROR = -100001,
/** 100002 */
EXECUTE_RETRY_ERROR = -100002,
/** 100003 */
MODEL_SERVICE_ERROR = -100003,
/** 100004 */
REACH_MAXLOOP_ERROR = -100004,
/** 100005 */
ENVIRONMENT_ERROR = -100005,
/** 100099 */
UNKNOWN_ERROR = -100099
}
export declare class GUIAgentError extends Error {
status: ErrorStatusEnum;
message: string;
stack?: string;
constructor(status: ErrorStatusEnum, message: string, stack?: string);
}
export type Status = `${StatusEnum}`;
export declare enum StatusEnum {
INIT = "init",
RUNNING = "running",
PAUSE = "pause",
END = "end",
CALL_USER = "call_user",
/**
* @deprecated kept for backward compatibility
*/
MAX_LOOP = "max_loop",
USER_STOPPED = "user_stopped",
ERROR = "error"
}
export interface VlmResponse {
generate_resp: {
input: string;
prediction: string;
uid: string;
}[];
}
export interface ScreenshotResult {
/** screenshot base64, `keep screenshot size as physical pixels` */
base64: string;
/** screenshot scale factor(DPR), physical_pixels = logical_resolution * scaleFactor */
scaleFactor: number;
}
export type Coords = [number, number] | [];
export type ActionInputs = Partial<{
content: string;
start_box: string;
end_box: string;
key: string;
hotkey: string;
direction: string;
start_coords: Coords;
end_coords: Coords;
}>;
export interface PredictionParsed {
/** `<action_inputs>` parsed from action_type(`action_inputs`) */
action_inputs: ActionInputs;
/** `<reflection>` parsed from Reflection: `<reflection>` */
reflection: string | null;
/** `<action_type>` parsed from `<action_type>`(action_inputs) */
action_type: string;
/** `<thought>` parsed from Thought: `<thought>` */
thought: string;
}
//# sourceMappingURL=agent.d.ts.map