Spaces:

jbilcke-hf
/

ai-comic-factory

Running on CPU Upgrade

App Files Files Community

1003

ai-comic-factory / src /types.ts

jbilcke-hf HF staff

working on an experimental speech bubble display

95a4e14 5 months ago

raw

history blame

4.78 kB

	export type ProjectionMode = 'cartesian' \| 'spherical'

	export type CacheMode = "use" \| "renew" \| "ignore"

	export interface RenderRequest {
	prompt: string

	// whether to use video segmentation
	// disabled (default)
	// firstframe: we only analyze the first frame
	// allframes: we analyze all the frames
	segmentation: 'disabled' \| 'firstframe' \| 'allframes'

	// segmentation will only be executed if we have a non-empty list of actionnables
	// actionnables are names of things like "chest", "key", "tree", "chair" etc
	actionnables: string[]

	nbFrames: number
	nbFPS: number

	nbSteps: number // min: 1, max: 50

	seed: number

	width: number // fixed at 1024 for now
	height: number // fixed at 512 for now

	// upscaling factor
	// 0: no upscaling
	// 1: no upscaling
	// 2: 2x larger
	// 3: 3x larger
	// 4x: 4x larger, up to 4096x4096 (warning: a PNG of this size can be 50 Mb!)
	upscalingFactor: number

	projection: ProjectionMode

	/**
	* Use turbo mode
	*
	* At the time of writing this will use SSD-1B + LCM
	* https://huggingface.co/spaces/jbilcke-hf/fast-image-server
	*/
	turbo: boolean

	cache: CacheMode

	wait: boolean // wait until the job is completed

	analyze: boolean // analyze the image to generate a caption (optional)

	identityImage: string // reference image for the main entity
	}

	export interface ImageSegment {
	id: number
	box: number[]
	color: number[]
	label: string
	score: number
	}

	export type RenderedSceneStatus =
	\| "pregenerated"
	\| "pending"
	\| "completed"
	\| "error"

	export interface RenderedScene {
	renderId: string
	status: RenderedSceneStatus
	assetUrl: string
	alt: string
	error: string
	maskUrl: string
	segments: ImageSegment[]
	}

	export interface ImageAnalysisRequest {
	image: string // in base64
	prompt: string
	}

	export interface ImageAnalysisResponse {
	result: string
	error?: string
	}

	export type GeneratedPanel = {
	panel: number
	instructions: string
	speech: string
	caption: string
	}

	export type GeneratedPanels = GeneratedPanel[]

	// LLMVendor = what the user configure in the UI (eg. a dropdown item called default server)
	// LLMEngine = the actual engine to use (eg. hugging face)
	export type LLMEngine =
	\| "INFERENCE_API"
	\| "INFERENCE_ENDPOINT"
	\| "OPENAI"
	\| "REPLICATE"
	\| "GROQ"
	\| "ANTHROPIC"

	export type RenderingEngine =
	\| "VIDEOCHAIN"
	\| "OPENAI"
	\| "REPLICATE"
	\| "INFERENCE_API"
	\| "INFERENCE_ENDPOINT"

	export type RenderingModelVendor =
	\| "SERVER"
	\| "OPENAI"
	\| "REPLICATE"
	\| "HUGGINGFACE"

	// LLMVendor = what the user configure in the UI (eg. a dropdown item called default server)
	// LLMEngine = the actual engine to use (eg. hugging face)
	export type LLMVendor =
	\| "SERVER"
	\| "OPENAI"
	\| "GROQ"
	\| "ANTHROPIC"

	export type LLMVendorConfig = {
	vendor: LLMVendor
	apiKey: string
	modelId: string
	}

	export type LLMPredictionFunctionParams = {
	systemPrompt: string
	userPrompt: string
	nbMaxNewTokens: number
	llmVendorConfig: LLMVendorConfig
	}

	export type PostVisibility =
	\| "featured" // featured by admins
	\| "trending" // top trending / received more than 10 upvotes
	\| "normal" // default visibility

	export type Post = {
	postId: string
	appId: string
	prompt: string
	previewUrl: string
	assetUrl: string
	createdAt: string
	visibility: PostVisibility
	upvotes: number
	downvotes: number
	}

	export type CreatePostResponse = {
	success?: boolean
	error?: string
	post: Post
	}

	export type GetAppPostsResponse = {
	success?: boolean
	error?: string
	posts: Post[]
	}

	export type GetAppPostResponse = {
	success?: boolean
	error?: string
	post: Post
	}

	export type LayoutProps = {
	page: number
	nbPanels: number
	}

	// TODO: rename the *Model fields to better indicate if this is a LLM or RENDER mdoel
	export type Settings = {
	renderingModelVendor: RenderingModelVendor
	renderingUseTurbo: boolean
	llmVendor: LLMVendor
	huggingFaceOAuth: string
	huggingfaceApiKey: string
	huggingfaceInferenceApiModel: string
	huggingfaceInferenceApiModelTrigger: string
	huggingfaceInferenceApiFileType: string
	replicateApiKey: string
	replicateApiModel: string
	replicateApiModelVersion: string
	replicateApiModelTrigger: string
	openaiApiKey: string
	openaiApiModel: string
	openaiApiLanguageModel: string
	groqApiKey: string
	groqApiLanguageModel: string
	anthropicApiKey: string
	anthropicApiLanguageModel: string
	hasGeneratedAtLeastOnce: boolean
	userDefinedMaxNumberOfPages: number
	}

	export type DynamicConfig = {
	maxNbPages: number
	nbPanelsPerPage: number
	nbTotalPanelsToGenerate: number
	oauthClientId: string
	oauthRedirectUrl: string
	oauthScopes: string
	enableHuggingFaceOAuth: boolean
	enableHuggingFaceOAuthWall: boolean
	}