Spaces:

jbilcke-hf
/

ai-tube

Running on CPU Upgrade

App Files Files Community

jbilcke-hf HF staff commited on Dec 16, 2023

Commit

0f35d4c

•

1 Parent(s): 534ad64

update

Browse files

Files changed (14) hide show

src/app/config.ts +4 -1
src/app/server/actions/ai-tube-hf/getChannelVideos.ts +5 -1
src/app/server/actions/ai-tube-hf/getVideoRequestsFromChannel.ts +17 -1
src/app/server/actions/ai-tube-hf/parseChannel.ts +8 -4
src/app/server/actions/ai-tube-hf/uploadVideoRequestToDataset.ts +19 -1
src/app/server/actions/submitVideoRequest.ts +8 -2
src/app/server/actions/utils/isValidNumber.ts +3 -0
src/app/server/actions/utils/orientationToWidthHeight.ts +38 -0
src/app/server/actions/utils/parseDatasetPrompt.ts +23 -2
src/app/server/actions/utils/parseDatasetReadme.ts +9 -3
src/app/server/actions/utils/parseVideoModelName.ts +2 -2
src/app/server/actions/utils/parseVideoOrientation.ts +31 -0
src/app/views/user-channel-view/index.tsx +84 -41
src/types.ts +41 -0

src/app/config.ts CHANGED Viewed

@@ -1,9 +1,12 @@
 export const showBetaFeatures = `${
   process.env.NEXT_PUBLIC_SHOW_BETA_FEATURES || ""
 }`.trim().toLowerCase() === "true"
-export const defaultVideoModel = "SVD"
 export const defaultVoice = "Julian"
 export const developerMode = `${

+import { VideoGenerationModel, VideoOrientation } from "@/types"
 export const showBetaFeatures = `${
   process.env.NEXT_PUBLIC_SHOW_BETA_FEATURES || ""
 }`.trim().toLowerCase() === "true"
+export const defaultVideoModel: VideoGenerationModel = "SVD"
+export const defaultVideoOrientation: VideoOrientation = "landscape"
 export const defaultVoice = "Julian"
 export const developerMode = `${

src/app/server/actions/ai-tube-hf/getChannelVideos.ts CHANGED Viewed

@@ -6,6 +6,7 @@ import { getVideoRequestsFromChannel  } from "./getVideoRequestsFromChannel"
 import { adminApiKey } from "../config"
 import { getVideoIndex } from "./getVideoIndex"
 import { extendVideosWithStats } from "./extendVideosWithStats"
 // return
 export async function getChannelVideos({
@@ -19,7 +20,7 @@ export async function getChannelVideos({
 }): Promise<VideoInfo[]> {
   if (!channel) { return [] }
   const videos = await getVideoRequestsFromChannel({
     channel,
     apiKey: adminApiKey,
@@ -50,6 +51,9 @@ export async function getChannelVideos({
       updatedAt: v.updatedAt,
       tags: v.tags,
       channel,
     }
     if (queued[v.id]) {

 import { adminApiKey } from "../config"
 import { getVideoIndex } from "./getVideoIndex"
 import { extendVideosWithStats } from "./extendVideosWithStats"
+import { orientationToWidthHeight } from "../utils/orientationToWidthHeight"
 // return
 export async function getChannelVideos({
 }): Promise<VideoInfo[]> {
   if (!channel) { return [] }
   const videos = await getVideoRequestsFromChannel({
     channel,
     apiKey: adminApiKey,
       updatedAt: v.updatedAt,
       tags: v.tags,
       channel,
+      duration: v.duration || 0,
+      orientation: v.orientation,
+      ...orientationToWidthHeight(v.orientation),
     }
     if (queued[v.id]) {

src/app/server/actions/ai-tube-hf/getVideoRequestsFromChannel.ts CHANGED Viewed

@@ -7,6 +7,7 @@ import { parsePromptFileName } from "../utils/parsePromptFileName"
 import { downloadFileAsText } from "./downloadFileAsText"
 import { parseDatasetPrompt } from "../utils/parseDatasetPrompt"
 import { parseVideoModelName } from "../utils/parseVideoModelName"
 /**
  * Return all the videos requests created by a user on their channel
@@ -72,7 +73,19 @@ export async function getVideoRequestsFromChannel({
           continue
         }
-        const { title, description, tags, prompt, thumbnail, model, lora, style, music, voice } = parseDatasetPrompt(rawMarkdown, channel)
         if (!title || !description || !prompt) {
           // console.log("dataset prompt is incomplete or unparseable")
@@ -101,6 +114,9 @@ export async function getVideoRequestsFromChannel({
           updatedAt: file.lastCommit?.date || new Date().toISOString(),
           tags: Array.isArray(tags) && tags.length ? tags : channel.tags,
           channel,
         }
         videos[id] = video

 import { downloadFileAsText } from "./downloadFileAsText"
 import { parseDatasetPrompt } from "../utils/parseDatasetPrompt"
 import { parseVideoModelName } from "../utils/parseVideoModelName"
+import { orientationToWidthHeight } from "../utils/orientationToWidthHeight"
 /**
  * Return all the videos requests created by a user on their channel
           continue
         }
+        const {
+          title,
+          description,
+          tags,
+          prompt,
+          thumbnail,
+          model,
+          lora,
+          style,
+          music,
+          voice,
+          orientation,
+        } = parseDatasetPrompt(rawMarkdown, channel)
         if (!title || !description || !prompt) {
           // console.log("dataset prompt is incomplete or unparseable")
           updatedAt: file.lastCommit?.date || new Date().toISOString(),
           tags: Array.isArray(tags) && tags.length ? tags : channel.tags,
           channel,
+          orientation,
+          ...orientationToWidthHeight(orientation),
+          duration: 0,
         }
         videos[id] = video

src/app/server/actions/ai-tube-hf/parseChannel.ts CHANGED Viewed

@@ -2,9 +2,10 @@
 import { Credentials, downloadFile, whoAmI } from "@/huggingface/hub/src"
 import { parseDatasetReadme } from "@/app/server/actions/utils/parseDatasetReadme"
-import { ChannelInfo, VideoGenerationModel } from "@/types"
 import { adminCredentials } from "../config"
 export async function parseChannel(options: {
   id: string
@@ -62,7 +63,7 @@ export async function parseChannel(options: {
   // TODO parse the README to get the proper label
   let label = slug.replaceAll("-", " ")
-  let model: VideoGenerationModel = "HotshotXL"
   let lora = ""
   let style = ""
   let thumbnail = ""
@@ -71,6 +72,7 @@ export async function parseChannel(options: {
   let voice = ""
   let music = ""
   let tags: string[] = []
   // console.log(`going to read datasets/${name}`)
   try {
@@ -89,11 +91,12 @@ export async function parseChannel(options: {
     label = parsedDatasetReadme.pretty_name
     description = parsedDatasetReadme.description
     thumbnail = parsedDatasetReadme.thumbnail || "thumbnail.jpg"
-    model = parsedDatasetReadme.model
     lora = parsedDatasetReadme.lora || ""
     style = parsedDatasetReadme.style || ""
     voice = parsedDatasetReadme.voice || ""
     music = parsedDatasetReadme.music || ""
     thumbnail =
       thumbnail.startsWith("http")
@@ -126,7 +129,8 @@ export async function parseChannel(options: {
     prompt,
     likes: options.likes,
     tags,
-    updatedAt: options.updatedAt.toISOString()
   }
   return channel

 import { Credentials, downloadFile, whoAmI } from "@/huggingface/hub/src"
 import { parseDatasetReadme } from "@/app/server/actions/utils/parseDatasetReadme"
+import { ChannelInfo, VideoGenerationModel, VideoOrientation } from "@/types"
 import { adminCredentials } from "../config"
+import { defaultVideoModel, defaultVideoOrientation } from "@/app/config"
 export async function parseChannel(options: {
   id: string
   // TODO parse the README to get the proper label
   let label = slug.replaceAll("-", " ")
+  let model: VideoGenerationModel = defaultVideoModel
   let lora = ""
   let style = ""
   let thumbnail = ""
   let voice = ""
   let music = ""
   let tags: string[] = []
+  let orientation: VideoOrientation = defaultVideoOrientation
   // console.log(`going to read datasets/${name}`)
   try {
     label = parsedDatasetReadme.pretty_name
     description = parsedDatasetReadme.description
     thumbnail = parsedDatasetReadme.thumbnail || "thumbnail.jpg"
+    model = parsedDatasetReadme.model || defaultVideoModel
     lora = parsedDatasetReadme.lora || ""
     style = parsedDatasetReadme.style || ""
     voice = parsedDatasetReadme.voice || ""
     music = parsedDatasetReadme.music || ""
+    orientation = parsedDatasetReadme.orientation || defaultVideoOrientation
     thumbnail =
       thumbnail.startsWith("http")
     prompt,
     likes: options.likes,
     tags,
+    updatedAt: options.updatedAt.toISOString(),
+    orientation,
   }
   return channel

src/app/server/actions/ai-tube-hf/uploadVideoRequestToDataset.ts CHANGED Viewed

@@ -3,8 +3,9 @@
 import { Blob } from "buffer"
 import { Credentials, uploadFile, whoAmI } from "@/huggingface/hub/src"
-import { ChannelInfo, VideoGenerationModel, VideoInfo, VideoRequest } from "@/types"
 import { formatPromptFileName } from "../utils/formatPromptFileName"
 /**
  * Save the video request to the user's own dataset
@@ -22,6 +23,8 @@ export async function uploadVideoRequestToDataset({
   voice,
   music,
   tags,
 }: {
   channel: ChannelInfo
   apiKey: string
@@ -34,6 +37,8 @@ export async function uploadVideoRequestToDataset({
   voice: string
   music: string
   tags: string[]
 }): Promise<{
   videoRequest: VideoRequest
   videoInfo: VideoInfo
@@ -81,6 +86,14 @@ ${voice}
 ${music}
 # Tags
 ${tags.map(tag => `- ${tag}`).join("\n")}
@@ -116,6 +129,8 @@ ${prompt}
     updatedAt: new Date().toISOString(),
     tags,
     channel,
   }
   const newVideo: VideoInfo = {
@@ -136,6 +151,9 @@ ${prompt}
     updatedAt: new Date().toISOString(),
     tags,
     channel,
   }
   return {

 import { Blob } from "buffer"
 import { Credentials, uploadFile, whoAmI } from "@/huggingface/hub/src"
+import { ChannelInfo, VideoGenerationModel, VideoInfo, VideoOrientation, VideoRequest } from "@/types"
 import { formatPromptFileName } from "../utils/formatPromptFileName"
+import { orientationToWidthHeight } from "../utils/orientationToWidthHeight"
 /**
  * Save the video request to the user's own dataset
   voice,
   music,
   tags,
+  duration,
+  orientation,
 }: {
   channel: ChannelInfo
   apiKey: string
   voice: string
   music: string
   tags: string[]
+  duration: number
+  orientation: VideoOrientation
 }): Promise<{
   videoRequest: VideoRequest
   videoInfo: VideoInfo
 ${music}
+# Duration
+${duration}
+# Orientation
+${orientation}
 # Tags
 ${tags.map(tag => `- ${tag}`).join("\n")}
     updatedAt: new Date().toISOString(),
     tags,
     channel,
+    duration: 0,
+    orientation,
   }
   const newVideo: VideoInfo = {
     updatedAt: new Date().toISOString(),
     tags,
     channel,
+    duration,
+    orientation,
+    ...orientationToWidthHeight(orientation),
   }
   return {

src/app/server/actions/submitVideoRequest.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 "use server"
-import { ChannelInfo, VideoGenerationModel, VideoInfo } from "@/types"
 import { uploadVideoRequestToDataset } from "./ai-tube-hf/uploadVideoRequestToDataset"
@@ -16,6 +16,8 @@ export async function submitVideoRequest({
   voice,
   music,
   tags,
 }: {
   channel: ChannelInfo
   apiKey: string
@@ -28,6 +30,8 @@ export async function submitVideoRequest({
   voice: string
   music: string
   tags: string[]
 }): Promise<VideoInfo> {
   if (!apiKey) {
     throw new Error(`the apiKey is required`)
@@ -44,7 +48,9 @@ export async function submitVideoRequest({
     style,
     voice,
     music,
-    tags
   })

 "use server"
+import { ChannelInfo, VideoGenerationModel, VideoInfo, VideoOrientation } from "@/types"
 import { uploadVideoRequestToDataset } from "./ai-tube-hf/uploadVideoRequestToDataset"
   voice,
   music,
   tags,
+  duration,
+  orientation,
 }: {
   channel: ChannelInfo
   apiKey: string
   voice: string
   music: string
   tags: string[]
+  duration: number
+  orientation: VideoOrientation
 }): Promise<VideoInfo> {
   if (!apiKey) {
     throw new Error(`the apiKey is required`)
     style,
     voice,
     music,
+    tags,
+    duration,
+    orientation
   })

src/app/server/actions/utils/isValidNumber.ts ADDED Viewed

	@@ -0,0 +1,3 @@

+export function isValidNumber(input?: any) {
+  return typeof input === "number" && !isNaN(input) && isFinite(input)
+}

src/app/server/actions/utils/orientationToWidthHeight.ts ADDED Viewed

	@@ -0,0 +1,38 @@

+import { VideoOrientation } from "@/types"
+export function orientationToWidthHeight(orientation?: VideoOrientation): { width: number; height: number } {
+  if (orientation === "square") {
+    return {
+      width: 512,
+      height: 512,
+    }
+  }
+  const longResolution = 1024
+  const shortResolution = 576
+  if (orientation === "portrait") {
+    return {
+      width: shortResolution,
+      height: longResolution,
+    }
+  }
+  /*
+  this is already the default, actually
+  if (orientation === "landscape") {
+    return {
+      width: longResolution,
+      height: shortResolution,
+    }
+  }
+  */
+  return {
+    width: longResolution,
+    height: shortResolution,
+  }
+}

src/app/server/actions/utils/parseDatasetPrompt.ts CHANGED Viewed

@@ -1,10 +1,27 @@
 import { ChannelInfo, ParsedDatasetPrompt } from "@/types"
 import { parseVideoModelName } from "./parseVideoModelName"
 export function parseDatasetPrompt(markdown: string, channel: ChannelInfo): ParsedDatasetPrompt {
   try {
-    const { title, description, tags, prompt, model, lora, style, thumbnail, voice, music } = parseMarkdown(markdown)
     return {
       title: typeof title === "string" && title ? title : "",
@@ -19,6 +36,7 @@ export function parseDatasetPrompt(markdown: string, channel: ChannelInfo): Pars
       thumbnail: typeof thumbnail === "string" && thumbnail ? thumbnail : "",
       voice: typeof voice === "string" && voice ? voice : (channel.voice || ""),
       music: typeof music === "string" && music ? music : (channel.music || ""),
     }
   } catch (err) {
     return {
@@ -26,12 +44,13 @@ export function parseDatasetPrompt(markdown: string, channel: ChannelInfo): Pars
       description:  "",
       tags: channel.tags || [],
       prompt: "",
-      model: channel.model || "HotshotXL",
       lora: channel.lora || "",
       style: channel.style || "",
       thumbnail: "",
       voice: channel.voice || "",
       music: channel.music || "",
     }
   }
 }
@@ -52,6 +71,7 @@ function parseMarkdown(markdown: string): {
   thumbnail: string
   voice: string
   music: string
 } {
   markdown = `${markdown || ""}`.trim()
@@ -77,5 +97,6 @@ function parseMarkdown(markdown: string): {
     thumbnail: sections["thumbnail"] || "",
     voice: sections["voice"] || "",
     music: sections["music"] || "",
   };
 }

 import { ChannelInfo, ParsedDatasetPrompt } from "@/types"
 import { parseVideoModelName } from "./parseVideoModelName"
+import { parseVideoOrientation } from "./parseVideoOrientation"
+import { defaultVideoModel, defaultVideoOrientation } from "@/app/config"
 export function parseDatasetPrompt(markdown: string, channel: ChannelInfo): ParsedDatasetPrompt {
   try {
+    const {
+      title,
+      description,
+      tags,
+      prompt,
+      model,
+      lora,
+      style,
+      thumbnail,
+      voice,
+      music,
+      // duration,
+      // width,
+      // height,
+      orientation
+    } = parseMarkdown(markdown)
     return {
       title: typeof title === "string" && title ? title : "",
       thumbnail: typeof thumbnail === "string" && thumbnail ? thumbnail : "",
       voice: typeof voice === "string" && voice ? voice : (channel.voice || ""),
       music: typeof music === "string" && music ? music : (channel.music || ""),
+      orientation: parseVideoOrientation(orientation, channel.orientation),
     }
   } catch (err) {
     return {
       description:  "",
       tags: channel.tags || [],
       prompt: "",
+      model: channel.model || defaultVideoModel,
       lora: channel.lora || "",
       style: channel.style || "",
       thumbnail: "",
       voice: channel.voice || "",
       music: channel.music || "",
+      orientation: channel.orientation || defaultVideoOrientation,
     }
   }
 }
   thumbnail: string
   voice: string
   music: string
+  orientation: string
 } {
   markdown = `${markdown || ""}`.trim()
     thumbnail: sections["thumbnail"] || "",
     voice: sections["voice"] || "",
     music: sections["music"] || "",
+    orientation: sections["orientation"] || "",
   };
 }

src/app/server/actions/utils/parseDatasetReadme.ts CHANGED Viewed

@@ -3,6 +3,8 @@ import metadataParser from "markdown-yaml-metadata-parser"
 import { ParsedDatasetReadme, ParsedMetadataAndContent } from "@/types"
 import { parseVideoModelName } from "./parseVideoModelName"
 export function parseDatasetReadme(markdown: string = ""): ParsedDatasetReadme {
   try {
@@ -12,14 +14,14 @@ export function parseDatasetReadme(markdown: string = ""): ParsedDatasetReadme {
     // console.log("DEBUG README:", { metadata, content })
-    const { model, lora, style, thumbnail, voice, music, description, prompt, tags } = parseMarkdown(content)
     return {
       license: typeof metadata?.license === "string" ? metadata.license : "",
       pretty_name: typeof metadata?.pretty_name === "string" ? metadata.pretty_name : "",
       hf_tags: Array.isArray(metadata?.tags) ? metadata.tags : [],
       tags: tags && typeof tags === "string" ? tags.split("-").map(x => x.trim()).filter(x => x) : [],
-      model: parseVideoModelName(model, "HotshotXL"),
       lora,
       style: style && typeof style === "string" ? style.split("- ").map(x => x.trim()).filter(x => x).join(", ") : [].join(", "),
       thumbnail,
@@ -27,6 +29,7 @@ export function parseDatasetReadme(markdown: string = ""): ParsedDatasetReadme {
       music,
       description,
       prompt,
     }
   } catch (err) {
     return {
@@ -34,7 +37,7 @@ export function parseDatasetReadme(markdown: string = ""): ParsedDatasetReadme {
       pretty_name: "",
       hf_tags: [], // Hugging Face tags
       tags: [],
-      model: "HotshotXL",
       lora: "",
       style: "",
       thumbnail: "",
@@ -42,6 +45,7 @@ export function parseDatasetReadme(markdown: string = ""): ParsedDatasetReadme {
       music: "",
       description: "",
       prompt: "",
     }
   }
 }
@@ -61,6 +65,7 @@ function parseMarkdown(markdown: string): {
   description: string
   prompt: string
   tags: string
 } {
   // console.log("markdown:", markdown)
   // Improved regular expression to find markdown sections and accommodate multi-line content.
@@ -84,5 +89,6 @@ function parseMarkdown(markdown: string): {
     music: sections["music"] || "",
     prompt: sections["prompt"] || "",
     tags: sections["tags"] || "",
   };
 }

 import { ParsedDatasetReadme, ParsedMetadataAndContent } from "@/types"
 import { parseVideoModelName } from "./parseVideoModelName"
+import { parseVideoOrientation } from "./parseVideoOrientation"
+import { defaultVideoModel, defaultVideoOrientation } from "@/app/config"
 export function parseDatasetReadme(markdown: string = ""): ParsedDatasetReadme {
   try {
     // console.log("DEBUG README:", { metadata, content })
+    const { model, lora, style, thumbnail, voice, music, description, prompt, tags, orientation } = parseMarkdown(content)
     return {
       license: typeof metadata?.license === "string" ? metadata.license : "",
       pretty_name: typeof metadata?.pretty_name === "string" ? metadata.pretty_name : "",
       hf_tags: Array.isArray(metadata?.tags) ? metadata.tags : [],
       tags: tags && typeof tags === "string" ? tags.split("-").map(x => x.trim()).filter(x => x) : [],
+      model: parseVideoModelName(model, defaultVideoModel),
       lora,
       style: style && typeof style === "string" ? style.split("- ").map(x => x.trim()).filter(x => x).join(", ") : [].join(", "),
       thumbnail,
       music,
       description,
       prompt,
+      orientation: parseVideoOrientation(orientation, defaultVideoOrientation),
     }
   } catch (err) {
     return {
       pretty_name: "",
       hf_tags: [], // Hugging Face tags
       tags: [],
+      model: defaultVideoModel,
       lora: "",
       style: "",
       thumbnail: "",
       music: "",
       description: "",
       prompt: "",
+      orientation: defaultVideoOrientation,
     }
   }
 }
   description: string
   prompt: string
   tags: string
+  orientation: string
 } {
   // console.log("markdown:", markdown)
   // Improved regular expression to find markdown sections and accommodate multi-line content.
     music: sections["music"] || "",
     prompt: sections["prompt"] || "",
     tags: sections["tags"] || "",
+    orientation:  sections["orientation"] || "",
   };
 }

src/app/server/actions/utils/parseVideoModelName.ts CHANGED Viewed

@@ -3,7 +3,7 @@ import { VideoGenerationModel } from "@/types"
 export function parseVideoModelName(text: any, defaultToUse: VideoGenerationModel): VideoGenerationModel {
   const rawModelString = `${text || ""}`.trim().toLowerCase()
-  let model: VideoGenerationModel = "HotshotXL"
   if (
     rawModelString === "stable video diffusion" ||
@@ -20,5 +20,5 @@ export function parseVideoModelName(text: any, defaultToUse: VideoGenerationMode
     model = "LaVie"
   }
-  return defaultToUse
 }

 export function parseVideoModelName(text: any, defaultToUse: VideoGenerationModel): VideoGenerationModel {
   const rawModelString = `${text || ""}`.trim().toLowerCase()
+  let model: VideoGenerationModel = defaultToUse || "SVD"
   if (
     rawModelString === "stable video diffusion" ||
     model = "LaVie"
   }
+  return model
 }

src/app/server/actions/utils/parseVideoOrientation.ts ADDED Viewed

	@@ -0,0 +1,31 @@

+import { defaultVideoOrientation } from "@/app/config"
+import { VideoOrientation } from "@/types"
+export function parseVideoOrientation(text: any, defaultToUse?: VideoOrientation): VideoOrientation {
+  const rawOrientationString = `${text || ""}`.trim().toLowerCase()
+  let orientation: VideoOrientation = defaultToUse || defaultVideoOrientation
+  if (
+    rawOrientationString === "landscape" ||
+    rawOrientationString === "horizontal"
+  ) {
+    orientation = "landscape"
+  }
+  if (
+    rawOrientationString === "portrait" ||
+    rawOrientationString === "vertical"
+  ) {
+    orientation = "portrait"
+  }
+  if (
+    rawOrientationString === "square"
+  ) {
+    orientation = "square"
+  }
+  return orientation
+}

src/app/views/user-channel-view/index.tsx CHANGED Viewed

@@ -17,7 +17,8 @@ import { PendingVideoList } from "@/app/interface/pending-video-list"
 import { getChannelVideos } from "@/app/server/actions/ai-tube-hf/getChannelVideos"
 import { parseVideoModelName } from "@/app/server/actions/utils/parseVideoModelName"
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui/select"
-import { defaultVideoModel, defaultVoice } from "@/app/config"
 export function UserChannelView() {
   const [_isPending, startTransition] = useTransition()
@@ -26,18 +27,20 @@ export function UserChannelView() {
     defaultSettings.huggingfaceApiKey
   )
-  const [titleDraft, setTitleDraft] = useState("")
-  const [descriptionDraft, setDescriptionDraft] = useState("")
-  const [tagsDraft, setTagsDraft] = useState("")
-  const [promptDraft, setPromptDraft] = useState("")
-  const [modelDraft, setModelDraft] = useState<VideoGenerationModel>(defaultVideoModel)
-  const [loraDraft, setLoraDraft] = useState("")
-  const [styleDraft, setStyleDraft] = useState("")
-  const [voiceDraft, setVoiceDraft] = useState(defaultVoice)
-  const [musicDraft, setMusicDraft] = useState("")
   // we do not include the tags in the list of required fields
-  const missingFields = !titleDraft || !descriptionDraft || !promptDraft
   const [isSubmitting, setIsSubmitting] = useState(false)
@@ -73,7 +76,7 @@ export function UserChannelView() {
     if (!userChannel) {
       return
     }
-    if (!titleDraft || !promptDraft) {
       console.log("missing title or prompt")
       return
     }
@@ -85,29 +88,31 @@ export function UserChannelView() {
         const newVideo = await submitVideoRequest({
           channel: userChannel,
           apiKey: huggingfaceApiKey,
-          title: titleDraft,
-          description: descriptionDraft,
-          prompt: promptDraft,
-          model: modelDraft,
-          lora: loraDraft,
-          style: styleDraft,
-          voice: voiceDraft,
-          music: musicDraft,
-          tags: tagsDraft.trim().split(",").map(x => x.trim()).filter(x => x),
         })
         // in case of success we update the frontend immediately
-        // with our draft video
         setUserVideos([newVideo, ...userVideos])
-        setPromptDraft("")
-        setDescriptionDraft("")
-        setTagsDraft("")
-        setTitleDraft("")
-        setModelDraft(defaultVideoModel)
-        setVoiceDraft(defaultVoice)
-        setMusicDraft("")
-        setLoraDraft("")
-        setStyleDraft("")
         // also renew the cache on Next's side
         /*
@@ -151,9 +156,9 @@ export function UserChannelView() {
               placeholder="Title"
               className="font-mono"
               onChange={(x) => {
-                setTitleDraft(x.target.value)
               }}
-              value={titleDraft}
             />
           </div>
         </div>
@@ -167,9 +172,9 @@ export function UserChannelView() {
               className="font-mono"
               rows={2}
               onChange={(x) => {
-                setDescriptionDraft(x.target.value)
               }}
-              value={descriptionDraft}
             />
             <p className="text-neutral-100/70">
               Short description (visible to humans, and used as context by the AI).
@@ -185,9 +190,9 @@ export function UserChannelView() {
               className="font-mono"
               rows={6}
               onChange={(x) => {
-                setPromptDraft(x.target.value)
               }}
-              value={promptDraft}
             />
             <p className="text-neutral-100/70">
               Describe your video content, in a synthetic way.
@@ -200,20 +205,58 @@ export function UserChannelView() {
           <div className="flex flex-col space-y-2 flex-grow">
             <Select
               onValueChange={(value: string) => {
-                setModelDraft(parseVideoModelName(value, defaultVideoModel))
               }}
               defaultValue={defaultVideoModel}>
               <SelectTrigger className="">
                 <SelectValue placeholder="Video model" />
               </SelectTrigger>
               <SelectContent>
-                <SelectItem value="SVD">SVD</SelectItem>
                 <SelectItem value="HotshotXL">HotshotXL</SelectItem>
                 <SelectItem value="LaVie">LaVie</SelectItem>
               </SelectContent>
             </Select>
           </div>
         </div>
         <div className="flex flex-row space-x-2 items-start">
           <label className="flex w-24 pt-1">Tags (optional):</label>
@@ -222,9 +265,9 @@ export function UserChannelView() {
               placeholder="Tags"
               className="font-mono"
               onChange={(x) => {
-                setTagsDraft(x.target.value)
               }}
-              value={tagsDraft}
             />
             <p className="text-neutral-100/70">
             Comma-separated tags (eg. &quot;Education, Sports&quot;)

 import { getChannelVideos } from "@/app/server/actions/ai-tube-hf/getChannelVideos"
 import { parseVideoModelName } from "@/app/server/actions/utils/parseVideoModelName"
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui/select"
+import { defaultVideoModel, defaultVideoOrientation, defaultVoice } from "@/app/config"
+import { parseVideoOrientation } from "@/app/server/actions/utils/parseVideoOrientation"
 export function UserChannelView() {
   const [_isPending, startTransition] = useTransition()
     defaultSettings.huggingfaceApiKey
   )
+  const [title, setTitle] = useState("")
+  const [description, setDescription] = useState("")
+  const [tags, setTags] = useState("")
+  const [prompt, setPrompt] = useState("")
+  const [model, setModel] = useState<VideoGenerationModel>(defaultVideoModel)
+  const [lora, setLora] = useState("")
+  const [style, setStyle] = useState("")
+  const [voice, setVoice] = useState(defaultVoice)
+  const [music, setMusic] = useState("")
+  const [duration, setDuration] = useState(0)
+  const [orientation, setOrientation] = useState(defaultVideoOrientation)
   // we do not include the tags in the list of required fields
+  const missingFields = !title || !description || !prompt
   const [isSubmitting, setIsSubmitting] = useState(false)
     if (!userChannel) {
       return
     }
+    if (!title || !prompt) {
       console.log("missing title or prompt")
       return
     }
         const newVideo = await submitVideoRequest({
           channel: userChannel,
           apiKey: huggingfaceApiKey,
+          title,
+          description,
+          prompt,
+          model,
+          lora,
+          style,
+          voice,
+          music,
+          tags: tags.trim().split(",").map(x => x.trim()).filter(x => x),
+          duration,
+          orientation
         })
         // in case of success we update the frontend immediately
+        // with our  video
         setUserVideos([newVideo, ...userVideos])
+        setPrompt("")
+        setDescription("")
+        setTags("")
+        setTitle("")
+        setModel(defaultVideoModel)
+        setVoice(defaultVoice)
+        setMusic("")
+        setLora("")
+        setStyle("")
         // also renew the cache on Next's side
         /*
               placeholder="Title"
               className="font-mono"
               onChange={(x) => {
+                setTitle(x.target.value)
               }}
+              value={title}
             />
           </div>
         </div>
               className="font-mono"
               rows={2}
               onChange={(x) => {
+                setDescription(x.target.value)
               }}
+              value={description}
             />
             <p className="text-neutral-100/70">
               Short description (visible to humans, and used as context by the AI).
               className="font-mono"
               rows={6}
               onChange={(x) => {
+                setPrompt(x.target.value)
               }}
+              value={prompt}
             />
             <p className="text-neutral-100/70">
               Describe your video content, in a synthetic way.
           <div className="flex flex-col space-y-2 flex-grow">
             <Select
               onValueChange={(value: string) => {
+                setModel(parseVideoModelName(value, defaultVideoModel))
               }}
               defaultValue={defaultVideoModel}>
               <SelectTrigger className="">
                 <SelectValue placeholder="Video model" />
               </SelectTrigger>
               <SelectContent>
+                <SelectItem value="SVD">SVD (default)</SelectItem>
                 <SelectItem value="HotshotXL">HotshotXL</SelectItem>
                 <SelectItem value="LaVie">LaVie</SelectItem>
               </SelectContent>
             </Select>
           </div>
         </div>
+        {/*
+        <div className="flex flex-row space-x-2 items-start">
+          <label className="flex w-24 pt-1">Video duration:</label>
+          <div className="flex flex-col space-y-2 flex-grow">
+            <Input
+              placeholder="Duration"
+              className="font-mono"
+              onChange={(x) => {
+                // TODO: clamp the value here + on server side
+                setDuration(parseInt(x.target.value))
+              }}
+              value={title}
+            />
+          </div>
+        </div>
+        */}
+        <div className="flex flex-row space-x-2 items-start">
+          <label className="flex w-24 pt-1">Video orientation:</label>
+          <div className="flex flex-col space-y-2 flex-grow">
+            <Select
+              onValueChange={(value: string) => {
+                setOrientation(parseVideoOrientation(value, defaultVideoOrientation))
+              }}
+              defaultValue={defaultVideoOrientation}>
+              <SelectTrigger className="">
+                <SelectValue placeholder="Video orientation" />
+              </SelectTrigger>
+              <SelectContent>
+                <SelectItem value="Landscape">Landscape (default)</SelectItem>
+                <SelectItem value="Portrait">Portrait</SelectItem>
+                {/* <SelectItem value="LaVie">Square</SelectItem> */}
+              </SelectContent>
+            </Select>
+          </div>
+        </div>
         <div className="flex flex-row space-x-2 items-start">
           <label className="flex w-24 pt-1">Tags (optional):</label>
               placeholder="Tags"
               className="font-mono"
               onChange={(x) => {
+                setTags(x.target.value)
               }}
+              value={tags}
             />
             <p className="text-neutral-100/70">
             Comma-separated tags (eg. &quot;Education, Sports&quot;)

src/types.ts CHANGED Viewed

@@ -231,6 +231,11 @@ export type ChannelInfo = {
   tags: string[]
   updatedAt: string
 }
 export type VideoStatus =
@@ -308,8 +313,22 @@ export type VideoRequest = {
    * ID of the channel
    */
   channel: ChannelInfo
 }
 export type VideoInfo = {
   /**
@@ -400,6 +419,26 @@ export type VideoInfo = {
    * The channel
    */
   channel: ChannelInfo
 }
 export type VideoGenerationModel =
@@ -451,6 +490,7 @@ export type ParsedDatasetReadme = {
   hf_tags: string[]
   description: string
   prompt: string
 }
 export type ParsedMetadataAndContent = {
@@ -473,6 +513,7 @@ export type ParsedDatasetPrompt = {
   thumbnail: string
   voice: string
   music: string
 }
 export type UpdateQueueRequest = {

   tags: string[]
   updatedAt: string
+  /**
+   * Default video orientation
+   */
+  orientation: VideoOrientation
 }
 export type VideoStatus =
    * ID of the channel
    */
   channel: ChannelInfo
+  /**
+   * Video orientation
+   */
+  orientation: VideoOrientation
+  /**
+   * Video duration
+   */
+  duration: number
 }
+export type VideoOrientation =
+  | "portrait"
+  | "landscape"
+  | "square"
 export type VideoInfo = {
   /**
    * The channel
    */
   channel: ChannelInfo
+  /**
+   * Video duration
+   */
+  duration: number
+  /**
+   * Video width (eg. 1024)
+   */
+  width: number
+  /**
+   * Video height (eg. 576)
+   */
+  height: number
+  /**
+   * General video aspect ratio
+   */
+  orientation: VideoOrientation
 }
 export type VideoGenerationModel =
   hf_tags: string[]
   description: string
   prompt: string
+  orientation: VideoOrientation
 }
 export type ParsedMetadataAndContent = {
   thumbnail: string
   voice: string
   music: string
+  orientation: VideoOrientation
 }
 export type UpdateQueueRequest = {