Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Commit
•
3b780fb
1
Parent(s):
8c7d08c
wip
Browse files- Dockerfile +12 -0
- package-lock.json +6 -0
- package.json +1 -0
- src/app/api/generators/search/getNewMediaInfo.ts +5 -5
- src/app/api/providers/huggingface/predictWithHuggingFace.ts +1 -1
- src/app/api/utils/parseRawStringToYAML.ts +3 -2
- src/app/api/v1/create/route.ts +4 -4
- src/app/api/v1/create/systemPrompt.ts +1 -1
- src/app/api/v1/create/userPrompt.ts +0 -0
- src/app/api/v1/edit/dialogues/processShot.ts +10 -8
- src/app/api/v1/edit/storyboards/processShot.ts +6 -6
- src/app/api/v1/edit/storyboards/route.ts +3 -3
- src/app/api/v1/search/index.ts +60 -0
- src/app/api/v1/search/route.ts +72 -0
- src/app/api/v1/search/systemPrompt.ts +92 -0
- src/app/api/v1/search/types.ts +16 -0
- src/app/{dream → latent}/embed/page.tsx +0 -0
- src/app/{dream → latent}/samples.tsx +0 -0
- src/app/{dream/spoiler.tsx → latent/search/page.tsx} +9 -6
- src/app/latent/watch/page.tsx +63 -0
- src/app/main.tsx +7 -3
- src/app/state/useStore.ts +8 -6
- src/app/views/public-latent-search-view/index.tsx +49 -0
- src/components/interface/latent-engine/core/engine.tsx +12 -14
- src/components/interface/latent-search-input/index.tsx +157 -0
- src/components/interface/media-player/index.tsx +2 -1
- src/components/interface/search-input/index.tsx +17 -6
- src/components/interface/top-header/index.tsx +6 -1
- src/types/general.ts +2 -1
Dockerfile
CHANGED
@@ -2,8 +2,20 @@ FROM node:20-alpine AS base
|
|
2 |
|
3 |
# Install dependencies only when needed
|
4 |
FROM base AS deps
|
|
|
5 |
# Check https://github.com/nodejs/docker-node/tree/b4117f9333da4138b03a546ec926ef50a31506c3#nodealpine to understand why libc6-compat might be needed.
|
6 |
RUN apk add --no-cache libc6-compat
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7 |
WORKDIR /app
|
8 |
|
9 |
# Install dependencies based on the preferred package manager
|
|
|
2 |
|
3 |
# Install dependencies only when needed
|
4 |
FROM base AS deps
|
5 |
+
|
6 |
# Check https://github.com/nodejs/docker-node/tree/b4117f9333da4138b03a546ec926ef50a31506c3#nodealpine to understand why libc6-compat might be needed.
|
7 |
RUN apk add --no-cache libc6-compat
|
8 |
+
|
9 |
+
# for dev mode
|
10 |
+
RUN apk add git git-lfs procps htop vim nano
|
11 |
+
|
12 |
+
RUN apk add alpine-sdk pkgconfig
|
13 |
+
|
14 |
+
# For FFMPEG and gl concat
|
15 |
+
RUN apk add curl python3 python3-dev libx11-dev libsm-dev libxrender libxext-dev mesa-dev xvfb libxi-dev glew-dev
|
16 |
+
|
17 |
+
RUN apk add ffmpeg
|
18 |
+
|
19 |
WORKDIR /app
|
20 |
|
21 |
# Install dependencies based on the preferred package manager
|
package-lock.json
CHANGED
@@ -66,6 +66,7 @@
|
|
66 |
"gsplat": "^1.2.4",
|
67 |
"hash-wasm": "^4.11.0",
|
68 |
"jose": "^5.2.4",
|
|
|
69 |
"lodash.debounce": "^4.0.8",
|
70 |
"lucide-react": "^0.260.0",
|
71 |
"markdown-yaml-metadata-parser": "^3.0.0",
|
@@ -6087,6 +6088,11 @@
|
|
6087 |
"url": "https://github.com/sponsors/panva"
|
6088 |
}
|
6089 |
},
|
|
|
|
|
|
|
|
|
|
|
6090 |
"node_modules/js-sha3": {
|
6091 |
"version": "0.8.0",
|
6092 |
"resolved": "https://registry.npmjs.org/js-sha3/-/js-sha3-0.8.0.tgz",
|
|
|
66 |
"gsplat": "^1.2.4",
|
67 |
"hash-wasm": "^4.11.0",
|
68 |
"jose": "^5.2.4",
|
69 |
+
"js-base64": "^3.7.7",
|
70 |
"lodash.debounce": "^4.0.8",
|
71 |
"lucide-react": "^0.260.0",
|
72 |
"markdown-yaml-metadata-parser": "^3.0.0",
|
|
|
6088 |
"url": "https://github.com/sponsors/panva"
|
6089 |
}
|
6090 |
},
|
6091 |
+
"node_modules/js-base64": {
|
6092 |
+
"version": "3.7.7",
|
6093 |
+
"resolved": "https://registry.npmjs.org/js-base64/-/js-base64-3.7.7.tgz",
|
6094 |
+
"integrity": "sha512-7rCnleh0z2CkXhH67J8K1Ytz0b2Y+yxTPL+/KOJoa20hfnVQ/3/T6W/KflYI4bRHRagNeXeU2bkNGI3v1oS/lw=="
|
6095 |
+
},
|
6096 |
"node_modules/js-sha3": {
|
6097 |
"version": "0.8.0",
|
6098 |
"resolved": "https://registry.npmjs.org/js-sha3/-/js-sha3-0.8.0.tgz",
|
package.json
CHANGED
@@ -67,6 +67,7 @@
|
|
67 |
"gsplat": "^1.2.4",
|
68 |
"hash-wasm": "^4.11.0",
|
69 |
"jose": "^5.2.4",
|
|
|
70 |
"lodash.debounce": "^4.0.8",
|
71 |
"lucide-react": "^0.260.0",
|
72 |
"markdown-yaml-metadata-parser": "^3.0.0",
|
|
|
67 |
"gsplat": "^1.2.4",
|
68 |
"hash-wasm": "^4.11.0",
|
69 |
"jose": "^5.2.4",
|
70 |
+
"js-base64": "^3.7.7",
|
71 |
"lodash.debounce": "^4.0.8",
|
72 |
"lucide-react": "^0.260.0",
|
73 |
"markdown-yaml-metadata-parser": "^3.0.0",
|
src/app/api/generators/search/getNewMediaInfo.ts
CHANGED
@@ -80,11 +80,9 @@ export function getNewMediaInfo(params: Partial<MediaInfo> = {}): MediaInfo {
|
|
80 |
updatedAt: new Date().toISOString(),
|
81 |
|
82 |
/**
|
83 |
-
*
|
84 |
*/
|
85 |
-
tags:
|
86 |
-
...params.tags,
|
87 |
-
] : [],
|
88 |
|
89 |
/**
|
90 |
* Model name
|
@@ -139,7 +137,9 @@ export function getNewMediaInfo(params: Partial<MediaInfo> = {}): MediaInfo {
|
|
139 |
/**
|
140 |
* Media projection (cartesian by default)
|
141 |
*/
|
142 |
-
projection: "latent"
|
|
|
|
|
143 |
}
|
144 |
|
145 |
return mediaInfo
|
|
|
80 |
updatedAt: new Date().toISOString(),
|
81 |
|
82 |
/**
|
83 |
+
* Arbitrary string tags to label the content
|
84 |
*/
|
85 |
+
tags: [],
|
|
|
|
|
86 |
|
87 |
/**
|
88 |
* Model name
|
|
|
137 |
/**
|
138 |
* Media projection (cartesian by default)
|
139 |
*/
|
140 |
+
projection: "latent",
|
141 |
+
|
142 |
+
...params,
|
143 |
}
|
144 |
|
145 |
return mediaInfo
|
src/app/api/providers/huggingface/predictWithHuggingFace.ts
CHANGED
@@ -31,7 +31,7 @@ export async function predict({
|
|
31 |
}
|
32 |
})) {
|
33 |
instructions += output.token.text
|
34 |
-
|
35 |
if (
|
36 |
instructions.includes("</s>") ||
|
37 |
instructions.includes("<s>") ||
|
|
|
31 |
}
|
32 |
})) {
|
33 |
instructions += output.token.text
|
34 |
+
process.stdout.write(output.token.text)
|
35 |
if (
|
36 |
instructions.includes("</s>") ||
|
37 |
instructions.includes("<s>") ||
|
src/app/api/utils/parseRawStringToYAML.ts
CHANGED
@@ -8,8 +8,9 @@ export function parseRawStringToYAML<T>(input: any, defaultValue: T) {
|
|
8 |
.replaceAll("```yaml\n", "")
|
9 |
.replaceAll("```yaml", "")
|
10 |
|
11 |
-
// we remove everything after the last ```
|
12 |
-
rawString = rawString.split(
|
|
|
13 |
|
14 |
const something: any = YAML.parse(rawString)
|
15 |
|
|
|
8 |
.replaceAll("```yaml\n", "")
|
9 |
.replaceAll("```yaml", "")
|
10 |
|
11 |
+
// we remove everything after the last ``` (or ``)
|
12 |
+
rawString = rawString.split(/```?/)[0].trim()
|
13 |
+
|
14 |
|
15 |
const something: any = YAML.parse(rawString)
|
16 |
|
src/app/api/v1/create/route.ts
CHANGED
@@ -25,7 +25,7 @@ export async function POST(req: NextRequest) {
|
|
25 |
|
26 |
const prompt = `${request?.prompt || ""}`.trim()
|
27 |
|
28 |
-
console.log("[api/
|
29 |
|
30 |
if (!prompt.length) { throw new Error(`please provide a prompt`) }
|
31 |
|
@@ -46,11 +46,11 @@ export async function POST(req: NextRequest) {
|
|
46 |
prefix: "```yaml\n",
|
47 |
})
|
48 |
|
49 |
-
console.log("[api/
|
50 |
|
51 |
const shots = parseRawStringToYAML<LatentStory[]>(rawString, [])
|
52 |
|
53 |
-
console.log(`[api/
|
54 |
|
55 |
// this is approximate - TTS generation will determine the final duration of each shot
|
56 |
const defaultSegmentDurationInMs = 7000
|
@@ -76,7 +76,7 @@ export async function POST(req: NextRequest) {
|
|
76 |
|
77 |
for (const { title, image, voice } of shots) {
|
78 |
|
79 |
-
console.log(`[api/
|
80 |
|
81 |
// note: it would be nice if we could have a convention saying that
|
82 |
// track 0 is for videos and track 1 storyboards
|
|
|
25 |
|
26 |
const prompt = `${request?.prompt || ""}`.trim()
|
27 |
|
28 |
+
console.log("[api/v1/create] request:", request)
|
29 |
|
30 |
if (!prompt.length) { throw new Error(`please provide a prompt`) }
|
31 |
|
|
|
46 |
prefix: "```yaml\n",
|
47 |
})
|
48 |
|
49 |
+
console.log("[api/v1/create] rawString: ", rawString)
|
50 |
|
51 |
const shots = parseRawStringToYAML<LatentStory[]>(rawString, [])
|
52 |
|
53 |
+
console.log(`[api/v1/create] generated ${shots.length} shots`)
|
54 |
|
55 |
// this is approximate - TTS generation will determine the final duration of each shot
|
56 |
const defaultSegmentDurationInMs = 7000
|
|
|
76 |
|
77 |
for (const { title, image, voice } of shots) {
|
78 |
|
79 |
+
console.log(`[api/v1/create] - ${title}`)
|
80 |
|
81 |
// note: it would be nice if we could have a convention saying that
|
82 |
// track 0 is for videos and track 1 storyboards
|
src/app/api/v1/create/systemPrompt.ts
CHANGED
@@ -35,5 +35,5 @@ but if the user asks for large numbers, it should be ignored (our limit is 32).
|
|
35 |
voice: "Now my dog is eating my birtday cake. Please send help."
|
36 |
\`\`\
|
37 |
|
38 |
-
#
|
39 |
`
|
|
|
35 |
voice: "Now my dog is eating my birtday cake. Please send help."
|
36 |
\`\`\
|
37 |
|
38 |
+
# Your turn:
|
39 |
`
|
src/app/api/v1/create/userPrompt.ts
DELETED
File without changes
|
src/app/api/v1/edit/dialogues/processShot.ts
CHANGED
@@ -40,14 +40,16 @@ export async function processShot({
|
|
40 |
|
41 |
const { durationInMs, durationInSec, hasAudio } = await getMediaInfo(shotDialogueSegment.assetUrl)
|
42 |
|
43 |
-
|
44 |
-
|
45 |
-
|
46 |
-
|
47 |
-
|
48 |
-
|
49 |
-
s
|
50 |
-
|
|
|
|
|
51 |
|
52 |
} catch (err) {
|
53 |
console.log(`[api/generate/dialogues] processShot: failed to generate audio: ${err}`)
|
|
|
40 |
|
41 |
const { durationInMs, durationInSec, hasAudio } = await getMediaInfo(shotDialogueSegment.assetUrl)
|
42 |
|
43 |
+
if (hasAudio && durationInMs > 1000) {
|
44 |
+
shotDialogueSegment.assetDurationInMs = durationInMs
|
45 |
+
shotSegment.assetDurationInMs = durationInMs
|
46 |
+
|
47 |
+
// we update the duration of all the segments for this shot
|
48 |
+
// (it is possible that this makes the two previous lines redundant)
|
49 |
+
clap.segments.filter(s => {
|
50 |
+
s.assetDurationInMs = durationInMs
|
51 |
+
})
|
52 |
+
}
|
53 |
|
54 |
} catch (err) {
|
55 |
console.log(`[api/generate/dialogues] processShot: failed to generate audio: ${err}`)
|
src/app/api/v1/edit/storyboards/processShot.ts
CHANGED
@@ -41,7 +41,7 @@ export async function processShot({
|
|
41 |
clap.segments.push(shotStoryboardSegment)
|
42 |
}
|
43 |
|
44 |
-
console.log(`[api/
|
45 |
}
|
46 |
if (!shotStoryboardSegment) { throw new Error(`failed to generate a newSegment`) }
|
47 |
|
@@ -49,12 +49,12 @@ export async function processShot({
|
|
49 |
if (!shotStoryboardSegment?.prompt) {
|
50 |
// storyboard is missing, let's generate it
|
51 |
shotStoryboardSegment.prompt = getVideoPrompt(shotSegments, clap.entityIndex, ["high quality", "crisp", "detailed"])
|
52 |
-
console.log(`[api/
|
53 |
}
|
54 |
|
55 |
// TASK 3: GENERATE MISSING STORYBOARD BITMAP
|
56 |
if (!shotStoryboardSegment.assetUrl) {
|
57 |
-
// console.log(`[api/
|
58 |
|
59 |
try {
|
60 |
shotStoryboardSegment.assetUrl = await generateStoryboard({
|
@@ -64,13 +64,13 @@ export async function processShot({
|
|
64 |
})
|
65 |
shotStoryboardSegment.assetSourceType = getClapAssetSourceType(shotStoryboardSegment.assetUrl)
|
66 |
} catch (err) {
|
67 |
-
console.log(`[api/
|
68 |
throw err
|
69 |
}
|
70 |
|
71 |
-
console.log(`[api/
|
72 |
} else {
|
73 |
-
console.log(`[api/
|
74 |
}
|
75 |
|
76 |
}
|
|
|
41 |
clap.segments.push(shotStoryboardSegment)
|
42 |
}
|
43 |
|
44 |
+
console.log(`[api/v1/edit/storyboards] processShot: generated storyboard segment [${shotSegment.startTimeInMs}:${shotSegment.endTimeInMs}]`)
|
45 |
}
|
46 |
if (!shotStoryboardSegment) { throw new Error(`failed to generate a newSegment`) }
|
47 |
|
|
|
49 |
if (!shotStoryboardSegment?.prompt) {
|
50 |
// storyboard is missing, let's generate it
|
51 |
shotStoryboardSegment.prompt = getVideoPrompt(shotSegments, clap.entityIndex, ["high quality", "crisp", "detailed"])
|
52 |
+
console.log(`[api/v1/edit/storyboards] processShot: generating storyboard prompt: ${shotStoryboardSegment.prompt}`)
|
53 |
}
|
54 |
|
55 |
// TASK 3: GENERATE MISSING STORYBOARD BITMAP
|
56 |
if (!shotStoryboardSegment.assetUrl) {
|
57 |
+
// console.log(`[api/v1/edit/storyboards] generating image..`)
|
58 |
|
59 |
try {
|
60 |
shotStoryboardSegment.assetUrl = await generateStoryboard({
|
|
|
64 |
})
|
65 |
shotStoryboardSegment.assetSourceType = getClapAssetSourceType(shotStoryboardSegment.assetUrl)
|
66 |
} catch (err) {
|
67 |
+
console.log(`[api/v1/edit/storyboards] processShot: failed to generate an image: ${err}`)
|
68 |
throw err
|
69 |
}
|
70 |
|
71 |
+
console.log(`[api/v1/edit/storyboards] processShot: generated storyboard image: ${shotStoryboardSegment?.assetUrl?.slice?.(0, 50)}...`)
|
72 |
} else {
|
73 |
+
console.log(`[api/v1/edit/storyboards] processShot: there is already a storyboard image: ${shotStoryboardSegment?.assetUrl?.slice?.(0, 50)}...`)
|
74 |
}
|
75 |
|
76 |
}
|
src/app/api/v1/edit/storyboards/route.ts
CHANGED
@@ -23,10 +23,10 @@ export async function POST(req: NextRequest) {
|
|
23 |
|
24 |
if (!clap?.segments) { throw new Error(`no segment found in the provided clap!`) }
|
25 |
|
26 |
-
console.log(`[api/
|
27 |
|
28 |
const shotsSegments: ClapSegment[] = clap.segments.filter(s => s.category === "camera")
|
29 |
-
console.log(`[api/
|
30 |
|
31 |
if (shotsSegments.length > 32) {
|
32 |
throw new Error(`Error, this endpoint being synchronous, it is designed for short stories only (max 32 shots).`)
|
@@ -40,7 +40,7 @@ export async function POST(req: NextRequest) {
|
|
40 |
})
|
41 |
))
|
42 |
|
43 |
-
// console.log(`[api/
|
44 |
|
45 |
return new NextResponse(await serializeClap(clap), {
|
46 |
status: 200,
|
|
|
23 |
|
24 |
if (!clap?.segments) { throw new Error(`no segment found in the provided clap!`) }
|
25 |
|
26 |
+
console.log(`[api/v1/edit/storyboards] detected ${clap.segments.length} segments`)
|
27 |
|
28 |
const shotsSegments: ClapSegment[] = clap.segments.filter(s => s.category === "camera")
|
29 |
+
console.log(`[api/v1/edit/storyboards] detected ${shotsSegments.length} shots`)
|
30 |
|
31 |
if (shotsSegments.length > 32) {
|
32 |
throw new Error(`Error, this endpoint being synchronous, it is designed for short stories only (max 32 shots).`)
|
|
|
40 |
})
|
41 |
))
|
42 |
|
43 |
+
// console.log(`[api/v1/edit/storyboards] returning the clap augmented with storyboards`)
|
44 |
|
45 |
return new NextResponse(await serializeClap(clap), {
|
46 |
status: 200,
|
src/app/api/v1/search/index.ts
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
"use server"
|
2 |
+
|
3 |
+
import YAML from "yaml"
|
4 |
+
|
5 |
+
import { predict } from "@/app/api/providers/huggingface/predictWithHuggingFace"
|
6 |
+
import { parseRawStringToYAML } from "@/app/api/utils/parseRawStringToYAML"
|
7 |
+
|
8 |
+
import { systemPromptForBasicSearchResults, systemPromptForExtendedSearchResults } from "./systemPrompt"
|
9 |
+
import type { BasicSearchResult, ExtendedSearchResult } from "./types"
|
10 |
+
|
11 |
+
export async function search({
|
12 |
+
prompt = "",
|
13 |
+
nbResults = 4
|
14 |
+
}: {
|
15 |
+
prompt: string
|
16 |
+
nbResults: number
|
17 |
+
}): Promise<BasicSearchResult[]> {
|
18 |
+
const userPrompt = `${
|
19 |
+
Math.max(1, Math.min(8, nbResults))
|
20 |
+
} search results about: ${
|
21 |
+
prompt || "various trending genres"
|
22 |
+
}`
|
23 |
+
|
24 |
+
// TODO use streaming for the Hugging Face prediction
|
25 |
+
const rawString = await predict({
|
26 |
+
systemPrompt: systemPromptForBasicSearchResults,
|
27 |
+
userPrompt,
|
28 |
+
nbMaxNewTokens: nbResults * 80,
|
29 |
+
prefix: "```yaml\n",
|
30 |
+
})
|
31 |
+
|
32 |
+
console.log("rawString: ", rawString)
|
33 |
+
|
34 |
+
const results = parseRawStringToYAML<BasicSearchResult[]>(rawString, [])
|
35 |
+
|
36 |
+
return results
|
37 |
+
}
|
38 |
+
|
39 |
+
export async function extend({
|
40 |
+
basicResults = [],
|
41 |
+
}: {
|
42 |
+
basicResults: BasicSearchResult[]
|
43 |
+
}): Promise<ExtendedSearchResult[]> {
|
44 |
+
const userPrompt = YAML.stringify(basicResults)
|
45 |
+
|
46 |
+
|
47 |
+
// TODO use streaming for the Hugging Face prediction
|
48 |
+
const rawString = await predict({
|
49 |
+
systemPrompt: systemPromptForExtendedSearchResults,
|
50 |
+
userPrompt,
|
51 |
+
nbMaxNewTokens: basicResults.length * 200,
|
52 |
+
prefix: "```yaml\n",
|
53 |
+
})
|
54 |
+
|
55 |
+
console.log("rawString: ", rawString)
|
56 |
+
|
57 |
+
const results = parseRawStringToYAML<ExtendedSearchResult[]>(rawString, [])
|
58 |
+
|
59 |
+
return results
|
60 |
+
}
|
src/app/api/v1/search/route.ts
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import { NextResponse, NextRequest } from "next/server"
|
2 |
+
import queryString from "query-string"
|
3 |
+
import { BasicSearchResult, ExtendedSearchResult } from "./types"
|
4 |
+
import { extend, search } from "."
|
5 |
+
|
6 |
+
export type LatentSearchMode =
|
7 |
+
| "basic"
|
8 |
+
| "extended"
|
9 |
+
|
10 |
+
// we hide/wrap the micro-service under a unified AiTube API
|
11 |
+
export async function GET(req: NextRequest, res: NextResponse) {
|
12 |
+
|
13 |
+
const qs = queryString.parseUrl(req.url || "")
|
14 |
+
const query = (qs || {}).query
|
15 |
+
|
16 |
+
let mode: LatentSearchMode = "basic"
|
17 |
+
try {
|
18 |
+
mode = decodeURIComponent(query?.m?.toString() || "basic").trim() as LatentSearchMode
|
19 |
+
} catch (err) {}
|
20 |
+
|
21 |
+
|
22 |
+
if (mode === "basic") {
|
23 |
+
let prompt = ""
|
24 |
+
try {
|
25 |
+
prompt = decodeURIComponent(query?.p?.toString() || "").trim() as string
|
26 |
+
} catch (err) {}
|
27 |
+
|
28 |
+
const basicSearchResults: BasicSearchResult[] = await search({
|
29 |
+
prompt,
|
30 |
+
nbResults: 4
|
31 |
+
})
|
32 |
+
|
33 |
+
console.log(`[api/v1/search] found ${basicSearchResults.length} basic search results`)
|
34 |
+
console.log(`[api/v1/search]`, basicSearchResults)
|
35 |
+
|
36 |
+
return NextResponse.json(basicSearchResults, {
|
37 |
+
status: 200,
|
38 |
+
statusText: "OK",
|
39 |
+
})
|
40 |
+
} else if (mode === "extended") {
|
41 |
+
|
42 |
+
let basicResults: BasicSearchResult[] = []
|
43 |
+
try {
|
44 |
+
const rawString = decodeURIComponent(query?.e?.toString() || "").trim() as string
|
45 |
+
const maybeExistingResults = JSON.parse(rawString)
|
46 |
+
if (Array.isArray(maybeExistingResults)) {
|
47 |
+
basicResults = maybeExistingResults
|
48 |
+
}
|
49 |
+
} catch (err) {}
|
50 |
+
|
51 |
+
const extendedSearchResults: ExtendedSearchResult[] = await extend({
|
52 |
+
basicResults
|
53 |
+
})
|
54 |
+
|
55 |
+
console.log(`[api/v1/search] extended ${extendedSearchResults.length} search results`)
|
56 |
+
|
57 |
+
console.log(`[api/v1/search]`, extendedSearchResults)
|
58 |
+
|
59 |
+
return NextResponse.json(extendedSearchResults, {
|
60 |
+
status: 200,
|
61 |
+
statusText: "OK",
|
62 |
+
})
|
63 |
+
} else {
|
64 |
+
/*
|
65 |
+
return NextResponse.json([], {
|
66 |
+
status: 200,
|
67 |
+
statusText: "OK",
|
68 |
+
})
|
69 |
+
*/
|
70 |
+
throw new Error(`Please specify the mode.`)
|
71 |
+
}
|
72 |
+
}
|
src/app/api/v1/search/systemPrompt.ts
ADDED
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
export const systemPromptForBasicSearchResults: string =
|
2 |
+
`# Context
|
3 |
+
You are a server-side function generating search results from a single text input (a "prompt").
|
4 |
+
You have a database of new, never-seen-before videos, series, tv shows, movies, documentaries, music videos, found footage, news videos, videos created by influencers, game review, trailers of all kind, tutorials, education videos, user-made short videos etc.. anything you could find on both Netflix or YouTube, really.
|
5 |
+
You do not contain any existing IP (intellectual property) content.
|
6 |
+
|
7 |
+
# Task
|
8 |
+
Your mission is to generate a sequence of search results that closely match the demand by the user.
|
9 |
+
|
10 |
+
You will be provided a "prompt" (for the story) and max number of results.
|
11 |
+
|
12 |
+
Each result object is composed of:
|
13 |
+
- title: title of the video
|
14 |
+
- tags: to describe the categories and genres
|
15 |
+
# Examples
|
16 |
+
|
17 |
+
You most reply by writing/completing a YAML list of objects.
|
18 |
+
Here is a short example, the prompt was "4 search results about: cows"
|
19 |
+
Note how we asked for "4 search results" for previty, but it's possible that it will omitted. You should return 5 results by default.
|
20 |
+
but if the user asks for large numbers, it should be ignored (our limit is 8).
|
21 |
+
If the user ask for a specific cateogry eg "<something> recipes" obviously you should only show recipes to cook the thing et.
|
22 |
+
Try to be imaginative!
|
23 |
+
|
24 |
+
\`\`\`
|
25 |
+
- title: "The Cows"
|
26 |
+
tags: ["feature film", "drama", "coming of age"]
|
27 |
+
- title: "Happy cows 🐮 mooing and grazing 🌱"
|
28 |
+
tags: ["short video", "nature", "community"]
|
29 |
+
- title: "Ganja Dog - Got Milk?"
|
30 |
+
tags: ["music", "music video", "hip-hop"]
|
31 |
+
- title: "How Cows Work"
|
32 |
+
tags: ["short video", "education", "influencer"]
|
33 |
+
\`\`\
|
34 |
+
|
35 |
+
# Your turn:
|
36 |
+
`
|
37 |
+
|
38 |
+
export const systemPromptForExtendedSearchResults: string =
|
39 |
+
`# Context
|
40 |
+
You are a server-side function generating search results from partial results.
|
41 |
+
You have a database of new, never-seen-before videos, series, tv shows, movies, documentaries, music videos, found footage, news videos, videos created by influencers, game review, trailers of all kind, tutorials, education videos, user-made short videos etc.. anything you could find on both Netflix or YouTube, really.
|
42 |
+
You do not contain any existing IP (intellectual property) content.
|
43 |
+
|
44 |
+
# Task
|
45 |
+
Your mission is to generate a sequence of search results that best complements and extends the partial results.
|
46 |
+
|
47 |
+
You will be provided those partial results as YAML, and you need to return YAML.
|
48 |
+
|
49 |
+
An extended search result should contain those fields:
|
50 |
+
- title: title of the video
|
51 |
+
- cover: you must describe it using a Stable Diffusion prompt - about ~300 characters - using simple descriptive words and adjectives. Describe facts about characters, location, lights, texture, camera orientation, colors, clothes, movements etc. But don't give your opinion, don't talk about the emotions it evokes etc.
|
52 |
+
- description: in 2 or 3 sentences please describe the genre, category, visual style, synopsis (You must only describe the content, so don't add any info about the director, author, release year.)
|
53 |
+
- tags: to describe the categories and genres
|
54 |
+
# Examples
|
55 |
+
|
56 |
+
You most reply by writing/completing a YAML list of objects.
|
57 |
+
Here is a short example, using this data as input:
|
58 |
+
|
59 |
+
\`\`\`
|
60 |
+
- title: "The Cows"
|
61 |
+
tags: ["feature film", "drama", "coming of age"]
|
62 |
+
- title: "Happy cows 🐮 mooing and grazing 🌱"
|
63 |
+
tags: ["short video", "nature", "community"]
|
64 |
+
- title: "Ganja Dog - Got Milk?"
|
65 |
+
tags: ["music", "music video", "hip-hop"]
|
66 |
+
- title: "How Cows Work"
|
67 |
+
tags: ["short video", "education", "influencer"]
|
68 |
+
\`\`\
|
69 |
+
|
70 |
+
And here is one of the many possibilities:
|
71 |
+
|
72 |
+
\`\`\`
|
73 |
+
- title: "The Cows"
|
74 |
+
description: "a drama about Pete, young man growing up in a farm. His mom died, and his dad (who is sick) expects him to take over the cow farm, but Pete doesn't want to, and dreams of a different life, in the city. He often goes to the city at night, meet girls, but when he comes back late, and unable to work properly in the morning (when he makes mistake, forget to feed the cows etc) his dad grows angrier. Pete doesn't know his dad is sick, though. Near the end, the dad dies, and Pete will have to make some difficult life-changing decisions."
|
75 |
+
cover: "poster of a movie called “The Cows”, mysterious image of a farmer, alone in a grass field, in the morning, cows in the background, sad, angry, mist, award-winning, film poster, movie poster"
|
76 |
+
tags: ["feature film", "drama", "coming of age"]
|
77 |
+
- title: "Happy cows 🐮 mooing and grazing 🌱"
|
78 |
+
description: various 4K footage of cows grazing, walking, mooing, in other words being happy.
|
79 |
+
cover: "well-lit photo of cows, grazing in a field, peaceful, instagram, award winning"
|
80 |
+
tags: ["short video", "nature", "community"]
|
81 |
+
- title: "Ganja Dog - Got Milk?"
|
82 |
+
description: "a music video by Ganja Dog, a dog who is a famous rapper and influencer. The clip is shot in a farm, with Ganja Dog rapping and dancing, showing off its cars, clothes, with various people. There are various dramatic camera effects. The lyrics should be funny eg “Witch, I'm a Cow, I go Moo..”, “I'm In the Mood For Some Milk Yo” etc"
|
83 |
+
cover: "medium-shot of a dog rapper, showing off his dollars, in a cow farm, rapping, rich, cows, dogs, puppies, trending, influencer, dramatic, music video, rapping"
|
84 |
+
tags: ["music", "music video", "hip-hop"]
|
85 |
+
- title: "How Cows Work"
|
86 |
+
description: "a video explaining how cows work, made using cheap stock footage and an AI voice-over. It should show the history of cows, how they evolved, why human use them, how a farm work, how grass gets turned into milk, differences in breeds, the economics etc"
|
87 |
+
cover: "picture of a cow, drawn like a blueprint, cow factory, cow machine, clickbait youtube thumbnail made by an influencer, overly dramatic, unrealistic, fake, dramatic, overplayed, too much"
|
88 |
+
tags: ["short video", "education", "influencer"]
|
89 |
+
\`\`\
|
90 |
+
|
91 |
+
# Your turn:
|
92 |
+
`
|
src/app/api/v1/search/types.ts
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// for latent search we need to get rough results fast
|
3 |
+
export type BasicSearchResult = {
|
4 |
+
// note: the absence of ID means this is a new, latent result
|
5 |
+
id?: string
|
6 |
+
title: string
|
7 |
+
tags: string[]
|
8 |
+
}
|
9 |
+
|
10 |
+
export type ExtendedSearchResult = {
|
11 |
+
id?: string
|
12 |
+
title: string
|
13 |
+
description: string
|
14 |
+
cover: string
|
15 |
+
tags: string[]
|
16 |
+
}
|
src/app/{dream → latent}/embed/page.tsx
RENAMED
File without changes
|
src/app/{dream → latent}/samples.tsx
RENAMED
File without changes
|
src/app/{dream/spoiler.tsx → latent/search/page.tsx}
RENAMED
@@ -1,13 +1,15 @@
|
|
1 |
-
import {
|
2 |
import { clapToDataUri, generateClapFromSimpleStory } from "@aitube/clap"
|
3 |
|
4 |
-
import {
|
5 |
-
|
6 |
-
import {
|
|
|
|
|
7 |
|
8 |
// https://jmswrnr.com/blog/protecting-next-js-api-routes-query-parameters
|
9 |
|
10 |
-
export default async function
|
11 |
searchParams: {
|
12 |
l: latentContent,
|
13 |
},
|
@@ -15,7 +17,8 @@ export default async function DreamPage({
|
|
15 |
}: LatentQueryProps) {
|
16 |
const jwtToken = await getToken({ user: "anonymous" })
|
17 |
|
18 |
-
|
|
|
19 |
|
20 |
// this will hallucinate the thumbnail on the fly - maybe we should cache it
|
21 |
// const latentMedia = await searchResultToMediaInfo(latentSearchResult)
|
|
|
1 |
+
import { encode, decode } from 'js-base64'
|
2 |
import { clapToDataUri, generateClapFromSimpleStory } from "@aitube/clap"
|
3 |
|
4 |
+
import { LatentQueryProps } from "@/types/general"
|
5 |
+
|
6 |
+
import { Main } from "../../main"
|
7 |
+
import { getNewMediaInfo } from "../../api/generators/search/getNewMediaInfo"
|
8 |
+
import { getToken } from "../../api/auth/getToken"
|
9 |
|
10 |
// https://jmswrnr.com/blog/protecting-next-js-api-routes-query-parameters
|
11 |
|
12 |
+
export default async function LatentSearchPage({
|
13 |
searchParams: {
|
14 |
l: latentContent,
|
15 |
},
|
|
|
17 |
}: LatentQueryProps) {
|
18 |
const jwtToken = await getToken({ user: "anonymous" })
|
19 |
|
20 |
+
|
21 |
+
// const latentSearchResult = JSON.parse(decodee(`${latentContent}`)) as LatentSearchResult
|
22 |
|
23 |
// this will hallucinate the thumbnail on the fly - maybe we should cache it
|
24 |
// const latentMedia = await searchResultToMediaInfo(latentSearchResult)
|
src/app/latent/watch/page.tsx
ADDED
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import { encode, decode } from 'js-base64'
|
2 |
+
|
3 |
+
import { LatentQueryProps } from "@/types/general"
|
4 |
+
import { BasicSearchResult, ExtendedSearchResult } from "@/app/api/v1/search/types"
|
5 |
+
|
6 |
+
import { Main } from "../../main"
|
7 |
+
import { getNewMediaInfo } from "../../api/generators/search/getNewMediaInfo"
|
8 |
+
import { getToken } from "../../api/auth/getToken"
|
9 |
+
|
10 |
+
import { extend } from "@/app/api/v1/search"
|
11 |
+
|
12 |
+
// https://jmswrnr.com/blog/protecting-next-js-api-routes-query-parameters
|
13 |
+
|
14 |
+
export default async function DreamPage({
|
15 |
+
searchParams: {
|
16 |
+
p: prompt,
|
17 |
+
},
|
18 |
+
...rest
|
19 |
+
}: LatentQueryProps) {
|
20 |
+
const jwtToken = await getToken({ user: "anonymous" })
|
21 |
+
console.log(`[/latent/watch] prompt =`, prompt)
|
22 |
+
let basicResult = JSON.parse(decode(`${prompt || ""}`)) as BasicSearchResult
|
23 |
+
|
24 |
+
console.log("[/latent/watch] basicResult:", basicResult)
|
25 |
+
|
26 |
+
// note that we should generate a longer synopsis from the autocomplete result
|
27 |
+
//
|
28 |
+
// however that is a slow process, maybe not great for a server-side rendering task,
|
29 |
+
// so idk
|
30 |
+
const extendedResults: ExtendedSearchResult[] = await extend({
|
31 |
+
basicResults: [ basicResult ]
|
32 |
+
})
|
33 |
+
console.log(`[/latent/watch] extendedResults =`, extendedResults)
|
34 |
+
|
35 |
+
const extendedResult = extendedResults.at(0)
|
36 |
+
|
37 |
+
if (!extendedResult || !Array.isArray(extendedResult.tags)) {
|
38 |
+
console.error(`failed to generated an extended result, aborting`)
|
39 |
+
throw new Error(`Server error`)
|
40 |
+
}
|
41 |
+
// const latentSearchResult = JSON.parse(decode(`${latentContent}`)) as LatentSearchResult
|
42 |
+
|
43 |
+
// TODO: we should hallucinate the thumbnail at this stage, and on the fly
|
44 |
+
// this is useful to do it on the server-side so we can share the link on social media etc
|
45 |
+
//
|
46 |
+
// maybe we should cache the image
|
47 |
+
// const latentMedia = await searchResultToMediaInfo(latentSearchResult)
|
48 |
+
|
49 |
+
const latentMedia = getNewMediaInfo({
|
50 |
+
label: extendedResult.title,
|
51 |
+
description: extendedResult.description,
|
52 |
+
prompt: extendedResult.description,
|
53 |
+
tags: [...extendedResult.tags],
|
54 |
+
})
|
55 |
+
|
56 |
+
console.log(`[/latent/watch] generated media: `, latentMedia)
|
57 |
+
// now, generating the .clap is another story, it will be much more intensive
|
58 |
+
// so we will generate it later in async, in the client-side
|
59 |
+
|
60 |
+
return (
|
61 |
+
<Main latentMedia={latentMedia} jwtToken={jwtToken} />
|
62 |
+
)
|
63 |
+
}
|
src/app/main.tsx
CHANGED
@@ -19,6 +19,7 @@ import { PublicMediaEmbedView } from "./views/public-media-embed-view"
|
|
19 |
import { PublicMediaView } from "./views/public-media-view"
|
20 |
import { PublicLatentMediaEmbedView } from "./views/public-latent-media-embed-view"
|
21 |
import { PublicLatentMediaView } from "./views/public-latent-media-view"
|
|
|
22 |
|
23 |
// this is where we transition from the server-side space
|
24 |
// and the client-side space
|
@@ -80,6 +81,8 @@ export function Main({
|
|
80 |
const setPublicTracks = useStore(s => s.setPublicTracks)
|
81 |
const setPublicTrack = useStore(s => s.setPublicTrack)
|
82 |
|
|
|
|
|
83 |
useEffect(() => {
|
84 |
if (typeof jwtToken !== "string" && !jwtToken) { return }
|
85 |
setJwtToken(jwtToken)
|
@@ -153,13 +156,13 @@ export function Main({
|
|
153 |
console.log(latentMedia)
|
154 |
setPublicLatentMedia(latentMedia)
|
155 |
if (!latentMedia || !latentMedia?.id) { return }
|
156 |
-
if (pathname === "/
|
157 |
-
if (pathname !== "/
|
158 |
// console.log("we are on huggingface apparently!")
|
159 |
// router.replace(`/watch?v=${publicMedia.id}`)
|
160 |
|
161 |
// TODO: add params in the URL to represent the latent result
|
162 |
-
router.replace(`/
|
163 |
}
|
164 |
}, [latentMedia?.id])
|
165 |
|
@@ -196,6 +199,7 @@ export function Main({
|
|
196 |
{view === "public_media" && <PublicMediaView />}
|
197 |
|
198 |
{/* latent content is the content that "doesn't exist" (is generated by the AI) */}
|
|
|
199 |
{view === "public_latent_media_embed" && <PublicLatentMediaEmbedView />}
|
200 |
{view === "public_latent_media" && <PublicLatentMediaView />}
|
201 |
|
|
|
19 |
import { PublicMediaView } from "./views/public-media-view"
|
20 |
import { PublicLatentMediaEmbedView } from "./views/public-latent-media-embed-view"
|
21 |
import { PublicLatentMediaView } from "./views/public-latent-media-view"
|
22 |
+
import { PublicLatentSearchView } from "./views/public-latent-search-view"
|
23 |
|
24 |
// this is where we transition from the server-side space
|
25 |
// and the client-side space
|
|
|
81 |
const setPublicTracks = useStore(s => s.setPublicTracks)
|
82 |
const setPublicTrack = useStore(s => s.setPublicTrack)
|
83 |
|
84 |
+
console.log("[main.tsx] latentMedia = ", latentMedia)
|
85 |
+
|
86 |
useEffect(() => {
|
87 |
if (typeof jwtToken !== "string" && !jwtToken) { return }
|
88 |
setJwtToken(jwtToken)
|
|
|
156 |
console.log(latentMedia)
|
157 |
setPublicLatentMedia(latentMedia)
|
158 |
if (!latentMedia || !latentMedia?.id) { return }
|
159 |
+
if (pathname === "/latent/embed") { return }
|
160 |
+
if (pathname !== "/latent/watch") {
|
161 |
// console.log("we are on huggingface apparently!")
|
162 |
// router.replace(`/watch?v=${publicMedia.id}`)
|
163 |
|
164 |
// TODO: add params in the URL to represent the latent result
|
165 |
+
router.replace(`/latent/watch`)
|
166 |
}
|
167 |
}, [latentMedia?.id])
|
168 |
|
|
|
199 |
{view === "public_media" && <PublicMediaView />}
|
200 |
|
201 |
{/* latent content is the content that "doesn't exist" (is generated by the AI) */}
|
202 |
+
{view === "public_latent_search" && <PublicLatentSearchView />}
|
203 |
{view === "public_latent_media_embed" && <PublicLatentMediaEmbedView />}
|
204 |
{view === "public_latent_media" && <PublicLatentMediaView />}
|
205 |
|
src/app/state/useStore.ts
CHANGED
@@ -3,6 +3,7 @@
|
|
3 |
import { create } from "zustand"
|
4 |
|
5 |
import { ChannelInfo, MediaInfo, InterfaceDisplayMode, InterfaceView, InterfaceMenuMode, InterfaceHeaderMode, CommentInfo, UserInfo } from "@/types/general"
|
|
|
6 |
|
7 |
export const useStore = create<{
|
8 |
displayMode: InterfaceDisplayMode
|
@@ -31,8 +32,8 @@ export const useStore = create<{
|
|
31 |
searchAutocompleteQuery: string
|
32 |
setSearchAutocompleteQuery: (searchAutocompleteQuery?: string) => void
|
33 |
|
34 |
-
searchAutocompleteResults:
|
35 |
-
setSearchAutocompleteResults: (searchAutocompleteResults:
|
36 |
|
37 |
searchResults: MediaInfo[]
|
38 |
setSearchResults: (searchResults: MediaInfo[]) => void
|
@@ -118,8 +119,9 @@ export const useStore = create<{
|
|
118 |
"/embed": "public_media_embed",
|
119 |
"/music": "public_music_videos",
|
120 |
"/channels": "public_channels",
|
121 |
-
"/
|
122 |
-
"/
|
|
|
123 |
"/channel": "public_channel",
|
124 |
|
125 |
// those are reserved for future use
|
@@ -149,8 +151,8 @@ export const useStore = create<{
|
|
149 |
set({ showAutocompleteBox })
|
150 |
},
|
151 |
|
152 |
-
searchAutocompleteResults: [] as
|
153 |
-
setSearchAutocompleteResults: (searchAutocompleteResults:
|
154 |
set({ searchAutocompleteResults })
|
155 |
},
|
156 |
|
|
|
3 |
import { create } from "zustand"
|
4 |
|
5 |
import { ChannelInfo, MediaInfo, InterfaceDisplayMode, InterfaceView, InterfaceMenuMode, InterfaceHeaderMode, CommentInfo, UserInfo } from "@/types/general"
|
6 |
+
import { BasicSearchResult } from "../api/v1/search/types"
|
7 |
|
8 |
export const useStore = create<{
|
9 |
displayMode: InterfaceDisplayMode
|
|
|
32 |
searchAutocompleteQuery: string
|
33 |
setSearchAutocompleteQuery: (searchAutocompleteQuery?: string) => void
|
34 |
|
35 |
+
searchAutocompleteResults: BasicSearchResult[]
|
36 |
+
setSearchAutocompleteResults: (searchAutocompleteResults: BasicSearchResult[]) => void
|
37 |
|
38 |
searchResults: MediaInfo[]
|
39 |
setSearchResults: (searchResults: MediaInfo[]) => void
|
|
|
119 |
"/embed": "public_media_embed",
|
120 |
"/music": "public_music_videos",
|
121 |
"/channels": "public_channels",
|
122 |
+
"/latent/search": "public_latent_search",
|
123 |
+
"/latent/watch": "public_latent_media",
|
124 |
+
"/latent/embed": "public_latent_media_embed",
|
125 |
"/channel": "public_channel",
|
126 |
|
127 |
// those are reserved for future use
|
|
|
151 |
set({ showAutocompleteBox })
|
152 |
},
|
153 |
|
154 |
+
searchAutocompleteResults: [] as BasicSearchResult[],
|
155 |
+
setSearchAutocompleteResults: (searchAutocompleteResults: BasicSearchResult[]) => {
|
156 |
set({ searchAutocompleteResults })
|
157 |
},
|
158 |
|
src/app/views/public-latent-search-view/index.tsx
ADDED
@@ -0,0 +1,49 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
"use client"
|
2 |
+
|
3 |
+
import { useEffect, useTransition } from "react"
|
4 |
+
|
5 |
+
import { useStore } from "@/app/state/useStore"
|
6 |
+
import { cn } from "@/lib/utils/cn"
|
7 |
+
import { MediaInfo } from "@/types/general"
|
8 |
+
import { getVideos } from "@/app/api/actions/ai-tube-hf/getVideos"
|
9 |
+
import { VideoList } from "@/components/interface/video-list"
|
10 |
+
|
11 |
+
export function PublicLatentSearchView() {
|
12 |
+
const [_isPending, startTransition] = useTransition()
|
13 |
+
const setView = useStore(s => s.setView)
|
14 |
+
const currentTag = useStore(s => s.currentTag)
|
15 |
+
const setPublicMedias = useStore(s => s.setPublicMedias)
|
16 |
+
const setPublicMedia = useStore(s => s.setPublicMedia)
|
17 |
+
const publicMedias = useStore(s => s.publicMedias)
|
18 |
+
|
19 |
+
useEffect(() => {
|
20 |
+
startTransition(async () => {
|
21 |
+
const medias = await getVideos({
|
22 |
+
sortBy: "date",
|
23 |
+
mandatoryTags: currentTag ? [currentTag] : [],
|
24 |
+
maxNbMedias: 25
|
25 |
+
})
|
26 |
+
|
27 |
+
// due to some caching on the first function.. we update with fresh data!
|
28 |
+
// const updatedVideos = await extendVideosWithStats(medias)
|
29 |
+
|
30 |
+
setPublicMedias(medias)
|
31 |
+
})
|
32 |
+
}, [currentTag])
|
33 |
+
|
34 |
+
const handleSelect = (media: MediaInfo) => {
|
35 |
+
setView("public_latent_media")
|
36 |
+
setPublicMedia(media)
|
37 |
+
}
|
38 |
+
|
39 |
+
return (
|
40 |
+
<div className={cn(
|
41 |
+
`sm:pr-4`
|
42 |
+
)}>
|
43 |
+
<VideoList
|
44 |
+
items={publicMedias}
|
45 |
+
onSelect={handleSelect}
|
46 |
+
/>
|
47 |
+
</div>
|
48 |
+
)
|
49 |
+
}
|
src/components/interface/latent-engine/core/engine.tsx
CHANGED
@@ -14,7 +14,7 @@ import { localStorageKeys } from "@/app/state/localStorageKeys"
|
|
14 |
import { defaultSettings } from "@/app/state/defaultSettings"
|
15 |
import { useStore } from "@/app/state/useStore"
|
16 |
import { ClapProject, generateClapFromSimpleStory, serializeClap } from "@aitube/clap"
|
17 |
-
import { theSimps } from "@/app/
|
18 |
|
19 |
function LatentEngine({
|
20 |
media,
|
@@ -76,29 +76,27 @@ function LatentEngine({
|
|
76 |
const videoLayerRef = useRef<HTMLDivElement>(null)
|
77 |
const segmentationLayerRef = useRef<HTMLDivElement>(null)
|
78 |
|
79 |
-
const mediaUrl = media.clapUrl || media.assetUrlHd || media.assetUrl
|
80 |
-
|
81 |
useEffect(() => {
|
82 |
-
if (!stateRef.current.isInitialized
|
83 |
stateRef.current.isInitialized = true
|
84 |
|
85 |
const fn = async () => {
|
86 |
-
//
|
87 |
-
//
|
|
|
|
|
88 |
|
89 |
-
// open(mediaUrl)
|
90 |
const mockClap: ClapProject = generateClapFromSimpleStory({
|
91 |
-
story: theSimps
|
|
|
|
|
92 |
})
|
93 |
-
|
94 |
-
|
95 |
-
// const mockDataUri = await blobToDataUri(mockArchive, "application/x-gzip")
|
96 |
-
// console.log("mockDataUri:", mockDataUri)
|
97 |
-
open(mockArchive)
|
98 |
}
|
99 |
fn()
|
100 |
}
|
101 |
-
}, [
|
102 |
|
103 |
const isPlayingRef = useRef(isPlaying)
|
104 |
isPlayingRef.current = isPlaying
|
|
|
14 |
import { defaultSettings } from "@/app/state/defaultSettings"
|
15 |
import { useStore } from "@/app/state/useStore"
|
16 |
import { ClapProject, generateClapFromSimpleStory, serializeClap } from "@aitube/clap"
|
17 |
+
import { theSimps } from "@/app/latent/samples"
|
18 |
|
19 |
function LatentEngine({
|
20 |
media,
|
|
|
76 |
const videoLayerRef = useRef<HTMLDivElement>(null)
|
77 |
const segmentationLayerRef = useRef<HTMLDivElement>(null)
|
78 |
|
|
|
|
|
79 |
useEffect(() => {
|
80 |
+
if (!stateRef.current.isInitialized) {
|
81 |
stateRef.current.isInitialized = true
|
82 |
|
83 |
const fn = async () => {
|
84 |
+
// if we have a clapUrl (eg. from the database) then we use that
|
85 |
+
// otherwise we generate it ourselves, chunk by chunk (since we're live)
|
86 |
+
|
87 |
+
// TODO Julian work on the chunk mechanism
|
88 |
|
|
|
89 |
const mockClap: ClapProject = generateClapFromSimpleStory({
|
90 |
+
story: theSimps,
|
91 |
+
showIntroPoweredByEngine: false,
|
92 |
+
showIntroDisclaimerAboutAI: false
|
93 |
})
|
94 |
+
|
95 |
+
open(mockClap)
|
|
|
|
|
|
|
96 |
}
|
97 |
fn()
|
98 |
}
|
99 |
+
}, [media.id])
|
100 |
|
101 |
const isPlayingRef = useRef(isPlaying)
|
102 |
isPlayingRef.current = isPlaying
|
src/components/interface/latent-search-input/index.tsx
ADDED
@@ -0,0 +1,157 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import { useRef, useState, useTransition } from "react"
|
2 |
+
import Link from "next/link"
|
3 |
+
import { encode, decode } from 'js-base64'
|
4 |
+
// import throttle from "@jcoreio/async-throttle"
|
5 |
+
import debounce from "lodash.debounce"
|
6 |
+
import { GoSearch } from "react-icons/go"
|
7 |
+
|
8 |
+
import { useStore } from "@/app/state/useStore"
|
9 |
+
import { cn } from "@/lib/utils/cn"
|
10 |
+
import { Input } from "@/components/ui/input"
|
11 |
+
import { Button } from "@/components/ui/button"
|
12 |
+
import { MediaInfo } from "@/types/general"
|
13 |
+
import { search } from "@/app/api/v1/search"
|
14 |
+
|
15 |
+
export function LatentSearchInput() {
|
16 |
+
const [_pending, startTransition] = useTransition()
|
17 |
+
|
18 |
+
const setSearchAutocompleteQuery = useStore(s => s.setSearchAutocompleteQuery)
|
19 |
+
const showAutocompleteBox = useStore(s => s.showAutocompleteBox)
|
20 |
+
const setShowAutocompleteBox = useStore(s => s.setShowAutocompleteBox)
|
21 |
+
|
22 |
+
const searchAutocompleteResults = useStore(s => s.searchAutocompleteResults)
|
23 |
+
const setSearchAutocompleteResults = useStore(s => s.setSearchAutocompleteResults)
|
24 |
+
|
25 |
+
const setSearchQuery = useStore(s => s.setSearchQuery)
|
26 |
+
|
27 |
+
const [searchDraft, setSearchDraft] = useState("")
|
28 |
+
|
29 |
+
const ref = useRef<HTMLInputElement>(null)
|
30 |
+
|
31 |
+
|
32 |
+
// called when pressing enter or clicking on search
|
33 |
+
const debouncedSearch = debounce((query: string) => {
|
34 |
+
startTransition(async () => {
|
35 |
+
console.log(`searching the latent space for "${query}"..`)
|
36 |
+
|
37 |
+
if (query.length < 2) { console.log("search term is too short") }
|
38 |
+
|
39 |
+
console.log("imaginating medias..")
|
40 |
+
|
41 |
+
const imaginedMedias = await search({
|
42 |
+
prompt: query,
|
43 |
+
nbResults: 4
|
44 |
+
})
|
45 |
+
|
46 |
+
console.log(`imagined ${imaginedMedias.length} results:`, imaginedMedias)
|
47 |
+
|
48 |
+
setSearchAutocompleteResults(imaginedMedias.map(item => ({
|
49 |
+
title: item.title,
|
50 |
+
tags: item.tags,
|
51 |
+
})))
|
52 |
+
|
53 |
+
// TODO: only close the show autocomplete box if we found something
|
54 |
+
// setShowAutocompleteBox(false)
|
55 |
+
})
|
56 |
+
}, 500)
|
57 |
+
|
58 |
+
// called when pressing enter or clicking on search
|
59 |
+
const handleSearch = () => {
|
60 |
+
ref.current?.focus()
|
61 |
+
setSearchQuery(searchDraft)
|
62 |
+
setShowAutocompleteBox(true)
|
63 |
+
debouncedSearch(searchDraft)
|
64 |
+
}
|
65 |
+
|
66 |
+
return (
|
67 |
+
<div className="flex flex-row flex-grow w-[380px] lg:w-[600px]">
|
68 |
+
|
69 |
+
<div className="flex flex-row w-full">
|
70 |
+
<Input
|
71 |
+
ref={ref}
|
72 |
+
placeholder="Search the latent space"
|
73 |
+
className={cn(
|
74 |
+
`bg-neutral-900 text-neutral-200 dark:bg-neutral-900 dark:text-neutral-200`,
|
75 |
+
`rounded-l-full rounded-r-none`,
|
76 |
+
|
77 |
+
// we increase the line height to better catch the clicks
|
78 |
+
`py-0 h-10 leading-7`,
|
79 |
+
|
80 |
+
`border-neutral-700 dark:border-neutral-700 border-r-0`,
|
81 |
+
|
82 |
+
)}
|
83 |
+
onFocus={() => {
|
84 |
+
handleSearch()
|
85 |
+
}}
|
86 |
+
onChange={(e) => {
|
87 |
+
setSearchDraft(e.target.value)
|
88 |
+
setShowAutocompleteBox(true)
|
89 |
+
// handleSearch()
|
90 |
+
}}
|
91 |
+
onKeyDown={({ key }) => {
|
92 |
+
if (key === 'Enter') {
|
93 |
+
handleSearch()
|
94 |
+
}
|
95 |
+
}}
|
96 |
+
value={searchDraft}
|
97 |
+
/>
|
98 |
+
<Button
|
99 |
+
className={cn(
|
100 |
+
`rounded-l-none rounded-r-full border border-neutral-700 dark:border-neutral-700`,
|
101 |
+
`cursor-pointer`,
|
102 |
+
`transition-all duration-200 ease-in-out`,
|
103 |
+
`text-neutral-200 dark:text-neutral-200 bg-neutral-800 dark:bg-neutral-800 hover:bg-neutral-700 disabled:bg-neutral-900`
|
104 |
+
)}
|
105 |
+
onClick={() => {
|
106 |
+
handleSearch()
|
107 |
+
// console.log("submit")
|
108 |
+
// setShowAutocompleteBox(false)
|
109 |
+
// setSearchDraft("")
|
110 |
+
}}
|
111 |
+
disabled={false}
|
112 |
+
>
|
113 |
+
<GoSearch className="w-6 h-6" />
|
114 |
+
</Button>
|
115 |
+
</div>
|
116 |
+
<div
|
117 |
+
className={cn(
|
118 |
+
`absolute z-50 ml-1`,
|
119 |
+
|
120 |
+
// please keep this in sync with the parent
|
121 |
+
`w-[320px] lg:w-[540px]`,
|
122 |
+
|
123 |
+
`text-neutral-200 dark:text-neutral-200 bg-neutral-900 dark:bg-neutral-900`,
|
124 |
+
`border border-neutral-800 dark:border-neutral-800`,
|
125 |
+
`rounded-xl shadow-2xl`,
|
126 |
+
`flex flex-col p-2 space-y-1`,
|
127 |
+
|
128 |
+
`transition-all duration-200 ease-in-out`,
|
129 |
+
showAutocompleteBox
|
130 |
+
? `opacity-100 scale-100 mt-11 pointer-events-auto`
|
131 |
+
: `opacity-0 scale-95 mt-6 pointer-events-none`
|
132 |
+
)}
|
133 |
+
>
|
134 |
+
{searchAutocompleteResults.length === 0 ? <div>Nothing to show, type something and press enter</div> : null}
|
135 |
+
{searchAutocompleteResults.map(item => (
|
136 |
+
<Link key={item.id} href={
|
137 |
+
item.id
|
138 |
+
? `${process.env.NEXT_PUBLIC_DOMAIN}/watch?v=${item.id}`
|
139 |
+
: `${process.env.NEXT_PUBLIC_DOMAIN}/latent/watch?p=${encode(JSON.stringify(item))}`
|
140 |
+
}>
|
141 |
+
<div
|
142 |
+
className={cn(
|
143 |
+
`dark:hover:bg-neutral-800 hover:bg-neutral-800`,
|
144 |
+
`text-sm`,
|
145 |
+
`px-3 py-2`,
|
146 |
+
`rounded-xl`
|
147 |
+
)}
|
148 |
+
|
149 |
+
>
|
150 |
+
{item.title}
|
151 |
+
</div>
|
152 |
+
</Link>
|
153 |
+
))}
|
154 |
+
</div>
|
155 |
+
</div>
|
156 |
+
)
|
157 |
+
}
|
src/components/interface/media-player/index.tsx
CHANGED
@@ -25,7 +25,6 @@ export function MediaPlayer({
|
|
25 |
console.log("MediaPlayer called for \"" + media?.label + "\"")
|
26 |
|
27 |
if (!media) { return null }
|
28 |
-
if (!media?.assetUrl && !media?.clapUrl) { return null }
|
29 |
|
30 |
// uncomment one of those to forcefully test the .clap player from an external .clap file
|
31 |
// media.assetUrlHd = "https://huggingface.co/datasets/jbilcke/ai-tube-cinema/tree/main/404.clap"
|
@@ -48,6 +47,8 @@ export function MediaPlayer({
|
|
48 |
)
|
49 |
}
|
50 |
|
|
|
|
|
51 |
if (projectionType === "gaussian") {
|
52 |
// note: for AutoSizer to work properly it needs to be inside a normal div with no display: "flex"
|
53 |
return (
|
|
|
25 |
console.log("MediaPlayer called for \"" + media?.label + "\"")
|
26 |
|
27 |
if (!media) { return null }
|
|
|
28 |
|
29 |
// uncomment one of those to forcefully test the .clap player from an external .clap file
|
30 |
// media.assetUrlHd = "https://huggingface.co/datasets/jbilcke/ai-tube-cinema/tree/main/404.clap"
|
|
|
47 |
)
|
48 |
}
|
49 |
|
50 |
+
if (!media?.assetUrl && !media?.assetUrlHd) { return null }
|
51 |
+
|
52 |
if (projectionType === "gaussian") {
|
53 |
// note: for AutoSizer to work properly it needs to be inside a normal div with no display: "flex"
|
54 |
return (
|
src/components/interface/search-input/index.tsx
CHANGED
@@ -1,5 +1,6 @@
|
|
1 |
import { useRef, useState, useTransition } from "react"
|
2 |
import Link from "next/link"
|
|
|
3 |
// import throttle from "@jcoreio/async-throttle"
|
4 |
import debounce from "lodash.debounce"
|
5 |
import { GoSearch } from "react-icons/go"
|
@@ -32,7 +33,7 @@ export function SearchInput() {
|
|
32 |
startTransition(async () => {
|
33 |
console.log(`searching for "${query}"..`)
|
34 |
|
35 |
-
const
|
36 |
query,
|
37 |
sortBy: "match",
|
38 |
maxNbMedias: 8,
|
@@ -40,8 +41,14 @@ export function SearchInput() {
|
|
40 |
renewCache: false, // bit of optimization
|
41 |
})
|
42 |
|
43 |
-
console.log(`got ${
|
44 |
-
setSearchAutocompleteResults(
|
|
|
|
|
|
|
|
|
|
|
|
|
45 |
|
46 |
// TODO: only close the show autocomplete box if we found something
|
47 |
// setShowAutocompleteBox(false)
|
@@ -125,8 +132,12 @@ export function SearchInput() {
|
|
125 |
)}
|
126 |
>
|
127 |
{searchAutocompleteResults.length === 0 ? <div>Nothing to show, type something and press enter</div> : null}
|
128 |
-
{searchAutocompleteResults.map(
|
129 |
-
<Link key={
|
|
|
|
|
|
|
|
|
130 |
<div
|
131 |
className={cn(
|
132 |
`dark:hover:bg-neutral-800 hover:bg-neutral-800`,
|
@@ -136,7 +147,7 @@ export function SearchInput() {
|
|
136 |
)}
|
137 |
|
138 |
>
|
139 |
-
{
|
140 |
</div>
|
141 |
</Link>
|
142 |
))}
|
|
|
1 |
import { useRef, useState, useTransition } from "react"
|
2 |
import Link from "next/link"
|
3 |
+
import { encode, decode } from 'js-base64'
|
4 |
// import throttle from "@jcoreio/async-throttle"
|
5 |
import debounce from "lodash.debounce"
|
6 |
import { GoSearch } from "react-icons/go"
|
|
|
33 |
startTransition(async () => {
|
34 |
console.log(`searching for "${query}"..`)
|
35 |
|
36 |
+
const medias = await getVideos({
|
37 |
query,
|
38 |
sortBy: "match",
|
39 |
maxNbMedias: 8,
|
|
|
41 |
renewCache: false, // bit of optimization
|
42 |
})
|
43 |
|
44 |
+
console.log(`got ${medias.length} results!`)
|
45 |
+
setSearchAutocompleteResults(medias.map(item => ({
|
46 |
+
id: item.id,
|
47 |
+
title: item.label,
|
48 |
+
tags: item.tags,
|
49 |
+
})))
|
50 |
+
|
51 |
+
|
52 |
|
53 |
// TODO: only close the show autocomplete box if we found something
|
54 |
// setShowAutocompleteBox(false)
|
|
|
132 |
)}
|
133 |
>
|
134 |
{searchAutocompleteResults.length === 0 ? <div>Nothing to show, type something and press enter</div> : null}
|
135 |
+
{searchAutocompleteResults.map(item => (
|
136 |
+
<Link key={item.id} href={
|
137 |
+
item.id
|
138 |
+
? `${process.env.NEXT_PUBLIC_DOMAIN}/watch?v=${item.id}`
|
139 |
+
: `${process.env.NEXT_PUBLIC_DOMAIN}/latent/watch?p=${encode(JSON.stringify(item))}`
|
140 |
+
}>
|
141 |
<div
|
142 |
className={cn(
|
143 |
`dark:hover:bg-neutral-800 hover:bg-neutral-800`,
|
|
|
147 |
)}
|
148 |
|
149 |
>
|
150 |
+
{item.title}
|
151 |
</div>
|
152 |
</Link>
|
153 |
))}
|
src/components/interface/top-header/index.tsx
CHANGED
@@ -11,6 +11,7 @@ import Link from 'next/link'
|
|
11 |
import { Input } from '@/components/ui/input'
|
12 |
import { Button } from '@/components/ui/button'
|
13 |
import { SearchInput } from '../search-input'
|
|
|
14 |
import { pathway } from '@/lib/fonts'
|
15 |
|
16 |
export function TopHeader() {
|
@@ -122,7 +123,11 @@ export function TopHeader() {
|
|
122 |
`px-4 py-2 w-max-64`,
|
123 |
`text-neutral-400 text-2xs sm:text-xs lg:text-sm italic`
|
124 |
)}>
|
125 |
-
|
|
|
|
|
|
|
|
|
126 |
</div>
|
127 |
<div className={cn("w-32 xl:w-42")}>
|
128 |
<span>
|
|
|
11 |
import { Input } from '@/components/ui/input'
|
12 |
import { Button } from '@/components/ui/button'
|
13 |
import { SearchInput } from '../search-input'
|
14 |
+
import { LatentSearchInput } from '../latent-search-input'
|
15 |
import { pathway } from '@/lib/fonts'
|
16 |
|
17 |
export function TopHeader() {
|
|
|
123 |
`px-4 py-2 w-max-64`,
|
124 |
`text-neutral-400 text-2xs sm:text-xs lg:text-sm italic`
|
125 |
)}>
|
126 |
+
{view === "public_latent_search" ||
|
127 |
+
view === "public_latent_media" ||
|
128 |
+
view === "public_latent_media_embed"
|
129 |
+
? <LatentSearchInput />
|
130 |
+
: <SearchInput />}
|
131 |
</div>
|
132 |
<div className={cn("w-32 xl:w-42")}>
|
133 |
<span>
|
src/types/general.ts
CHANGED
@@ -636,6 +636,7 @@ export type InterfaceView =
|
|
636 |
| "public_media" // public view of an individual media (video, gaussian splat, clap video)
|
637 |
| "public_media_embed" // for integration into twitter etc
|
638 |
| "public_music_videos" // public music videos - it's a special category, because music is *cool*
|
|
|
639 |
| "public_latent_media" // public view of an individual dream (a latent media, so it's not a "real" file)
|
640 |
| "public_latent_media_embed" // for integration into twitter etc (which would be hardcore for our server load.. so maybe not)
|
641 |
| "public_gaming" // for AiTube Gaming
|
@@ -712,7 +713,7 @@ export type AppQueryProps = {
|
|
712 |
export type LatentQueryProps = {
|
713 |
params: { jwtToken: string }
|
714 |
searchParams: {
|
715 |
-
|
716 |
[key: string]: string | string[] | undefined
|
717 |
}
|
718 |
}
|
|
|
636 |
| "public_media" // public view of an individual media (video, gaussian splat, clap video)
|
637 |
| "public_media_embed" // for integration into twitter etc
|
638 |
| "public_music_videos" // public music videos - it's a special category, because music is *cool*
|
639 |
+
| "public_latent_search" // public view of latent search results
|
640 |
| "public_latent_media" // public view of an individual dream (a latent media, so it's not a "real" file)
|
641 |
| "public_latent_media_embed" // for integration into twitter etc (which would be hardcore for our server load.. so maybe not)
|
642 |
| "public_gaming" // for AiTube Gaming
|
|
|
713 |
export type LatentQueryProps = {
|
714 |
params: { jwtToken: string }
|
715 |
searchParams: {
|
716 |
+
p?: string | string[], // search result content (serialized to a base64 json)
|
717 |
[key: string]: string | string[] | undefined
|
718 |
}
|
719 |
}
|