Minor improvements to viz and params

2022-11-25 21:17:29 -08:00 · 2022-11-25 21:17:29 -08:00 · 35a90ec979
parent 5a23032fb8
commit 35a90ec979
4 changed files with 36 additions and 20 deletions
--- a/components/HeightMapImage.tsx
+++ b/components/HeightMapImage.tsx
@ -38,7 +38,7 @@ export default function HeightMapImage(props: HeightMapImageProps) {
          // Feed the heightmap
          bumpTexture: { value: heightMap },
          // Feed the scaling constant for the heightmap
-          bumpScale: { value: -0.2 },
+          bumpScale: { value: -0.5 },
          // Feed the texture map
          terrainTexture: { value: textureMap },
        }}
--- a/components/SpectrogramViewer.tsx
+++ b/components/SpectrogramViewer.tsx
@ -39,15 +39,17 @@ export default function SpectrogramViewer({
    playheadRef.current.position.y = camera.position.y;
  });

+  const playbarShift = 3.6; // [m]
+
  return (
    <group>
      {inferenceResults.map((value: InferenceResult, index: number) => {
-        const height = audioLength * (-0.48 - value.counter);
+        const position = audioLength * (-0.53 - value.counter) + playbarShift;
        if (use_height_map) {
          return (
            <HeightMapImage
              url={value.image}
-              position={[0, height, 0]}
+              position={[0, position, 0]}
              rotation={[0, 0, -Math.PI / 2]}
              scale={[audioLength, 5, 1]}
              key={index}
@ -57,7 +59,7 @@ export default function SpectrogramViewer({
          return (
            <ImagePlane
              url={value.image}
-              height={height}
+              height={position}
              duration={audioLength}
              key={index}
            />
@ -69,10 +71,10 @@ export default function SpectrogramViewer({
      <group ref={playheadRef}>
        <Box
          args={[5.5, 2.0, 0.15]}
-          rotation={[Math.PI / 2 - 0.4, 0, 0]}
-          position={[0, 0, -0.5]}
+          rotation={[Math.PI / 2 - 0.2, 0, 0]}
+          position={[0, playbarShift, -0.5]}
        >
-          <meshBasicMaterial color="#ee2211" transparent opacity={0.7} />
+          <meshBasicMaterial color="#ee2211" transparent opacity={0.8} />
        </Box>
      </group>
    </group>
--- a/pages/index.tsx
+++ b/pages/index.tsx
@ -16,7 +16,7 @@ const SERVER_URL = "http://129.146.52.68:3013/run_inference/";
 const defaultPromptInputs = [
  { prompt: "A jazz pianist playing a classical concerto" },
  { prompt: "Country singer and a techno DJ" },
-  { prompt: "A typewriter in they style of K-Pop" },
+  { prompt: "A typewriter in the style of K-Pop" },
  { prompt: "lo-fi beat for the holidays" },
  { prompt: "" },
  { prompt: "" },
@ -264,15 +264,28 @@ export default function Home() {

    const transitioning = appState == AppState.Transition;

+    const denoising = 0.85;
+    const guidance = 7.0;
+    const numInferenceSteps = 50;
+    const seedImageId = 0;
+    const maskImageId = null;
+
    const inferenceInput = {
      alpha: alpha,
+      num_inference_steps: numInferenceSteps,
+      seed_image_id: seedImageId,
+      mask_image_id: maskImageId,
      start: {
        prompt: startPrompt,
        seed: seed,
+        denoising: denoising,
+        guidance: guidance,
      },
      end: {
        prompt: transitioning ? endPrompt : startPrompt,
        seed: transitioning ? seed : seed + 1,
+        denoising: denoising,
+        guidance: guidance,
      },
    };

@ -324,6 +337,8 @@ export default function Home() {
    });
  };

+  // Run inference on a timer.
+  // TODO(hayk): Improve the strategy here.
  useInterval(() => {
    console.log(inferenceResults);
    if (inferenceResults.length < maxNumInferenceResults) {
@ -331,8 +346,6 @@ export default function Home() {
    }
  }, timeout);

-  // Run inference on a timer.
-  // TODO(hayk): Improve the timing here.
  // TODO(hayk): Fix warning about effects.
  useEffect(() => {
    runInference(alpha, seed, appState, promptInputs);
@ -351,14 +364,14 @@ export default function Home() {

      <div className="bg-[#0A2342] flex flex-row min-h-screen text-white">
        <div className="w-1/3 min-h-screen">
-          {tonePlayer && (
          <ThreeCanvas
            paused={paused}
            getTime={() => Tone.Transport.seconds}
-              audioLength={tonePlayer.sampleTime * tonePlayer.buffer.length}
+            audioLength={
+              tonePlayer ? tonePlayer.sampleTime * tonePlayer.buffer.length : 0
+            }
            inferenceResults={inferenceResults}
          />
-          )}
        </div>

        <PromptPanel
--- a/types.ts
+++ b/types.ts
@ -7,8 +7,9 @@ export interface PromptInput {

 export interface InferenceInput {
    alpha: number;
-    // num_inference_steps: number;
-    // seed_image_id: number;
+    num_inference_steps?: number;
+    seed_image_id?: number;
+    mask_image_id?: string;

    start: PromptInput;
    end: PromptInput;