Real-Time-Latent-Consistency-Model-Text-To-Image

Runtime error

App Files Files Community

radames commited on Nov 7, 2023

Commit

9b79b03

1 Parent(s): c4a002d

add other params

Browse files

Files changed (2) hide show

app-txt2img.py +9 -7
txt2img/index.html +57 -28

app-txt2img.py CHANGED Viewed

@@ -76,9 +76,9 @@ pipe.unet.to(memory_format=torch.channels_last)
 if psutil.virtual_memory().total < 64 * 1024**3:
     pipe.enable_attention_slicing()
-if not mps_available and not xpu_available:
-    pipe.unet = torch.compile(pipe.unet, mode="reduce-overhead", fullgraph=True)
-    pipe(prompt="warmup", num_inference_steps=1, guidance_scale=8.0)
 compel_proc = Compel(
     tokenizer=pipe.tokenizer,
@@ -89,9 +89,12 @@ user_queue_map = {}
 class InputParams(BaseModel):
-    prompt: str
     seed: int = 2159232
     guidance_scale: float = 8.0
     width: int = WIDTH
     height: int = HEIGHT
@@ -100,15 +103,14 @@ def predict(params: InputParams):
     generator = torch.manual_seed(params.seed)
     prompt_embeds = compel_proc(params.prompt)
     # Can be set to 1~50 steps. LCM support fast inference even <= 4 steps. Recommend: 1~8 steps.
-    num_inference_steps = 4
     results = pipe(
         prompt_embeds=prompt_embeds,
         generator=generator,
-        num_inference_steps=num_inference_steps,
         guidance_scale=params.guidance_scale,
         width=params.width,
         height=params.height,
-        original_inference_steps=50,
         output_type="pil",
     )
     nsfw_content_detected = (

 if psutil.virtual_memory().total < 64 * 1024**3:
     pipe.enable_attention_slicing()
+# if not mps_available and not xpu_available:
+#     pipe.unet = torch.compile(pipe.unet, mode="reduce-overhead", fullgraph=True)
+#     pipe(prompt="warmup", num_inference_steps=1, guidance_scale=8.0)
 compel_proc = Compel(
     tokenizer=pipe.tokenizer,
 class InputParams(BaseModel):
     seed: int = 2159232
+    prompt: str
     guidance_scale: float = 8.0
+    strength: float = 0.5
+    steps: int = 4
+    lcm_steps: int = 50
     width: int = WIDTH
     height: int = HEIGHT
     generator = torch.manual_seed(params.seed)
     prompt_embeds = compel_proc(params.prompt)
     # Can be set to 1~50 steps. LCM support fast inference even <= 4 steps. Recommend: 1~8 steps.
     results = pipe(
         prompt_embeds=prompt_embeds,
         generator=generator,
+        num_inference_steps=params.steps,
         guidance_scale=params.guidance_scale,
         width=params.width,
         height=params.height,
+        original_inference_steps=params.lcm_steps,
         output_type="pil",
     )
     nsfw_content_detected = (

txt2img/index.html CHANGED Viewed

@@ -15,10 +15,12 @@
         }
     </style>
     <script type="module">
-        const seedEl = document.querySelector("#seed");
-        const promptEl = document.querySelector("#prompt");
-        const guidanceEl = document.querySelector("#guidance-scale");
         const startBtn = document.querySelector("#start");
         const stopBtn = document.querySelector("#stop");
         const videoEl = document.querySelector("#webcam");
@@ -26,8 +28,9 @@
         const queueSizeEl = document.querySelector("#queue_size");
         const errorEl = document.querySelector("#error");
         const snapBtn = document.querySelector("#snap");
-        function LCMLive(promptEl, liveImage, seedEl, guidanceEl) {
             let websocket;
             async function start() {
@@ -69,15 +72,17 @@
                 })
             }
-            async function promptUpdateStream() {
-                const prompt = promptEl.value;
-                console.log(prompt);
-                const seed = seedEl.value;
-                const guidance_scale = guidanceEl.value;
                 websocket.send(JSON.stringify({
-                    prompt: prompt,
-                    seed: seed,
-                    guidance_scale: guidance_scale,
                 }));
             }
             function debouceInput(fn, delay) {
@@ -92,16 +97,12 @@
             const debouncedInput = debouceInput(promptUpdateStream, 200);
             function initPromptStream(userId) {
                 liveImage.src = `/stream/${userId}`;
-                promptEl.addEventListener("input", debouncedInput);
-                seedEl.addEventListener("input", debouncedInput);
-                guidanceEl.addEventListener("change", debouncedInput);
             }
             async function stop() {
                 websocket.close();
-                promptEl.removeEventListener("input",  debouncedInput);
-                seedEl.removeEventListener("input", debouncedInput);
-                guidanceEl.removeEventListener("change", debouncedInput);
             }
             return {
                 start,
@@ -131,7 +132,7 @@
                 const exif = {};
                 const gps = {};
                 zeroth[piexif.ImageIFD.Make] = "LCM Text-to-Image";
-                zeroth[piexif.ImageIFD.ImageDescription] = `prompt: ${promptEl.value} | seed: ${seedEl.value} | guidance: ${guidanceEl.value}`;
                 zeroth[piexif.ImageIFD.Software] = "https://github.com/radames/Real-Time-Latent-Consistency-Model";
                 exif[piexif.ExifIFD.DateTimeOriginal] = new Date().toISOString();
@@ -157,7 +158,7 @@
         }
-        const lcmLive = LCMLive(promptEl, imageEl, seedEl, guidanceEl);
         startBtn.addEventListener("click", async () => {
             try {
                 startBtn.disabled = true;
@@ -233,22 +234,50 @@
         <div class="">
             <details>
                 <summary class="font-medium cursor-pointer">Advanced Options</summary>
-                <div class="grid grid-cols-3 max-w-md items-center gap-3 py-3">
                     <label class="text-sm font-medium" for="guidance-scale">Guidance Scale
                     </label>
-                    <input type="range" id="guidance-scale" name="guidance-scale" min="1" max="30" step="0.001"
                         value="8.0" oninput="this.nextElementSibling.value = Number(this.value).toFixed(2)">
                     <output class="text-xs w-[50px] text-center font-light px-1 py-1 border border-gray-700 rounded-md">
                         8.0</output>
                     <label class="text-sm font-medium" for="seed">Seed</label>
                     <input type="number" id="seed" name="seed" value="299792458"
                         class="font-light border border-gray-700 text-right rounded-md p-2 dark:text-black">
-                    <button
-                        onclick="document.querySelector('#seed').value = Math.floor(Math.random() * Number.MAX_SAFE_INTEGER); document.querySelector('#seed').dispatchEvent(new Event('input'));"
-                        class="button">
                         Rand
                     </button>
-                </div>
             </details>
         </div>
         <div class="flex gap-3">

         }
     </style>
     <script type="module">
+        const getValue = (id) => {
+            const el = document.querySelector(`${id}`)
+            if (el.type === "checkbox")
+                return el.checked;
+            return el.value;
+        }
         const startBtn = document.querySelector("#start");
         const stopBtn = document.querySelector("#stop");
         const videoEl = document.querySelector("#webcam");
         const queueSizeEl = document.querySelector("#queue_size");
         const errorEl = document.querySelector("#error");
         const snapBtn = document.querySelector("#snap");
+        const paramsEl = document.querySelector("#params");
+        paramsEl.addEventListener("submit", (e) => e.preventDefault());
+        function LCMLive(paramsEl, liveImage) {
             let websocket;
             async function start() {
                 })
             }
+            async function promptUpdateStream(e) {
+                const dimension = getValue("input[name=dimension]:checked");
+                const [WIDTH, HEIGHT] = JSON.parse(dimension);
                 websocket.send(JSON.stringify({
+                    "seed": getValue("#seed"),
+                    "prompt": getValue("#prompt"),
+                    "guidance_scale": getValue("#guidance-scale"),
+                    "steps": getValue("#steps"),
+                    "lcm_steps": getValue("#lcm_steps"),
+                    "width": WIDTH,
+                    "height": HEIGHT,
                 }));
             }
             function debouceInput(fn, delay) {
             const debouncedInput = debouceInput(promptUpdateStream, 200);
             function initPromptStream(userId) {
                 liveImage.src = `/stream/${userId}`;
+                paramsEl.addEventListener("change", debouncedInput);
             }
             async function stop() {
                 websocket.close();
+                paramsEl.removeEventListener("change", debouncedInput);
             }
             return {
                 start,
                 const exif = {};
                 const gps = {};
                 zeroth[piexif.ImageIFD.Make] = "LCM Text-to-Image";
+                zeroth[piexif.ImageIFD.ImageDescription] = `prompt: ${getValue("#prompt")} | seed: ${getValue("#seed")} | guidance_scale: ${getValue("#guidance-scale")} | lcm_steps: ${getValue("#lcm_steps")} | steps: ${getValue("#steps")}`;
                 zeroth[piexif.ImageIFD.Software] = "https://github.com/radames/Real-Time-Latent-Consistency-Model";
                 exif[piexif.ExifIFD.DateTimeOriginal] = new Date().toISOString();
         }
+        const lcmLive = LCMLive(paramsEl, imageEl);
         startBtn.addEventListener("click", async () => {
             try {
                 startBtn.disabled = true;
         <div class="">
             <details>
                 <summary class="font-medium cursor-pointer">Advanced Options</summary>
+                <form class="grid grid-cols-3 items-center gap-3 py-3" id="params" action="">
+                    <label class="text-sm font-medium" for="dimension">Image Dimensions</label>
+                    <div class="col-span-2 flex gap-2">
+                        <div class="flex gap-1">
+                            <input type="radio" id="dimension512" name="dimension" value="[512,512]" checked
+                                class="cursor-pointer">
+                            <label for="dimension512" class="text-sm cursor-pointer">512x512</label>
+                        </div>
+                        <div class="flex gap-1">
+                            <input type="radio" id="dimension768" name="dimension" value="[768,768]"
+                                lass="cursor-pointer">
+                            <label for="dimension768" class="text-sm cursor-pointer">768x768</label>
+                        </div>
+                    </div>
+                    <!--  -->
+                    <label class="text-sm font-medium " for="steps">Inference Steps
+                    </label>
+                    <input type="range" id="steps" name="steps" min="1" max="20" value="4"
+                        oninput="this.nextElementSibling.value = Number(this.value)">
+                    <output class="text-xs w-[50px] text-center font-light px-1 py-1 border border-gray-700 rounded-md">
+                        4</output>
+                    <!--  -->
+                    <label class="text-sm font-medium" for="lcm_steps">LCM Inference Steps
+                    </label>
+                    <input type="range" id="lcm_steps" name="lcm_steps" min="2" max="60" value="50"
+                        oninput="this.nextElementSibling.value = Number(this.value)">
+                    <output class="text-xs w-[50px] text-center font-light px-1 py-1 border border-gray-700 rounded-md">
+                        50</output>
+                    <!--  -->
                     <label class="text-sm font-medium" for="guidance-scale">Guidance Scale
                     </label>
+                    <input type="range" id="guidance-scale" name="guidance-scale" min="0" max="30" step="0.001"
                         value="8.0" oninput="this.nextElementSibling.value = Number(this.value).toFixed(2)">
                     <output class="text-xs w-[50px] text-center font-light px-1 py-1 border border-gray-700 rounded-md">
                         8.0</output>
+                    <!--  -->
                     <label class="text-sm font-medium" for="seed">Seed</label>
                     <input type="number" id="seed" name="seed" value="299792458"
                         class="font-light border border-gray-700 text-right rounded-md p-2 dark:text-black">
+                    <button class="button" onclick="document.querySelector('#seed').value = Math.floor(Math.random() * 1000000000); document.querySelector('#params').dispatchEvent(new Event('change'))">
                         Rand
                     </button>
+                    <!--  -->
+                </form>
             </details>
         </div>
         <div class="flex gap-3">