Failed to load versions. Head to the versions page to see all versions for this model.
You're looking at a specific version of this model. Jump to the model overview.
zsxkib /animatediff-illusions:b3ccb010
Input
Run this model in Node.js with one line of code:
npm install replicate
REPLICATE_API_TOKEN
environment variable:export REPLICATE_API_TOKEN=<paste-your-token-here>
Find your API token in your account settings.
import Replicate from "replicate";
import fs from "node:fs";
const replicate = new Replicate({
auth: process.env.REPLICATE_API_TOKEN,
});
Run zsxkib/animatediff-illusions using Replicate’s API. Check out the model's schema for an overview of inputs and outputs.
const output = await replicate.run(
"zsxkib/animatediff-illusions:b3ccb0101402aafd04bfea042950be606223e2abedbad93cf848bfffa072bb61",
{
input: {
loop: true,
seed: -1,
steps: 25,
width: 384,
frames: 32,
height: 256,
context: 16,
clip_skip: 2,
scheduler: "k_dpmpp_sde",
base_model: "majicmixRealistic_v5Preview",
prompt_map: "0: black coffee | 10: frothy milky foamy coffee",
head_prompt: "an artistic cup of coffee",
tail_prompt: "sat on a table, overhead birdseye shot, bird's-eye view",
output_format: "mp4",
guidance_scale: 7.5,
negative_prompt: "ugly, broken, unrealstic, nsfw, trypophobia",
controlnet_video: "https://replicate.delivery/pbxt/JlbPomk5xQXYw3Mao6B9eoFJS0moaYjCGSRhFPcMLCXNu0w8/spiral.gif",
film_interpolation: true,
prompt_fixed_ratio: 0.5,
custom_base_model_url: "",
num_interpolation_steps: 3,
enable_qr_code_monster_v2: true,
playback_frames_per_second: 20,
controlnet_conditioning_scale: 0.3,
qr_code_monster_v2_guess_mode: false,
qr_code_monster_v2_preprocessor: true
}
}
);
// To access the file URL:
console.log(output.url()); //=> "http://example.com"
// To write the file to disk:
fs.writeFile("my-image.png", output);
To learn more, take a look at the guide on getting started with Node.js.
pip install replicate
REPLICATE_API_TOKEN
environment variable:export REPLICATE_API_TOKEN=<paste-your-token-here>
Find your API token in your account settings.
import replicate
Run zsxkib/animatediff-illusions using Replicate’s API. Check out the model's schema for an overview of inputs and outputs.
output = replicate.run(
"zsxkib/animatediff-illusions:b3ccb0101402aafd04bfea042950be606223e2abedbad93cf848bfffa072bb61",
input={
"loop": True,
"seed": -1,
"steps": 25,
"width": 384,
"frames": 32,
"height": 256,
"context": 16,
"clip_skip": 2,
"scheduler": "k_dpmpp_sde",
"base_model": "majicmixRealistic_v5Preview",
"prompt_map": "0: black coffee | 10: frothy milky foamy coffee",
"head_prompt": "an artistic cup of coffee",
"tail_prompt": "sat on a table, overhead birdseye shot, bird's-eye view",
"output_format": "mp4",
"guidance_scale": 7.5,
"negative_prompt": "ugly, broken, unrealstic, nsfw, trypophobia",
"controlnet_video": "https://replicate.delivery/pbxt/JlbPomk5xQXYw3Mao6B9eoFJS0moaYjCGSRhFPcMLCXNu0w8/spiral.gif",
"film_interpolation": True,
"prompt_fixed_ratio": 0.5,
"custom_base_model_url": "",
"num_interpolation_steps": 3,
"enable_qr_code_monster_v2": True,
"playback_frames_per_second": 20,
"controlnet_conditioning_scale": 0.3,
"qr_code_monster_v2_guess_mode": False,
"qr_code_monster_v2_preprocessor": True
}
)
print(output)
To learn more, take a look at the guide on getting started with Python.
REPLICATE_API_TOKEN
environment variable:export REPLICATE_API_TOKEN=<paste-your-token-here>
Find your API token in your account settings.
Run zsxkib/animatediff-illusions using Replicate’s API. Check out the model's schema for an overview of inputs and outputs.
curl -s -X POST \
-H "Authorization: Bearer $REPLICATE_API_TOKEN" \
-H "Content-Type: application/json" \
-H "Prefer: wait" \
-d $'{
"version": "zsxkib/animatediff-illusions:b3ccb0101402aafd04bfea042950be606223e2abedbad93cf848bfffa072bb61",
"input": {
"loop": true,
"seed": -1,
"steps": 25,
"width": 384,
"frames": 32,
"height": 256,
"context": 16,
"clip_skip": 2,
"scheduler": "k_dpmpp_sde",
"base_model": "majicmixRealistic_v5Preview",
"prompt_map": "0: black coffee | 10: frothy milky foamy coffee",
"head_prompt": "an artistic cup of coffee",
"tail_prompt": "sat on a table, overhead birdseye shot, bird\'s-eye view",
"output_format": "mp4",
"guidance_scale": 7.5,
"negative_prompt": "ugly, broken, unrealstic, nsfw, trypophobia",
"controlnet_video": "https://replicate.delivery/pbxt/JlbPomk5xQXYw3Mao6B9eoFJS0moaYjCGSRhFPcMLCXNu0w8/spiral.gif",
"film_interpolation": true,
"prompt_fixed_ratio": 0.5,
"custom_base_model_url": "",
"num_interpolation_steps": 3,
"enable_qr_code_monster_v2": true,
"playback_frames_per_second": 20,
"controlnet_conditioning_scale": 0.3,
"qr_code_monster_v2_guess_mode": false,
"qr_code_monster_v2_preprocessor": true
}
}' \
https://api.replicate.com/v1/predictions
To learn more, take a look at Replicate’s HTTP API reference docs.
Add a payment method to run this model.
By signing in, you agree to our
terms of service and privacy policy
Output
{
"completed_at": "2023-11-01T10:51:55.032481Z",
"created_at": "2023-11-01T10:49:50.058029Z",
"data_removed": false,
"error": null,
"id": "bd232u3b4exsk7wrgiwq6keb64",
"input": {
"loop": true,
"seed": -1,
"steps": 25,
"width": 384,
"frames": 32,
"height": 256,
"context": 16,
"clip_skip": 2,
"scheduler": "k_dpmpp_sde",
"base_model": "majicmixRealistic_v5Preview",
"prompt_map": "0: black coffee | 10: frothy milky foamy coffee",
"head_prompt": "an artistic cup of coffee",
"tail_prompt": "sat on a table, overhead birdseye shot, bird's-eye view",
"output_format": "mp4",
"guidance_scale": 7.5,
"negative_prompt": "ugly, broken, unrealstic, nsfw, trypophobia",
"controlnet_video": "https://replicate.delivery/pbxt/JlbPomk5xQXYw3Mao6B9eoFJS0moaYjCGSRhFPcMLCXNu0w8/spiral.gif",
"film_interpolation": true,
"prompt_fixed_ratio": 0.5,
"custom_base_model_url": "",
"num_interpolation_steps": 3,
"enable_qr_code_monster_v2": true,
"playback_frames_per_second": 20,
"controlnet_conditioning_scale": 0.3,
"qr_code_monster_v2_guess_mode": false,
"qr_code_monster_v2_preprocessor": true
},
"logs": "Using ControlNet\nffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\nbuilt with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\nconfiguration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\nlibavutil 56. 70.100 / 56. 70.100\nlibavcodec 58.134.100 / 58.134.100\nlibavformat 58. 76.100 / 58. 76.100\nlibavdevice 58. 13.100 / 58. 13.100\nlibavfilter 7.110.100 / 7.110.100\nlibswscale 5. 9.100 / 5. 9.100\nlibswresample 3. 9.100 / 3. 9.100\nlibpostproc 55. 9.100 / 55. 9.100\nInput #0, gif, from '/tmp/tmpbmp23h10spiral.gif':\nDuration: 00:00:14.39, start: 0.000000, bitrate: 2292 kb/s\nStream #0:0: Video: gif, bgra, 480x270, 15 fps, 15 tbr, 100 tbn, 100 tbc\nStream mapping:\nStream #0:0 -> #0:0 (gif (native) -> png (native))\nPress [q] to stop, [?] for help\nOutput #0, image2, to 'data/controlnet_image/test/qr_code_monster_v2/%04d.png':\nMetadata:\nencoder : Lavf58.76.100\nStream #0:0: Video: png, rgba(pc, gbr/unknown/unknown, progressive), 480x270, q=2-31, 200 kb/s, 15 fps, 15 tbn\nMetadata:\nencoder : Lavc58.134.100 png\nframe= 1 fps=0.0 q=0.0 size=N/A time=00:00:00.00 bitrate=N/A speed=N/A\nframe= 32 fps=0.0 q=-0.0 Lsize=N/A time=00:00:02.13 bitrate=N/A speed=37.1x\nvideo:938kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: unknown\n--------------------------------------------------------------------------------\n{\n\"name\": \"sample\",\n\"path\": \"share/Stable-diffusion/majicmixRealistic_v5Preview.safetensors\",\n\"motion_module\": \"models/motion-module/mm_sd_v15_v2.ckpt\",\n\"compile\": false,\n\"seed\": [\n-1\n],\n\"scheduler\": \"k_dpmpp_sde\",\n\"steps\": 25,\n\"guidance_scale\": 7.5,\n\"clip_skip\": 2,\n\"prompt_fixed_ratio\": 0.5,\n\"head_prompt\": \"an artistic cup of coffee\",\n\"prompt_map\": {\n\"0\": \"black coffee\", \"10\": \"frothy milky foamy coffee\"\n},\n\"tail_prompt\": \"sat on a table, overhead birdseye shot, bird's-eye view\",\n\"n_prompt\": [\n\"ugly, broken, unrealstic, nsfw, trypophobia\"\n],\n\"controlnet_map\": {\n\"input_image_dir\": \"controlnet_image/test\",\n\"max_samples_on_vram\": 200,\n\"max_models_on_vram\": 3,\n\"save_detectmap\": true,\n\"preprocess_on_gpu\": true,\n\"is_loop\": true,\n\"qr_code_monster_v2\": {\n\"enable\": true,\n\"use_preprocessor\": true,\n\"guess_mode\": false,\n\"controlnet_conditioning_scale\": 0.3,\n\"control_guidance_start\": 0.0,\n\"control_guidance_end\": 1.0,\n\"control_scale_list\": [\n0.5,\n0.4,\n0.3,\n0.2,\n0.1\n]\n}\n},\n\"output\":{\n\"format\" : \"mp4\",\n\"fps\" : 20,\n\"encode_param\":{\n\"crf\": 10\n}\n}\n}\n--------------------------------------------------------------------------------\nRunning command: animatediff generate -c config/prompts/custom_prompt_travel.json -W 384 -H 256 -L 32 -C 16\n10:50:33 INFO Using generation config: cli.py:291\nconfig/prompts/custom_prompt_travel.json\n10:50:34 INFO is_v2=True util.py:361\nINFO Using base model: runwayml/stable-diffusion-v1-5 cli.py:309\nINFO Will save outputs to cli.py:317\n./output/2023-11-01T10-50-34-sample-majicmixrealist\nic_v5preview\nPreprocessing images (qr_code_monster_v2) 81% ━━━ 26/… [ 0:0… < 0:0… , 127 ]\nit/s\nSaving Preprocessed images (qr_code_monster_v2) 94% ━━╸ 29… [ 0:… < 0:… , 26 ]\nit…\n10:50:35 INFO Checking motion module... generate.py:331\nINFO Loading tokenizer... generate.py:345\nINFO Loading text encoder... generate.py:347\n10:50:37 INFO Loading VAE... generate.py:349\nINFO Loading UNet... generate.py:351\n10:50:45 INFO Loaded 453.20928M-parameter motion module unet.py:578\nINFO Using scheduler \"k_dpmpp_sde\" generate.py:363\n(DPMSolverSinglestepScheduler)\nINFO Loading weights from generate.py:368\n/src/data/share/Stable-diffusion/majicmixReali\nstic_v5Preview.safetensors\n10:50:47 INFO Merging weights into UNet... generate.py:385\nINFO Creating AnimationPipeline... generate.py:431\nINFO No TI embeddings found ti.py:102\nINFO loading c='qr_code_monster_v2' model generate.py:460\n10:50:48 INFO Sending pipeline to device \"cuda\" pipeline.py:22\nINFO Selected data types: unet_dtype=torch.float16, device.py:90\ntenc_dtype=torch.float16,\nvae_dtype=torch.bfloat16\nINFO Using channels_last memory format for UNet and device.py:111\nVAE\n10:50:50 INFO Saving prompt config to output directory cli.py:364\nINFO Initialization complete! cli.py:372\nINFO Generating 1 animations cli.py:373\nINFO Running generation 1 of 1 cli.py:383\nINFO Generation seed: 7418695825388302117 cli.py:389\nINFO len( region_condi_list )=1 generate.py:1153\nINFO len( region_list )=1 generate.py:1154\n100% ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 75/75 [ 0:00:37 < 0:00:00 , 2 it/s ]\n10:51:29 INFO Generation complete, saving... generate.py:1185\n10:51:31 INFO Creating ffmpeg encoder... generate.py:1084\nINFO Encoding interpolated frames with ffmpeg... generate.py:1094\nINFO Saved sample to generate.py:1189\noutput/2023-11-01T10-50-34-sample-majicmixrea\nlistic_v5preview/00_7418695825388302117_an-ar\ntistic-cup-of-coffee_black-coffee_sat-on-a-ta\nINFO Generation complete! cli.py:429\nINFO Done, exiting... cli.py:435\nError: ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\nbuilt with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\nconfiguration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\nlibavutil 56. 70.100 / 56. 70.100\nlibavcodec 58.134.100 / 58.134.100\nlibavformat 58. 76.100 / 58. 76.100\nlibavdevice 58. 13.100 / 58. 13.100\nlibavfilter 7.110.100 / 7.110.100\nlibswscale 5. 9.100 / 5. 9.100\nlibswresample 3. 9.100 / 3. 9.100\nlibpostproc 55. 9.100 / 55. 9.100\nInput #0, image2, from '/src/output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00-7418695825388302117/%08d.png':\nDuration: 00:00:01.60, start: 0.000000, bitrate: N/A\nStream #0:0: Video: png, rgb24(pc), 384x256, 20 fps, 20 tbr, 20 tbn, 20 tbc\nStream mapping:\nStream #0:0 (png) -> fps\nfps -> Stream #0:0 (libx264)\nPress [q] to stop, [?] for help\n[libx264 @ 0x556f50ea08c0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2\n[libx264 @ 0x556f50ea08c0] profile High, level 1.3, 4:2:0, 8-bit\n[libx264 @ 0x556f50ea08c0] 264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=6 deblock=1:1:1 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=0.40:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=8 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=5 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=20 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=10.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:0.60\nOutput #0, mp4, to '/src/output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00_7418695825388302117_an-artistic-cup-of-coffee_black-coffee_sat-on-a-ta.mp4':\nMetadata:\nencoder : Lavf58.76.100\nStream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 384x256, q=2-31, 20 fps, 10240 tbn\nMetadata:\nencoder : Lavc58.134.100 libx264\nSide data:\ncpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A\nframe= 1 fps=0.0 q=0.0 size= 0kB time=00:00:00.00 bitrate=N/A speed= 0x\nframe= 32 fps=0.0 q=-1.0 Lsize= 504kB time=00:00:01.45 bitrate=2847.4kbits/s speed=9.63x\nvideo:503kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 0.236934%\n[libx264 @ 0x556f50ea08c0] frame I:1 Avg QP:13.18 size: 22097\n[libx264 @ 0x556f50ea08c0] frame P:7 Avg QP:13.48 size: 21731\n[libx264 @ 0x556f50ea08c0] frame B:24 Avg QP:14.68 size: 14167\n[libx264 @ 0x556f50ea08c0] consecutive B-frames: 3.1% 0.0% 0.0% 50.0% 46.9% 0.0%\n[libx264 @ 0x556f50ea08c0] mb I I16..4: 5.5% 60.2% 34.4%\n[libx264 @ 0x556f50ea08c0] mb P I16..4: 8.9% 47.4% 27.3% P16..4: 3.0% 8.4% 5.0% 0.0% 0.0% skip: 0.0%\n[libx264 @ 0x556f50ea08c0] mb B I16..4: 3.6% 13.3% 6.5% B16..8: 21.6% 28.5% 15.3% direct: 9.8% skip: 1.5% L0:31.0% L1:27.5% BI:41.5%\n[libx264 @ 0x556f50ea08c0] 8x8 transform intra:57.0% inter:64.7%\n[libx264 @ 0x556f50ea08c0] coded y,uvDC,uvAC intra: 90.9% 95.3% 90.2% inter: 79.7% 93.2% 62.9%\n[libx264 @ 0x556f50ea08c0] i16 v,h,dc,p: 13% 11% 23% 54%\n[libx264 @ 0x556f50ea08c0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 19% 13% 16% 8% 9% 10% 8% 10% 8%\n[libx264 @ 0x556f50ea08c0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 20% 11% 10% 7% 15% 14% 9% 10% 5%\n[libx264 @ 0x556f50ea08c0] i8c dc,h,v,p: 43% 17% 27% 13%\n[libx264 @ 0x556f50ea08c0] Weighted P-Frames: Y:28.6% UV:28.6%\n[libx264 @ 0x556f50ea08c0] ref P L0: 44.6% 16.6% 17.6% 9.1% 6.0% 5.8% 0.3%\n[libx264 @ 0x556f50ea08c0] ref B L0: 91.8% 4.8% 2.2% 0.8% 0.5%\n[libx264 @ 0x556f50ea08c0] ref B L1: 98.3% 1.7%\n[libx264 @ 0x556f50ea08c0] kb/s:2571.11\nIdentifying the GIF path from the generated outputs...\nIdentified directory: output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview\nIdentified Media Path: output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00_7418695825388302117_an-artistic-cup-of-coffee_black-coffee_sat-on-a-ta.mp4\nIdentified PNG Folder Path: output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00-7418695825388302117\nInterpolating frames with FILM...\n 0%|\u001b[32m \u001b[0m| 0/217 [00:00<?, ?it/s]\u001b[0m\n 1%|\u001b[32m▌ \u001b[0m| 2/217 [00:00<00:13, 16.29it/s]\u001b[0m\n 2%|\u001b[32m█▏ \u001b[0m| 4/217 [00:00<00:11, 18.16it/s]\u001b[0m\n 3%|\u001b[32m██ \u001b[0m| 7/217 [00:00<00:10, 19.19it/s]\u001b[0m\n 4%|\u001b[32m██▌ \u001b[0m| 9/217 [00:00<00:10, 19.10it/s]\u001b[0m\n 6%|\u001b[32m███▍ \u001b[0m| 12/217 [00:00<00:10, 19.54it/s]\u001b[0m\n 7%|\u001b[32m████▎ \u001b[0m| 15/217 [00:00<00:10, 19.47it/s]\u001b[0m\n 8%|\u001b[32m█████▏ \u001b[0m| 18/217 [00:00<00:10, 19.66it/s]\u001b[0m\n 10%|\u001b[32m██████ \u001b[0m| 21/217 [00:01<00:09, 19.80it/s]\u001b[0m\n 11%|\u001b[32m██████▌ \u001b[0m| 23/217 [00:01<00:09, 19.57it/s]\u001b[0m\n 12%|\u001b[32m███████▍ \u001b[0m| 26/217 [00:01<00:09, 19.73it/s]\u001b[0m\n 13%|\u001b[32m████████▎ \u001b[0m| 29/217 [00:01<00:09, 19.59it/s]\u001b[0m\n 15%|\u001b[32m█████████▏ \u001b[0m| 32/217 [00:01<00:09, 19.80it/s]\u001b[0m\n 16%|\u001b[32m██████████ \u001b[0m| 35/217 [00:01<00:09, 19.95it/s]\u001b[0m\n 17%|\u001b[32m██████████▌ \u001b[0m| 37/217 [00:01<00:09, 19.71it/s]\u001b[0m\n 18%|\u001b[32m███████████▍ \u001b[0m| 40/217 [00:02<00:08, 19.84it/s]\u001b[0m\n 20%|\u001b[32m████████████▎ \u001b[0m| 43/217 [00:02<00:08, 19.68it/s]\u001b[0m\n 21%|\u001b[32m█████████████▏ \u001b[0m| 46/217 [00:02<00:08, 19.81it/s]\u001b[0m\n 23%|\u001b[32m██████████████ \u001b[0m| 49/217 [00:02<00:08, 20.00it/s]\u001b[0m\n 24%|\u001b[32m██████████████▌ \u001b[0m| 51/217 [00:02<00:08, 19.78it/s]\u001b[0m\n 25%|\u001b[32m███████████████▍ \u001b[0m| 54/217 [00:02<00:08, 19.90it/s]\u001b[0m\n 26%|\u001b[32m████████████████▎ \u001b[0m| 57/217 [00:02<00:08, 19.72it/s]\u001b[0m\n 27%|\u001b[32m████████████████▊ \u001b[0m| 59/217 [00:03<00:08, 19.75it/s]\u001b[0m\n 29%|\u001b[32m█████████████████▋ \u001b[0m| 62/217 [00:03<00:07, 19.86it/s]\u001b[0m\n 29%|\u001b[32m██████████████████▎ \u001b[0m| 64/217 [00:03<00:07, 19.26it/s]\u001b[0m\n 31%|\u001b[32m███████████████████▏ \u001b[0m| 67/217 [00:03<00:07, 19.60it/s]\u001b[0m\n 32%|\u001b[32m████████████████████ \u001b[0m| 70/217 [00:03<00:07, 19.82it/s]\u001b[0m\n 33%|\u001b[32m████████████████████▌ \u001b[0m| 72/217 [00:03<00:07, 19.63it/s]\u001b[0m\n 35%|\u001b[32m█████████████████████▍ \u001b[0m| 75/217 [00:03<00:07, 19.68it/s]\u001b[0m\n 36%|\u001b[32m██████████████████████▎ \u001b[0m| 78/217 [00:03<00:07, 19.57it/s]\u001b[0m\n 37%|\u001b[32m███████████████████████▏ \u001b[0m| 81/217 [00:04<00:06, 19.79it/s]\u001b[0m\n 38%|\u001b[32m███████████████████████▋ \u001b[0m| 83/217 [00:04<00:06, 19.81it/s]\u001b[0m\n 39%|\u001b[32m████████████████████████▎ \u001b[0m| 85/217 [00:04<00:06, 19.54it/s]\u001b[0m\n 41%|\u001b[32m█████████████████████████▏ \u001b[0m| 88/217 [00:04<00:06, 19.79it/s]\u001b[0m\n 42%|\u001b[32m██████████████████████████ \u001b[0m| 91/217 [00:04<00:06, 19.89it/s]\u001b[0m\n 43%|\u001b[32m██████████████████████████▌ \u001b[0m| 93/217 [00:04<00:06, 19.70it/s]\u001b[0m\n 44%|\u001b[32m███████████████████████████▍ \u001b[0m| 96/217 [00:04<00:06, 19.97it/s]\u001b[0m\n 46%|\u001b[32m████████████████████████████▎ \u001b[0m| 99/217 [00:05<00:05, 19.79it/s]\u001b[0m\n 47%|\u001b[32m████████████████████████████▋ \u001b[0m| 102/217 [00:05<00:05, 19.95it/s]\u001b[0m\n 48%|\u001b[32m█████████████████████████████▌ \u001b[0m| 105/217 [00:05<00:05, 20.03it/s]\u001b[0m\n 50%|\u001b[32m██████████████████████████████▎ \u001b[0m| 108/217 [00:05<00:05, 19.80it/s]\u001b[0m\n 51%|\u001b[32m███████████████████████████████▏ \u001b[0m| 111/217 [00:05<00:05, 19.92it/s]\u001b[0m\n 52%|\u001b[32m███████████████████████████████▊ \u001b[0m| 113/217 [00:05<00:05, 19.66it/s]\u001b[0m\n 53%|\u001b[32m████████████████████████████████▎ \u001b[0m| 115/217 [00:05<00:05, 19.73it/s]\u001b[0m\n 54%|\u001b[32m████████████████████████████████▉ \u001b[0m| 117/217 [00:05<00:05, 19.71it/s]\u001b[0m\n 55%|\u001b[32m█████████████████████████████████▍ \u001b[0m| 119/217 [00:06<00:04, 19.68it/s]\u001b[0m\n 56%|\u001b[32m██████████████████████████████████ \u001b[0m| 121/217 [00:06<00:04, 19.40it/s]\u001b[0m\n 57%|\u001b[32m██████████████████████████████████▊ \u001b[0m| 124/217 [00:06<00:04, 19.66it/s]\u001b[0m\n 59%|\u001b[32m███████████████████████████████████▋ \u001b[0m| 127/217 [00:06<00:04, 19.53it/s]\u001b[0m\n 60%|\u001b[32m████████████████████████████████████▌ \u001b[0m| 130/217 [00:06<00:04, 19.76it/s]\u001b[0m\n 61%|\u001b[32m█████████████████████████████████████▍ \u001b[0m| 133/217 [00:06<00:04, 19.89it/s]\u001b[0m\n 62%|\u001b[32m█████████████████████████████████████▉ \u001b[0m| 135/217 [00:06<00:04, 19.65it/s]\u001b[0m\n 64%|\u001b[32m██████████████████████████████████████▊ \u001b[0m| 138/217 [00:07<00:03, 19.81it/s]\u001b[0m\n 65%|\u001b[32m███████████████████████████████████████▋ \u001b[0m| 141/217 [00:07<00:03, 19.67it/s]\u001b[0m\n 66%|\u001b[32m████████████████████████████████████████▍ \u001b[0m| 144/217 [00:07<00:03, 19.80it/s]\u001b[0m\n 68%|\u001b[32m█████████████████████████████████████████▎ \u001b[0m| 147/217 [00:07<00:03, 19.90it/s]\u001b[0m\n 69%|\u001b[32m█████████████████████████████████████████▉ \u001b[0m| 149/217 [00:07<00:03, 19.68it/s]\u001b[0m\n 70%|\u001b[32m██████████████████████████████████████████▋ \u001b[0m| 152/217 [00:07<00:03, 19.86it/s]\u001b[0m\n 71%|\u001b[32m███████████████████████████████████████████▌ \u001b[0m| 155/217 [00:07<00:03, 19.64it/s]\u001b[0m\n 72%|\u001b[32m████████████████████████████████████████████▏ \u001b[0m| 157/217 [00:07<00:03, 19.69it/s]\u001b[0m\n 73%|\u001b[32m████████████████████████████████████████████▋ \u001b[0m| 159/217 [00:08<00:02, 19.76it/s]\u001b[0m\n 75%|\u001b[32m█████████████████████████████████████████████▌ \u001b[0m| 162/217 [00:08<00:02, 19.59it/s]\u001b[0m\n 76%|\u001b[32m██████████████████████████████████████████████▍ \u001b[0m| 165/217 [00:08<00:02, 19.83it/s]\u001b[0m\n 77%|\u001b[32m███████████████████████████████████████████████▏ \u001b[0m| 168/217 [00:08<00:02, 20.00it/s]\u001b[0m\n 79%|\u001b[32m████████████████████████████████████████████████ \u001b[0m| 171/217 [00:08<00:02, 19.84it/s]\u001b[0m\n 80%|\u001b[32m████████████████████████████████████████████████▉ \u001b[0m| 174/217 [00:08<00:02, 19.98it/s]\u001b[0m\n 81%|\u001b[32m█████████████████████████████████████████████████▍ \u001b[0m| 176/217 [00:08<00:02, 19.71it/s]\u001b[0m\n 82%|\u001b[32m██████████████████████████████████████████████████▎ \u001b[0m| 179/217 [00:09<00:01, 19.90it/s]\u001b[0m\n 84%|\u001b[32m███████████████████████████████████████████████████▏ \u001b[0m| 182/217 [00:09<00:01, 20.01it/s]\u001b[0m\n 85%|\u001b[32m███████████████████████████████████████████████████▋ \u001b[0m| 184/217 [00:09<00:01, 19.74it/s]\u001b[0m\n 86%|\u001b[32m████████████████████████████████████████████████████▌ \u001b[0m| 187/217 [00:09<00:01, 19.93it/s]\u001b[0m\n 88%|\u001b[32m█████████████████████████████████████████████████████▍ \u001b[0m| 190/217 [00:09<00:01, 19.76it/s]\u001b[0m\n 89%|\u001b[32m██████████████████████████████████████████████████████▎ \u001b[0m| 193/217 [00:09<00:01, 19.91it/s]\u001b[0m\n 90%|\u001b[32m███████████████████████████████████████████████████████ \u001b[0m| 196/217 [00:09<00:01, 19.99it/s]\u001b[0m\n 91%|\u001b[32m███████████████████████████████████████████████████████▋ \u001b[0m| 198/217 [00:10<00:00, 19.61it/s]\u001b[0m\n 93%|\u001b[32m████████████████████████████████████████████████████████▌ \u001b[0m| 201/217 [00:10<00:00, 19.84it/s]\u001b[0m\n 94%|\u001b[32m█████████████████████████████████████████████████████████▎ \u001b[0m| 204/217 [00:10<00:00, 19.67it/s]\u001b[0m\n 95%|\u001b[32m██████████████████████████████████████████████████████████▏ \u001b[0m| 207/217 [00:10<00:00, 19.89it/s]\u001b[0m\n 97%|\u001b[32m███████████████████████████████████████████████████████████ \u001b[0m| 210/217 [00:10<00:00, 20.01it/s]\u001b[0m\n 98%|\u001b[32m███████████████████████████████████████████████████████████▌ \u001b[0m| 212/217 [00:10<00:00, 19.76it/s]\u001b[0m\n 99%|\u001b[32m████████████████████████████████████████████████████████████▍\u001b[0m| 215/217 [00:10<00:00, 19.89it/s]\u001b[0m\n100%|\u001b[32m█████████████████████████████████████████████████████████████\u001b[0m| 217/217 [00:10<00:00, 19.74it/s]\u001b[0m\nffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\nbuilt with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\nconfiguration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\nlibavutil 56. 70.100 / 56. 70.100\nlibavcodec 58.134.100 / 58.134.100\nlibavformat 58. 76.100 / 58. 76.100\nlibavdevice 58. 13.100 / 58. 13.100\nlibavfilter 7.110.100 / 7.110.100\nlibswscale 5. 9.100 / 5. 9.100\nlibswresample 3. 9.100 / 3. 9.100\nlibpostproc 55. 9.100 / 55. 9.100\nInput #0, image2, from 'output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/interpolated_frames/%08d.png':\nDuration: 00:00:09.96, start: 0.000000, bitrate: N/A\nStream #0:0: Video: png, rgb24(pc), 384x256, 25 fps, 25 tbr, 25 tbn, 25 tbc\nStream mapping:\nStream #0:0 -> #0:0 (png (native) -> h264 (libx264))\nPress [q] to stop, [?] for help\n[libx264 @ 0x5592e9ec48c0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2\n[libx264 @ 0x5592e9ec48c0] profile High, level 1.3, 4:2:0, 8-bit\n[libx264 @ 0x5592e9ec48c0] 264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=8 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=20 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=1.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\nOutput #0, mp4, to 'output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/output_video.mp4':\nMetadata:\nencoder : Lavf58.76.100\nStream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 384x256, q=2-31, 20 fps, 10240 tbn\nMetadata:\nencoder : Lavc58.134.100 libx264\nSide data:\ncpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A\nframe= 1 fps=0.0 q=0.0 size= 0kB time=00:00:00.00 bitrate=N/A speed= 0x\nframe= 226 fps=0.0 q=6.0 size= 3584kB time=00:00:08.55 bitrate=3433.9kbits/s speed=16.8x\nframe= 249 fps=0.0 q=-1.0 Lsize= 5318kB time=00:00:12.30 bitrate=3542.0kbits/s speed=18.2x\nvideo:5314kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 0.072162%\n[libx264 @ 0x5592e9ec48c0] frame I:1 Avg QP: 2.24 size: 57980\n[libx264 @ 0x5592e9ec48c0] frame P:64 Avg QP: 2.39 size: 41589\n[libx264 @ 0x5592e9ec48c0] frame B:184 Avg QP: 5.64 size: 14791\n[libx264 @ 0x5592e9ec48c0] consecutive B-frames: 1.2% 0.8% 0.0% 98.0%\n[libx264 @ 0x5592e9ec48c0] mb I I16..4: 10.4% 25.8% 63.8%\n[libx264 @ 0x5592e9ec48c0] mb P I16..4: 4.8% 10.3% 11.5% P16..4: 20.6% 30.7% 21.9% 0.0% 0.0% skip: 0.2%\n[libx264 @ 0x5592e9ec48c0] mb B I16..4: 0.3% 1.3% 0.3% B16..8: 33.0% 10.6% 9.4% direct:31.8% skip:13.3% L0:25.7% L1:23.1% BI:51.2%\n[libx264 @ 0x5592e9ec48c0] 8x8 transform intra:42.5% inter:33.0%\n[libx264 @ 0x5592e9ec48c0] coded y,uvDC,uvAC intra: 98.2% 97.2% 97.1% inter: 80.7% 81.9% 77.9%\n[libx264 @ 0x5592e9ec48c0] i16 v,h,dc,p: 14% 7% 22% 57%\n[libx264 @ 0x5592e9ec48c0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 22% 13% 36% 4% 5% 5% 4% 6% 5%\n[libx264 @ 0x5592e9ec48c0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 22% 14% 20% 7% 10% 9% 7% 7% 4%\n[libx264 @ 0x5592e9ec48c0] i8c dc,h,v,p: 45% 15% 30% 10%\n[libx264 @ 0x5592e9ec48c0] Weighted P-Frames: Y:23.4% UV:18.8%\n[libx264 @ 0x5592e9ec48c0] ref P L0: 60.7% 27.9% 9.8% 1.4% 0.2%\n[libx264 @ 0x5592e9ec48c0] ref B L0: 98.8% 1.0% 0.2%\n[libx264 @ 0x5592e9ec48c0] ref B L1: 99.7% 0.3%\n[libx264 @ 0x5592e9ec48c0] kb/s:3496.38",
"metrics": {
"predict_time": 87.69389,
"total_time": 124.974452
},
"output": "https://replicate.delivery/pbxt/FQlfhM2aly1aS6cjG6DVYwEZJzzfwbpix6nGDGcHkbTJf7njA/output_video.mp4",
"started_at": "2023-11-01T10:50:27.338591Z",
"status": "succeeded",
"urls": {
"get": "https://api.replicate.com/v1/predictions/bd232u3b4exsk7wrgiwq6keb64",
"cancel": "https://api.replicate.com/v1/predictions/bd232u3b4exsk7wrgiwq6keb64/cancel"
},
"version": "b3ccb0101402aafd04bfea042950be606223e2abedbad93cf848bfffa072bb61"
}
Using ControlNet
ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers
built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)
configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared
libavutil 56. 70.100 / 56. 70.100
libavcodec 58.134.100 / 58.134.100
libavformat 58. 76.100 / 58. 76.100
libavdevice 58. 13.100 / 58. 13.100
libavfilter 7.110.100 / 7.110.100
libswscale 5. 9.100 / 5. 9.100
libswresample 3. 9.100 / 3. 9.100
libpostproc 55. 9.100 / 55. 9.100
Input #0, gif, from '/tmp/tmpbmp23h10spiral.gif':
Duration: 00:00:14.39, start: 0.000000, bitrate: 2292 kb/s
Stream #0:0: Video: gif, bgra, 480x270, 15 fps, 15 tbr, 100 tbn, 100 tbc
Stream mapping:
Stream #0:0 -> #0:0 (gif (native) -> png (native))
Press [q] to stop, [?] for help
Output #0, image2, to 'data/controlnet_image/test/qr_code_monster_v2/%04d.png':
Metadata:
encoder : Lavf58.76.100
Stream #0:0: Video: png, rgba(pc, gbr/unknown/unknown, progressive), 480x270, q=2-31, 200 kb/s, 15 fps, 15 tbn
Metadata:
encoder : Lavc58.134.100 png
frame= 1 fps=0.0 q=0.0 size=N/A time=00:00:00.00 bitrate=N/A speed=N/A
frame= 32 fps=0.0 q=-0.0 Lsize=N/A time=00:00:02.13 bitrate=N/A speed=37.1x
video:938kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: unknown
--------------------------------------------------------------------------------
{
"name": "sample",
"path": "share/Stable-diffusion/majicmixRealistic_v5Preview.safetensors",
"motion_module": "models/motion-module/mm_sd_v15_v2.ckpt",
"compile": false,
"seed": [
-1
],
"scheduler": "k_dpmpp_sde",
"steps": 25,
"guidance_scale": 7.5,
"clip_skip": 2,
"prompt_fixed_ratio": 0.5,
"head_prompt": "an artistic cup of coffee",
"prompt_map": {
"0": "black coffee", "10": "frothy milky foamy coffee"
},
"tail_prompt": "sat on a table, overhead birdseye shot, bird's-eye view",
"n_prompt": [
"ugly, broken, unrealstic, nsfw, trypophobia"
],
"controlnet_map": {
"input_image_dir": "controlnet_image/test",
"max_samples_on_vram": 200,
"max_models_on_vram": 3,
"save_detectmap": true,
"preprocess_on_gpu": true,
"is_loop": true,
"qr_code_monster_v2": {
"enable": true,
"use_preprocessor": true,
"guess_mode": false,
"controlnet_conditioning_scale": 0.3,
"control_guidance_start": 0.0,
"control_guidance_end": 1.0,
"control_scale_list": [
0.5,
0.4,
0.3,
0.2,
0.1
]
}
},
"output":{
"format" : "mp4",
"fps" : 20,
"encode_param":{
"crf": 10
}
}
}
--------------------------------------------------------------------------------
Running command: animatediff generate -c config/prompts/custom_prompt_travel.json -W 384 -H 256 -L 32 -C 16
10:50:33 INFO Using generation config: cli.py:291
config/prompts/custom_prompt_travel.json
10:50:34 INFO is_v2=True util.py:361
INFO Using base model: runwayml/stable-diffusion-v1-5 cli.py:309
INFO Will save outputs to cli.py:317
./output/2023-11-01T10-50-34-sample-majicmixrealist
ic_v5preview
Preprocessing images (qr_code_monster_v2) 81% ━━━ 26/… [ 0:0… < 0:0… , 127 ]
it/s
Saving Preprocessed images (qr_code_monster_v2) 94% ━━╸ 29… [ 0:… < 0:… , 26 ]
it…
10:50:35 INFO Checking motion module... generate.py:331
INFO Loading tokenizer... generate.py:345
INFO Loading text encoder... generate.py:347
10:50:37 INFO Loading VAE... generate.py:349
INFO Loading UNet... generate.py:351
10:50:45 INFO Loaded 453.20928M-parameter motion module unet.py:578
INFO Using scheduler "k_dpmpp_sde" generate.py:363
(DPMSolverSinglestepScheduler)
INFO Loading weights from generate.py:368
/src/data/share/Stable-diffusion/majicmixReali
stic_v5Preview.safetensors
10:50:47 INFO Merging weights into UNet... generate.py:385
INFO Creating AnimationPipeline... generate.py:431
INFO No TI embeddings found ti.py:102
INFO loading c='qr_code_monster_v2' model generate.py:460
10:50:48 INFO Sending pipeline to device "cuda" pipeline.py:22
INFO Selected data types: unet_dtype=torch.float16, device.py:90
tenc_dtype=torch.float16,
vae_dtype=torch.bfloat16
INFO Using channels_last memory format for UNet and device.py:111
VAE
10:50:50 INFO Saving prompt config to output directory cli.py:364
INFO Initialization complete! cli.py:372
INFO Generating 1 animations cli.py:373
INFO Running generation 1 of 1 cli.py:383
INFO Generation seed: 7418695825388302117 cli.py:389
INFO len( region_condi_list )=1 generate.py:1153
INFO len( region_list )=1 generate.py:1154
100% ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 75/75 [ 0:00:37 < 0:00:00 , 2 it/s ]
10:51:29 INFO Generation complete, saving... generate.py:1185
10:51:31 INFO Creating ffmpeg encoder... generate.py:1084
INFO Encoding interpolated frames with ffmpeg... generate.py:1094
INFO Saved sample to generate.py:1189
output/2023-11-01T10-50-34-sample-majicmixrea
listic_v5preview/00_7418695825388302117_an-ar
tistic-cup-of-coffee_black-coffee_sat-on-a-ta
INFO Generation complete! cli.py:429
INFO Done, exiting... cli.py:435
Error: ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers
built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)
configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared
libavutil 56. 70.100 / 56. 70.100
libavcodec 58.134.100 / 58.134.100
libavformat 58. 76.100 / 58. 76.100
libavdevice 58. 13.100 / 58. 13.100
libavfilter 7.110.100 / 7.110.100
libswscale 5. 9.100 / 5. 9.100
libswresample 3. 9.100 / 3. 9.100
libpostproc 55. 9.100 / 55. 9.100
Input #0, image2, from '/src/output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00-7418695825388302117/%08d.png':
Duration: 00:00:01.60, start: 0.000000, bitrate: N/A
Stream #0:0: Video: png, rgb24(pc), 384x256, 20 fps, 20 tbr, 20 tbn, 20 tbc
Stream mapping:
Stream #0:0 (png) -> fps
fps -> Stream #0:0 (libx264)
Press [q] to stop, [?] for help
[libx264 @ 0x556f50ea08c0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2
[libx264 @ 0x556f50ea08c0] profile High, level 1.3, 4:2:0, 8-bit
[libx264 @ 0x556f50ea08c0] 264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=6 deblock=1:1:1 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=0.40:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=8 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=5 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=20 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=10.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:0.60
Output #0, mp4, to '/src/output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00_7418695825388302117_an-artistic-cup-of-coffee_black-coffee_sat-on-a-ta.mp4':
Metadata:
encoder : Lavf58.76.100
Stream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 384x256, q=2-31, 20 fps, 10240 tbn
Metadata:
encoder : Lavc58.134.100 libx264
Side data:
cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A
frame= 1 fps=0.0 q=0.0 size= 0kB time=00:00:00.00 bitrate=N/A speed= 0x
frame= 32 fps=0.0 q=-1.0 Lsize= 504kB time=00:00:01.45 bitrate=2847.4kbits/s speed=9.63x
video:503kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 0.236934%
[libx264 @ 0x556f50ea08c0] frame I:1 Avg QP:13.18 size: 22097
[libx264 @ 0x556f50ea08c0] frame P:7 Avg QP:13.48 size: 21731
[libx264 @ 0x556f50ea08c0] frame B:24 Avg QP:14.68 size: 14167
[libx264 @ 0x556f50ea08c0] consecutive B-frames: 3.1% 0.0% 0.0% 50.0% 46.9% 0.0%
[libx264 @ 0x556f50ea08c0] mb I I16..4: 5.5% 60.2% 34.4%
[libx264 @ 0x556f50ea08c0] mb P I16..4: 8.9% 47.4% 27.3% P16..4: 3.0% 8.4% 5.0% 0.0% 0.0% skip: 0.0%
[libx264 @ 0x556f50ea08c0] mb B I16..4: 3.6% 13.3% 6.5% B16..8: 21.6% 28.5% 15.3% direct: 9.8% skip: 1.5% L0:31.0% L1:27.5% BI:41.5%
[libx264 @ 0x556f50ea08c0] 8x8 transform intra:57.0% inter:64.7%
[libx264 @ 0x556f50ea08c0] coded y,uvDC,uvAC intra: 90.9% 95.3% 90.2% inter: 79.7% 93.2% 62.9%
[libx264 @ 0x556f50ea08c0] i16 v,h,dc,p: 13% 11% 23% 54%
[libx264 @ 0x556f50ea08c0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 19% 13% 16% 8% 9% 10% 8% 10% 8%
[libx264 @ 0x556f50ea08c0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 20% 11% 10% 7% 15% 14% 9% 10% 5%
[libx264 @ 0x556f50ea08c0] i8c dc,h,v,p: 43% 17% 27% 13%
[libx264 @ 0x556f50ea08c0] Weighted P-Frames: Y:28.6% UV:28.6%
[libx264 @ 0x556f50ea08c0] ref P L0: 44.6% 16.6% 17.6% 9.1% 6.0% 5.8% 0.3%
[libx264 @ 0x556f50ea08c0] ref B L0: 91.8% 4.8% 2.2% 0.8% 0.5%
[libx264 @ 0x556f50ea08c0] ref B L1: 98.3% 1.7%
[libx264 @ 0x556f50ea08c0] kb/s:2571.11
Identifying the GIF path from the generated outputs...
Identified directory: output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview
Identified Media Path: output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00_7418695825388302117_an-artistic-cup-of-coffee_black-coffee_sat-on-a-ta.mp4
Identified PNG Folder Path: output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/00-7418695825388302117
Interpolating frames with FILM...
0%| | 0/217 [00:00<?, ?it/s]
1%|▌ | 2/217 [00:00<00:13, 16.29it/s]
2%|█▏ | 4/217 [00:00<00:11, 18.16it/s]
3%|██ | 7/217 [00:00<00:10, 19.19it/s]
4%|██▌ | 9/217 [00:00<00:10, 19.10it/s]
6%|███▍ | 12/217 [00:00<00:10, 19.54it/s]
7%|████▎ | 15/217 [00:00<00:10, 19.47it/s]
8%|█████▏ | 18/217 [00:00<00:10, 19.66it/s]
10%|██████ | 21/217 [00:01<00:09, 19.80it/s]
11%|██████▌ | 23/217 [00:01<00:09, 19.57it/s]
12%|███████▍ | 26/217 [00:01<00:09, 19.73it/s]
13%|████████▎ | 29/217 [00:01<00:09, 19.59it/s]
15%|█████████▏ | 32/217 [00:01<00:09, 19.80it/s]
16%|██████████ | 35/217 [00:01<00:09, 19.95it/s]
17%|██████████▌ | 37/217 [00:01<00:09, 19.71it/s]
18%|███████████▍ | 40/217 [00:02<00:08, 19.84it/s]
20%|████████████▎ | 43/217 [00:02<00:08, 19.68it/s]
21%|█████████████▏ | 46/217 [00:02<00:08, 19.81it/s]
23%|██████████████ | 49/217 [00:02<00:08, 20.00it/s]
24%|██████████████▌ | 51/217 [00:02<00:08, 19.78it/s]
25%|███████████████▍ | 54/217 [00:02<00:08, 19.90it/s]
26%|████████████████▎ | 57/217 [00:02<00:08, 19.72it/s]
27%|████████████████▊ | 59/217 [00:03<00:08, 19.75it/s]
29%|█████████████████▋ | 62/217 [00:03<00:07, 19.86it/s]
29%|██████████████████▎ | 64/217 [00:03<00:07, 19.26it/s]
31%|███████████████████▏ | 67/217 [00:03<00:07, 19.60it/s]
32%|████████████████████ | 70/217 [00:03<00:07, 19.82it/s]
33%|████████████████████▌ | 72/217 [00:03<00:07, 19.63it/s]
35%|█████████████████████▍ | 75/217 [00:03<00:07, 19.68it/s]
36%|██████████████████████▎ | 78/217 [00:03<00:07, 19.57it/s]
37%|███████████████████████▏ | 81/217 [00:04<00:06, 19.79it/s]
38%|███████████████████████▋ | 83/217 [00:04<00:06, 19.81it/s]
39%|████████████████████████▎ | 85/217 [00:04<00:06, 19.54it/s]
41%|█████████████████████████▏ | 88/217 [00:04<00:06, 19.79it/s]
42%|██████████████████████████ | 91/217 [00:04<00:06, 19.89it/s]
43%|██████████████████████████▌ | 93/217 [00:04<00:06, 19.70it/s]
44%|███████████████████████████▍ | 96/217 [00:04<00:06, 19.97it/s]
46%|████████████████████████████▎ | 99/217 [00:05<00:05, 19.79it/s]
47%|████████████████████████████▋ | 102/217 [00:05<00:05, 19.95it/s]
48%|█████████████████████████████▌ | 105/217 [00:05<00:05, 20.03it/s]
50%|██████████████████████████████▎ | 108/217 [00:05<00:05, 19.80it/s]
51%|███████████████████████████████▏ | 111/217 [00:05<00:05, 19.92it/s]
52%|███████████████████████████████▊ | 113/217 [00:05<00:05, 19.66it/s]
53%|████████████████████████████████▎ | 115/217 [00:05<00:05, 19.73it/s]
54%|████████████████████████████████▉ | 117/217 [00:05<00:05, 19.71it/s]
55%|█████████████████████████████████▍ | 119/217 [00:06<00:04, 19.68it/s]
56%|██████████████████████████████████ | 121/217 [00:06<00:04, 19.40it/s]
57%|██████████████████████████████████▊ | 124/217 [00:06<00:04, 19.66it/s]
59%|███████████████████████████████████▋ | 127/217 [00:06<00:04, 19.53it/s]
60%|████████████████████████████████████▌ | 130/217 [00:06<00:04, 19.76it/s]
61%|█████████████████████████████████████▍ | 133/217 [00:06<00:04, 19.89it/s]
62%|█████████████████████████████████████▉ | 135/217 [00:06<00:04, 19.65it/s]
64%|██████████████████████████████████████▊ | 138/217 [00:07<00:03, 19.81it/s]
65%|███████████████████████████████████████▋ | 141/217 [00:07<00:03, 19.67it/s]
66%|████████████████████████████████████████▍ | 144/217 [00:07<00:03, 19.80it/s]
68%|█████████████████████████████████████████▎ | 147/217 [00:07<00:03, 19.90it/s]
69%|█████████████████████████████████████████▉ | 149/217 [00:07<00:03, 19.68it/s]
70%|██████████████████████████████████████████▋ | 152/217 [00:07<00:03, 19.86it/s]
71%|███████████████████████████████████████████▌ | 155/217 [00:07<00:03, 19.64it/s]
72%|████████████████████████████████████████████▏ | 157/217 [00:07<00:03, 19.69it/s]
73%|████████████████████████████████████████████▋ | 159/217 [00:08<00:02, 19.76it/s]
75%|█████████████████████████████████████████████▌ | 162/217 [00:08<00:02, 19.59it/s]
76%|██████████████████████████████████████████████▍ | 165/217 [00:08<00:02, 19.83it/s]
77%|███████████████████████████████████████████████▏ | 168/217 [00:08<00:02, 20.00it/s]
79%|████████████████████████████████████████████████ | 171/217 [00:08<00:02, 19.84it/s]
80%|████████████████████████████████████████████████▉ | 174/217 [00:08<00:02, 19.98it/s]
81%|█████████████████████████████████████████████████▍ | 176/217 [00:08<00:02, 19.71it/s]
82%|██████████████████████████████████████████████████▎ | 179/217 [00:09<00:01, 19.90it/s]
84%|███████████████████████████████████████████████████▏ | 182/217 [00:09<00:01, 20.01it/s]
85%|███████████████████████████████████████████████████▋ | 184/217 [00:09<00:01, 19.74it/s]
86%|████████████████████████████████████████████████████▌ | 187/217 [00:09<00:01, 19.93it/s]
88%|█████████████████████████████████████████████████████▍ | 190/217 [00:09<00:01, 19.76it/s]
89%|██████████████████████████████████████████████████████▎ | 193/217 [00:09<00:01, 19.91it/s]
90%|███████████████████████████████████████████████████████ | 196/217 [00:09<00:01, 19.99it/s]
91%|███████████████████████████████████████████████████████▋ | 198/217 [00:10<00:00, 19.61it/s]
93%|████████████████████████████████████████████████████████▌ | 201/217 [00:10<00:00, 19.84it/s]
94%|█████████████████████████████████████████████████████████▎ | 204/217 [00:10<00:00, 19.67it/s]
95%|██████████████████████████████████████████████████████████▏ | 207/217 [00:10<00:00, 19.89it/s]
97%|███████████████████████████████████████████████████████████ | 210/217 [00:10<00:00, 20.01it/s]
98%|███████████████████████████████████████████████████████████▌ | 212/217 [00:10<00:00, 19.76it/s]
99%|████████████████████████████████████████████████████████████▍| 215/217 [00:10<00:00, 19.89it/s]
100%|█████████████████████████████████████████████████████████████| 217/217 [00:10<00:00, 19.74it/s]
ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers
built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)
configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared
libavutil 56. 70.100 / 56. 70.100
libavcodec 58.134.100 / 58.134.100
libavformat 58. 76.100 / 58. 76.100
libavdevice 58. 13.100 / 58. 13.100
libavfilter 7.110.100 / 7.110.100
libswscale 5. 9.100 / 5. 9.100
libswresample 3. 9.100 / 3. 9.100
libpostproc 55. 9.100 / 55. 9.100
Input #0, image2, from 'output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/interpolated_frames/%08d.png':
Duration: 00:00:09.96, start: 0.000000, bitrate: N/A
Stream #0:0: Video: png, rgb24(pc), 384x256, 25 fps, 25 tbr, 25 tbn, 25 tbc
Stream mapping:
Stream #0:0 -> #0:0 (png (native) -> h264 (libx264))
Press [q] to stop, [?] for help
[libx264 @ 0x5592e9ec48c0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2
[libx264 @ 0x5592e9ec48c0] profile High, level 1.3, 4:2:0, 8-bit
[libx264 @ 0x5592e9ec48c0] 264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=8 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=20 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=1.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00
Output #0, mp4, to 'output/2023-11-01T10-50-34-sample-majicmixrealistic_v5preview/output_video.mp4':
Metadata:
encoder : Lavf58.76.100
Stream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 384x256, q=2-31, 20 fps, 10240 tbn
Metadata:
encoder : Lavc58.134.100 libx264
Side data:
cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A
frame= 1 fps=0.0 q=0.0 size= 0kB time=00:00:00.00 bitrate=N/A speed= 0x
frame= 226 fps=0.0 q=6.0 size= 3584kB time=00:00:08.55 bitrate=3433.9kbits/s speed=16.8x
frame= 249 fps=0.0 q=-1.0 Lsize= 5318kB time=00:00:12.30 bitrate=3542.0kbits/s speed=18.2x
video:5314kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 0.072162%
[libx264 @ 0x5592e9ec48c0] frame I:1 Avg QP: 2.24 size: 57980
[libx264 @ 0x5592e9ec48c0] frame P:64 Avg QP: 2.39 size: 41589
[libx264 @ 0x5592e9ec48c0] frame B:184 Avg QP: 5.64 size: 14791
[libx264 @ 0x5592e9ec48c0] consecutive B-frames: 1.2% 0.8% 0.0% 98.0%
[libx264 @ 0x5592e9ec48c0] mb I I16..4: 10.4% 25.8% 63.8%
[libx264 @ 0x5592e9ec48c0] mb P I16..4: 4.8% 10.3% 11.5% P16..4: 20.6% 30.7% 21.9% 0.0% 0.0% skip: 0.2%
[libx264 @ 0x5592e9ec48c0] mb B I16..4: 0.3% 1.3% 0.3% B16..8: 33.0% 10.6% 9.4% direct:31.8% skip:13.3% L0:25.7% L1:23.1% BI:51.2%
[libx264 @ 0x5592e9ec48c0] 8x8 transform intra:42.5% inter:33.0%
[libx264 @ 0x5592e9ec48c0] coded y,uvDC,uvAC intra: 98.2% 97.2% 97.1% inter: 80.7% 81.9% 77.9%
[libx264 @ 0x5592e9ec48c0] i16 v,h,dc,p: 14% 7% 22% 57%
[libx264 @ 0x5592e9ec48c0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 22% 13% 36% 4% 5% 5% 4% 6% 5%
[libx264 @ 0x5592e9ec48c0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 22% 14% 20% 7% 10% 9% 7% 7% 4%
[libx264 @ 0x5592e9ec48c0] i8c dc,h,v,p: 45% 15% 30% 10%
[libx264 @ 0x5592e9ec48c0] Weighted P-Frames: Y:23.4% UV:18.8%
[libx264 @ 0x5592e9ec48c0] ref P L0: 60.7% 27.9% 9.8% 1.4% 0.2%
[libx264 @ 0x5592e9ec48c0] ref B L0: 98.8% 1.0% 0.2%
[libx264 @ 0x5592e9ec48c0] ref B L1: 99.7% 0.3%
[libx264 @ 0x5592e9ec48c0] kb/s:3496.38