ProgramerSalar
/

L1-S

Model card Files Files and versions

L1-S / scripts /extract_vae_latent.sh

ProgramerSalar's picture

changes

524f2f8 10 months ago

762 Bytes

	#!/bin/bash

	# This script is used for batch extract the vae latents for video generation training
	# Since the video latent extract is very slow, pre-extract the video vae latents will save the training time

	GPUS=8 # The gpu number
	MODEL_NAME=pyramid_flux # The model name, `pyramid_flux` or `pyramid_mmdit`
	VAE_MODEL_PATH=/PATH/pyramid-flow-miniflux/causal_video_vae # The VAE CKPT dir.
	ANNO_FILE=annotation/video_text.jsonl # The video annotation file path
	WIDTH=640
	HEIGHT=384
	NUM_FRAMES=121

	torchrun --nproc_per_node $GPUS \
	tools/extract_video_vae_latents.py \
	--batch_size 1 \
	--model_dtype bf16 \
	--model_path $VAE_MODEL_PATH \
	--anno_file $ANNO_FILE \
	--width $WIDTH \
	--height $HEIGHT \
	--num_frames $NUM_FRAMES