#accelerate==0.28.0 #av==11.0.0 diffusers einops==0.7.0 #pydantic==2.10.6 #gradio==4.44.1 imageio imageio-ffmpeg librosa #numpy==1.26.4 omegaconf opencv-python #sk-video==1.1.10 #tqdm==4.65.2 transformers
Use DICE-Talk in ComfyUI,which is a method about ‘Correlation-Aware Emotional Talking Portrait Generation’.
In the ./ComfyUI/custom_node directory, run the following:
git clone https://github.com/smthemex/ComfyUI_DICE_Talk.git
pip install -r requirements.txt
-- ComfyUI/models/dice_talk/
|-- audio_linear.pth
|-- emo_model.pth
|-- pose_guider.pth
|-- unet.pth
|-- yoloface_v5m.pt #can use sonic 可以用sonic的,不需要复制
|-- whisper-tiny/ #can use sonic 可以用sonic的,不需要复制
|--config.json
|--model.safetensors
|--preprocessor_config.json
|-- RIFE/ #can use sonic 可以用sonic的,不需要复制
|--flownet.pkl
-- ComfyUI/models/checkpoints
├── svd_xt.safetensors or svd_xt_1_1.safetensors
@misc{tan2025disentangleidentitycooperateemotion,
title={Disentangle Identity, Cooperate Emotion: Correlation-Aware Emotional Talking Portrait Generation},
author={Weipeng Tan and Chuming Lin and Chengming Xu and FeiFan Xu and Xiaobin Hu and Xiaozhong Ji and Junwei Zhu and Chengjie Wang and Yanwei Fu},
year={2025},
eprint={2504.18087},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2504.18087},
}