AudioLDM
AudioLDM copied to clipboard
model 不能直接放在指定位置么?
比如放在ckpt下面
ckpt
├── ckpt/audioldm2
│ ├── ckpt/audioldm2/configuration.json
│ ├── ckpt/audioldm2/feature_extractor
│ │ └── ckpt/audioldm2/feature_extractor/preprocessor_config.json
│ ├── ckpt/audioldm2/language_model
│ │ ├── ckpt/audioldm2/language_model/config.json
│ │ └── ckpt/audioldm2/language_model/model.safetensors
│ ├── ckpt/audioldm2/model_index.json
│ ├── ckpt/audioldm2/projection_model
│ │ ├── ckpt/audioldm2/projection_model/config.json
│ │ └── ckpt/audioldm2/projection_model/diffusion_pytorch_model.safetensors
│ ├── ckpt/audioldm2/scheduler
│ │ └── ckpt/audioldm2/scheduler/scheduler_config.json
│ ├── ckpt/audioldm2/text_encoder
│ │ ├── ckpt/audioldm2/text_encoder/config.json
│ │ └── ckpt/audioldm2/text_encoder/model.safetensors
│ ├── ckpt/audioldm2/text_encoder_2
│ │ ├── ckpt/audioldm2/text_encoder_2/config.json
│ │ └── ckpt/audioldm2/text_encoder_2/model.safetensors
│ ├── ckpt/audioldm2/tokenizer
│ │ ├── ckpt/audioldm2/tokenizer/merges.txt
│ │ ├── ckpt/audioldm2/tokenizer/special_tokens_map.json
│ │ ├── ckpt/audioldm2/tokenizer/tokenizer_config.json
│ │ ├── ckpt/audioldm2/tokenizer/tokenizer.json
│ │ └── ckpt/audioldm2/tokenizer/vocab.json
│ ├── ckpt/audioldm2/tokenizer_2
│ │ ├── ckpt/audioldm2/tokenizer_2/special_tokens_map.json
│ │ ├── ckpt/audioldm2/tokenizer_2/spiece.model
│ │ ├── ckpt/audioldm2/tokenizer_2/tokenizer_config.json
│ │ └── ckpt/audioldm2/tokenizer_2/tokenizer.json
│ ├── ckpt/audioldm2/unet
│ │ ├── ckpt/audioldm2/unet/config.json
│ │ └── ckpt/audioldm2/unet/diffusion_pytorch_model.safetensors
│ ├── ckpt/audioldm2/vae
│ │ ├── ckpt/audioldm2/vae/config.json
│ │ └── ckpt/audioldm2/vae/diffusion_pytorch_model.safetensors
│ └── ckpt/audioldm2/vocoder
│ ├── ckpt/audioldm2/vocoder/config.json
│ └── ckpt/audioldm2/vocoder/model.safetensors
└── ckpt/audioldm-m-full
├── ckpt/audioldm-m-full/model_index.json
├── ckpt/audioldm-m-full/README.md
├── ckpt/audioldm-m-full/scheduler
│ └── ckpt/audioldm-m-full/scheduler/scheduler_config.json
├── ckpt/audioldm-m-full/text_encoder
│ ├── ckpt/audioldm-m-full/text_encoder/config.json
│ ├── ckpt/audioldm-m-full/text_encoder/model.safetensors
│ └── ckpt/audioldm-m-full/text_encoder/pytorch_model.bin
├── ckpt/audioldm-m-full/tokenizer
│ ├── ckpt/audioldm-m-full/tokenizer/merges.txt
│ ├── ckpt/audioldm-m-full/tokenizer/special_tokens_map.json
│ ├── ckpt/audioldm-m-full/tokenizer/tokenizer_config.json
│ ├── ckpt/audioldm-m-full/tokenizer/tokenizer.json
│ └── ckpt/audioldm-m-full/tokenizer/vocab.json
├── ckpt/audioldm-m-full/unet
│ ├── ckpt/audioldm-m-full/unet/config.json
│ ├── ckpt/audioldm-m-full/unet/diffusion_pytorch_model.bin
│ └── ckpt/audioldm-m-full/unet/diffusion_pytorch_model.safetensors
├── ckpt/audioldm-m-full/vae
│ ├── ckpt/audioldm-m-full/vae/config.json
│ ├── ckpt/audioldm-m-full/vae/diffusion_pytorch_model.bin
│ └── ckpt/audioldm-m-full/vae/diffusion_pytorch_model.safetensors
└── ckpt/audioldm-m-full/vocoder
├── ckpt/audioldm-m-full/vocoder/config.json
├── ckpt/audioldm-m-full/vocoder/model.safetensors
└── ckpt/audioldm-m-full/vocoder/pytorch_model.bin