Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .editorconfig +34 -0
- .gitattributes +1 -0
- .gitignore +241 -0
- .pre-commit-config.yaml +28 -0
- .vscode/settings.json +75 -0
- COPYING +13 -0
- LICENSE.md +194 -0
- MANIFEST.in +2 -0
- README.md +596 -0
- config/.gitignore +4 -0
- config/GroundingDINO/GroundingDINO_SwinB_cfg.py +43 -0
- config/GroundingDINO/GroundingDINO_SwinT_OGC.py +43 -0
- config/inference/default.json +27 -0
- config/inference/motion_v2.json +28 -0
- config/inference/sd15-unet.json +89 -0
- config/inference/sd15-unet3d.json +64 -0
- config/prompts/.gitignore +2 -0
- config/prompts/01-ToonYou.json +24 -0
- config/prompts/02-Lyriel.json +25 -0
- config/prompts/03-RcnzCartoon.json +25 -0
- config/prompts/04-MajicMix.json +25 -0
- config/prompts/05-RealisticVision.json +25 -0
- config/prompts/06-Tusun.json +23 -0
- config/prompts/07-FilmVelvia.json +26 -0
- config/prompts/08-GhibliBackground.json +23 -0
- config/prompts/concat_2horizontal.bat +1 -0
- config/prompts/ignore_tokens.txt +4 -0
- config/prompts/prompt_travel.json +248 -0
- config/prompts/prompt_travel_multi_controlnet.json +323 -0
- config/prompts/to_8fps_Frames.bat +1 -0
- data/.gitignore +5 -0
- data/controlnet_image/test/controlnet_canny/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_depth/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_inpaint/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_ip2p/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_lineart/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_lineart_anime/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_mlsd/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_normalbae/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_openpose/0000.png +0 -0
- data/controlnet_image/test/controlnet_openpose/0016.png +0 -0
- data/controlnet_image/test/controlnet_openpose/0032.png +0 -0
- data/controlnet_image/test/controlnet_openpose/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_scribble/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_seg/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_shuffle/put_pngs_here.txt +0 -0
- data/controlnet_image/test/controlnet_softedge/0000.png +0 -0
- data/controlnet_image/test/controlnet_softedge/0016.png +0 -0
- data/controlnet_image/test/controlnet_softedge/0032.png +0 -0
- data/controlnet_image/test/controlnet_softedge/put_pngs_here.txt +0 -0
.editorconfig
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# http://editorconfig.org
|
2 |
+
|
3 |
+
root = true
|
4 |
+
|
5 |
+
[*]
|
6 |
+
indent_style = space
|
7 |
+
indent_size = 4
|
8 |
+
trim_trailing_whitespace = true
|
9 |
+
insert_final_newline = true
|
10 |
+
charset = utf-8
|
11 |
+
end_of_line = lf
|
12 |
+
|
13 |
+
[*.bat]
|
14 |
+
indent_style = tab
|
15 |
+
end_of_line = crlf
|
16 |
+
|
17 |
+
[*.{json,jsonc}]
|
18 |
+
indent_style = space
|
19 |
+
indent_size = 2
|
20 |
+
|
21 |
+
[.vscode/*.{json,jsonc}]
|
22 |
+
indent_style = space
|
23 |
+
indent_size = 4
|
24 |
+
|
25 |
+
[*.{yml,yaml,toml}]
|
26 |
+
indent_style = space
|
27 |
+
indent_size = 2
|
28 |
+
|
29 |
+
[*.md]
|
30 |
+
trim_trailing_whitespace = false
|
31 |
+
|
32 |
+
[Makefile]
|
33 |
+
indent_style = tab
|
34 |
+
indent_size = 8
|
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
data/ref_image/ref_sample.png filter=lfs diff=lfs merge=lfs -text
|
.gitignore
ADDED
@@ -0,0 +1,241 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Created by https://www.toptal.com/developers/gitignore/api/linux,windows,macos,visualstudiocode,python
|
2 |
+
# Edit at https://www.toptal.com/developers/gitignore?templates=linux,windows,macos,visualstudiocode,python
|
3 |
+
|
4 |
+
### Linux ###
|
5 |
+
*~
|
6 |
+
|
7 |
+
# temporary files which can be created if a process still has a handle open of a deleted file
|
8 |
+
.fuse_hidden*
|
9 |
+
|
10 |
+
# KDE directory preferences
|
11 |
+
.directory
|
12 |
+
|
13 |
+
# Linux trash folder which might appear on any partition or disk
|
14 |
+
.Trash-*
|
15 |
+
|
16 |
+
# .nfs files are created when an open file is removed but is still being accessed
|
17 |
+
.nfs*
|
18 |
+
|
19 |
+
### macOS ###
|
20 |
+
# General
|
21 |
+
.DS_Store
|
22 |
+
.AppleDouble
|
23 |
+
.LSOverride
|
24 |
+
|
25 |
+
# Icon must end with two \r
|
26 |
+
Icon
|
27 |
+
|
28 |
+
|
29 |
+
# Thumbnails
|
30 |
+
._*
|
31 |
+
|
32 |
+
# Files that might appear in the root of a volume
|
33 |
+
.DocumentRevisions-V100
|
34 |
+
.fseventsd
|
35 |
+
.Spotlight-V100
|
36 |
+
.TemporaryItems
|
37 |
+
.Trashes
|
38 |
+
.VolumeIcon.icns
|
39 |
+
.com.apple.timemachine.donotpresent
|
40 |
+
|
41 |
+
# Directories potentially created on remote AFP share
|
42 |
+
.AppleDB
|
43 |
+
.AppleDesktop
|
44 |
+
Network Trash Folder
|
45 |
+
Temporary Items
|
46 |
+
.apdisk
|
47 |
+
|
48 |
+
### Python ###
|
49 |
+
# Byte-compiled / optimized / DLL files
|
50 |
+
__pycache__/
|
51 |
+
*.py[cod]
|
52 |
+
*$py.class
|
53 |
+
|
54 |
+
# C extensions
|
55 |
+
*.so
|
56 |
+
|
57 |
+
# Distribution / packaging
|
58 |
+
.Python
|
59 |
+
build/
|
60 |
+
develop-eggs/
|
61 |
+
dist/
|
62 |
+
downloads/
|
63 |
+
eggs/
|
64 |
+
.eggs/
|
65 |
+
lib/
|
66 |
+
lib64/
|
67 |
+
parts/
|
68 |
+
sdist/
|
69 |
+
var/
|
70 |
+
wheels/
|
71 |
+
share/python-wheels/
|
72 |
+
*.egg-info/
|
73 |
+
.installed.cfg
|
74 |
+
*.egg
|
75 |
+
MANIFEST
|
76 |
+
|
77 |
+
# PyInstaller
|
78 |
+
# Usually these files are written by a python script from a template
|
79 |
+
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
80 |
+
*.manifest
|
81 |
+
*.spec
|
82 |
+
|
83 |
+
# Installer logs
|
84 |
+
pip-log.txt
|
85 |
+
pip-delete-this-directory.txt
|
86 |
+
|
87 |
+
# Unit test / coverage reports
|
88 |
+
htmlcov/
|
89 |
+
.tox/
|
90 |
+
.nox/
|
91 |
+
.coverage
|
92 |
+
.coverage.*
|
93 |
+
.cache
|
94 |
+
nosetests.xml
|
95 |
+
coverage.xml
|
96 |
+
*.cover
|
97 |
+
*.py,cover
|
98 |
+
.hypothesis/
|
99 |
+
.pytest_cache/
|
100 |
+
cover/
|
101 |
+
|
102 |
+
# Translations
|
103 |
+
*.mo
|
104 |
+
*.pot
|
105 |
+
|
106 |
+
# Django stuff:
|
107 |
+
*.log
|
108 |
+
local_settings.py
|
109 |
+
db.sqlite3
|
110 |
+
db.sqlite3-journal
|
111 |
+
|
112 |
+
# Flask stuff:
|
113 |
+
instance/
|
114 |
+
.webassets-cache
|
115 |
+
|
116 |
+
# Scrapy stuff:
|
117 |
+
.scrapy
|
118 |
+
|
119 |
+
# Sphinx documentation
|
120 |
+
docs/_build/
|
121 |
+
|
122 |
+
# PyBuilder
|
123 |
+
.pybuilder/
|
124 |
+
target/
|
125 |
+
|
126 |
+
# Jupyter Notebook
|
127 |
+
.ipynb_checkpoints
|
128 |
+
|
129 |
+
# IPython
|
130 |
+
profile_default/
|
131 |
+
ipython_config.py
|
132 |
+
|
133 |
+
# pyenv
|
134 |
+
# For a library or package, you might want to ignore these files since the code is
|
135 |
+
# intended to run in multiple environments; otherwise, check them in:
|
136 |
+
# .python-version
|
137 |
+
|
138 |
+
# pipenv
|
139 |
+
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
140 |
+
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
141 |
+
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
142 |
+
# install all needed dependencies.
|
143 |
+
#Pipfile.lock
|
144 |
+
|
145 |
+
# PEP 582; used by e.g. github.com/David-OConnor/pyflow
|
146 |
+
__pypackages__/
|
147 |
+
|
148 |
+
# Celery stuff
|
149 |
+
celerybeat-schedule
|
150 |
+
celerybeat.pid
|
151 |
+
|
152 |
+
# SageMath parsed files
|
153 |
+
*.sage.py
|
154 |
+
|
155 |
+
# Environments
|
156 |
+
.env
|
157 |
+
.venv
|
158 |
+
env/
|
159 |
+
venv/
|
160 |
+
ENV/
|
161 |
+
env.bak/
|
162 |
+
venv.bak/
|
163 |
+
|
164 |
+
# Spyder project settings
|
165 |
+
.spyderproject
|
166 |
+
.spyproject
|
167 |
+
|
168 |
+
# Rope project settings
|
169 |
+
.ropeproject
|
170 |
+
|
171 |
+
# mkdocs documentation
|
172 |
+
/site
|
173 |
+
|
174 |
+
# mypy
|
175 |
+
.mypy_cache/
|
176 |
+
.dmypy.json
|
177 |
+
dmypy.json
|
178 |
+
|
179 |
+
# Pyre type checker
|
180 |
+
.pyre/
|
181 |
+
|
182 |
+
# pytype static type analyzer
|
183 |
+
.pytype/
|
184 |
+
|
185 |
+
# Cython debug symbols
|
186 |
+
cython_debug/
|
187 |
+
|
188 |
+
### VisualStudioCode ###
|
189 |
+
.vscode/*
|
190 |
+
!.vscode/settings.json
|
191 |
+
!.vscode/tasks.json
|
192 |
+
!.vscode/launch.json
|
193 |
+
!.vscode/extensions.json
|
194 |
+
*.code-workspace
|
195 |
+
|
196 |
+
# Local History for Visual Studio Code
|
197 |
+
.history/
|
198 |
+
|
199 |
+
### VisualStudioCode Patch ###
|
200 |
+
# Ignore all local history of files
|
201 |
+
.history
|
202 |
+
.ionide
|
203 |
+
|
204 |
+
### Windows ###
|
205 |
+
# Windows thumbnail cache files
|
206 |
+
Thumbs.db
|
207 |
+
Thumbs.db:encryptable
|
208 |
+
ehthumbs.db
|
209 |
+
ehthumbs_vista.db
|
210 |
+
|
211 |
+
# Dump file
|
212 |
+
*.stackdump
|
213 |
+
|
214 |
+
# Folder config file
|
215 |
+
[Dd]esktop.ini
|
216 |
+
|
217 |
+
# Recycle Bin used on file shares
|
218 |
+
$RECYCLE.BIN/
|
219 |
+
|
220 |
+
# Windows Installer files
|
221 |
+
*.cab
|
222 |
+
*.msi
|
223 |
+
*.msix
|
224 |
+
*.msm
|
225 |
+
*.msp
|
226 |
+
|
227 |
+
# Windows shortcuts
|
228 |
+
*.lnk
|
229 |
+
|
230 |
+
# End of https://www.toptal.com/developers/gitignore/api/linux,windows,macos,visualstudiocode,python
|
231 |
+
|
232 |
+
# setuptools-scm _version file
|
233 |
+
src/animatediff/_version.py
|
234 |
+
|
235 |
+
# local misc and temp
|
236 |
+
/misc/
|
237 |
+
/temp/
|
238 |
+
|
239 |
+
# envrc
|
240 |
+
.env*
|
241 |
+
!.envrc.example
|
.pre-commit-config.yaml
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# See https://pre-commit.com for more information
|
2 |
+
ci:
|
3 |
+
autofix_prs: true
|
4 |
+
autoupdate_branch: "main"
|
5 |
+
autoupdate_commit_msg: "[pre-commit.ci] pre-commit autoupdate"
|
6 |
+
autoupdate_schedule: weekly
|
7 |
+
|
8 |
+
repos:
|
9 |
+
- repo: https://github.com/astral-sh/ruff-pre-commit
|
10 |
+
rev: "v0.0.281"
|
11 |
+
hooks:
|
12 |
+
- id: ruff
|
13 |
+
args: ["--fix", "--exit-non-zero-on-fix"]
|
14 |
+
|
15 |
+
- repo: https://github.com/psf/black
|
16 |
+
rev: 23.7.0
|
17 |
+
hooks:
|
18 |
+
- id: black
|
19 |
+
args: ["--line-length=110"]
|
20 |
+
|
21 |
+
- repo: https://github.com/pre-commit/pre-commit-hooks
|
22 |
+
rev: v4.4.0
|
23 |
+
hooks:
|
24 |
+
- id: trailing-whitespace
|
25 |
+
args: [--markdown-linebreak-ext=md]
|
26 |
+
- id: end-of-file-fixer
|
27 |
+
- id: check-yaml
|
28 |
+
- id: check-added-large-files
|
.vscode/settings.json
ADDED
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"editor.insertSpaces": true,
|
3 |
+
"editor.tabSize": 4,
|
4 |
+
"files.trimTrailingWhitespace": true,
|
5 |
+
"editor.rulers": [100, 120],
|
6 |
+
|
7 |
+
"files.associations": {
|
8 |
+
"*.yaml": "yaml"
|
9 |
+
},
|
10 |
+
|
11 |
+
"files.exclude": {
|
12 |
+
"**/.git": true,
|
13 |
+
"**/.svn": true,
|
14 |
+
"**/.hg": true,
|
15 |
+
"**/CVS": true,
|
16 |
+
"**/.DS_Store": true,
|
17 |
+
"**/Thumbs.db": true,
|
18 |
+
"**/__pycache__": true
|
19 |
+
},
|
20 |
+
|
21 |
+
"[python]": {
|
22 |
+
"editor.wordBasedSuggestions": false,
|
23 |
+
"editor.formatOnSave": true,
|
24 |
+
"editor.defaultFormatter": "ms-python.black-formatter",
|
25 |
+
"editor.codeActionsOnSave": {
|
26 |
+
"source.organizeImports": true
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"python.analysis.include": ["./src", "./scripts", "./tests"],
|
30 |
+
|
31 |
+
"python.linting.enabled": false,
|
32 |
+
"python.linting.pylintEnabled": false,
|
33 |
+
"python.linting.flake8Enabled": true,
|
34 |
+
"python.linting.flake8Args": ["--config=${workspaceFolder}/setup.cfg"],
|
35 |
+
|
36 |
+
"[json]": {
|
37 |
+
"editor.tabSize": 2,
|
38 |
+
"editor.detectIndentation": false,
|
39 |
+
"editor.formatOnSave": true,
|
40 |
+
"editor.formatOnSaveMode": "file"
|
41 |
+
},
|
42 |
+
|
43 |
+
"[toml]": {
|
44 |
+
"editor.tabSize": 2,
|
45 |
+
"editor.detectIndentation": false,
|
46 |
+
"editor.formatOnSave": true,
|
47 |
+
"editor.formatOnSaveMode": "file",
|
48 |
+
"editor.defaultFormatter": "tamasfe.even-better-toml",
|
49 |
+
"editor.rulers": [80, 100]
|
50 |
+
},
|
51 |
+
"evenBetterToml.formatter.columnWidth": 88,
|
52 |
+
|
53 |
+
"[yaml]": {
|
54 |
+
"editor.detectIndentation": false,
|
55 |
+
"editor.tabSize": 2,
|
56 |
+
"editor.formatOnSave": true,
|
57 |
+
"editor.formatOnSaveMode": "file"
|
58 |
+
},
|
59 |
+
"yaml.format.bracketSpacing": true,
|
60 |
+
"yaml.format.proseWrap": "preserve",
|
61 |
+
"yaml.format.singleQuote": false,
|
62 |
+
"yaml.format.printWidth": 110,
|
63 |
+
|
64 |
+
"[markdown]": {
|
65 |
+
"files.trimTrailingWhitespace": false
|
66 |
+
},
|
67 |
+
|
68 |
+
"css.lint.validProperties": ["dock", "content-align", "content-justify"],
|
69 |
+
"[css]": {
|
70 |
+
"editor.formatOnSave": true
|
71 |
+
},
|
72 |
+
|
73 |
+
"remote.autoForwardPorts": false,
|
74 |
+
"remote.autoForwardPortsSource": "process"
|
75 |
+
}
|
COPYING
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Copyright (c) 2023, Andi Powers-Holmes
|
2 |
+
|
3 |
+
Licensed under the Apache License, Version 2.0 (the "License");
|
4 |
+
you may not use this file except in compliance with the License.
|
5 |
+
You may obtain a copy of the License at
|
6 |
+
|
7 |
+
http://www.apache.org/licenses/LICENSE-2.0
|
8 |
+
|
9 |
+
Unless required by applicable law or agreed to in writing, software
|
10 |
+
distributed under the License is distributed on an "AS IS" BASIS,
|
11 |
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
12 |
+
See the License for the specific language governing permissions and
|
13 |
+
limitations under the License.
|
LICENSE.md
ADDED
@@ -0,0 +1,194 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Apache License
|
2 |
+
==============
|
3 |
+
|
4 |
+
_Version 2.0, January 2004_
|
5 |
+
_<<http://www.apache.org/licenses/>>_
|
6 |
+
|
7 |
+
### Terms and Conditions for use, reproduction, and distribution
|
8 |
+
|
9 |
+
#### 1. Definitions
|
10 |
+
|
11 |
+
“License” shall mean the terms and conditions for use, reproduction, and
|
12 |
+
distribution as defined by Sections 1 through 9 of this document.
|
13 |
+
|
14 |
+
“Licensor” shall mean the copyright owner or entity authorized by the copyright
|
15 |
+
owner that is granting the License.
|
16 |
+
|
17 |
+
“Legal Entity” shall mean the union of the acting entity and all other entities
|
18 |
+
that control, are controlled by, or are under common control with that entity.
|
19 |
+
For the purposes of this definition, “control” means **(i)** the power, direct or
|
20 |
+
indirect, to cause the direction or management of such entity, whether by
|
21 |
+
contract or otherwise, or **(ii)** ownership of fifty percent (50%) or more of the
|
22 |
+
outstanding shares, or **(iii)** beneficial ownership of such entity.
|
23 |
+
|
24 |
+
“You” (or “Your”) shall mean an individual or Legal Entity exercising
|
25 |
+
permissions granted by this License.
|
26 |
+
|
27 |
+
“Source” form shall mean the preferred form for making modifications, including
|
28 |
+
but not limited to software source code, documentation source, and configuration
|
29 |
+
files.
|
30 |
+
|
31 |
+
“Object” form shall mean any form resulting from mechanical transformation or
|
32 |
+
translation of a Source form, including but not limited to compiled object code,
|
33 |
+
generated documentation, and conversions to other media types.
|
34 |
+
|
35 |
+
“Work” shall mean the work of authorship, whether in Source or Object form, made
|
36 |
+
available under the License, as indicated by a copyright notice that is included
|
37 |
+
in or attached to the work (an example is provided in the Appendix below).
|
38 |
+
|
39 |
+
“Derivative Works” shall mean any work, whether in Source or Object form, that
|
40 |
+
is based on (or derived from) the Work and for which the editorial revisions,
|
41 |
+
annotations, elaborations, or other modifications represent, as a whole, an
|
42 |
+
original work of authorship. For the purposes of this License, Derivative Works
|
43 |
+
shall not include works that remain separable from, or merely link (or bind by
|
44 |
+
name) to the interfaces of, the Work and Derivative Works thereof.
|
45 |
+
|
46 |
+
“Contribution” shall mean any work of authorship, including the original version
|
47 |
+
of the Work and any modifications or additions to that Work or Derivative Works
|
48 |
+
thereof, that is intentionally submitted to Licensor for inclusion in the Work
|
49 |
+
by the copyright owner or by an individual or Legal Entity authorized to submit
|
50 |
+
on behalf of the copyright owner. For the purposes of this definition,
|
51 |
+
“submitted” means any form of electronic, verbal, or written communication sent
|
52 |
+
to the Licensor or its representatives, including but not limited to
|
53 |
+
communication on electronic mailing lists, source code control systems, and
|
54 |
+
issue tracking systems that are managed by, or on behalf of, the Licensor for
|
55 |
+
the purpose of discussing and improving the Work, but excluding communication
|
56 |
+
that is conspicuously marked or otherwise designated in writing by the copyright
|
57 |
+
owner as “Not a Contribution.”
|
58 |
+
|
59 |
+
“Contributor” shall mean Licensor and any individual or Legal Entity on behalf
|
60 |
+
of whom a Contribution has been received by Licensor and subsequently
|
61 |
+
incorporated within the Work.
|
62 |
+
|
63 |
+
#### 2. Grant of Copyright License
|
64 |
+
|
65 |
+
Subject to the terms and conditions of this License, each Contributor hereby
|
66 |
+
grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free,
|
67 |
+
irrevocable copyright license to reproduce, prepare Derivative Works of,
|
68 |
+
publicly display, publicly perform, sublicense, and distribute the Work and such
|
69 |
+
Derivative Works in Source or Object form.
|
70 |
+
|
71 |
+
#### 3. Grant of Patent License
|
72 |
+
|
73 |
+
Subject to the terms and conditions of this License, each Contributor hereby
|
74 |
+
grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free,
|
75 |
+
irrevocable (except as stated in this section) patent license to make, have
|
76 |
+
made, use, offer to sell, sell, import, and otherwise transfer the Work, where
|
77 |
+
such license applies only to those patent claims licensable by such Contributor
|
78 |
+
that are necessarily infringed by their Contribution(s) alone or by combination
|
79 |
+
of their Contribution(s) with the Work to which such Contribution(s) was
|
80 |
+
submitted. If You institute patent litigation against any entity (including a
|
81 |
+
cross-claim or counterclaim in a lawsuit) alleging that the Work or a
|
82 |
+
Contribution incorporated within the Work constitutes direct or contributory
|
83 |
+
patent infringement, then any patent licenses granted to You under this License
|
84 |
+
for that Work shall terminate as of the date such litigation is filed.
|
85 |
+
|
86 |
+
#### 4. Redistribution
|
87 |
+
|
88 |
+
You may reproduce and distribute copies of the Work or Derivative Works thereof
|
89 |
+
in any medium, with or without modifications, and in Source or Object form,
|
90 |
+
provided that You meet the following conditions:
|
91 |
+
|
92 |
+
* **(a)** You must give any other recipients of the Work or Derivative Works a copy of
|
93 |
+
this License; and
|
94 |
+
* **(b)** You must cause any modified files to carry prominent notices stating that You
|
95 |
+
changed the files; and
|
96 |
+
* **(c)** You must retain, in the Source form of any Derivative Works that You distribute,
|
97 |
+
all copyright, patent, trademark, and attribution notices from the Source form
|
98 |
+
of the Work, excluding those notices that do not pertain to any part of the
|
99 |
+
Derivative Works; and
|
100 |
+
* **(d)** If the Work includes a “NOTICE” text file as part of its distribution, then any
|
101 |
+
Derivative Works that You distribute must include a readable copy of the
|
102 |
+
attribution notices contained within such NOTICE file, excluding those notices
|
103 |
+
that do not pertain to any part of the Derivative Works, in at least one of the
|
104 |
+
following places: within a NOTICE text file distributed as part of the
|
105 |
+
Derivative Works; within the Source form or documentation, if provided along
|
106 |
+
with the Derivative Works; or, within a display generated by the Derivative
|
107 |
+
Works, if and wherever such third-party notices normally appear. The contents of
|
108 |
+
the NOTICE file are for informational purposes only and do not modify the
|
109 |
+
License. You may add Your own attribution notices within Derivative Works that
|
110 |
+
You distribute, alongside or as an addendum to the NOTICE text from the Work,
|
111 |
+
provided that such additional attribution notices cannot be construed as
|
112 |
+
modifying the License.
|
113 |
+
|
114 |
+
You may add Your own copyright statement to Your modifications and may provide
|
115 |
+
additional or different license terms and conditions for use, reproduction, or
|
116 |
+
distribution of Your modifications, or for any such Derivative Works as a whole,
|
117 |
+
provided Your use, reproduction, and distribution of the Work otherwise complies
|
118 |
+
with the conditions stated in this License.
|
119 |
+
|
120 |
+
#### 5. Submission of Contributions
|
121 |
+
|
122 |
+
Unless You explicitly state otherwise, any Contribution intentionally submitted
|
123 |
+
for inclusion in the Work by You to the Licensor shall be under the terms and
|
124 |
+
conditions of this License, without any additional terms or conditions.
|
125 |
+
Notwithstanding the above, nothing herein shall supersede or modify the terms of
|
126 |
+
any separate license agreement you may have executed with Licensor regarding
|
127 |
+
such Contributions.
|
128 |
+
|
129 |
+
#### 6. Trademarks
|
130 |
+
|
131 |
+
This License does not grant permission to use the trade names, trademarks,
|
132 |
+
service marks, or product names of the Licensor, except as required for
|
133 |
+
reasonable and customary use in describing the origin of the Work and
|
134 |
+
reproducing the content of the NOTICE file.
|
135 |
+
|
136 |
+
#### 7. Disclaimer of Warranty
|
137 |
+
|
138 |
+
Unless required by applicable law or agreed to in writing, Licensor provides the
|
139 |
+
Work (and each Contributor provides its Contributions) on an “AS IS” BASIS,
|
140 |
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied,
|
141 |
+
including, without limitation, any warranties or conditions of TITLE,
|
142 |
+
NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are
|
143 |
+
solely responsible for determining the appropriateness of using or
|
144 |
+
redistributing the Work and assume any risks associated with Your exercise of
|
145 |
+
permissions under this License.
|
146 |
+
|
147 |
+
#### 8. Limitation of Liability
|
148 |
+
|
149 |
+
In no event and under no legal theory, whether in tort (including negligence),
|
150 |
+
contract, or otherwise, unless required by applicable law (such as deliberate
|
151 |
+
and grossly negligent acts) or agreed to in writing, shall any Contributor be
|
152 |
+
liable to You for damages, including any direct, indirect, special, incidental,
|
153 |
+
or consequential damages of any character arising as a result of this License or
|
154 |
+
out of the use or inability to use the Work (including but not limited to
|
155 |
+
damages for loss of goodwill, work stoppage, computer failure or malfunction, or
|
156 |
+
any and all other commercial damages or losses), even if such Contributor has
|
157 |
+
been advised of the possibility of such damages.
|
158 |
+
|
159 |
+
#### 9. Accepting Warranty or Additional Liability
|
160 |
+
|
161 |
+
While redistributing the Work or Derivative Works thereof, You may choose to
|
162 |
+
offer, and charge a fee for, acceptance of support, warranty, indemnity, or
|
163 |
+
other liability obligations and/or rights consistent with this License. However,
|
164 |
+
in accepting such obligations, You may act only on Your own behalf and on Your
|
165 |
+
sole responsibility, not on behalf of any other Contributor, and only if You
|
166 |
+
agree to indemnify, defend, and hold each Contributor harmless for any liability
|
167 |
+
incurred by, or claims asserted against, such Contributor by reason of your
|
168 |
+
accepting any such warranty or additional liability.
|
169 |
+
|
170 |
+
_END OF TERMS AND CONDITIONS_
|
171 |
+
|
172 |
+
### APPENDIX: How to apply the Apache License to your work
|
173 |
+
|
174 |
+
To apply the Apache License to your work, attach the following boilerplate
|
175 |
+
notice, with the fields enclosed by brackets `[]` replaced with your own
|
176 |
+
identifying information. (Don't include the brackets!) The text should be
|
177 |
+
enclosed in the appropriate comment syntax for the file format. We also
|
178 |
+
recommend that a file or class name and description of purpose be included on
|
179 |
+
the same “printed page” as the copyright notice for easier identification within
|
180 |
+
third-party archives.
|
181 |
+
|
182 |
+
Copyright [yyyy] [name of copyright owner]
|
183 |
+
|
184 |
+
Licensed under the Apache License, Version 2.0 (the "License");
|
185 |
+
you may not use this file except in compliance with the License.
|
186 |
+
You may obtain a copy of the License at
|
187 |
+
|
188 |
+
http://www.apache.org/licenses/LICENSE-2.0
|
189 |
+
|
190 |
+
Unless required by applicable law or agreed to in writing, software
|
191 |
+
distributed under the License is distributed on an "AS IS" BASIS,
|
192 |
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
193 |
+
See the License for the specific language governing permissions and
|
194 |
+
limitations under the License.
|
MANIFEST.in
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
# setuptools_scm will grab all tracked files, minus these exclusions
|
2 |
+
prune .vscode
|
README.md
ADDED
@@ -0,0 +1,596 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# AnimateDiff prompt travel
|
2 |
+
|
3 |
+
[AnimateDiff](https://github.com/guoyww/AnimateDiff) with prompt travel + [ControlNet](https://github.com/lllyasviel/ControlNet) + [IP-Adapter](https://github.com/tencent-ailab/IP-Adapter)
|
4 |
+
|
5 |
+
I added a experimental feature to animatediff-cli to change the prompt in the middle of the frame.
|
6 |
+
|
7 |
+
It seems to work surprisingly well!
|
8 |
+
|
9 |
+
### Example
|
10 |
+
- [A command to stylization with mask has been added](https://github.com/s9roll7/animatediff-cli-prompt-travel#video-stylization-with-mask).
|
11 |
+
|
12 |
+
<div><video controls src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/e2ce68b0-f904-4fc3-8d5c-2224b5ffc1d3" muted="false"></video></div>
|
13 |
+
<br>
|
14 |
+
|
15 |
+
- [A command to automate video stylization has been added](https://github.com/s9roll7/animatediff-cli-prompt-travel#video-stylization).
|
16 |
+
- Original / First generation result / Second generation(for upscaling) result
|
17 |
+
- It took 4 minutes to generate the first one and about 5 minutes to generate the second one (on rtx 4090).
|
18 |
+
- more example [here](https://github.com/s9roll7/animatediff-cli-prompt-travel/issues/29)
|
19 |
+
|
20 |
+
<div><video controls src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/2f1965f2-9a50-485e-ac95-e888a3189ba2" muted="false"></video></div>
|
21 |
+
<br>
|
22 |
+
|
23 |
+
- Numbered from left to right.
|
24 |
+
- 1.prompt + lora
|
25 |
+
- 2.prompt + lora + IP-Adapter(scale 0.5)
|
26 |
+
- 3.prompt + lora + IP-Adapter Plus(scale 0.5)
|
27 |
+
- 4.prompt + lora + Controlnet Reference Only(style_fidelity 0)
|
28 |
+
- input image
|
29 |
+
|
30 |
+
![0000](https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/4ae90f13-341d-4965-adfc-174ec2e61cd7)
|
31 |
+
|
32 |
+
|
33 |
+
<div><video controls src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/d9d300a9-1107-4a3b-a1f1-3245b49dde10" muted="false"></video></div>
|
34 |
+
<br>
|
35 |
+
|
36 |
+
|
37 |
+
- controlnet_openpose + controlnet_softedge
|
38 |
+
- input frames for controlnet(0,16,32 frames)
|
39 |
+
<img src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/4adac698-75a4-4c6d-bf64-a5723d0e3e77" width="512">
|
40 |
+
|
41 |
+
- result
|
42 |
+
<div><video controls src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/50aa9d0d-15b6-4c84-a497-8d020d3bdb7c" muted="false"></video></div>
|
43 |
+
<br>
|
44 |
+
|
45 |
+
- In the latest version, generation can now be controlled more precisely through prompts.
|
46 |
+
- sample 1
|
47 |
+
```json
|
48 |
+
"prompt_fixed_ratio": 0.8,
|
49 |
+
"head_prompt": "1girl, wizard, circlet, earrings, jewelry, purple hair,",
|
50 |
+
"prompt_map": {
|
51 |
+
"0": "(standing,full_body),blue_sky, town",
|
52 |
+
"8": "(sitting,full_body),rain, town",
|
53 |
+
"16": "(standing,full_body),blue_sky, woods",
|
54 |
+
"24": "(upper_body), beach",
|
55 |
+
"32": "(upper_body, smile)",
|
56 |
+
"40": "(upper_body, angry)",
|
57 |
+
"48": "(upper_body, smile, from_above)",
|
58 |
+
"56": "(upper_body, angry, from_side)",
|
59 |
+
"64": "(upper_body, smile, from_below)",
|
60 |
+
"72": "(upper_body, angry, from_behind, looking at viewer)",
|
61 |
+
"80": "face,looking at viewer",
|
62 |
+
"88": "face,looking at viewer, closed_eyes",
|
63 |
+
"96": "face,looking at viewer, open eyes, open_mouth",
|
64 |
+
"104": "face,looking at viewer, closed_eyes, closed_mouth",
|
65 |
+
"112": "face,looking at viewer, open eyes,eyes, open_mouth, tongue, smile, laughing",
|
66 |
+
"120": "face,looking at viewer, eating, bowl,chopsticks,holding,food"
|
67 |
+
},
|
68 |
+
```
|
69 |
+
<div><video controls src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/c4de4b87-f302-4d61-98c7-9607dece386f" muted="false"></video></div>
|
70 |
+
<br>
|
71 |
+
|
72 |
+
- sample 2
|
73 |
+
```json
|
74 |
+
"prompt_fixed_ratio": 1.0,
|
75 |
+
"head_prompt": "1girl, wizard, circlet, earrings, jewelry, purple hair,",
|
76 |
+
"prompt_map": {
|
77 |
+
"0": "",
|
78 |
+
"8": "((fire magic spell, fire background))",
|
79 |
+
"16": "((ice magic spell, ice background))",
|
80 |
+
"24": "((thunder magic spell, thunder background))",
|
81 |
+
"32": "((skull magic spell, skull background))",
|
82 |
+
"40": "((wind magic spell, wind background))",
|
83 |
+
"48": "((stone magic spell, stone background))",
|
84 |
+
"56": "((holy magic spell, holy background))",
|
85 |
+
"64": "((star magic spell, star background))",
|
86 |
+
"72": "((plant magic spell, plant background))",
|
87 |
+
"80": "((meteor magic spell, meteor background))"
|
88 |
+
},
|
89 |
+
```
|
90 |
+
<div><video controls src="https://github.com/s9roll7/animatediff-cli-prompt-travel/assets/118420657/31a5827d-e551-4937-8b67-51747a92d14c" muted="false"></video></div>
|
91 |
+
<br>
|
92 |
+
|
93 |
+
### Installation(for windows)
|
94 |
+
Same as the original animatediff-cli
|
95 |
+
[Python 3.10](https://www.python.org/) and git client must be installed
|
96 |
+
(A few days ago, PyTorch 2.1 was released, but it is safer to install the older version until things settle down.
|
97 |
+
[#87](https://github.com/s9roll7/animatediff-cli-prompt-travel/issues/87))
|
98 |
+
```sh
|
99 |
+
git clone https://github.com/s9roll7/animatediff-cli-prompt-travel.git
|
100 |
+
cd animatediff-cli-prompt-travel
|
101 |
+
py -3.10 -m venv venv
|
102 |
+
venv\Scripts\activate.bat
|
103 |
+
set PYTHONUTF8=1
|
104 |
+
python -m pip install --upgrade pip
|
105 |
+
# Torch installation must be modified to suit the environment. (https://pytorch.org/get-started/previous-versions/)
|
106 |
+
python -m pip install torch==2.0.1+cu118 torchvision==0.15.2+cu118 torchaudio==2.0.2 --index-url https://download.pytorch.org/whl/cu118
|
107 |
+
python -m pip install -e .
|
108 |
+
python -m pip install xformers
|
109 |
+
|
110 |
+
# If you want to use the 'stylize' command, you will also need
|
111 |
+
python -m pip install -e .[stylize]
|
112 |
+
|
113 |
+
# If you want to use use dwpose as a preprocessor for controlnet_openpose, you will also need
|
114 |
+
python -m pip install -e .[dwpose]
|
115 |
+
# (DWPose is a more powerful version of Openpose)
|
116 |
+
|
117 |
+
# If you want to use the 'stylize create-mask' and 'stylize composite' command, you will also need
|
118 |
+
python -m pip install -e .[stylize_mask]
|
119 |
+
```
|
120 |
+
(https://www.reddit.com/r/StableDiffusion/comments/157c0wl/working_animatediff_cli_windows_install/)
|
121 |
+
|
122 |
+
I found a detailed tutorial
|
123 |
+
(https://www.reddit.com/r/StableDiffusion/comments/16vlk9j/guide_to_creating_videos_with/)
|
124 |
+
(https://www.youtube.com/watch?v=7_hh3wOD81s)
|
125 |
+
|
126 |
+
### How To Use
|
127 |
+
Almost same as the original animatediff-cli, but with a slight change in config format.
|
128 |
+
```json
|
129 |
+
# prompt_travel.json
|
130 |
+
{
|
131 |
+
"name": "sample",
|
132 |
+
"path": "share/Stable-diffusion/mistoonAnime_v20.safetensors", # Specify Checkpoint as a path relative to /animatediff-cli/data
|
133 |
+
"vae_path":"share/VAE/vae-ft-mse-840000-ema-pruned.ckpt", # Specify vae as a path relative to /animatediff-cli/data
|
134 |
+
"motion_module": "models/motion-module/mm_sd_v14.ckpt", # Specify motion module as a path relative to /animatediff-cli/data
|
135 |
+
"compile": false,
|
136 |
+
"seed": [
|
137 |
+
341774366206100,-1,-1 # -1 means random. If "--repeats 3" is specified in this setting, The first will be 341774366206100, the second and third will be random.
|
138 |
+
],
|
139 |
+
"scheduler": "ddim", # "ddim","euler","euler_a","k_dpmpp_2m", etc...
|
140 |
+
"steps": 40,
|
141 |
+
"guidance_scale": 20, # cfg scale
|
142 |
+
"clip_skip": 2,
|
143 |
+
"head_prompt": "masterpiece, best quality, a beautiful and detailed portriat of muffet, monster girl,((purple body:1.3)),humanoid, arachnid, anthro,((fangs)),pigtails,hair bows,5 eyes,spider girl,6 arms,solo",
|
144 |
+
"prompt_map": { # "FRAME" : "PROMPT" format / ex. prompt for frame 32 is "head_prompt" + prompt_map["32"] + "tail_prompt"
|
145 |
+
"0": "smile standing,((spider webs:1.0))",
|
146 |
+
"32": "(((walking))),((spider webs:1.0))",
|
147 |
+
"64": "(((running))),((spider webs:2.0)),wide angle lens, fish eye effect",
|
148 |
+
"96": "(((sitting))),((spider webs:1.0))"
|
149 |
+
},
|
150 |
+
"tail_prompt": "clothed, open mouth, awesome and detailed background, holding teapot, holding teacup, 6 hands,detailed hands,storefront that sells pastries and tea,bloomers,(red and black clothing),inside,pouring into teacup,muffetwear",
|
151 |
+
"n_prompt": [
|
152 |
+
"(worst quality, low quality:1.4),nudity,simple background,border,mouth closed,text, patreon,bed,bedroom,white background,((monochrome)),sketch,(pink body:1.4),7 arms,8 arms,4 arms"
|
153 |
+
],
|
154 |
+
"lora_map": { # "PATH_TO_LORA" : STRENGTH format
|
155 |
+
"share/Lora/muffet_v2.safetensors" : 1.0, # Specify lora as a path relative to /animatediff-cli/data
|
156 |
+
"share/Lora/add_detail.safetensors" : 1.0 # Lora support is limited. Not all formats can be used!!!
|
157 |
+
},
|
158 |
+
"motion_lora_map": { # "PATH_TO_LORA" : STRENGTH format
|
159 |
+
"models/motion_lora/v2_lora_RollingAnticlockwise.ckpt":0.5, # Currently, the officially distributed lora seems to work only for v2 motion modules (mm_sd_v15_v2.ckpt).
|
160 |
+
"models/motion_lora/v2_lora_ZoomIn.ckpt":0.5
|
161 |
+
},
|
162 |
+
"ip_adapter_map": { # config for ip-adapter
|
163 |
+
# enable/disable (important)
|
164 |
+
"enable": true,
|
165 |
+
# Specify input image directory relative to /animatediff-cli/data (important! No need to specify frames in the config file. The effect on generation is exactly the same logic as the placement of the prompt)
|
166 |
+
"input_image_dir": "ip_adapter_image/test",
|
167 |
+
# save input image or not
|
168 |
+
"save_input_image": true,
|
169 |
+
# Ratio of image prompt vs text prompt (important). Even if you want to emphasize only the image prompt in 1.0, do not leave prompt/neg prompt empty, but specify a general text such as "best quality".
|
170 |
+
"scale": 0.5,
|
171 |
+
# IP-Adapter or IP-Adapter Plus or IP-Adapter Plus Face (important) It would be a completely different outcome. Not always PLUS a superior result.
|
172 |
+
"is_plus_face": true,
|
173 |
+
"is_plus": true
|
174 |
+
},
|
175 |
+
"controlnet_map": { # config for controlnet(for generation)
|
176 |
+
"input_image_dir" : "controlnet_image/test", # Specify input image directory relative to /animatediff-cli/data (important! Please refer to the directory structure of sample. No need to specify frames in the config file.)
|
177 |
+
"max_samples_on_vram" : 200, # If you specify a large number of images for controlnet and vram will not be enough, reduce this value. 0 means that everything should be placed in cpu.
|
178 |
+
"max_models_on_vram" : 3, # Number of controlnet models to be placed in vram
|
179 |
+
"save_detectmap" : true, # save preprocessed image or not
|
180 |
+
"preprocess_on_gpu": true, # run preprocess on gpu or not (It probably does not affect vram usage at peak, so it should always set true.)
|
181 |
+
"is_loop": true, # Whether controlnet effects consider loop
|
182 |
+
|
183 |
+
"controlnet_tile":{ # config for controlnet_tile
|
184 |
+
"enable": true, # enable/disable (important)
|
185 |
+
"use_preprocessor":true, # Whether to use a preprocessor for each controlnet type
|
186 |
+
"preprocessor":{ # If not specified, the default preprocessor is selected.(Most of the time the default should be fine.)
|
187 |
+
# none/blur/tile_resample/upernet_seg/ or key in controlnet_aux.processor.MODELS
|
188 |
+
# https://github.com/patrickvonplaten/controlnet_aux/blob/2fd027162e7aef8c18d0a9b5a344727d37f4f13d/src/controlnet_aux/processor.py#L20
|
189 |
+
"type" : "tile_resample",
|
190 |
+
"param":{
|
191 |
+
"down_sampling_rate":2.0
|
192 |
+
}
|
193 |
+
},
|
194 |
+
"guess_mode":false,
|
195 |
+
"controlnet_conditioning_scale": 1.0, # control weight (important)
|
196 |
+
"control_guidance_start": 0.0, # starting control step
|
197 |
+
"control_guidance_end": 1.0, # ending control step
|
198 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1] # list of influences on neighboring frames (important)
|
199 |
+
}, # This means that there is an impact of 0.5 on both neighboring frames and 0.4 on the one next to it. Try lengthening, shortening, or changing the values inside.
|
200 |
+
"controlnet_ip2p":{
|
201 |
+
"enable": true,
|
202 |
+
"use_preprocessor":true,
|
203 |
+
"guess_mode":false,
|
204 |
+
"controlnet_conditioning_scale": 1.0,
|
205 |
+
"control_guidance_start": 0.0,
|
206 |
+
"control_guidance_end": 1.0,
|
207 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
208 |
+
},
|
209 |
+
"controlnet_lineart_anime":{
|
210 |
+
"enable": true,
|
211 |
+
"use_preprocessor":true,
|
212 |
+
"guess_mode":false,
|
213 |
+
"controlnet_conditioning_scale": 1.0,
|
214 |
+
"control_guidance_start": 0.0,
|
215 |
+
"control_guidance_end": 1.0,
|
216 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
217 |
+
},
|
218 |
+
"controlnet_openpose":{
|
219 |
+
"enable": true,
|
220 |
+
"use_preprocessor":true,
|
221 |
+
"guess_mode":false,
|
222 |
+
"controlnet_conditioning_scale": 1.0,
|
223 |
+
"control_guidance_start": 0.0,
|
224 |
+
"control_guidance_end": 1.0,
|
225 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
226 |
+
},
|
227 |
+
"controlnet_softedge":{
|
228 |
+
"enable": true,
|
229 |
+
"use_preprocessor":true,
|
230 |
+
"preprocessor":{
|
231 |
+
"type" : "softedge_pidsafe",
|
232 |
+
"param":{
|
233 |
+
}
|
234 |
+
},
|
235 |
+
"guess_mode":false,
|
236 |
+
"controlnet_conditioning_scale": 1.0,
|
237 |
+
"control_guidance_start": 0.0,
|
238 |
+
"control_guidance_end": 1.0,
|
239 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
240 |
+
},
|
241 |
+
"controlnet_ref": {
|
242 |
+
"enable": false, # enable/disable (important)
|
243 |
+
"ref_image": "ref_image/ref_sample.png", # path to reference image.
|
244 |
+
"attention_auto_machine_weight": 1.0,
|
245 |
+
"gn_auto_machine_weight": 1.0,
|
246 |
+
"style_fidelity": 0.5, # control weight-like parameter(important)
|
247 |
+
"reference_attn": true, # [attn=true , adain=false] means "reference_only"
|
248 |
+
"reference_adain": false,
|
249 |
+
"scale_pattern":[0.5] # Pattern for applying controlnet_ref to frames
|
250 |
+
} # ex. [0.5] means [0.5,0.5,0.5,0.5,0.5 .... ]. All frames are affected by 50%
|
251 |
+
# ex. [1, 0] means [1,0,1,0,1,0,1,0,1,0,1 ....]. Only even frames are affected by 100%.
|
252 |
+
},
|
253 |
+
"upscale_config": { # config for tile-upscale
|
254 |
+
"scheduler": "ddim",
|
255 |
+
"steps": 20,
|
256 |
+
"strength": 0.5,
|
257 |
+
"guidance_scale": 10,
|
258 |
+
"controlnet_tile": { # config for controlnet tile
|
259 |
+
"enable": true, # enable/disable (important)
|
260 |
+
"controlnet_conditioning_scale": 1.0, # control weight (important)
|
261 |
+
"guess_mode": false,
|
262 |
+
"control_guidance_start": 0.0, # starting control step
|
263 |
+
"control_guidance_end": 1.0 # ending control step
|
264 |
+
},
|
265 |
+
"controlnet_line_anime": { # config for controlnet line anime
|
266 |
+
"enable": false,
|
267 |
+
"controlnet_conditioning_scale": 1.0,
|
268 |
+
"guess_mode": false,
|
269 |
+
"control_guidance_start": 0.0,
|
270 |
+
"control_guidance_end": 1.0
|
271 |
+
},
|
272 |
+
"controlnet_ip2p": { # config for controlnet ip2p
|
273 |
+
"enable": false,
|
274 |
+
"controlnet_conditioning_scale": 0.5,
|
275 |
+
"guess_mode": false,
|
276 |
+
"control_guidance_start": 0.0,
|
277 |
+
"control_guidance_end": 1.0
|
278 |
+
},
|
279 |
+
"controlnet_ref": { # config for controlnet ref
|
280 |
+
"enable": false, # enable/disable (important)
|
281 |
+
"use_frame_as_ref_image": false, # use original frames as ref_image for each upscale (important)
|
282 |
+
"use_1st_frame_as_ref_image": false, # use 1st original frame as ref_image for all upscale (important)
|
283 |
+
"ref_image": "ref_image/path_to_your_ref_img.jpg", # use specified image file as ref_image for all upscale (important)
|
284 |
+
"attention_auto_machine_weight": 1.0,
|
285 |
+
"gn_auto_machine_weight": 1.0,
|
286 |
+
"style_fidelity": 0.25, # control weight-like parameter(important)
|
287 |
+
"reference_attn": true, # [attn=true , adain=false] means "reference_only"
|
288 |
+
"reference_adain": false
|
289 |
+
}
|
290 |
+
},
|
291 |
+
"output":{ # output format
|
292 |
+
"format" : "gif", # gif/mp4/webm
|
293 |
+
"fps" : 8,
|
294 |
+
"encode_param":{
|
295 |
+
"crf": 10
|
296 |
+
}
|
297 |
+
}
|
298 |
+
}
|
299 |
+
```
|
300 |
+
|
301 |
+
```sh
|
302 |
+
cd animatediff-cli-prompt-travel
|
303 |
+
venv\Scripts\activate.bat
|
304 |
+
|
305 |
+
# with this setup, it took about a minute to generate in my environment(RTX4090). VRAM usage was 6-7 GB
|
306 |
+
# width 256 / height 384 / length 128 frames / context 16 frames
|
307 |
+
animatediff generate -c config/prompts/prompt_travel.json -W 256 -H 384 -L 128 -C 16
|
308 |
+
# 5min / 9-10GB
|
309 |
+
animatediff generate -c config/prompts/prompt_travel.json -W 512 -H 768 -L 128 -C 16
|
310 |
+
|
311 |
+
# upscale using controlnet (tile, line anime, ip2p, ref)
|
312 |
+
# specify the directory of the frame generated in the above step
|
313 |
+
# default config path is 'frames_dir/../prompt.json'
|
314 |
+
# here, width=512 is specified, but even if the original size is 512, it is effective in increasing detail
|
315 |
+
animatediff tile-upscale PATH_TO_TARGET_FRAME_DIRECTORY -c config/prompts/prompt_travel.json -W 512
|
316 |
+
|
317 |
+
# upscale width to 768 (smoother than tile-upscale)
|
318 |
+
animatediff refine PATH_TO_TARGET_FRAME_DIRECTORY -W 768
|
319 |
+
# If generation takes an unusually long time, there is not enough vram.
|
320 |
+
# Give up large size or reduce the size of the context.
|
321 |
+
animatediff refine PATH_TO_TARGET_FRAME_DIRECTORY -W 1024 -C 6
|
322 |
+
|
323 |
+
# change lora and prompt to make minor changes to the video.
|
324 |
+
animatediff refine PATH_TO_TARGET_FRAME_DIRECTORY -c config/prompts/some_minor_changed.json
|
325 |
+
```
|
326 |
+
|
327 |
+
#### Video Stylization
|
328 |
+
```sh
|
329 |
+
cd animatediff-cli-prompt-travel
|
330 |
+
venv\Scripts\activate.bat
|
331 |
+
|
332 |
+
# If you want to use the 'stylize' command, additional installation required
|
333 |
+
python -m pip install -e .[stylize]
|
334 |
+
|
335 |
+
# create config file from src video
|
336 |
+
animatediff stylize create-config YOUR_SRC_MOVIE_FILE.mp4
|
337 |
+
|
338 |
+
# Edit the config file by referring to the hint displayed in the log when the command finishes
|
339 |
+
# It is recommended to specify a short length for the test run
|
340 |
+
|
341 |
+
# generate(test run)
|
342 |
+
# 16 frames
|
343 |
+
animatediff stylize generate STYLYZE_DIR -L 16
|
344 |
+
# 16 frames from the 200th frame
|
345 |
+
animatediff stylize generate STYLYZE_DIR -L 16 -FO 200
|
346 |
+
|
347 |
+
# If generation takes an unusually long time, there is not enough vram.
|
348 |
+
# Give up large size or reduce the size of the context.
|
349 |
+
|
350 |
+
# generate
|
351 |
+
animatediff stylize generate STYLYZE_DIR
|
352 |
+
```
|
353 |
+
|
354 |
+
#### Video Stylization with mask
|
355 |
+
```sh
|
356 |
+
cd animatediff-cli-prompt-travel
|
357 |
+
venv\Scripts\activate.bat
|
358 |
+
|
359 |
+
# If you want to use the 'stylize create-mask' command, additional installation required
|
360 |
+
python -m pip install -e .[stylize_mask]
|
361 |
+
|
362 |
+
# [1] create config file from src video
|
363 |
+
animatediff stylize create-config YOUR_SRC_MOVIE_FILE.mp4
|
364 |
+
```
|
365 |
+
```json
|
366 |
+
# in prompt.json (generated in [1])
|
367 |
+
# [2] write the object you want to mask
|
368 |
+
# ex.) If you want to mask a person
|
369 |
+
"stylize_config": {
|
370 |
+
"create_mask": [
|
371 |
+
"person"
|
372 |
+
],
|
373 |
+
"composite": {
|
374 |
+
```
|
375 |
+
```json
|
376 |
+
# ex.) person, dog, cat
|
377 |
+
"stylize_config": {
|
378 |
+
"create_mask": [
|
379 |
+
"person", "dog", "cat"
|
380 |
+
],
|
381 |
+
"composite": {
|
382 |
+
```
|
383 |
+
```json
|
384 |
+
# ex.) boy, girl
|
385 |
+
"stylize_config": {
|
386 |
+
"create_mask": [
|
387 |
+
"boy", "girl"
|
388 |
+
],
|
389 |
+
"composite": {
|
390 |
+
```
|
391 |
+
```sh
|
392 |
+
# [3] generate mask
|
393 |
+
animatediff stylize create-mask STYLYZE_DIR
|
394 |
+
|
395 |
+
# If you have less than 12GB of vram, specify low vram mode
|
396 |
+
animatediff stylize create-mask STYLYZE_DIR -lo
|
397 |
+
|
398 |
+
# The foreground is output to the following directory (FG_STYLYZE_DIR)
|
399 |
+
# STYLYZE_DIR/fg_00_timestamp_str
|
400 |
+
# The background is output to the following directory (BG_STYLYZE_DIR)
|
401 |
+
# STYLYZE_DIR/bg_timestamp_str
|
402 |
+
|
403 |
+
# [4] generate foreground
|
404 |
+
animatediff stylize generate FG_STYLYZE_DIR
|
405 |
+
|
406 |
+
# Same as normal generate.
|
407 |
+
# The default is controlnet_tile, so if you want to make a big style change,
|
408 |
+
# such as changing the character, change to openpose, etc.
|
409 |
+
|
410 |
+
# Of course, you can also generate the background here.
|
411 |
+
```
|
412 |
+
```json
|
413 |
+
# in prompt.json (generated in [1])
|
414 |
+
# [5] composite setup
|
415 |
+
# enter the directory containing the frames generated in [4] in "fg_list".
|
416 |
+
# In the "mask_prompt" field, write the object you want to extract from the generated foreground frame.
|
417 |
+
# If you prepared the mask yourself, specify it in mask_path. If a valid path is set, use it.
|
418 |
+
# If the shape has not changed when the foreground is generated, FG_STYLYZE_DIR/00_mask can be used
|
419 |
+
# enter the directory containing the background frames separated in [3] in "bg_frame_dir".
|
420 |
+
"composite": {
|
421 |
+
"fg_list": [
|
422 |
+
{
|
423 |
+
"path": "FG_STYLYZE_DIR/time_stamp_str/00-341774366206100",
|
424 |
+
"mask_path": " absolute path to mask dir (this is optional) ",
|
425 |
+
"mask_prompt": "person"
|
426 |
+
},
|
427 |
+
{
|
428 |
+
"path": " absolute path to frame dir ",
|
429 |
+
"mask_path": " absolute path to mask dir (this is optional) ",
|
430 |
+
"mask_prompt": "cat"
|
431 |
+
}
|
432 |
+
],
|
433 |
+
"bg_frame_dir": "BG_STYLYZE_DIR/00_controlnet_image/controlnet_tile",
|
434 |
+
"hint": ""
|
435 |
+
},
|
436 |
+
```
|
437 |
+
```sh
|
438 |
+
# [6] composite
|
439 |
+
animatediff stylize composite STYLYZE_DIR
|
440 |
+
|
441 |
+
# See help for detailed options.
|
442 |
+
```
|
443 |
+
|
444 |
+
|
445 |
+
#### Auto config generation for [Stable-Diffusion-Webui-Civitai-Helper](https://github.com/butaixianran/Stable-Diffusion-Webui-Civitai-Helper) user
|
446 |
+
```sh
|
447 |
+
# This command parses the *.civitai.info files and automatically generates config files
|
448 |
+
# See "animatediff civitai2config -h" for details
|
449 |
+
animatediff civitai2config PATH_TO_YOUR_A111_LORA_DIR
|
450 |
+
```
|
451 |
+
#### Wildcard
|
452 |
+
- you can pick wildcard up at [civitai](https://civitai.com/models/23799/freecards). then, put them in /wildcards.
|
453 |
+
- Usage is the same as a1111.( \_\_WILDCARDFILENAME\_\_ format,
|
454 |
+
ex. \_\_animal\_\_ for animal.txt. \_\_background-color\_\_ for background-color.txt.)
|
455 |
+
```json
|
456 |
+
"prompt_map": { # __WILDCARDFILENAME__
|
457 |
+
"0": "__character-posture__, __character-gesture__, __character-emotion__, masterpiece, best quality, a beautiful and detailed portriat of muffet, monster girl,((purple body:1.3)), __background__",
|
458 |
+
```
|
459 |
+
### Recommended setting
|
460 |
+
- checkpoint : [mistoonAnime_v20](https://civitai.com/models/24149/mistoonanime) for anime, [xxmix9realistic_v40](https://civitai.com/models/47274) for photoreal
|
461 |
+
- scheduler : "k_dpmpp_sde"
|
462 |
+
- upscale : Enable controlnet_tile and controlnet_ip2p only. If you can provide a good reference image, controlnet_ref may also be useful.
|
463 |
+
|
464 |
+
### Recommended settings for 8-12 GB of vram
|
465 |
+
- max_samples_on_vram : Set to 0 if vram is insufficient when using controlnet
|
466 |
+
- max_models_on_vram : 1
|
467 |
+
- Generate at lower resolution and upscale to higher resolution
|
468 |
+
```sh
|
469 |
+
animatediff generate -c config/prompts/your_config.json -W 384 -H 576 -L 48 -C 16
|
470 |
+
animatediff tile-upscale output/2023-08-25T20-00-00-sample-mistoonanime_v20/00-341774366206100 -W 512
|
471 |
+
```
|
472 |
+
|
473 |
+
### Limitations
|
474 |
+
- lora support is limited. Not all formats can be used!!!
|
475 |
+
- It is not possible to specify lora in the prompt.
|
476 |
+
|
477 |
+
### Related resources
|
478 |
+
- [AnimateDiff](https://github.com/guoyww/AnimateDiff)
|
479 |
+
- [ControlNet](https://github.com/lllyasviel/ControlNet)
|
480 |
+
- [IP-Adapter](https://github.com/tencent-ailab/IP-Adapter)
|
481 |
+
- [DWPose](https://github.com/IDEA-Research/DWPose)
|
482 |
+
- [softmax-splatting](https://github.com/sniklaus/softmax-splatting)
|
483 |
+
- [sam-hq](https://github.com/SysCV/sam-hq)
|
484 |
+
- [Grounded-Segment-Anything](https://github.com/IDEA-Research/Grounded-Segment-Anything)
|
485 |
+
- [ProPainter](https://github.com/sczhou/ProPainter)
|
486 |
+
|
487 |
+
<br>
|
488 |
+
<br>
|
489 |
+
<br>
|
490 |
+
<br>
|
491 |
+
<br>
|
492 |
+
|
493 |
+
Below is the original readme.
|
494 |
+
|
495 |
+
----------------------------------------------------------
|
496 |
+
|
497 |
+
|
498 |
+
# animatediff
|
499 |
+
[![pre-commit.ci status](https://results.pre-commit.ci/badge/github/neggles/animatediff-cli/main.svg)](https://results.pre-commit.ci/latest/github/neggles/animatediff-cli/main)
|
500 |
+
|
501 |
+
animatediff refactor, ~~because I can.~~ with significantly lower VRAM usage.
|
502 |
+
|
503 |
+
Also, **infinite generation length support!** yay!
|
504 |
+
|
505 |
+
# LoRA loading is ABSOLUTELY NOT IMPLEMENTED YET!
|
506 |
+
|
507 |
+
This can theoretically run on CPU, but it's not recommended. Should work fine on a GPU, nVidia or otherwise,
|
508 |
+
but I haven't tested on non-CUDA hardware. Uses PyTorch 2.0 Scaled-Dot-Product Attention (aka builtin xformers)
|
509 |
+
by default, but you can pass `--xformers` to force using xformers if you *really* want.
|
510 |
+
|
511 |
+
### How To Use
|
512 |
+
|
513 |
+
1. Lie down
|
514 |
+
2. Try not to cry
|
515 |
+
3. Cry a lot
|
516 |
+
|
517 |
+
### but for real?
|
518 |
+
|
519 |
+
Okay, fine. But it's still a little complicated and there's no webUI yet.
|
520 |
+
|
521 |
+
```sh
|
522 |
+
git clone https://github.com/neggles/animatediff-cli
|
523 |
+
cd animatediff-cli
|
524 |
+
python3.10 -m venv .venv
|
525 |
+
source .venv/bin/activate
|
526 |
+
# install Torch. Use whatever your favourite torch version >= 2.0.0 is, but, good luck on non-nVidia...
|
527 |
+
python -m pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118
|
528 |
+
# install the rest of all the things (probably! I may have missed some deps.)
|
529 |
+
python -m pip install -e '.[dev]'
|
530 |
+
# you should now be able to
|
531 |
+
animatediff --help
|
532 |
+
# There's a nice pretty help screen with a bunch of info that'll print here.
|
533 |
+
```
|
534 |
+
|
535 |
+
From here you'll need to put whatever checkpoint you want to use into `data/models/sd`, copy
|
536 |
+
one of the prompt configs in `config/prompts`, edit it with your choices of prompt and model (model
|
537 |
+
paths in prompt .json files are **relative to `data/`**, e.g. `models/sd/vanilla.safetensors`), and
|
538 |
+
off you go.
|
539 |
+
|
540 |
+
Then it's something like (for an 8GB card):
|
541 |
+
```sh
|
542 |
+
animatediff generate -c 'config/prompts/waifu.json' -W 576 -H 576 -L 128 -C 16
|
543 |
+
```
|
544 |
+
You may have to drop `-C` down to 8 on cards with less than 8GB VRAM, and you can raise it to 20-24
|
545 |
+
on cards with more. 24 is max.
|
546 |
+
|
547 |
+
N.B. generating 128 frames is _**slow...**_
|
548 |
+
|
549 |
+
## RiFE!
|
550 |
+
|
551 |
+
I have added experimental support for [rife-ncnn-vulkan](https://github.com/nihui/rife-ncnn-vulkan)
|
552 |
+
using the `animatediff rife interpolate` command. It has fairly self-explanatory help, and it has
|
553 |
+
been tested on Linux, but I've **no idea** if it'll work on Windows.
|
554 |
+
|
555 |
+
Either way, you'll need ffmpeg installed on your system and present in PATH, and you'll need to
|
556 |
+
download the rife-ncnn-vulkan release for your OS of choice from the GitHub repo (above). Unzip it, and
|
557 |
+
place the extracted folder at `data/rife/`. You should have a `data/rife/rife-ncnn-vulkan` executable, or `data\rife\rife-ncnn-vulkan.exe` on Windows.
|
558 |
+
|
559 |
+
You'll also need to reinstall the repo/package with:
|
560 |
+
```py
|
561 |
+
python -m pip install -e '.[rife]'
|
562 |
+
```
|
563 |
+
or just install `ffmpeg-python` manually yourself.
|
564 |
+
|
565 |
+
Default is to multiply each frame by 8, turning an 8fps animation into a 64fps one, then encode
|
566 |
+
that to a 60fps WebM. (If you pick GIF mode, it'll be 50fps, because GIFs are cursed and encode
|
567 |
+
frame durations as 1/100ths of a second).
|
568 |
+
|
569 |
+
Seems to work pretty well...
|
570 |
+
|
571 |
+
## TODO:
|
572 |
+
|
573 |
+
In no particular order:
|
574 |
+
|
575 |
+
- [x] Infinite generation length support
|
576 |
+
- [x] RIFE support for motion interpolation (`rife-ncnn-vulkan` isn't the greatest implementation)
|
577 |
+
- [x] Export RIFE interpolated frames to a video file (webm, mp4, animated webp, hevc mp4, gif, etc.)
|
578 |
+
- [x] Generate infinite length animations on a 6-8GB card (at 512x512 with 8-frame context, but hey it'll do)
|
579 |
+
- [x] Torch SDP Attention (makes xformers optional)
|
580 |
+
- [x] Support for `clip_skip` in prompt config
|
581 |
+
- [x] Experimental support for `torch.compile()` (upstream Diffusers bugs slow this down a little but it's still zippy)
|
582 |
+
- [x] Batch your generations with `--repeat`! (e.g. `--repeat 10` will repeat all your prompts 10 times)
|
583 |
+
- [x] Call the `animatediff.cli.generate()` function from another Python program without reloading the model every time
|
584 |
+
- [x] Drag remaining old Diffusers code up to latest (mostly)
|
585 |
+
- [ ] Add a webUI (maybe, there are people wrapping this already so maybe not?)
|
586 |
+
- [ ] img2img support (start from an existing image and continue)
|
587 |
+
- [ ] Stop using custom modules where possible (should be able to use Diffusers for almost all of it)
|
588 |
+
- [ ] Automatic generate-then-interpolate-with-RIFE mode
|
589 |
+
|
590 |
+
## Credits:
|
591 |
+
|
592 |
+
see [guoyww/AnimateDiff](https://github.com/guoyww/AnimateDiff) (very little of this is my work)
|
593 |
+
|
594 |
+
n.b. the copyright notice in `COPYING` is missing the original authors' names, solely because
|
595 |
+
the original repo (as of this writing) has no name attached to the license. I have, however,
|
596 |
+
used the same license they did (Apache 2.0).
|
config/.gitignore
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
/*
|
2 |
+
!.gitignore
|
3 |
+
!/inference/
|
4 |
+
!/prompts/
|
config/GroundingDINO/GroundingDINO_SwinB_cfg.py
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
batch_size = 1
|
2 |
+
modelname = "groundingdino"
|
3 |
+
backbone = "swin_B_384_22k"
|
4 |
+
position_embedding = "sine"
|
5 |
+
pe_temperatureH = 20
|
6 |
+
pe_temperatureW = 20
|
7 |
+
return_interm_indices = [1, 2, 3]
|
8 |
+
backbone_freeze_keywords = None
|
9 |
+
enc_layers = 6
|
10 |
+
dec_layers = 6
|
11 |
+
pre_norm = False
|
12 |
+
dim_feedforward = 2048
|
13 |
+
hidden_dim = 256
|
14 |
+
dropout = 0.0
|
15 |
+
nheads = 8
|
16 |
+
num_queries = 900
|
17 |
+
query_dim = 4
|
18 |
+
num_patterns = 0
|
19 |
+
num_feature_levels = 4
|
20 |
+
enc_n_points = 4
|
21 |
+
dec_n_points = 4
|
22 |
+
two_stage_type = "standard"
|
23 |
+
two_stage_bbox_embed_share = False
|
24 |
+
two_stage_class_embed_share = False
|
25 |
+
transformer_activation = "relu"
|
26 |
+
dec_pred_bbox_embed_share = True
|
27 |
+
dn_box_noise_scale = 1.0
|
28 |
+
dn_label_noise_ratio = 0.5
|
29 |
+
dn_label_coef = 1.0
|
30 |
+
dn_bbox_coef = 1.0
|
31 |
+
embed_init_tgt = True
|
32 |
+
dn_labelbook_size = 2000
|
33 |
+
max_text_len = 256
|
34 |
+
text_encoder_type = "bert-base-uncased"
|
35 |
+
use_text_enhancer = True
|
36 |
+
use_fusion_layer = True
|
37 |
+
use_checkpoint = True
|
38 |
+
use_transformer_ckpt = True
|
39 |
+
use_text_cross_attention = True
|
40 |
+
text_dropout = 0.0
|
41 |
+
fusion_dropout = 0.0
|
42 |
+
fusion_droppath = 0.1
|
43 |
+
sub_sentence_present = True
|
config/GroundingDINO/GroundingDINO_SwinT_OGC.py
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
batch_size = 1
|
2 |
+
modelname = "groundingdino"
|
3 |
+
backbone = "swin_T_224_1k"
|
4 |
+
position_embedding = "sine"
|
5 |
+
pe_temperatureH = 20
|
6 |
+
pe_temperatureW = 20
|
7 |
+
return_interm_indices = [1, 2, 3]
|
8 |
+
backbone_freeze_keywords = None
|
9 |
+
enc_layers = 6
|
10 |
+
dec_layers = 6
|
11 |
+
pre_norm = False
|
12 |
+
dim_feedforward = 2048
|
13 |
+
hidden_dim = 256
|
14 |
+
dropout = 0.0
|
15 |
+
nheads = 8
|
16 |
+
num_queries = 900
|
17 |
+
query_dim = 4
|
18 |
+
num_patterns = 0
|
19 |
+
num_feature_levels = 4
|
20 |
+
enc_n_points = 4
|
21 |
+
dec_n_points = 4
|
22 |
+
two_stage_type = "standard"
|
23 |
+
two_stage_bbox_embed_share = False
|
24 |
+
two_stage_class_embed_share = False
|
25 |
+
transformer_activation = "relu"
|
26 |
+
dec_pred_bbox_embed_share = True
|
27 |
+
dn_box_noise_scale = 1.0
|
28 |
+
dn_label_noise_ratio = 0.5
|
29 |
+
dn_label_coef = 1.0
|
30 |
+
dn_bbox_coef = 1.0
|
31 |
+
embed_init_tgt = True
|
32 |
+
dn_labelbook_size = 2000
|
33 |
+
max_text_len = 256
|
34 |
+
text_encoder_type = "bert-base-uncased"
|
35 |
+
use_text_enhancer = True
|
36 |
+
use_fusion_layer = True
|
37 |
+
use_checkpoint = True
|
38 |
+
use_transformer_ckpt = True
|
39 |
+
use_text_cross_attention = True
|
40 |
+
text_dropout = 0.0
|
41 |
+
fusion_dropout = 0.0
|
42 |
+
fusion_droppath = 0.1
|
43 |
+
sub_sentence_present = True
|
config/inference/default.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"unet_additional_kwargs": {
|
3 |
+
"unet_use_cross_frame_attention": false,
|
4 |
+
"unet_use_temporal_attention": false,
|
5 |
+
"use_motion_module": true,
|
6 |
+
"motion_module_resolutions": [1, 2, 4, 8],
|
7 |
+
"motion_module_mid_block": false,
|
8 |
+
"motion_module_decoder_only": false,
|
9 |
+
"motion_module_type": "Vanilla",
|
10 |
+
"motion_module_kwargs": {
|
11 |
+
"num_attention_heads": 8,
|
12 |
+
"num_transformer_block": 1,
|
13 |
+
"attention_block_types": ["Temporal_Self", "Temporal_Self"],
|
14 |
+
"temporal_position_encoding": true,
|
15 |
+
"temporal_position_encoding_max_len": 24,
|
16 |
+
"temporal_attention_dim_div": 1
|
17 |
+
}
|
18 |
+
},
|
19 |
+
"noise_scheduler_kwargs": {
|
20 |
+
"num_train_timesteps": 1000,
|
21 |
+
"beta_start": 0.00085,
|
22 |
+
"beta_end": 0.012,
|
23 |
+
"beta_schedule": "linear",
|
24 |
+
"steps_offset": 1,
|
25 |
+
"clip_sample": false
|
26 |
+
}
|
27 |
+
}
|
config/inference/motion_v2.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"unet_additional_kwargs": {
|
3 |
+
"use_inflated_groupnorm": true,
|
4 |
+
"unet_use_cross_frame_attention": false,
|
5 |
+
"unet_use_temporal_attention": false,
|
6 |
+
"use_motion_module": true,
|
7 |
+
"motion_module_resolutions": [1, 2, 4, 8],
|
8 |
+
"motion_module_mid_block": true,
|
9 |
+
"motion_module_decoder_only": false,
|
10 |
+
"motion_module_type": "Vanilla",
|
11 |
+
"motion_module_kwargs": {
|
12 |
+
"num_attention_heads": 8,
|
13 |
+
"num_transformer_block": 1,
|
14 |
+
"attention_block_types": ["Temporal_Self", "Temporal_Self"],
|
15 |
+
"temporal_position_encoding": true,
|
16 |
+
"temporal_position_encoding_max_len": 32,
|
17 |
+
"temporal_attention_dim_div": 1
|
18 |
+
}
|
19 |
+
},
|
20 |
+
"noise_scheduler_kwargs": {
|
21 |
+
"num_train_timesteps": 1000,
|
22 |
+
"beta_start": 0.00085,
|
23 |
+
"beta_end": 0.012,
|
24 |
+
"beta_schedule": "linear",
|
25 |
+
"steps_offset": 1,
|
26 |
+
"clip_sample": false
|
27 |
+
}
|
28 |
+
}
|
config/inference/sd15-unet.json
ADDED
@@ -0,0 +1,89 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"sample_size": 64,
|
3 |
+
"in_channels": 4,
|
4 |
+
"out_channels": 4,
|
5 |
+
"center_input_sample": false,
|
6 |
+
"flip_sin_to_cos": true,
|
7 |
+
"freq_shift": 0,
|
8 |
+
"down_block_types": [
|
9 |
+
"CrossAttnDownBlock2D",
|
10 |
+
"CrossAttnDownBlock2D",
|
11 |
+
"CrossAttnDownBlock2D",
|
12 |
+
"DownBlock2D"
|
13 |
+
],
|
14 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
15 |
+
"up_block_types": [
|
16 |
+
"UpBlock2D",
|
17 |
+
"CrossAttnUpBlock2D",
|
18 |
+
"CrossAttnUpBlock2D",
|
19 |
+
"CrossAttnUpBlock2D"
|
20 |
+
],
|
21 |
+
"only_cross_attention": false,
|
22 |
+
"block_out_channels": [320, 640, 1280, 1280],
|
23 |
+
"layers_per_block": 2,
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"mid_block_scale_factor": 1,
|
26 |
+
"act_fn": "silu",
|
27 |
+
"norm_num_groups": 32,
|
28 |
+
"norm_eps": 1e-5,
|
29 |
+
"cross_attention_dim": 768,
|
30 |
+
"transformer_layers_per_block": 1,
|
31 |
+
"encoder_hid_dim": null,
|
32 |
+
"encoder_hid_dim_type": null,
|
33 |
+
"attention_head_dim": 8,
|
34 |
+
"num_attention_heads": null,
|
35 |
+
"dual_cross_attention": false,
|
36 |
+
"use_linear_projection": false,
|
37 |
+
"class_embed_type": null,
|
38 |
+
"addition_embed_type": null,
|
39 |
+
"addition_time_embed_dim": null,
|
40 |
+
"num_class_embeds": null,
|
41 |
+
"upcast_attention": false,
|
42 |
+
"resnet_time_scale_shift": "default",
|
43 |
+
"resnet_skip_time_act": false,
|
44 |
+
"resnet_out_scale_factor": 1.0,
|
45 |
+
"time_embedding_type": "positional",
|
46 |
+
"time_embedding_dim": null,
|
47 |
+
"time_embedding_act_fn": null,
|
48 |
+
"timestep_post_act": null,
|
49 |
+
"time_cond_proj_dim": null,
|
50 |
+
"conv_in_kernel": 3,
|
51 |
+
"conv_out_kernel": 3,
|
52 |
+
"projection_class_embeddings_input_dim": null,
|
53 |
+
"class_embeddings_concat": false,
|
54 |
+
"mid_block_only_cross_attention": null,
|
55 |
+
"cross_attention_norm": null,
|
56 |
+
"addition_embed_type_num_heads": 64,
|
57 |
+
"_use_default_values": [
|
58 |
+
"transformer_layers_per_block",
|
59 |
+
"use_linear_projection",
|
60 |
+
"num_class_embeds",
|
61 |
+
"addition_embed_type",
|
62 |
+
"cross_attention_norm",
|
63 |
+
"conv_out_kernel",
|
64 |
+
"encoder_hid_dim_type",
|
65 |
+
"projection_class_embeddings_input_dim",
|
66 |
+
"num_attention_heads",
|
67 |
+
"only_cross_attention",
|
68 |
+
"class_embed_type",
|
69 |
+
"resnet_time_scale_shift",
|
70 |
+
"addition_embed_type_num_heads",
|
71 |
+
"timestep_post_act",
|
72 |
+
"mid_block_type",
|
73 |
+
"mid_block_only_cross_attention",
|
74 |
+
"time_embedding_type",
|
75 |
+
"addition_time_embed_dim",
|
76 |
+
"time_embedding_dim",
|
77 |
+
"encoder_hid_dim",
|
78 |
+
"resnet_skip_time_act",
|
79 |
+
"conv_in_kernel",
|
80 |
+
"upcast_attention",
|
81 |
+
"dual_cross_attention",
|
82 |
+
"resnet_out_scale_factor",
|
83 |
+
"time_cond_proj_dim",
|
84 |
+
"class_embeddings_concat",
|
85 |
+
"time_embedding_act_fn"
|
86 |
+
],
|
87 |
+
"_class_name": "UNet2DConditionModel",
|
88 |
+
"_diffusers_version": "0.6.0"
|
89 |
+
}
|
config/inference/sd15-unet3d.json
ADDED
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"sample_size": 64,
|
3 |
+
"in_channels": 4,
|
4 |
+
"out_channels": 4,
|
5 |
+
"center_input_sample": false,
|
6 |
+
"flip_sin_to_cos": true,
|
7 |
+
"freq_shift": 0,
|
8 |
+
"down_block_types": [
|
9 |
+
"CrossAttnDownBlock3D",
|
10 |
+
"CrossAttnDownBlock3D",
|
11 |
+
"CrossAttnDownBlock3D",
|
12 |
+
"DownBlock3D"
|
13 |
+
],
|
14 |
+
"mid_block_type": "UNetMidBlock3DCrossAttn",
|
15 |
+
"up_block_types": [
|
16 |
+
"UpBlock3D",
|
17 |
+
"CrossAttnUpBlock3D",
|
18 |
+
"CrossAttnUpBlock3D",
|
19 |
+
"CrossAttnUpBlock3D"
|
20 |
+
],
|
21 |
+
"only_cross_attention": false,
|
22 |
+
"block_out_channels": [320, 640, 1280, 1280],
|
23 |
+
"layers_per_block": 2,
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"mid_block_scale_factor": 1,
|
26 |
+
"act_fn": "silu",
|
27 |
+
"norm_num_groups": 32,
|
28 |
+
"norm_eps": 1e-5,
|
29 |
+
"cross_attention_dim": 768,
|
30 |
+
"attention_head_dim": 8,
|
31 |
+
"dual_cross_attention": false,
|
32 |
+
"use_linear_projection": false,
|
33 |
+
"class_embed_type": null,
|
34 |
+
"num_class_embeds": null,
|
35 |
+
"upcast_attention": false,
|
36 |
+
"resnet_time_scale_shift": "default",
|
37 |
+
"use_motion_module": true,
|
38 |
+
"motion_module_resolutions": [1, 2, 4, 8],
|
39 |
+
"motion_module_mid_block": false,
|
40 |
+
"motion_module_decoder_only": false,
|
41 |
+
"motion_module_type": "Vanilla",
|
42 |
+
"motion_module_kwargs": {
|
43 |
+
"num_attention_heads": 8,
|
44 |
+
"num_transformer_block": 1,
|
45 |
+
"attention_block_types": ["Temporal_Self", "Temporal_Self"],
|
46 |
+
"temporal_position_encoding": true,
|
47 |
+
"temporal_position_encoding_max_len": 24,
|
48 |
+
"temporal_attention_dim_div": 1
|
49 |
+
},
|
50 |
+
"unet_use_cross_frame_attention": false,
|
51 |
+
"unet_use_temporal_attention": false,
|
52 |
+
"_use_default_values": [
|
53 |
+
"use_linear_projection",
|
54 |
+
"mid_block_type",
|
55 |
+
"upcast_attention",
|
56 |
+
"dual_cross_attention",
|
57 |
+
"num_class_embeds",
|
58 |
+
"only_cross_attention",
|
59 |
+
"class_embed_type",
|
60 |
+
"resnet_time_scale_shift"
|
61 |
+
],
|
62 |
+
"_class_name": "UNet3DConditionModel",
|
63 |
+
"_diffusers_version": "0.6.0"
|
64 |
+
}
|
config/prompts/.gitignore
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
*
|
2 |
+
!.gitignore
|
config/prompts/01-ToonYou.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "ToonYou",
|
3 |
+
"base": "",
|
4 |
+
"path": "models/sd/toonyou_beta3.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"compile": false,
|
7 |
+
"seed": [
|
8 |
+
10788741199826055000, 6520604954829637000, 6519455744612556000,
|
9 |
+
16372571278361864000
|
10 |
+
],
|
11 |
+
"scheduler": "k_dpmpp",
|
12 |
+
"steps": 30,
|
13 |
+
"guidance_scale": 8.5,
|
14 |
+
"clip_skip": 2,
|
15 |
+
"prompt": [
|
16 |
+
"1girl, solo, best quality, masterpiece, looking at viewer, purple hair, orange hair, gradient hair, blurry background, upper body, dress, flower print, spaghetti strap, bare shoulders",
|
17 |
+
"1girl, solo, masterpiece, best quality, cherry blossoms, hanami, pink flower, white flower, spring season, wisteria, petals, flower, plum blossoms, outdoors, falling petals, white hair, black eyes,",
|
18 |
+
"1girl, solo, best quality, masterpiece, looking at viewer, purple hair, orange hair, gradient hair, blurry background, upper body, dress, flower print, spaghetti strap, bare shoulders",
|
19 |
+
"1girl, solo, best quality, masterpiece, cloudy sky, dandelion, contrapposto, alternate hairstyle"
|
20 |
+
],
|
21 |
+
"n_prompt": [
|
22 |
+
"worst quality, low quality, cropped, lowres, text, jpeg artifacts, multiple view"
|
23 |
+
]
|
24 |
+
}
|
config/prompts/02-Lyriel.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "Lyriel",
|
3 |
+
"base": "",
|
4 |
+
"path": "models/sd/lyriel_v16.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
10917152860782582000, 6399018107401806000, 15875751942533906000,
|
8 |
+
6653196880059937000
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"prompt": [
|
14 |
+
"dark shot, epic realistic, portrait of halo, sunglasses, blue eyes, tartan scarf, white hair by atey ghailan, by greg rutkowski, by greg tocchini, by james gilleard, by joe fenton, by kaethe butcher, gradient yellow, black, brown and magenta color scheme, grunge aesthetic!!! graffiti tag wall background, art by greg rutkowski and artgerm, soft cinematic light, adobe lightroom, photolab, hdr, intricate, highly detailed, depth of field, faded, neutral colors, hdr, muted colors, hyperdetailed, artstation, cinematic, warm lights, dramatic light, intricate details, complex background, rutkowski, teal and orange",
|
15 |
+
"A forbidden castle high up in the mountains, pixel art, intricate details2, hdr, intricate details, hyperdetailed5, natural skin texture, hyperrealism, soft light, sharp, game art, key visual, surreal",
|
16 |
+
"dark theme, medieval portrait of a man sharp features, grim, cold stare, dark colors, Volumetric lighting, baroque oil painting by Greg Rutkowski, Artgerm, WLOP, Alphonse Mucha dynamic lighting hyperdetailed intricately detailed, hdr, muted colors, complex background, hyperrealism, hyperdetailed, amandine van ray",
|
17 |
+
"As I have gone alone in there and with my treasures bold, I can keep my secret where and hint of riches new and old. Begin it where warm waters halt and take it in a canyon down, not far but too far to walk, put in below the home of brown."
|
18 |
+
],
|
19 |
+
"n_prompt": [
|
20 |
+
"3d, cartoon, lowres, bad anatomy, bad hands, text, error, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality, normal quality, jpeg artifacts, signature, watermark, username, blurry, artist name, young, loli, elf, 3d, illustration",
|
21 |
+
"3d, cartoon, anime, sketches, worst quality, low quality, normal quality, lowres, normal quality, monochrome, grayscale, skin spots, acnes, skin blemishes, bad anatomy, girl, loli, young, large breasts, red eyes, muscular",
|
22 |
+
"dof, grayscale, black and white, bw, 3d, cartoon, anime, sketches, worst quality, low quality, normal quality, lowres, normal quality, monochrome, grayscale, skin spots, acnes, skin blemishes, bad anatomy, girl, loli, young, large breasts, red eyes, muscular,badhandsv5-neg, By bad artist -neg 1, monochrome",
|
23 |
+
"holding an item, cowboy, hat, cartoon, 3d, disfigured, bad art, deformed,extra limbs,close up,b&w, wierd colors, blurry, duplicate, morbid, mutilated, [out of frame], extra fingers, mutated hands, poorly drawn hands, poorly drawn face, mutation, deformed, ugly, blurry, bad anatomy, bad proportions, extra limbs, cloned face, disfigured, out of frame, ugly, extra limbs, bad anatomy, gross proportions, malformed limbs, missing arms, missing legs, extra arms, extra legs, mutated hands, fused fingers, too many fingers, long neck, Photoshop, video game, ugly, tiling, poorly drawn hands, poorly drawn feet, poorly drawn face, out of frame, mutation, mutated, extra limbs, extra legs, extra arms, disfigured, deformed, cross-eye, body out of frame, blurry, bad art, bad anatomy, 3d render"
|
24 |
+
]
|
25 |
+
}
|
config/prompts/03-RcnzCartoon.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "RcnzCartoon",
|
3 |
+
"base": "",
|
4 |
+
"path": "models/sd/rcnzCartoon3d_v10.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
16931037867122268000, 2094308009433392000, 4292543217695451000,
|
8 |
+
15572665120852310000
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"prompt": [
|
14 |
+
"Jane Eyre with headphones, natural skin texture,4mm,k textures, soft cinematic light, adobe lightroom, photolab, hdr, intricate, elegant, highly detailed, sharp focus, cinematic look, soothing tones, insane details, intricate details, hyperdetailed, low contrast, soft cinematic light, dim colors, exposure blend, hdr, faded",
|
15 |
+
"close up Portrait photo of muscular bearded guy in a worn mech suit, light bokeh, intricate, steel metal [rust], elegant, sharp focus, photo by greg rutkowski, soft lighting, vibrant colors, masterpiece, streets, detailed face",
|
16 |
+
"absurdres, photorealistic, masterpiece, a 30 year old man with gold framed, aviator reading glasses and a black hooded jacket and a beard, professional photo, a character portrait, altermodern, detailed eyes, detailed lips, detailed face, grey eyes",
|
17 |
+
"a golden labrador, warm vibrant colours, natural lighting, dappled lighting, diffused lighting, absurdres, highres,k, uhd, hdr, rtx, unreal, octane render, RAW photo, photorealistic, global illumination, subsurface scattering"
|
18 |
+
],
|
19 |
+
"n_prompt": [
|
20 |
+
"deformed, distorted, disfigured, poorly drawn, bad anatomy, wrong anatomy, extra limb, missing limb, floating limbs, mutated hands and fingers, disconnected limbs, mutation, mutated, ugly, disgusting, blurry, amputation",
|
21 |
+
"nude, cross eyed, tongue, open mouth, inside, 3d, cartoon, anime, sketches, worst quality, low quality, normal quality, lowres, normal quality, monochrome, grayscale, skin spots, acnes, skin blemishes, bad anatomy, red eyes, muscular",
|
22 |
+
"easynegative, cartoon, anime, sketches, necklace, earrings worst quality, low quality, normal quality, bad anatomy, bad hands, shiny skin, error, missing fingers, extra digit, fewer digits, jpeg artifacts, signature, watermark, username, blurry, chubby, anorectic, bad eyes, old, wrinkled skin, red skin, photograph By bad artist -neg, big eyes, muscular face,",
|
23 |
+
"beard, EasyNegative, lowres, chromatic aberration, depth of field, motion blur, blurry, bokeh, bad quality, worst quality, multiple arms, badhand"
|
24 |
+
]
|
25 |
+
}
|
config/prompts/04-MajicMix.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "MajicMix",
|
3 |
+
"base": "",
|
4 |
+
"path": "models/sd/majicmixRealistic_v5Preview.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
1572448948722921000, 1099474677988590700, 6488833139725636000,
|
8 |
+
18339859844376519000
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"prompt": [
|
14 |
+
"1girl, offshoulder, light smile, shiny skin best quality, masterpiece, photorealistic",
|
15 |
+
"best quality, masterpiece, photorealistic, 1boy, 50 years old beard, dramatic lighting",
|
16 |
+
"best quality, masterpiece, photorealistic, 1girl, light smile, shirt with collars, waist up, dramatic lighting, from below",
|
17 |
+
"male, man, beard, bodybuilder, skinhead,cold face, tough guy, cowboyshot, tattoo, french windows, luxury hotel masterpiece, best quality, photorealistic"
|
18 |
+
],
|
19 |
+
"n_prompt": [
|
20 |
+
"ng_deepnegative_v1_75t, badhandv4, worst quality, low quality, normal quality, lowres, bad anatomy, bad hands, watermark, moles",
|
21 |
+
"nsfw, ng_deepnegative_v1_75t,badhandv4, worst quality, low quality, normal quality, lowres,watermark, monochrome",
|
22 |
+
"nsfw, ng_deepnegative_v1_75t,badhandv4, worst quality, low quality, normal quality, lowres,watermark, monochrome",
|
23 |
+
"nude, nsfw, ng_deepnegative_v1_75t, badhandv4, worst quality, low quality, normal quality, lowres, bad anatomy, bad hands, monochrome, grayscale watermark, moles, people"
|
24 |
+
]
|
25 |
+
}
|
config/prompts/05-RealisticVision.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "RealisticVision",
|
3 |
+
"base": "",
|
4 |
+
"path": "models/sd/realisticVisionV20_v20.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
5658137986800322000, 12099779162349365000, 10499524853910854000,
|
8 |
+
16768009035333712000
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"prompt": [
|
14 |
+
"b&w photo of 42 y.o man in black clothes, bald, face, half body, body, high detailed skin, skin pores, coastline, overcast weather, wind, waves, 8k uhd, dslr, soft lighting, high quality, film grain, Fujifilm XT3",
|
15 |
+
"close up photo of a rabbit, forest, haze, halation, bloom, dramatic atmosphere, centred, rule of thirds, 200mm 1.4f macro shot",
|
16 |
+
"photo of coastline, rocks, storm weather, wind, waves, lightning, 8k uhd, dslr, soft lighting, high quality, film grain, Fujifilm XT3",
|
17 |
+
"night, b&w photo of old house, post apocalypse, forest, storm weather, wind, rocks, 8k uhd, dslr, soft lighting, high quality, film grain"
|
18 |
+
],
|
19 |
+
"n_prompt": [
|
20 |
+
"semi-realistic, cgi, 3d, render, sketch, cartoon, drawing, anime, text, close up, cropped, out of frame, worst quality, low quality, jpeg artifacts, ugly, duplicate, morbid, mutilated, extra fingers, mutated hands, poorly drawn hands, poorly drawn face, mutation, deformed, blurry, dehydrated, bad anatomy, bad proportions, extra limbs, cloned face, disfigured, gross proportions, malformed limbs, missing arms, missing legs, extra arms, extra legs, fused fingers, too many fingers, long neck",
|
21 |
+
"semi-realistic, cgi, 3d, render, sketch, cartoon, drawing, anime, text, close up, cropped, out of frame, worst quality, low quality, jpeg artifacts, ugly, duplicate, morbid, mutilated, extra fingers, mutated hands, poorly drawn hands, poorly drawn face, mutation, deformed, blurry, dehydrated, bad anatomy, bad proportions, extra limbs, cloned face, disfigured, gross proportions, malformed limbs, missing arms, missing legs, extra arms, extra legs, fused fingers, too many fingers, long neck",
|
22 |
+
"blur, haze, deformed iris, deformed pupils, semi-realistic, cgi, 3d, render, sketch, cartoon, drawing, anime, mutated hands and fingers, deformed, distorted, disfigured, poorly drawn, bad anatomy, wrong anatomy, extra limb, missing limb, floating limbs, disconnected limbs, mutation, mutated, ugly, disgusting, amputation",
|
23 |
+
"blur, haze, deformed iris, deformed pupils, semi-realistic, cgi, 3d, render, sketch, cartoon, drawing, anime, art, mutated hands and fingers, deformed, distorted, disfigured, poorly drawn, bad anatomy, wrong anatomy, extra limb, missing limb, floating limbs, disconnected limbs, mutation, mutated, ugly, disgusting, amputation"
|
24 |
+
]
|
25 |
+
}
|
config/prompts/06-Tusun.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "Tusun",
|
3 |
+
"base": "models/sd/moonfilm_reality20.safetensors",
|
4 |
+
"path": "models/sd/TUSUN.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
10154078483724687000, 2664393535095473700, 4231566096207623000,
|
8 |
+
1713349740448094500
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"lora_alpha": 0.6,
|
14 |
+
"prompt": [
|
15 |
+
"tusuncub with its mouth open, blurry, open mouth, fangs, photo background, looking at viewer, tongue, full body, solo, cute and lovely, Beautiful and realistic eye details, perfect anatomy, Nonsense, pure background, Centered-Shot, realistic photo, photograph, 4k, hyper detailed, DSLR, 24 Megapixels, 8mm Lens, Full Frame, film grain, Global Illumination, studio Lighting, Award Winning Photography, diffuse reflection, ray tracing",
|
16 |
+
"cute tusun with a blurry background, black background, simple background, signature, face, solo, cute and lovely, Beautiful and realistic eye details, perfect anatomy, Nonsense, pure background, Centered-Shot, realistic photo, photograph, 4k, hyper detailed, DSLR, 24 Megapixels, 8mm Lens, Full Frame, film grain, Global Illumination, studio Lighting, Award Winning Photography, diffuse reflection, ray tracing",
|
17 |
+
"cut tusuncub walking in the snow, blurry, looking at viewer, depth of field, blurry background, full body, solo, cute and lovely, Beautiful and realistic eye details, perfect anatomy, Nonsense, pure background, Centered-Shot, realistic photo, photograph, 4k, hyper detailed, DSLR, 24 Megapixels, 8mm Lens, Full Frame, film grain, Global Illumination, studio Lighting, Award Winning Photography, diffuse reflection, ray tracing",
|
18 |
+
"character design, cyberpunk tusun kitten wearing astronaut suit, sci-fic, realistic eye color and details, fluffy, big head, science fiction, communist ideology, Cyborg, fantasy, intense angle, soft lighting, photograph, 4k, hyper detailed, portrait wallpaper, realistic, photo-realistic, DSLR, 24 Megapixels, Full Frame, vibrant details, octane render, finely detail, best quality, incredibly absurdres, robotic parts, rim light, vibrant details, luxurious cyberpunk, hyperrealistic, cable electric wires, microchip, full body"
|
19 |
+
],
|
20 |
+
"n_prompt": [
|
21 |
+
"worst quality, low quality, deformed, distorted, disfigured, bad eyes, bad anatomy, disconnected limbs, wrong body proportions, low quality, worst quality, text, watermark, signatre, logo, illustration, painting, cartoons, ugly, easy_negative"
|
22 |
+
]
|
23 |
+
}
|
config/prompts/07-FilmVelvia.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "FilmVelvia",
|
3 |
+
"base": "models/sd/majicmixRealistic_v4.safetensors",
|
4 |
+
"path": "models/sd/FilmVelvia2.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
358675358833372800, 3519455280971924000, 11684545350557985000,
|
8 |
+
8696855302100400000
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"lora_alpha": 0.6,
|
14 |
+
"prompt": [
|
15 |
+
"a woman standing on the side of a road at night,girl, long hair, motor vehicle, car, looking at viewer, ground vehicle, night, hands in pockets, blurry background, coat, black hair, parted lips, bokeh, jacket, brown hair, outdoors, red lips, upper body, artist name",
|
16 |
+
", dark shot,0mm, portrait quality of a arab man worker,boy, wasteland that stands out vividly against the background of the desert, barren landscape, closeup, moles skin, soft light, sharp, exposure blend, medium shot, bokeh, hdr, high contrast, cinematic, teal and orange5, muted colors, dim colors, soothing tones, low saturation, hyperdetailed, noir",
|
17 |
+
"fashion photography portrait of 1girl, offshoulder, fluffy short hair, soft light, rim light, beautiful shadow, low key, photorealistic, raw photo, natural skin texture, realistic eye and face details, hyperrealism, ultra high res, 4K, Best quality, masterpiece, necklace, cleavage, in the dark",
|
18 |
+
"In this lighthearted portrait, a woman is dressed as a fierce warrior, armed with an arsenal of paintbrushes and palette knives. Her war paint is composed of thick, vibrant strokes of color, and her armor is made of paint tubes and paint-splattered canvases. She stands victoriously atop a mountain of conquered blank canvases, with a beautiful, colorful landscape behind her, symbolizing the power of art and creativity. bust Portrait, close-up, Bright and transparent scene lighting, "
|
19 |
+
],
|
20 |
+
"n_prompt": [
|
21 |
+
"cartoon, anime, sketches,worst quality, low quality, deformed, distorted, disfigured, bad eyes, wrong lips, weird mouth, bad teeth, mutated hands and fingers, bad anatomy, wrong anatomy, amputation, extra limb, missing limb, floating limbs, disconnected limbs, mutation, ugly, disgusting, bad_pictures, negative_hand-neg",
|
22 |
+
"cartoon, anime, sketches,worst quality, low quality, deformed, distorted, disfigured, bad eyes, wrong lips, weird mouth, bad teeth, mutated hands and fingers, bad anatomy, wrong anatomy, amputation, extra limb, missing limb, floating limbs, disconnected limbs, mutation, ugly, disgusting, bad_pictures, negative_hand-neg",
|
23 |
+
"wrong white balance, dark, cartoon, anime, sketches,worst quality, low quality, deformed, distorted, disfigured, bad eyes, wrong lips, weird mouth, bad teeth, mutated hands and fingers, bad anatomy, wrong anatomy, amputation, extra limb, missing limb, floating limbs, disconnected limbs, mutation, ugly, disgusting, bad_pictures, negative_hand-neg",
|
24 |
+
"wrong white balance, dark, cartoon, anime, sketches,worst quality, low quality, deformed, distorted, disfigured, bad eyes, wrong lips, weird mouth, bad teeth, mutated hands and fingers, bad anatomy, wrong anatomy, amputation, extra limb, missing limb, floating limbs, disconnected limbs, mutation, ugly, disgusting, bad_pictures, negative_hand-neg"
|
25 |
+
]
|
26 |
+
}
|
config/prompts/08-GhibliBackground.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "GhibliBackground",
|
3 |
+
"base": "models/sd/CounterfeitV30_25.safetensors",
|
4 |
+
"path": "models/sd/lora_Ghibli_n3.safetensors",
|
5 |
+
"motion_module": "models/motion-module/mm_sd_v15.ckpt",
|
6 |
+
"seed": [
|
7 |
+
8775748474469046000, 5893874876080607000, 11911465742147697000,
|
8 |
+
12437784838692000000
|
9 |
+
],
|
10 |
+
"scheduler": "k_dpmpp",
|
11 |
+
"steps": 25,
|
12 |
+
"guidance_scale": 7.5,
|
13 |
+
"lora_alpha": 1,
|
14 |
+
"prompt": [
|
15 |
+
"best quality,single build,architecture, blue_sky, building,cloudy_sky, day, fantasy, fence, field, house, build,architecture,landscape, moss, outdoors, overgrown, path, river, road, rock, scenery, sky, sword, tower, tree, waterfall",
|
16 |
+
"black_border, building, city, day, fantasy, ice, landscape, letterboxed, mountain, ocean, outdoors, planet, scenery, ship, snow, snowing, water, watercraft, waterfall, winter",
|
17 |
+
",mysterious sea area, fantasy,build,concept",
|
18 |
+
"Tomb Raider,Scenography,Old building"
|
19 |
+
],
|
20 |
+
"n_prompt": [
|
21 |
+
"easynegative,bad_construction,bad_structure,bad_wail,bad_windows,blurry,cloned_window,cropped,deformed,disfigured,error,extra_windows,extra_chimney,extra_door,extra_structure,extra_frame,fewer_digits,fused_structure,gross_proportions,jpeg_artifacts,long_roof,low_quality,structure_limbs,missing_windows,missing_doors,missing_roofs,mutated_structure,mutation,normal_quality,out_of_frame,owres,poorly_drawn_structure,poorly_drawn_house,signature,text,too_many_windows,ugly,username,uta,watermark,worst_quality"
|
22 |
+
]
|
23 |
+
}
|
config/prompts/concat_2horizontal.bat
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
ffmpeg -i %1 -i %2 -filter_complex "[0:v][1:v]hstack=inputs=2[v]" -map "[v]" -crf 15 2horizontal.mp4
|
config/prompts/ignore_tokens.txt
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
motion_blur
|
2 |
+
blurry
|
3 |
+
realistic
|
4 |
+
depth_of_field
|
config/prompts/prompt_travel.json
ADDED
@@ -0,0 +1,248 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "sample",
|
3 |
+
"path": "share/sd_models/Anything.safetensors",
|
4 |
+
"motion_module": "models/motion-module/animatediff/mm_sd_v15_v2.ckpt",
|
5 |
+
"compile": false,
|
6 |
+
"seed": [
|
7 |
+
-1
|
8 |
+
],
|
9 |
+
"scheduler": "k_dpmpp_sde",
|
10 |
+
"steps": 20,
|
11 |
+
"guidance_scale": 10,
|
12 |
+
"clip_skip": 2,
|
13 |
+
"prompt_fixed_ratio": 1.0,
|
14 |
+
"head_prompt": "1girl, wizard, circlet, earrings, jewelry, purple hair,",
|
15 |
+
"prompt_map": {
|
16 |
+
"0": "",
|
17 |
+
"8": "((fire magic spell, fire background))",
|
18 |
+
"16": "((ice magic spell, ice background))",
|
19 |
+
"24": "((thunder magic spell, thunder background))",
|
20 |
+
"32": "((skull magic spell, skull background))",
|
21 |
+
"40": "((wind magic spell, wind background))",
|
22 |
+
"48": "((stone magic spell, stone background))",
|
23 |
+
"56": "((holy magic spell, holy background))",
|
24 |
+
"64": "((star magic spell, star background))",
|
25 |
+
"72": "((plant magic spell, plant background))",
|
26 |
+
"80": "((meteor magic spell, meteor background))"
|
27 |
+
},
|
28 |
+
"tail_prompt": "",
|
29 |
+
"n_prompt": [
|
30 |
+
"(worst quality, low quality:1.4),nudity,simple background,border,mouth closed,text, patreon,bed,bedroom,white background,((monochrome)),sketch,(pink body:1.4),7 arms,8 arms,4 arms"
|
31 |
+
],
|
32 |
+
"lora_map": {
|
33 |
+
"share/lora/more_detail.safetensors" : 1.0,
|
34 |
+
"share/lora/add_detail.safetensors" : 1.0
|
35 |
+
},
|
36 |
+
"motion_lora_map": {
|
37 |
+
"models/motion-module/animatediff/v2_lora_PanLeft.ckpt":1.0
|
38 |
+
},
|
39 |
+
"ip_adapter_map": {
|
40 |
+
"enable": true,
|
41 |
+
"input_image_dir": "ip_adapter_image/test",
|
42 |
+
"save_input_image": true,
|
43 |
+
"resized_to_square": false,
|
44 |
+
"scale": 0.5,
|
45 |
+
"is_plus_face": true,
|
46 |
+
"is_plus": true
|
47 |
+
},
|
48 |
+
"controlnet_map": {
|
49 |
+
"input_image_dir" : "controlnet_image/test",
|
50 |
+
"max_samples_on_vram": 200,
|
51 |
+
"max_models_on_vram" : 3,
|
52 |
+
"save_detectmap": true,
|
53 |
+
"preprocess_on_gpu": true,
|
54 |
+
"is_loop": true,
|
55 |
+
|
56 |
+
"controlnet_tile":{
|
57 |
+
"enable": true,
|
58 |
+
"use_preprocessor":true,
|
59 |
+
"preprocessor":{
|
60 |
+
"type" : "none",
|
61 |
+
"param":{
|
62 |
+
}
|
63 |
+
},
|
64 |
+
"guess_mode":false,
|
65 |
+
"controlnet_conditioning_scale": 1.0,
|
66 |
+
"control_guidance_start": 0.0,
|
67 |
+
"control_guidance_end": 1.0,
|
68 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
69 |
+
},
|
70 |
+
"controlnet_ip2p":{
|
71 |
+
"enable": true,
|
72 |
+
"use_preprocessor":true,
|
73 |
+
"guess_mode":false,
|
74 |
+
"controlnet_conditioning_scale": 1.0,
|
75 |
+
"control_guidance_start": 0.0,
|
76 |
+
"control_guidance_end": 1.0,
|
77 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
78 |
+
},
|
79 |
+
"controlnet_lineart_anime":{
|
80 |
+
"enable": true,
|
81 |
+
"use_preprocessor":true,
|
82 |
+
"guess_mode":false,
|
83 |
+
"controlnet_conditioning_scale": 1.0,
|
84 |
+
"control_guidance_start": 0.0,
|
85 |
+
"control_guidance_end": 1.0,
|
86 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
87 |
+
},
|
88 |
+
"controlnet_openpose":{
|
89 |
+
"enable": true,
|
90 |
+
"use_preprocessor":true,
|
91 |
+
"guess_mode":false,
|
92 |
+
"controlnet_conditioning_scale": 1.0,
|
93 |
+
"control_guidance_start": 0.0,
|
94 |
+
"control_guidance_end": 1.0,
|
95 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
96 |
+
},
|
97 |
+
"controlnet_softedge":{
|
98 |
+
"enable": true,
|
99 |
+
"use_preprocessor":true,
|
100 |
+
"preprocessor":{
|
101 |
+
"type" : "softedge_pidsafe",
|
102 |
+
"param":{
|
103 |
+
}
|
104 |
+
},
|
105 |
+
"guess_mode":false,
|
106 |
+
"controlnet_conditioning_scale": 1.0,
|
107 |
+
"control_guidance_start": 0.0,
|
108 |
+
"control_guidance_end": 1.0,
|
109 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
110 |
+
},
|
111 |
+
"controlnet_shuffle": {
|
112 |
+
"enable": true,
|
113 |
+
"use_preprocessor":true,
|
114 |
+
"guess_mode":false,
|
115 |
+
"controlnet_conditioning_scale": 1.0,
|
116 |
+
"control_guidance_start": 0.0,
|
117 |
+
"control_guidance_end": 1.0,
|
118 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
119 |
+
},
|
120 |
+
"controlnet_depth": {
|
121 |
+
"enable": true,
|
122 |
+
"use_preprocessor":true,
|
123 |
+
"guess_mode":false,
|
124 |
+
"controlnet_conditioning_scale": 1.0,
|
125 |
+
"control_guidance_start": 0.0,
|
126 |
+
"control_guidance_end": 1.0,
|
127 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
128 |
+
},
|
129 |
+
"controlnet_canny": {
|
130 |
+
"enable": true,
|
131 |
+
"use_preprocessor":true,
|
132 |
+
"guess_mode":false,
|
133 |
+
"controlnet_conditioning_scale": 1.0,
|
134 |
+
"control_guidance_start": 0.0,
|
135 |
+
"control_guidance_end": 1.0,
|
136 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
137 |
+
},
|
138 |
+
"controlnet_inpaint": {
|
139 |
+
"enable": true,
|
140 |
+
"use_preprocessor":true,
|
141 |
+
"guess_mode":false,
|
142 |
+
"controlnet_conditioning_scale": 1.0,
|
143 |
+
"control_guidance_start": 0.0,
|
144 |
+
"control_guidance_end": 1.0,
|
145 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
146 |
+
},
|
147 |
+
"controlnet_lineart": {
|
148 |
+
"enable": true,
|
149 |
+
"use_preprocessor":true,
|
150 |
+
"guess_mode":false,
|
151 |
+
"controlnet_conditioning_scale": 1.0,
|
152 |
+
"control_guidance_start": 0.0,
|
153 |
+
"control_guidance_end": 1.0,
|
154 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
155 |
+
},
|
156 |
+
"controlnet_mlsd": {
|
157 |
+
"enable": true,
|
158 |
+
"use_preprocessor":true,
|
159 |
+
"guess_mode":false,
|
160 |
+
"controlnet_conditioning_scale": 1.0,
|
161 |
+
"control_guidance_start": 0.0,
|
162 |
+
"control_guidance_end": 1.0,
|
163 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
164 |
+
},
|
165 |
+
"controlnet_normalbae": {
|
166 |
+
"enable": true,
|
167 |
+
"use_preprocessor":true,
|
168 |
+
"guess_mode":false,
|
169 |
+
"controlnet_conditioning_scale": 1.0,
|
170 |
+
"control_guidance_start": 0.0,
|
171 |
+
"control_guidance_end": 1.0,
|
172 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
173 |
+
},
|
174 |
+
"controlnet_scribble": {
|
175 |
+
"enable": true,
|
176 |
+
"use_preprocessor":true,
|
177 |
+
"guess_mode":false,
|
178 |
+
"controlnet_conditioning_scale": 1.0,
|
179 |
+
"control_guidance_start": 0.0,
|
180 |
+
"control_guidance_end": 1.0,
|
181 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
182 |
+
},
|
183 |
+
"controlnet_seg": {
|
184 |
+
"enable": true,
|
185 |
+
"use_preprocessor":true,
|
186 |
+
"guess_mode":false,
|
187 |
+
"controlnet_conditioning_scale": 1.0,
|
188 |
+
"control_guidance_start": 0.0,
|
189 |
+
"control_guidance_end": 1.0,
|
190 |
+
"control_scale_list":[0.5,0.4,0.3,0.2,0.1]
|
191 |
+
},
|
192 |
+
"controlnet_ref": {
|
193 |
+
"enable": false,
|
194 |
+
"ref_image": "ref_image/ref_sample.png",
|
195 |
+
"attention_auto_machine_weight": 0.3,
|
196 |
+
"gn_auto_machine_weight": 0.3,
|
197 |
+
"style_fidelity": 0.5,
|
198 |
+
"reference_attn": true,
|
199 |
+
"reference_adain": false,
|
200 |
+
"scale_pattern":[1.0]
|
201 |
+
}
|
202 |
+
},
|
203 |
+
"upscale_config": {
|
204 |
+
"scheduler": "k_dpmpp_sde",
|
205 |
+
"steps": 20,
|
206 |
+
"strength": 0.5,
|
207 |
+
"guidance_scale": 10,
|
208 |
+
"controlnet_tile": {
|
209 |
+
"enable": true,
|
210 |
+
"controlnet_conditioning_scale": 1.0,
|
211 |
+
"guess_mode": false,
|
212 |
+
"control_guidance_start": 0.0,
|
213 |
+
"control_guidance_end": 1.0
|
214 |
+
},
|
215 |
+
"controlnet_line_anime": {
|
216 |
+
"enable": false,
|
217 |
+
"controlnet_conditioning_scale": 1.0,
|
218 |
+
"guess_mode": false,
|
219 |
+
"control_guidance_start": 0.0,
|
220 |
+
"control_guidance_end": 1.0
|
221 |
+
},
|
222 |
+
"controlnet_ip2p": {
|
223 |
+
"enable": false,
|
224 |
+
"controlnet_conditioning_scale": 0.5,
|
225 |
+
"guess_mode": false,
|
226 |
+
"control_guidance_start": 0.0,
|
227 |
+
"control_guidance_end": 1.0
|
228 |
+
},
|
229 |
+
"controlnet_ref": {
|
230 |
+
"enable": false,
|
231 |
+
"use_frame_as_ref_image": false,
|
232 |
+
"use_1st_frame_as_ref_image": false,
|
233 |
+
"ref_image": "ref_image/path_to_your_ref_img.jpg",
|
234 |
+
"attention_auto_machine_weight": 1.0,
|
235 |
+
"gn_auto_machine_weight": 1.0,
|
236 |
+
"style_fidelity": 0.25,
|
237 |
+
"reference_attn": true,
|
238 |
+
"reference_adain": false
|
239 |
+
}
|
240 |
+
},
|
241 |
+
"output":{
|
242 |
+
"format" : "gif",
|
243 |
+
"fps" : 8,
|
244 |
+
"encode_param":{
|
245 |
+
"crf": 10
|
246 |
+
}
|
247 |
+
}
|
248 |
+
}
|
config/prompts/prompt_travel_multi_controlnet.json
ADDED
@@ -0,0 +1,323 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "sample",
|
3 |
+
"path": "share/sd_models/mistoonAnime_v20.safetensors",
|
4 |
+
"motion_module": "models/motion-module/animatediff/mm_sd_v15_v2.ckpt",
|
5 |
+
"compile": false,
|
6 |
+
"seed": [
|
7 |
+
-1
|
8 |
+
],
|
9 |
+
"scheduler": "k_dpmpp_sde",
|
10 |
+
"steps": 20,
|
11 |
+
"guidance_scale": 10,
|
12 |
+
"clip_skip": 2,
|
13 |
+
"prompt_fixed_ratio": 1.0,
|
14 |
+
"head_prompt": "little girl, pink hair, tall, confident posture, closed eyes, deep thought, intense anger, powerful roar, red face",
|
15 |
+
"prompt_map": {
|
16 |
+
"0": "",
|
17 |
+
"8": "((contemplation))",
|
18 |
+
"16": "((furrowed brows))",
|
19 |
+
"24": "((anger))",
|
20 |
+
"32": "((wide open mouth))",
|
21 |
+
"40": "((powerful roar))"
|
22 |
+
},
|
23 |
+
"tail_prompt": "",
|
24 |
+
"n_prompt": [
|
25 |
+
"(worst quality, bad quality:1.4), nudity, multiple views, text, logo, extra heads, painting, sketches, cropped, monochrome, grayscale, (ugly, morbid, mutation, disfigured:1.3), out of frame, long neck, age spot, skin blemishes, mole, acnes, cross-eyed, unbalanced eyes, different eyes color, extra fingers, extra arms, mutated hands, bad anatomy, bad proportions, extra limbs, malformed limbs, extra legs, twisted legs, fused legs, watermark, bad composition, (bad and mutated hands:1.3), (blurry:2.0)"
|
26 |
+
],
|
27 |
+
"lora_map": {
|
28 |
+
"share/lora/more_detail.safetensors": 0.5,
|
29 |
+
"share/lora/add_detail.safetensors": 0.5
|
30 |
+
},
|
31 |
+
"ip_adapter_map": {
|
32 |
+
"enable": true,
|
33 |
+
"input_image_dir": "ip_adapter_image/test",
|
34 |
+
"save_input_image": true,
|
35 |
+
"resized_to_square": false,
|
36 |
+
"scale": 0.5,
|
37 |
+
"is_plus_face": true,
|
38 |
+
"is_plus": true
|
39 |
+
},
|
40 |
+
"controlnet_map": {
|
41 |
+
"input_image_dir": "controlnet_image/test",
|
42 |
+
"max_samples_on_vram": 200,
|
43 |
+
"max_models_on_vram": 3,
|
44 |
+
"save_detectmap": true,
|
45 |
+
"preprocess_on_gpu": true,
|
46 |
+
"is_loop": true,
|
47 |
+
"controlnet_tile": {
|
48 |
+
"enable": true,
|
49 |
+
"use_preprocessor": true,
|
50 |
+
"preprocessor": {
|
51 |
+
"type": "none",
|
52 |
+
"param": {}
|
53 |
+
},
|
54 |
+
"guess_mode": false,
|
55 |
+
"controlnet_conditioning_scale": 1.0,
|
56 |
+
"control_guidance_start": 0.0,
|
57 |
+
"control_guidance_end": 1.0,
|
58 |
+
"control_scale_list": [
|
59 |
+
0.5,
|
60 |
+
0.4,
|
61 |
+
0.3,
|
62 |
+
0.2,
|
63 |
+
0.1
|
64 |
+
]
|
65 |
+
},
|
66 |
+
"controlnet_ip2p": {
|
67 |
+
"enable": true,
|
68 |
+
"use_preprocessor": true,
|
69 |
+
"guess_mode": false,
|
70 |
+
"controlnet_conditioning_scale": 1.0,
|
71 |
+
"control_guidance_start": 0.0,
|
72 |
+
"control_guidance_end": 1.0,
|
73 |
+
"control_scale_list": [
|
74 |
+
0.5,
|
75 |
+
0.4,
|
76 |
+
0.3,
|
77 |
+
0.2,
|
78 |
+
0.1
|
79 |
+
]
|
80 |
+
},
|
81 |
+
"controlnet_lineart_anime": {
|
82 |
+
"enable": true,
|
83 |
+
"use_preprocessor": true,
|
84 |
+
"guess_mode": false,
|
85 |
+
"controlnet_conditioning_scale": 1.0,
|
86 |
+
"control_guidance_start": 0.0,
|
87 |
+
"control_guidance_end": 1.0,
|
88 |
+
"control_scale_list": [
|
89 |
+
0.5,
|
90 |
+
0.4,
|
91 |
+
0.3,
|
92 |
+
0.2,
|
93 |
+
0.1
|
94 |
+
]
|
95 |
+
},
|
96 |
+
"controlnet_openpose": {
|
97 |
+
"enable": false,
|
98 |
+
"use_preprocessor": true,
|
99 |
+
"guess_mode": false,
|
100 |
+
"controlnet_conditioning_scale": 1.0,
|
101 |
+
"control_guidance_start": 0.0,
|
102 |
+
"control_guidance_end": 1.0,
|
103 |
+
"control_scale_list": [
|
104 |
+
0.5,
|
105 |
+
0.4,
|
106 |
+
0.3,
|
107 |
+
0.2,
|
108 |
+
0.1
|
109 |
+
]
|
110 |
+
},
|
111 |
+
"controlnet_softedge": {
|
112 |
+
"enable": false,
|
113 |
+
"use_preprocessor": true,
|
114 |
+
"preprocessor": {
|
115 |
+
"type": "softedge_pidsafe",
|
116 |
+
"param": {}
|
117 |
+
},
|
118 |
+
"guess_mode": false,
|
119 |
+
"controlnet_conditioning_scale": 1.0,
|
120 |
+
"control_guidance_start": 0.0,
|
121 |
+
"control_guidance_end": 1.0,
|
122 |
+
"control_scale_list": [
|
123 |
+
0.5,
|
124 |
+
0.4,
|
125 |
+
0.3,
|
126 |
+
0.2,
|
127 |
+
0.1
|
128 |
+
]
|
129 |
+
},
|
130 |
+
"controlnet_shuffle": {
|
131 |
+
"enable": true,
|
132 |
+
"use_preprocessor": true,
|
133 |
+
"guess_mode": false,
|
134 |
+
"controlnet_conditioning_scale": 1.0,
|
135 |
+
"control_guidance_start": 0.0,
|
136 |
+
"control_guidance_end": 1.0,
|
137 |
+
"control_scale_list": [
|
138 |
+
0.5,
|
139 |
+
0.4,
|
140 |
+
0.3,
|
141 |
+
0.2,
|
142 |
+
0.1
|
143 |
+
]
|
144 |
+
},
|
145 |
+
"controlnet_depth": {
|
146 |
+
"enable": true,
|
147 |
+
"use_preprocessor": true,
|
148 |
+
"guess_mode": false,
|
149 |
+
"controlnet_conditioning_scale": 1.0,
|
150 |
+
"control_guidance_start": 0.0,
|
151 |
+
"control_guidance_end": 1.0,
|
152 |
+
"control_scale_list": [
|
153 |
+
0.5,
|
154 |
+
0.4,
|
155 |
+
0.3,
|
156 |
+
0.2,
|
157 |
+
0.1
|
158 |
+
]
|
159 |
+
},
|
160 |
+
"controlnet_canny": {
|
161 |
+
"enable": true,
|
162 |
+
"use_preprocessor": true,
|
163 |
+
"guess_mode": false,
|
164 |
+
"controlnet_conditioning_scale": 1.0,
|
165 |
+
"control_guidance_start": 0.0,
|
166 |
+
"control_guidance_end": 1.0,
|
167 |
+
"control_scale_list": [
|
168 |
+
0.5,
|
169 |
+
0.4,
|
170 |
+
0.3,
|
171 |
+
0.2,
|
172 |
+
0.1
|
173 |
+
]
|
174 |
+
},
|
175 |
+
"controlnet_inpaint": {
|
176 |
+
"enable": true,
|
177 |
+
"use_preprocessor": true,
|
178 |
+
"guess_mode": false,
|
179 |
+
"controlnet_conditioning_scale": 1.0,
|
180 |
+
"control_guidance_start": 0.0,
|
181 |
+
"control_guidance_end": 1.0,
|
182 |
+
"control_scale_list": [
|
183 |
+
0.5,
|
184 |
+
0.4,
|
185 |
+
0.3,
|
186 |
+
0.2,
|
187 |
+
0.1
|
188 |
+
]
|
189 |
+
},
|
190 |
+
"controlnet_lineart": {
|
191 |
+
"enable": true,
|
192 |
+
"use_preprocessor": true,
|
193 |
+
"guess_mode": false,
|
194 |
+
"controlnet_conditioning_scale": 1.0,
|
195 |
+
"control_guidance_start": 0.0,
|
196 |
+
"control_guidance_end": 1.0,
|
197 |
+
"control_scale_list": [
|
198 |
+
0.5,
|
199 |
+
0.4,
|
200 |
+
0.3,
|
201 |
+
0.2,
|
202 |
+
0.1
|
203 |
+
]
|
204 |
+
},
|
205 |
+
"controlnet_mlsd": {
|
206 |
+
"enable": true,
|
207 |
+
"use_preprocessor": true,
|
208 |
+
"guess_mode": false,
|
209 |
+
"controlnet_conditioning_scale": 1.0,
|
210 |
+
"control_guidance_start": 0.0,
|
211 |
+
"control_guidance_end": 1.0,
|
212 |
+
"control_scale_list": [
|
213 |
+
0.5,
|
214 |
+
0.4,
|
215 |
+
0.3,
|
216 |
+
0.2,
|
217 |
+
0.1
|
218 |
+
]
|
219 |
+
},
|
220 |
+
"controlnet_normalbae": {
|
221 |
+
"enable": true,
|
222 |
+
"use_preprocessor": true,
|
223 |
+
"guess_mode": false,
|
224 |
+
"controlnet_conditioning_scale": 1.0,
|
225 |
+
"control_guidance_start": 0.0,
|
226 |
+
"control_guidance_end": 1.0,
|
227 |
+
"control_scale_list": [
|
228 |
+
0.5,
|
229 |
+
0.4,
|
230 |
+
0.3,
|
231 |
+
0.2,
|
232 |
+
0.1
|
233 |
+
]
|
234 |
+
},
|
235 |
+
"controlnet_scribble": {
|
236 |
+
"enable": true,
|
237 |
+
"use_preprocessor": true,
|
238 |
+
"guess_mode": false,
|
239 |
+
"controlnet_conditioning_scale": 1.0,
|
240 |
+
"control_guidance_start": 0.0,
|
241 |
+
"control_guidance_end": 1.0,
|
242 |
+
"control_scale_list": [
|
243 |
+
0.5,
|
244 |
+
0.4,
|
245 |
+
0.3,
|
246 |
+
0.2,
|
247 |
+
0.1
|
248 |
+
]
|
249 |
+
},
|
250 |
+
"controlnet_seg": {
|
251 |
+
"enable": true,
|
252 |
+
"use_preprocessor": true,
|
253 |
+
"guess_mode": false,
|
254 |
+
"controlnet_conditioning_scale": 1.0,
|
255 |
+
"control_guidance_start": 0.0,
|
256 |
+
"control_guidance_end": 1.0,
|
257 |
+
"control_scale_list": [
|
258 |
+
0.5,
|
259 |
+
0.4,
|
260 |
+
0.3,
|
261 |
+
0.2,
|
262 |
+
0.1
|
263 |
+
]
|
264 |
+
},
|
265 |
+
"controlnet_ref": {
|
266 |
+
"enable": false,
|
267 |
+
"ref_image": "ref_image/ref_sample.png",
|
268 |
+
"attention_auto_machine_weight": 0.3,
|
269 |
+
"gn_auto_machine_weight": 0.3,
|
270 |
+
"style_fidelity": 0.5,
|
271 |
+
"reference_attn": true,
|
272 |
+
"reference_adain": false,
|
273 |
+
"scale_pattern": [
|
274 |
+
1.0
|
275 |
+
]
|
276 |
+
}
|
277 |
+
},
|
278 |
+
"upscale_config": {
|
279 |
+
"scheduler": "k_dpmpp_sde",
|
280 |
+
"steps": 20,
|
281 |
+
"strength": 0.5,
|
282 |
+
"guidance_scale": 10,
|
283 |
+
"controlnet_tile": {
|
284 |
+
"enable": true,
|
285 |
+
"controlnet_conditioning_scale": 1.0,
|
286 |
+
"guess_mode": false,
|
287 |
+
"control_guidance_start": 0.0,
|
288 |
+
"control_guidance_end": 1.0
|
289 |
+
},
|
290 |
+
"controlnet_line_anime": {
|
291 |
+
"enable": false,
|
292 |
+
"controlnet_conditioning_scale": 1.0,
|
293 |
+
"guess_mode": false,
|
294 |
+
"control_guidance_start": 0.0,
|
295 |
+
"control_guidance_end": 1.0
|
296 |
+
},
|
297 |
+
"controlnet_ip2p": {
|
298 |
+
"enable": true,
|
299 |
+
"controlnet_conditioning_scale": 0.5,
|
300 |
+
"guess_mode": false,
|
301 |
+
"control_guidance_start": 0.0,
|
302 |
+
"control_guidance_end": 1.0
|
303 |
+
},
|
304 |
+
"controlnet_ref": {
|
305 |
+
"enable": false,
|
306 |
+
"use_frame_as_ref_image": false,
|
307 |
+
"use_1st_frame_as_ref_image": true,
|
308 |
+
"ref_image": "ref_image/path_to_your_ref_img.jpg",
|
309 |
+
"attention_auto_machine_weight": 1.0,
|
310 |
+
"gn_auto_machine_weight": 1.0,
|
311 |
+
"style_fidelity": 0.25,
|
312 |
+
"reference_attn": true,
|
313 |
+
"reference_adain": false
|
314 |
+
}
|
315 |
+
},
|
316 |
+
"output": {
|
317 |
+
"format": "gif",
|
318 |
+
"fps": 8,
|
319 |
+
"encode_param": {
|
320 |
+
"crf": 10
|
321 |
+
}
|
322 |
+
}
|
323 |
+
}
|
config/prompts/to_8fps_Frames.bat
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
ffmpeg -i %1 -start_number 0 -vf "scale=512:768,fps=8" %%04d.png
|
data/.gitignore
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
*
|
2 |
+
!.gitignore
|
3 |
+
!/models/
|
4 |
+
!/embeddings/
|
5 |
+
!/rife/
|
data/controlnet_image/test/controlnet_canny/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_depth/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_inpaint/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_ip2p/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_lineart/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_lineart_anime/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_mlsd/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_normalbae/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_openpose/0000.png
ADDED
data/controlnet_image/test/controlnet_openpose/0016.png
ADDED
data/controlnet_image/test/controlnet_openpose/0032.png
ADDED
data/controlnet_image/test/controlnet_openpose/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_scribble/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_seg/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_shuffle/put_pngs_here.txt
ADDED
File without changes
|
data/controlnet_image/test/controlnet_softedge/0000.png
ADDED
data/controlnet_image/test/controlnet_softedge/0016.png
ADDED
data/controlnet_image/test/controlnet_softedge/0032.png
ADDED
data/controlnet_image/test/controlnet_softedge/put_pngs_here.txt
ADDED
File without changes
|