HiMind commited on
Commit
4e9190a
·
verified ·
1 Parent(s): 4f269c1

Upload config.json

Browse files
Files changed (1) hide show
  1. config.json +175 -0
config.json ADDED
@@ -0,0 +1,175 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "packedavatar",
3
+ "library_name": "packed_avatar",
4
+ "bundle_file": "PackedAvatar.pt",
5
+ "runtime_script": "PackedAvatar.py",
6
+ "version": 1,
7
+ "architecture": {
8
+ "animation_engine": "SadTalker",
9
+ "audio_to_coeff": "Audio2Coeff",
10
+ "face_renderer": "FaceVid2Vid|PIRender (fallback)",
11
+ "wav2lip": "Wav2Lip GAN (optional)",
12
+ "rmbg": "Bria RMBG 2.0",
13
+ "avatar_bank": "AvatarBank",
14
+ "bfm": "BFM face model assets"
15
+ },
16
+ "bundle_layout": {
17
+ "archives": {
18
+ "checkpoints_zip": "checkpoints.zip",
19
+ "sadtalker_zip": "sadtalker.zip"
20
+ },
21
+ "checkpoints": {
22
+ "avatar_bank": "checkpoints/AvatarBank.pt",
23
+ "wav2lip_gan": "checkpoints/wav2lip_gan.pth",
24
+ "bria_rmbg": "checkpoints/briaaiRMBG-2.0/",
25
+ "bfm": "checkpoints/BFM/",
26
+ "face_detectors": "checkpoints/face_detectors/"
27
+ },
28
+ "sadtalker": {
29
+ "source": "SadTalker/",
30
+ "hub_checkpoints": "SadTalker/hub/checkpoints/"
31
+ },
32
+ "manifest": "manifest.json",
33
+ "metadata": "manifest"
34
+ },
35
+ "media": {
36
+ "audio": {
37
+ "sample_rate": 16000,
38
+ "accepted_formats": [
39
+ "wav",
40
+ "mp3",
41
+ "m4a"
42
+ ],
43
+ "auto_convert_to_wav": true
44
+ },
45
+ "video": {
46
+ "output_format": "mp4",
47
+ "preview_supported": true,
48
+ "accepted_reference_formats": [
49
+ "mp4",
50
+ "mov",
51
+ "mkv",
52
+ "webm"
53
+ ]
54
+ },
55
+ "image": {
56
+ "accepted_formats": [
57
+ "png",
58
+ "jpg",
59
+ "jpeg",
60
+ "webp"
61
+ ],
62
+ "auto_composite_alpha": true
63
+ }
64
+ },
65
+ "defaults": {
66
+ "default_avatar": "",
67
+ "device_priority": [
68
+ "cuda",
69
+ "mps",
70
+ "cpu"
71
+ ],
72
+ "use_wav2lip_by_default": false,
73
+ "remove_background_by_default": false,
74
+ "cache_dir": "<system_temp>/PackedAvatarCache",
75
+ "cache_validation": "sha256(checkpoints_zip + sadtalker_zip)"
76
+ },
77
+ "avatar_bank": {
78
+ "included": true,
79
+ "avatar_count": 100,
80
+ "styles": [
81
+ "anime",
82
+ "cyber",
83
+ "drawn",
84
+ "paint",
85
+ "real"
86
+ ],
87
+ "resolution_previews": true,
88
+ "preview_formats": [
89
+ "png",
90
+ "zstd-compressed-png"
91
+ ]
92
+ },
93
+ "conditioning": {
94
+ "avatar_condition_formats": [
95
+ ".pt",
96
+ ".pth",
97
+ ".mat",
98
+ "dict"
99
+ ],
100
+ "motion_condition_formats": [
101
+ ".pt",
102
+ ".pth",
103
+ ".mat",
104
+ "dict"
105
+ ],
106
+ "legacy_normalization": [
107
+ "motion_3dmm",
108
+ "full_3dmm",
109
+ "coeff_3dmm"
110
+ ]
111
+ },
112
+ "runtime_behavior": {
113
+ "lazy_module_loading": true,
114
+ "cache_invalidation_on_bundle_change": true,
115
+ "avatar_resolution_priority": [
116
+ "avatar_condition",
117
+ "source_image",
118
+ "avatar_id",
119
+ "default_avatar"
120
+ ],
121
+ "background_removal_pipeline": "Input Image -> Bria RMBG -> Foreground -> SadTalker -> MP4",
122
+ "post_processing": {
123
+ "wav2lip": "optional post-pass",
124
+ "enhancer": "gfpgan (optional)"
125
+ },
126
+ "memory_cleanup": [
127
+ "del preprocess_model",
128
+ "del audio_to_coeff",
129
+ "del animate_from_coeff",
130
+ "torch.cuda.empty_cache()",
131
+ "gc.collect()"
132
+ ]
133
+ },
134
+ "supported_commands": [
135
+ "generate",
136
+ "extract-embeddings",
137
+ "list-avatars",
138
+ "list-bundle-contents",
139
+ "download-bundle",
140
+ "validate-bundle",
141
+ "cleanup-cache"
142
+ ],
143
+ "cli_examples": {
144
+ "basic": "python PackedAvatar.py --source-image person.jpg --driven-audio speech.wav",
145
+ "avatarbank": "python PackedAvatar.py --avatar-id Rebecca --driven-audio speech.wav",
146
+ "background_removal": "python PackedAvatar.py --source-image portrait.png --driven-audio speech.wav --remove-background",
147
+ "wav2lip": "python PackedAvatar.py --source-image portrait.png --driven-audio speech.wav --use-wav2lip"
148
+ },
149
+ "input_files": [
150
+ "PackedAvatar.pt",
151
+ "PackedAvatar.py",
152
+ "requirements.txt",
153
+ "README.md"
154
+ ],
155
+ "query_file": true,
156
+ "recommended_env": {
157
+ "python": [
158
+ "3.10",
159
+ "3.11"
160
+ ],
161
+ "pytorch": "2.x (CUDA-enabled for GPU)",
162
+ "ffmpeg": "required for reference-video audio extraction"
163
+ },
164
+ "performance_guidance": {
165
+ "256_resolution_vram": "4-6GB (recommended)",
166
+ "512_resolution_vram": "8-12GB (recommended)",
167
+ "high_quality_vram": "12+ GB",
168
+ "notes": "First run slower due to extraction; subsequent runs reuse cache and start faster."
169
+ },
170
+ "security_and_ethics": {
171
+ "bundle_trust": "Bundle is treated as a trusted runtime artifact",
172
+ "ethical_use_note": "Users must obtain consent for generating talking-head videos of real people",
173
+ "license": "apache-2.0 (see repo)"
174
+ }
175
+ }