oKen38461 commited on
Commit
09ceafd
·
1 Parent(s): 1345fdc

モデルマネージャーに補助モデルの情報を追加し、`requirements.txt`にMediaPipeを新たに追加しました。また、NumPyのバージョン制約を設定しました。

Browse files
Files changed (2) hide show
  1. model_manager.py +41 -0
  2. requirements.txt +5 -2
model_manager.py CHANGED
@@ -68,6 +68,47 @@ class ModelManager:
68
  "dest_file": "v0.4_hubert_cfg_pytorch.pkl",
69
  "type": "file",
70
  "size": "31 kB"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
71
  }
72
  ]
73
  else:
 
68
  "dest_file": "v0.4_hubert_cfg_pytorch.pkl",
69
  "type": "file",
70
  "size": "31 kB"
71
+ },
72
+ # 補助モデル (aux_models)
73
+ {
74
+ "name": "2d106det.onnx",
75
+ "url": f"{base_url}/ditto_pytorch/aux_models/2d106det.onnx",
76
+ "dest_dir": "checkpoints/ditto_pytorch/aux_models",
77
+ "dest_file": "2d106det.onnx",
78
+ "type": "file",
79
+ "size": "5.03 MB"
80
+ },
81
+ {
82
+ "name": "det_10g.onnx",
83
+ "url": f"{base_url}/ditto_pytorch/aux_models/det_10g.onnx",
84
+ "dest_dir": "checkpoints/ditto_pytorch/aux_models",
85
+ "dest_file": "det_10g.onnx",
86
+ "type": "file",
87
+ "size": "16.9 MB"
88
+ },
89
+ {
90
+ "name": "face_landmarker.task",
91
+ "url": f"{base_url}/ditto_pytorch/aux_models/face_landmarker.task",
92
+ "dest_dir": "checkpoints/ditto_pytorch/aux_models",
93
+ "dest_file": "face_landmarker.task",
94
+ "type": "file",
95
+ "size": "3.76 MB"
96
+ },
97
+ {
98
+ "name": "hubert_streaming_fix_kv.onnx",
99
+ "url": f"{base_url}/ditto_pytorch/aux_models/hubert_streaming_fix_kv.onnx",
100
+ "dest_dir": "checkpoints/ditto_pytorch/aux_models",
101
+ "dest_file": "hubert_streaming_fix_kv.onnx",
102
+ "type": "file",
103
+ "size": "1.46 GB"
104
+ },
105
+ {
106
+ "name": "landmark203.onnx",
107
+ "url": f"{base_url}/ditto_pytorch/aux_models/landmark203.onnx",
108
+ "dest_dir": "checkpoints/ditto_pytorch/aux_models",
109
+ "dest_file": "landmark203.onnx",
110
+ "type": "file",
111
+ "size": "115 MB"
112
  }
113
  ]
114
  else:
requirements.txt CHANGED
@@ -2,7 +2,7 @@
2
  torch
3
  torchvision
4
  torchaudio
5
- numpy
6
  pillow
7
 
8
  # Audio processing
@@ -48,4 +48,7 @@ typing-extensions
48
  filetype==1.2.0
49
 
50
  # ONNX Runtime for model inference
51
- onnxruntime-gpu # GPU版のみで十分(CPU版も含まれる)
 
 
 
 
2
  torch
3
  torchvision
4
  torchaudio
5
+ numpy<2.0 # NumPy 2.xとの互換性問題を回避
6
  pillow
7
 
8
  # Audio processing
 
48
  filetype==1.2.0
49
 
50
  # ONNX Runtime for model inference
51
+ onnxruntime-gpu # GPU版のみで十分(CPU版も含まれる)
52
+
53
+ # MediaPipe for face detection
54
+ mediapipe