Spaces:

minhho
/

FaceSwapLite-1.0

Runtime error

App Files Files Community

minhho commited on Oct 4

Commit

69532ce

1 Parent(s): 75d3319

Deploy FaceSwapLite application with full documentation

Browse files

Files changed (26) hide show

.gitattributes +4 -0
.gitignore +76 -0
DEPLOYMENT.md +228 -0
DEPLOYMENT_READY.md +178 -0
LICENSE +29 -0
QUICKSTART.md +162 -0
README.md +147 -6
app.py +59 -0
demo.gif +3 -0
deploy.sh +140 -0
docker/0 +1 -0
docker/Dockerfile.nvidia +20 -0
docker/run.sh +13 -0
out.gitkeep +0 -0
out/.gitkeep +0 -0
packages.txt +1 -0
recognition/0 +1 -0
recognition/arcface_onnx.py +91 -0
recognition/face_align.py +141 -0
recognition/main.py +57 -0
recognition/scrfd.py +329 -0
refacer.py +262 -0
requirements-COREML.txt +12 -0
requirements-GPU.txt +12 -0
requirements.txt +10 -0
script.py +41 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+demo.gif filter=lfs diff=lfs merge=lfs -text
+*.jpg filter=lfs diff=lfs merge=lfs -text
+*.jpeg filter=lfs diff=lfs merge=lfs -text
+*.png filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,76 @@

+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# Virtual environments
+venv/
+env/
+ENV/
+env.bak/
+venv.bak/
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+.DS_Store
+# Model files (large files)
+*.onnx
+*.pth
+*.pt
+*.bin
+# InsightFace models cache
+.insightface/
+# Output files
+out/*
+!out/.gitkeep
+*.mp4
+*.avi
+*.mov
+*.mkv
+# Test files
+test_*.py
+testsrc.mp4
+*.jpg
+*.png
+*.jpeg
+!demo.gif
+!image.jpg
+# Logs
+*.log
+# System
+.DS_Store
+Thumbs.db
+# Temporary files
+tmp/
+temp/
+*.tmp
+image.jpg

DEPLOYMENT.md ADDED Viewed

	@@ -0,0 +1,228 @@

+# Deployment Guide for Hugging Face Spaces
+This guide will help you deploy FaceSwapLite to Hugging Face Spaces.
+## Prerequisites
+1. A Hugging Face account (create one at https://huggingface.co/join)
+2. Git installed on your system
+3. Hugging Face CLI installed: `pip install huggingface_hub`
+4. An access token with write permissions from https://huggingface.co/settings/tokens
+## Method 1: Deploy via Git (Recommended)
+### Step 1: Clone Your Space Repository
+```bash
+git clone https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+cd FaceSwapLite-1.0
+```
+When prompted for a password, use your Hugging Face access token.
+### Step 2: Copy Project Files
+Copy all the necessary files from your local FaceSwapLite directory to the cloned space directory:
+```bash
+# Copy from your local project to the space directory
+cp /path/to/local/FaceSwapLite/app.py .
+cp /path/to/local/FaceSwapLite/refacer.py .
+cp /path/to/local/FaceSwapLite/script.py .
+cp /path/to/local/FaceSwapLite/requirements.txt .
+cp /path/to/local/FaceSwapLite/README.md .
+cp -r /path/to/local/FaceSwapLite/recognition .
+cp /path/to/local/FaceSwapLite/inswapper_128.onnx .
+```
+### Step 3: Create the Output Directory
+```bash
+mkdir -p out
+touch out/.gitkeep
+```
+### Step 4: Add and Commit Files
+```bash
+git add .
+git commit -m "Initial deployment of FaceSwapLite"
+```
+### Step 5: Push to Hugging Face
+```bash
+git push
+```
+When prompted for a password, use your Hugging Face access token.
+### Step 6: Wait for Build
+- Go to https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+- Wait for the space to build (this may take 5-10 minutes)
+- Check the build logs for any errors
+## Method 2: Deploy via Hugging Face CLI
+### Step 1: Login to Hugging Face
+```bash
+huggingface-cli login
+```
+Enter your access token when prompted.
+### Step 2: Upload Files
+```bash
+cd /path/to/your/FaceSwapLite
+huggingface-cli upload minhho/FaceSwapLite-1.0 . . --repo-type=space
+```
+## Method 3: Manual Upload via Web Interface
+1. Go to https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+2. Click on "Files" tab
+3. Click "Add file" → "Create a new file" or "Upload files"
+4. Upload the following files one by one:
+   - `app.py`
+   - `refacer.py`
+   - `script.py`
+   - `requirements.txt`
+   - `README.md`
+   - `inswapper_128.onnx`
+   - All files in `recognition/` folder
+## Important Notes
+### Model File Size
+The `inswapper_128.onnx` file is quite large (~500MB). You have several options:
+#### Option 1: Git LFS (Recommended)
+```bash
+# Install Git LFS if not already installed
+git lfs install
+# Track the model file
+git lfs track "*.onnx"
+git add .gitattributes
+git add inswapper_128.onnx
+git commit -m "Add model file with LFS"
+git push
+```
+#### Option 2: External Storage
+Store the model file externally (e.g., Google Drive, Dropbox) and download it during app initialization. Add this to `refacer.py`:
+```python
+import urllib.request
+import os
+def download_model():
+    model_path = 'inswapper_128.onnx'
+    if not os.path.exists(model_path):
+        print("Downloading model...")
+        url = "YOUR_MODEL_URL_HERE"
+        urllib.request.urlretrieve(url, model_path)
+        print("Model downloaded!")
+```
+#### Option 3: Hugging Face Hub
+Upload the model to Hugging Face Model Hub and download it:
+```python
+from huggingface_hub import hf_hub_download
+model_path = hf_hub_download(
+    repo_id="YOUR_REPO/model",
+    filename="inswapper_128.onnx"
+)
+```
+### System Dependencies
+If you need FFmpeg or other system packages, create a `packages.txt` file:
+```txt
+ffmpeg
+```
+### Environment Variables
+You can set environment variables in the Space settings:
+- Go to Space Settings → Variables and secrets
+- Add variables like `MAX_NUM_FACES`, `FORCE_CPU`, etc.
+### Hardware Requirements
+For better performance:
+1. Go to Space Settings
+2. Under "Hardware", upgrade to a GPU-enabled instance (requires payment)
+3. Recommended: T4 small or better for real-time processing
+### Free Tier Limitations
+On the free tier:
+- CPU-only processing (slower)
+- 16GB RAM limit
+- 50GB storage limit
+- May go to sleep after inactivity
+## Troubleshooting
+### Build Fails
+Check the build logs at your Space URL. Common issues:
+- Missing dependencies in `requirements.txt`
+- Large files not tracked by Git LFS
+- Incompatible package versions
+### App Doesn't Start
+- Check that `app.py` is in the root directory
+- Verify `sdk: gradio` is in README.md frontmatter
+- Check Python version compatibility
+### Model Not Found
+- Ensure `inswapper_128.onnx` is uploaded
+- Check file permissions and paths
+- Verify Git LFS is tracking large files
+### Performance Issues
+- Upgrade to GPU hardware
+- Reduce video resolution
+- Process shorter clips
+- Optimize batch processing settings
+## Post-Deployment
+After successful deployment:
+1. **Test the Space**: Try uploading a video and swapping faces
+2. **Monitor Logs**: Check for any runtime errors
+3. **Update Documentation**: Add examples and usage tips
+4. **Share**: Share your Space URL with others!
+## Updating Your Space
+To update your deployed space:
+```bash
+cd FaceSwapLite-1.0
+# Make your changes
+git add .
+git commit -m "Update: description of changes"
+git push
+```
+The space will automatically rebuild with your changes.
+## Need Help?
+- Check Hugging Face Spaces documentation: https://huggingface.co/docs/hub/spaces
+- Visit the Hugging Face forums: https://discuss.huggingface.co/
+- Open an issue on your Space repository

DEPLOYMENT_READY.md ADDED Viewed

	@@ -0,0 +1,178 @@

+# ✅ FaceSwapLite - Ready for Deployment
+## Summary of Changes
+Your FaceSwapLite project has been updated and is now ready for deployment to Hugging Face Spaces!
+### 📝 What Was Updated
+#### 1. **README.md** ✅
+   - Added comprehensive project description
+   - Included features, installation, and usage instructions
+   - Added technical details and architecture information
+   - Included disclaimer and acknowledgments
+   - Updated emoji from 🏆 to 🎃 for consistency
+#### 2. **app.py** ✅
+   - Removed `argparse` (not needed for Hugging Face Spaces)
+   - Removed `ngrok` integration (not compatible with HF Spaces)
+   - Simplified configuration using environment variables
+   - Fixed for Hugging Face Spaces deployment
+   - Clean, production-ready code
+#### 3. **requirements.txt** ✅
+   - Updated Gradio from 3.33.1 to 4.40.0 (matches README.md)
+   - Fixed package name: `ffmpeg_python` → `ffmpeg-python`
+   - Removed `opencv_python` (keeping only `opencv-python-headless` for server deployment)
+   - Removed `ngrok` (not needed for HF Spaces)
+   - All packages are now compatible with Hugging Face Spaces
+#### 4. **New Files Created** ✅
+   - `.gitignore` - Excludes unnecessary files from version control
+   - `packages.txt` - System dependencies (FFmpeg) for Hugging Face
+   - `LICENSE` - MIT License with disclaimer
+   - `DEPLOYMENT.md` - Comprehensive deployment guide
+   - `QUICKSTART.md` - Quick deployment instructions
+   - `deploy.sh` - Automated deployment script
+### 📦 Current Project Structure
+```
+FaceSwapLite/
+├── app.py                    # ✅ Updated - Gradio web interface (HF compatible)
+├── refacer.py               # ✅ Core face swapping logic
+├── script.py                # ✅ Command-line interface
+├── requirements.txt         # ✅ Updated - Python dependencies
+├── packages.txt             # ✨ New - System dependencies (FFmpeg)
+├── README.md                # ✅ Updated - Comprehensive documentation
+├── LICENSE                  # ✨ New - MIT License
+├── DEPLOYMENT.md            # ✨ New - Detailed deployment guide
+├── QUICKSTART.md            # ✨ New - Quick start guide
+├── deploy.sh                # ✨ New - Automated deployment script
+├── .gitignore               # ✨ New - Git ignore rules
+├── .gitattributes           # ✅ Already exists - Git LFS config
+├── inswapper_128.onnx       # ✅ Model file (529MB, tracked by LFS)
+├── demo.gif                 # ✅ Demo file
+├── image.jpg                # ✅ Sample image
+├── recognition/             # ✅ Face detection and recognition
+│   ├── arcface_onnx.py
+│   ├── face_align.py
+│   ├── main.py
+│   └── scrfd.py
+└── out/                     # ✅ Output directory
+    └── .gitkeep
+```
+### 🎯 Ready for Deployment
+Your project is now ready to deploy! Here's what's been verified:
+✅ **No Python errors** in app.py or refacer.py
+✅ **Model file exists** (inswapper_128.onnx - 529MB)
+✅ **Git LFS configured** (.gitattributes already has *.onnx)
+✅ **Dependencies updated** for Hugging Face compatibility
+✅ **System packages** specified (FFmpeg in packages.txt)
+✅ **Documentation** complete and comprehensive
+✅ **Deployment scripts** ready to use
+### 🚀 Deploy Now!
+You have **three options** to deploy:
+#### Option 1: Automated Script (Easiest)
+```bash
+cd /Users/hoangminh.ho/Works/research/FaceSwapLite
+./deploy.sh
+```
+#### Option 2: Manual Git Push
+```bash
+# See QUICKSTART.md for detailed steps
+git clone https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+# Copy files and push
+```
+#### Option 3: Hugging Face CLI
+```bash
+pip install huggingface_hub
+huggingface-cli login
+huggingface-cli upload minhho/FaceSwapLite-1.0 . . --repo-type=space
+```
+### 📋 Pre-Deployment Checklist
+Before deploying, make sure you have:
+- [ ] Hugging Face account created
+- [ ] Access token with write permissions from https://huggingface.co/settings/tokens
+- [ ] Git and Git LFS installed
+- [ ] Git LFS initialized (`git lfs install`)
+### 🔍 What Happens After Deployment
+1. **Files Upload**: All files will be uploaded to your Space
+2. **Build Process**: Hugging Face will build your Space (5-10 minutes)
+3. **Dependencies Install**: Install packages from requirements.txt and packages.txt
+4. **Model Download**: InsightFace models auto-download on first run
+5. **App Launch**: Your app will be live at https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+### ⚙️ Configuration Options
+You can set environment variables in Space Settings:
+- `MAX_NUM_FACES` - Maximum number of faces (default: 5)
+- `FORCE_CPU` - Force CPU mode (default: False)
+### 💡 Performance Tips
+**Free Tier (CPU):**
+- Processing will be slower
+- Good for testing and demos
+- No additional cost
+**Paid Tier (GPU):**
+- Much faster processing
+- Recommended for production use
+- Upgrade in Space Settings → Hardware
+- Suggested: T4 small (~$0.60/hour)
+### 🐛 Common Issues & Solutions
+**Issue: "No application file"**
+✅ Solution: Make sure app.py is in the root directory
+**Issue: Build fails**
+✅ Solution: Check logs, verify requirements.txt and packages.txt
+**Issue: Model file not found**
+✅ Solution: Ensure Git LFS is tracking *.onnx files
+**Issue: Out of memory**
+✅ Solution: Upgrade to GPU instance or reduce video resolution
+### 📚 Documentation
+- **README.md** - Main documentation
+- **QUICKSTART.md** - Fast deployment guide
+- **DEPLOYMENT.md** - Detailed deployment instructions
+- **This file** - Summary and checklist
+### 🎉 Next Steps
+1. **Deploy** using one of the three methods above
+2. **Monitor** the build logs at your Space URL
+3. **Test** with a sample video once deployed
+4. **Share** your Space with others!
+### 📧 Support
+If you encounter issues:
+- Check DEPLOYMENT.md for troubleshooting
+- Review Hugging Face Spaces docs: https://huggingface.co/docs/hub/spaces
+- Open an issue on your Space repository
+---
+**Your FaceSwapLite is production-ready! 🚀**
+Deploy now and start swapping faces in the cloud!

LICENSE ADDED Viewed

	@@ -0,0 +1,29 @@

+MIT License
+Copyright (c) 2024 FaceSwapLite
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+---
+DISCLAIMER: This software is provided for educational and research purposes only.
+Users are responsible for ensuring their use complies with all applicable laws
+and regulations. The authors and contributors are not responsible for any misuse
+of this software. Always obtain proper consent before processing anyone's images
+or videos.

QUICKSTART.md ADDED Viewed

	@@ -0,0 +1,162 @@

+# 🚀 Quick Start - Deploy to Hugging Face
+This is a quick guide to deploy FaceSwapLite to your Hugging Face Space.
+## Prerequisites
+✅ Hugging Face account
+✅ Git installed
+✅ Git LFS installed (for the 529MB model file)
+✅ Hugging Face access token with write permissions
+## Option 1: Automated Deployment (Recommended)
+### Step 1: Prepare Git LFS
+```bash
+# Install Git LFS (if not already installed)
+# macOS
+brew install git-lfs
+# Linux
+sudo apt-get install git-lfs
+# Initialize Git LFS
+git lfs install
+```
+### Step 2: Run Deployment Script
+```bash
+# Make sure you're in the FaceSwapLite directory
+cd /Users/hoangminh.ho/Works/research/FaceSwapLite
+# Run the deployment script
+./deploy.sh
+```
+The script will:
+1. Clone your Hugging Face Space
+2. Copy all necessary files
+3. Set up Git LFS for the model file
+4. Commit and push to Hugging Face
+When prompted, enter your Hugging Face access token.
+## Option 2: Manual Deployment
+### Step 1: Clone Your Space
+```bash
+git clone https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+cd FaceSwapLite-1.0
+```
+### Step 2: Set Up Git LFS
+```bash
+git lfs install
+git lfs track "*.onnx"
+git add .gitattributes
+```
+### Step 3: Copy Files
+Copy the following files from your local project:
+```bash
+# From your FaceSwapLite directory
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/app.py .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/refacer.py .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/script.py .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/requirements.txt .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/README.md .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/LICENSE .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/packages.txt .
+cp -r /Users/hoangminh.ho/Works/research/FaceSwapLite/recognition .
+cp /Users/hoangminh.ho/Works/research/FaceSwapLite/inswapper_128.onnx .
+# Create output directory
+mkdir -p out
+touch out/.gitkeep
+```
+### Step 4: Commit and Push
+```bash
+git add .
+git commit -m "Deploy FaceSwapLite application"
+git push
+```
+Enter your Hugging Face access token when prompted for password.
+## Verify Deployment
+1. Visit https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+2. Wait 5-10 minutes for the build to complete
+3. Check the "Logs" tab for any errors
+4. Test the application with a sample video
+## Troubleshooting
+### Large File Upload Issues
+If you have issues uploading the model file:
+```bash
+# Make sure Git LFS is tracking it
+git lfs track "*.onnx"
+git add .gitattributes
+git add inswapper_128.onnx
+git commit -m "Add model file with LFS"
+git push
+```
+### Build Failures
+Check the logs at your Space URL. Common issues:
+- Missing `packages.txt` (for FFmpeg)
+- Incorrect `requirements.txt`
+- Model file not uploaded
+### Permission Denied
+Make sure you're using your Hugging Face **access token** (not password) when pushing.
+Get your token at: https://huggingface.co/settings/tokens
+## Next Steps
+After successful deployment:
+1. ✅ Test with a sample video
+2. ✅ Monitor the logs for errors
+3. ✅ Share your Space with others!
+4. ✅ Consider upgrading to GPU for better performance
+## Getting Your Access Token
+1. Go to https://huggingface.co/settings/tokens
+2. Click "New token"
+3. Give it a name (e.g., "FaceSwapLite")
+4. Select "Write" permissions
+5. Click "Generate"
+6. Copy the token (you won't see it again!)
+## Using Hugging Face CLI (Alternative)
+```bash
+# Install Hugging Face CLI
+pip install huggingface_hub
+# Login
+huggingface-cli login
+# Upload all files
+huggingface-cli upload minhho/FaceSwapLite-1.0 . . --repo-type=space
+```
+---
+For detailed deployment instructions, see `DEPLOYMENT.md`

README.md CHANGED Viewed

@@ -1,12 +1,153 @@
 ---
-title: FaceSwapLite 1.0
-emoji: 🚀
-colorFrom: gray
-colorTo: blue
 sdk: gradio
-sdk_version: 5.48.0
 app_file: app.py
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: FaceSwapLite
+emoji: �
+colorFrom: purple
+colorTo: red
 sdk: gradio
+sdk_version: 4.40.0
 app_file: app.py
 pinned: false
+license: mit
 ---
+# 🎃 FaceSwapLite - AI Face Swapping Application
+A lightweight and efficient face swapping application powered by InsightFace and ONNX Runtime. Swap faces in videos with high-quality results using AI technology.
+## 🌟 Features
+- **Multi-Face Support**: Swap multiple faces in a single video
+- **High-Quality Results**: Uses InsightFace's state-of-the-art face recognition and swapping models
+- **Flexible Processing**: Support for CPU, CUDA, CoreML, and TensorRT execution
+- **Adjustable Transparency**: Control the blending threshold for each face swap
+- **Audio Preservation**: Automatically preserves audio from the original video
+- **User-Friendly Interface**: Simple Gradio web interface for easy interaction
+## 🚀 Quick Start
+### Online Usage
+Visit the [Hugging Face Space](https://huggingface.co/spaces/minhho/FaceSwapLite-1.0) to use the application directly in your browser.
+### Local Installation
+1. **Clone the repository**
+```bash
+git clone https://huggingface.co/spaces/minhho/FaceSwapLite-1.0
+cd FaceSwapLite-1.0
+```
+2. **Install dependencies**
+```bash
+pip install -r requirements.txt
+```
+3. **Download the face swapping model**
+   - Download `inswapper_128.onnx` from [InsightFace Model Zoo](https://github.com/deepinsight/insightface/releases)
+   - Place it in the root directory
+4. **Run the application**
+```bash
+python app.py
+```
+## 📖 Usage
+### Web Interface
+1. Upload a target video (MP4 format)
+2. For each face you want to swap:
+   - Upload the target face from the video (face to replace)
+   - Upload the source face (replacement face)
+   - Adjust the transparency slider (0.0-1.0, default: 0.2)
+3. Click "⏳ Start processing"
+4. Download the result video
+### Command Line
+```bash
+python script.py --video path/to/video.mp4 --face path/to/target_face.jpg,path/to/source_face.jpg,0.2
+```
+**Arguments:**
+- `--video`: Path to the target video
+- `--face`: Face swap configuration (can be used multiple times)
+  - Format: `target_face,source_face,threshold`
+- `--force_cpu`: Force CPU execution (optional)
+- `--colab_performance`: Optimize for Google Colab (optional)
+## ⚙️ Configuration
+### Execution Modes
+The application automatically detects and uses the best available execution provider:
+- **CPU Mode**: Default fallback, works on all systems
+- **CUDA Mode**: NVIDIA GPU acceleration (recommended for best performance)
+- **CoreML Mode**: Apple Silicon optimization
+- **TensorRT Mode**: Advanced NVIDIA GPU optimization
+### Performance Tips
+- For faster processing, use a CUDA-compatible GPU
+- Reduce video resolution for quicker processing
+- Process shorter video segments for testing
+- On Colab, use the `--colab_performance` flag
+## 🛠️ Technical Details
+### Architecture
+- **Face Detection**: SCRFD (Sample and Computation Redistributed Face Detection)
+- **Face Recognition**: ArcFace with ResNet-50 backbone
+- **Face Swapping**: INSwapper model (128x128)
+- **Backend**: ONNX Runtime for optimized inference
+### Requirements
+- Python 3.8+
+- FFmpeg (for video processing)
+- 8GB+ RAM recommended
+- GPU with 4GB+ VRAM (optional, for faster processing)
+## 📁 Project Structure
+```
+FaceSwapLite/
+├── app.py                 # Gradio web interface
+├── refacer.py            # Core face swapping logic
+├── script.py             # Command-line interface
+├── requirements.txt      # Python dependencies
+├── inswapper_128.onnx   # Face swapping model
+├── recognition/          # Face detection and recognition modules
+│   ├── scrfd.py         # Face detector
+│   ├── arcface_onnx.py  # Face recognition
+│   └── ...
+└── out/                  # Output directory for processed videos
+```
+## 🤝 Contributing
+Contributions are welcome! Please feel free to submit issues or pull requests.
+## 📝 License
+This project is licensed under the MIT License - see the LICENSE file for details.
+## 🙏 Acknowledgments
+- [InsightFace](https://github.com/deepinsight/insightface) for the face analysis models
+- [ONNX Runtime](https://onnxruntime.ai/) for efficient model inference
+- [Gradio](https://gradio.app/) for the web interface
+## ⚠️ Disclaimer
+This software is provided for educational and research purposes only. Please use responsibly and ethically. Do not use this tool for creating misleading or harmful content. Always obtain proper consent before swapping someone's face.
+## 📧 Contact
+For questions or support, please open an issue on the GitHub repository.
+---
+**Note**: Make sure you have the required model files (`inswapper_128.onnx`) before running the application. The InsightFace models will be automatically downloaded on first run.

app.py ADDED Viewed

	@@ -0,0 +1,59 @@

+# -*- coding: utf-8 -*-
+import gradio as gr
+from refacer import Refacer
+import os
+# Configuration
+MAX_NUM_FACES = int(os.environ.get("MAX_NUM_FACES", "5"))
+FORCE_CPU = os.environ.get("FORCE_CPU", "False").lower() == "true"
+# Initialize the face swapper
+print("Initializing FaceSwapLite...")
+refacer = Refacer(force_cpu=FORCE_CPU, colab_performance=False)
+print("Initialization complete!")
+num_faces = MAX_NUM_FACES
+def run(*vars):
+    video_path=vars[0]
+    origins=vars[1:(num_faces+1)]
+    destinations=vars[(num_faces+1):(num_faces*2)+1]
+    thresholds=vars[(num_faces*2)+1:]
+    faces = []
+    for k in range(0,num_faces):
+        if origins[k] is not None and destinations[k] is not None:
+            faces.append({
+                'origin':origins[k],
+                'destination':destinations[k],
+                'threshold':thresholds[k]
+            })
+    return refacer.reface(video_path,faces)
+origin = []
+destination = []
+thresholds = []
+with gr.Blocks() as demo:
+    with gr.Row():
+        gr.Markdown("# 🎃 FaceSwap Lite 🎃")
+    with gr.Row():
+        video=gr.Video(label=u"🖥️ Target Video,foramt mp4",format="mp4")
+        video2=gr.Video(label=u"🎞️ Target Video",interactive=False,format="mp4")
+    for i in range(0,num_faces):
+        with gr.Tab(u"Face #" + f"{i+1}"):
+            with gr.Row():
+                origin.append(gr.Image(label=u"🎯 Target Face from Video"))
+                destination.append(gr.Image(label=u"📸 Source Face"))
+            with gr.Row():
+                thresholds.append(gr.Slider(label=u"Transparency",minimum=0.0,maximum=1.0,value=0.2))
+    with gr.Row():
+        button=gr.Button(u"⏳ Start processing", variant="primary")
+    button.click(fn=run,inputs=[video]+origin+destination+thresholds,outputs=[video2])
+# Launch the Gradio app
+demo.queue().launch()

demo.gif ADDED Viewed

Git LFS Details

SHA256: 52b95c2e607c6edd0a9180596759c20ec00f92fa00798922004a612482dda2f2
Pointer size: 132 Bytes
Size of remote file: 2.87 MB

deploy.sh ADDED Viewed

	@@ -0,0 +1,140 @@

+#!/bin/bash
+# FaceSwapLite - Hugging Face Deployment Script
+# This script helps deploy FaceSwapLite to Hugging Face Spaces
+set -e
+echo "🎃 FaceSwapLite - Hugging Face Deployment Script 🎃"
+echo "=================================================="
+echo ""
+# Configuration
+SPACE_REPO="https://huggingface.co/spaces/minhho/FaceSwapLite-1.0"
+SPACE_DIR="FaceSwapLite-1.0-hf"
+# Check if git is installed
+if ! command -v git &> /dev/null; then
+    echo "❌ Error: Git is not installed. Please install git first."
+    exit 1
+fi
+# Check if git-lfs is installed
+if ! command -v git-lfs &> /dev/null; then
+    echo "⚠️  Warning: Git LFS is not installed."
+    echo "   The model file (529MB) requires Git LFS."
+    echo "   Install it with: brew install git-lfs (macOS) or visit https://git-lfs.github.com/"
+    read -p "   Continue anyway? (y/n) " -n 1 -r
+    echo
+    if [[ ! $REPLY =~ ^[Yy]$ ]]; then
+        exit 1
+    fi
+else
+    echo "✅ Git LFS is installed"
+    git lfs install
+fi
+# Step 1: Clone or update the space repository
+echo ""
+echo "Step 1: Cloning Hugging Face Space..."
+if [ -d "$SPACE_DIR" ]; then
+    echo "Directory $SPACE_DIR already exists."
+    read -p "Do you want to remove it and clone fresh? (y/n) " -n 1 -r
+    echo
+    if [[ $REPLY =~ ^[Yy]$ ]]; then
+        rm -rf "$SPACE_DIR"
+        git clone "$SPACE_REPO" "$SPACE_DIR"
+    else
+        cd "$SPACE_DIR"
+        git pull
+        cd ..
+    fi
+else
+    git clone "$SPACE_REPO" "$SPACE_DIR"
+fi
+# Step 2: Copy files
+echo ""
+echo "Step 2: Copying project files..."
+cp -v app.py "$SPACE_DIR/"
+cp -v refacer.py "$SPACE_DIR/"
+cp -v script.py "$SPACE_DIR/"
+cp -v requirements.txt "$SPACE_DIR/"
+cp -v README.md "$SPACE_DIR/"
+cp -v LICENSE "$SPACE_DIR/"
+cp -v packages.txt "$SPACE_DIR/"
+# Copy recognition folder
+echo "Copying recognition module..."
+cp -rv recognition "$SPACE_DIR/"
+# Copy model file if it exists
+if [ -f "inswapper_128.onnx" ]; then
+    echo "Copying model file (this may take a moment - 529MB)..."
+    cp -v inswapper_128.onnx "$SPACE_DIR/"
+else
+    echo "⚠️  Warning: inswapper_128.onnx not found!"
+    echo "   Please manually copy the model file or download it from:"
+    echo "   https://github.com/deepinsight/insightface/releases/download/v0.7/inswapper_128.onnx"
+fi
+# Create output directory
+mkdir -p "$SPACE_DIR/out"
+touch "$SPACE_DIR/out/.gitkeep"
+# Step 3: Git operations
+echo ""
+echo "Step 3: Preparing git commit..."
+cd "$SPACE_DIR"
+# Track large files with LFS if git-lfs is available
+if command -v git-lfs &> /dev/null; then
+    echo "Setting up Git LFS..."
+    git lfs track "*.onnx"
+    git add .gitattributes
+fi
+# Add all files
+git add .
+# Check if there are changes
+if git diff --staged --quiet; then
+    echo "ℹ️  No changes to commit."
+else
+    echo ""
+    echo "Files to be committed:"
+    git diff --staged --name-status
+    echo ""
+    read -p "Enter commit message (or press Enter for default): " COMMIT_MSG
+    if [ -z "$COMMIT_MSG" ]; then
+        COMMIT_MSG="Update FaceSwapLite application"
+    fi
+    git commit -m "$COMMIT_MSG"
+    # Step 4: Push to Hugging Face
+    echo ""
+    echo "Step 4: Pushing to Hugging Face..."
+    echo "⚠️  You will be prompted for your Hugging Face access token."
+    echo "   Get it from: https://huggingface.co/settings/tokens"
+    echo ""
+    git push
+    echo ""
+    echo "✅ Deployment complete!"
+    echo ""
+    echo "🎉 Your Space should be live at:"
+    echo "   $SPACE_REPO"
+    echo ""
+    echo "⏳ The space will take 5-10 minutes to build."
+    echo "   Check the build logs at the URL above."
+fi
+cd ..
+echo ""
+echo "=================================================="
+echo "Deployment script finished!"
+echo "=================================================="

docker/0 ADDED Viewed

	@@ -0,0 +1 @@


1	+ v

docker/Dockerfile.nvidia ADDED Viewed

	@@ -0,0 +1,20 @@

+FROM nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04
+# Always use UTC on a server
+RUN ln -snf /usr/share/zoneinfo/UTC /etc/localtime && echo UTC > /etc/timezone
+RUN DEBIAN_FRONTEND=noninteractive apt update && apt install -y python3 python3-pip python3-tk git ffmpeg nvidia-cuda-toolkit nvidia-container-runtime libnvidia-decode-525-server wget unzip
+RUN wget https://github.com/deepinsight/insightface/releases/download/v0.7/buffalo_l.zip -O /tmp/buffalo_l.zip && \
+        mkdir -p /root/.insightface/models/buffalo_l && \
+        cd /root/.insightface/models/buffalo_l && \
+        unzip /tmp/buffalo_l.zip && \
+        rm -f /tmp/buffalo_l.zip
+RUN pip install nvidia-tensorrt
+RUN git clone https://github.com/xaviviro/refacer && cd refacer && pip install -r requirements-GPU.txt
+WORKDIR /refacer
+# Test following commands in container to make sure GPU stuff works
+# nvidia-smi
+# python3 -c "import tensorflow as tf; print(tf.config.list_physical_devices('GPU'))"

docker/run.sh ADDED Viewed

	@@ -0,0 +1,13 @@

+#!/bin/bash
+# Run this script from within the refacer/docker folder.
+# You'll need inswrapper_128.onnx from either:
+#    https://drive.google.com/file/d/1eu60OrRtn4WhKrzM4mQv4F3rIuyUXqfl/view?usp=drive_link
+# or https://drive.google.com/file/d/1jbDUGrADco9A1MutWjO6d_1dwizh9w9P/view?usp=sharing
+# or https://mega.nz/file/9l8mGDJA#FnPxHwpdhDovDo6OvbQjhHd2nDAk8_iVEgo3mpHLG6U
+# or https://1drv.ms/u/s!AsHA3Xbnj6uAgxhb_tmQ7egHACOR?e=CPoThO
+# or https://civitai.com/models/80324?modelVersionId=85159
+docker stop -t 0 refacer
+docker build -t refacer -f Dockerfile.nvidia . && \
+    docker run --rm --name refacer -v $(pwd)/..:/refacer -p 7860:7860 --gpus all refacer python3 app.py --server_name 0.0.0.0 &
+sleep 2 && google-chrome --new-window "http://127.0.0.1:7860" &

out.gitkeep ADDED Viewed

File without changes

out/.gitkeep ADDED Viewed

File without changes

packages.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ ffmpeg

recognition/0 ADDED Viewed

	@@ -0,0 +1 @@


1	+ t

recognition/arcface_onnx.py ADDED Viewed

	@@ -0,0 +1,91 @@

+# -*- coding: utf-8 -*-
+# @Organization  : insightface.ai
+# @Author        : Jia Guo
+# @Time          : 2021-05-04
+# @Function      :
+import numpy as np
+import cv2
+import onnx
+import onnxruntime
+import face_align
+__all__ = [
+    'ArcFaceONNX',
+]
+class ArcFaceONNX:
+    def __init__(self, model_file=None, session=None):
+        assert model_file is not None
+        self.model_file = model_file
+        self.session = session
+        self.taskname = 'recognition'
+        find_sub = False
+        find_mul = False
+        model = onnx.load(self.model_file)
+        graph = model.graph
+        for nid, node in enumerate(graph.node[:8]):
+            #print(nid, node.name)
+            if node.name.startswith('Sub') or node.name.startswith('_minus'):
+                find_sub = True
+            if node.name.startswith('Mul') or node.name.startswith('_mul'):
+                find_mul = True
+        if find_sub and find_mul:
+            #mxnet arcface model
+            input_mean = 0.0
+            input_std = 1.0
+        else:
+            input_mean = 127.5
+            input_std = 127.5
+        self.input_mean = input_mean
+        self.input_std = input_std
+        #print('input mean and std:', self.input_mean, self.input_std)
+        if self.session is None:
+            self.session = onnxruntime.InferenceSession(self.model_file, providers=['CoreMLExecutionProvider','CUDAExecutionProvider'])
+        input_cfg = self.session.get_inputs()[0]
+        input_shape = input_cfg.shape
+        input_name = input_cfg.name
+        self.input_size = tuple(input_shape[2:4][::-1])
+        self.input_shape = input_shape
+        outputs = self.session.get_outputs()
+        output_names = []
+        for out in outputs:
+            output_names.append(out.name)
+        self.input_name = input_name
+        self.output_names = output_names
+        assert len(self.output_names)==1
+        self.output_shape = outputs[0].shape
+    def prepare(self, ctx_id, **kwargs):
+        if ctx_id<0:
+            self.session.set_providers(['CPUExecutionProvider'])
+    def get(self, img, kps):
+        aimg = face_align.norm_crop(img, landmark=kps, image_size=self.input_size[0])
+        embedding = self.get_feat(aimg).flatten()
+        return embedding
+    def compute_sim(self, feat1, feat2):
+        from numpy.linalg import norm
+        feat1 = feat1.ravel()
+        feat2 = feat2.ravel()
+        sim = np.dot(feat1, feat2) / (norm(feat1) * norm(feat2))
+        return sim
+    def get_feat(self, imgs):
+        if not isinstance(imgs, list):
+            imgs = [imgs]
+        input_size = self.input_size
+        blob = cv2.dnn.blobFromImages(imgs, 1.0 / self.input_std, input_size,
+                                      (self.input_mean, self.input_mean, self.input_mean), swapRB=True)
+        net_out = self.session.run(self.output_names, {self.input_name: blob})[0]
+        return net_out
+    def forward(self, batch_data):
+        blob = (batch_data - self.input_mean) / self.input_std
+        net_out = self.session.run(self.output_names, {self.input_name: blob})[0]
+        return net_out

recognition/face_align.py ADDED Viewed

	@@ -0,0 +1,141 @@

+import cv2
+import numpy as np
+from skimage import transform as trans
+src1 = np.array([[51.642, 50.115], [57.617, 49.990], [35.740, 69.007],
+                 [51.157, 89.050], [57.025, 89.702]],
+                dtype=np.float32)
+#<--left
+src2 = np.array([[45.031, 50.118], [65.568, 50.872], [39.677, 68.111],
+                 [45.177, 86.190], [64.246, 86.758]],
+                dtype=np.float32)
+#---frontal
+src3 = np.array([[39.730, 51.138], [72.270, 51.138], [56.000, 68.493],
+                 [42.463, 87.010], [69.537, 87.010]],
+                dtype=np.float32)
+#-->right
+src4 = np.array([[46.845, 50.872], [67.382, 50.118], [72.737, 68.111],
+                 [48.167, 86.758], [67.236, 86.190]],
+                dtype=np.float32)
+#-->right profile
+src5 = np.array([[54.796, 49.990], [60.771, 50.115], [76.673, 69.007],
+                 [55.388, 89.702], [61.257, 89.050]],
+                dtype=np.float32)
+src = np.array([src1, src2, src3, src4, src5])
+src_map = {112: src, 224: src * 2}
+arcface_src = np.array(
+    [[38.2946, 51.6963], [73.5318, 51.5014], [56.0252, 71.7366],
+     [41.5493, 92.3655], [70.7299, 92.2041]],
+    dtype=np.float32)
+arcface_src = np.expand_dims(arcface_src, axis=0)
+# In[66]:
+# lmk is prediction; src is template
+def estimate_norm(lmk, image_size=112, mode='arcface'):
+    assert lmk.shape == (5, 2)
+    tform = trans.SimilarityTransform()
+    lmk_tran = np.insert(lmk, 2, values=np.ones(5), axis=1)
+    min_M = []
+    min_index = []
+    min_error = float('inf')
+    if mode == 'arcface':
+        if image_size == 112:
+            src = arcface_src
+        else:
+            src = float(image_size) / 112 * arcface_src
+    else:
+        src = src_map[image_size]
+    for i in np.arange(src.shape[0]):
+        tform.estimate(lmk, src[i])
+        M = tform.params[0:2, :]
+        results = np.dot(M, lmk_tran.T)
+        results = results.T
+        error = np.sum(np.sqrt(np.sum((results - src[i])**2, axis=1)))
+        #         print(error)
+        if error < min_error:
+            min_error = error
+            min_M = M
+            min_index = i
+    return min_M, min_index
+def norm_crop(img, landmark, image_size=112, mode='arcface'):
+    M, pose_index = estimate_norm(landmark, image_size, mode)
+    warped = cv2.warpAffine(img, M, (image_size, image_size), borderValue=0.0)
+    return warped
+def square_crop(im, S):
+    if im.shape[0] > im.shape[1]:
+        height = S
+        width = int(float(im.shape[1]) / im.shape[0] * S)
+        scale = float(S) / im.shape[0]
+    else:
+        width = S
+        height = int(float(im.shape[0]) / im.shape[1] * S)
+        scale = float(S) / im.shape[1]
+    resized_im = cv2.resize(im, (width, height))
+    det_im = np.zeros((S, S, 3), dtype=np.uint8)
+    det_im[:resized_im.shape[0], :resized_im.shape[1], :] = resized_im
+    return det_im, scale
+def transform(data, center, output_size, scale, rotation):
+    scale_ratio = scale
+    rot = float(rotation) * np.pi / 180.0
+    #translation = (output_size/2-center[0]*scale_ratio, output_size/2-center[1]*scale_ratio)
+    t1 = trans.SimilarityTransform(scale=scale_ratio)
+    cx = center[0] * scale_ratio
+    cy = center[1] * scale_ratio
+    t2 = trans.SimilarityTransform(translation=(-1 * cx, -1 * cy))
+    t3 = trans.SimilarityTransform(rotation=rot)
+    t4 = trans.SimilarityTransform(translation=(output_size / 2,
+                                                output_size / 2))
+    t = t1 + t2 + t3 + t4
+    M = t.params[0:2]
+    cropped = cv2.warpAffine(data,
+                             M, (output_size, output_size),
+                             borderValue=0.0)
+    return cropped, M
+def trans_points2d(pts, M):
+    new_pts = np.zeros(shape=pts.shape, dtype=np.float32)
+    for i in range(pts.shape[0]):
+        pt = pts[i]
+        new_pt = np.array([pt[0], pt[1], 1.], dtype=np.float32)
+        new_pt = np.dot(M, new_pt)
+        #print('new_pt', new_pt.shape, new_pt)
+        new_pts[i] = new_pt[0:2]
+    return new_pts
+def trans_points3d(pts, M):
+    scale = np.sqrt(M[0][0] * M[0][0] + M[0][1] * M[0][1])
+    #print(scale)
+    new_pts = np.zeros(shape=pts.shape, dtype=np.float32)
+    for i in range(pts.shape[0]):
+        pt = pts[i]
+        new_pt = np.array([pt[0], pt[1], 1.], dtype=np.float32)
+        new_pt = np.dot(M, new_pt)
+        #print('new_pt', new_pt.shape, new_pt)
+        new_pts[i][0:2] = new_pt[0:2]
+        new_pts[i][2] = pts[i][2] * scale
+    return new_pts
+def trans_points(pts, M):
+    if pts.shape[1] == 2:
+        return trans_points2d(pts, M)
+    else:
+        return trans_points3d(pts, M)

recognition/main.py ADDED Viewed

	@@ -0,0 +1,57 @@

+#!/usr/bin/env python
+import os
+import os.path as osp
+import argparse
+import cv2
+import numpy as np
+import onnxruntime
+from scrfd import SCRFD
+from arcface_onnx import ArcFaceONNX
+onnxruntime.set_default_logger_severity(5)
+assets_dir = osp.expanduser('~/.insightface/models/buffalo_l')
+detector = SCRFD(os.path.join(assets_dir, 'det_10g.onnx'))
+detector.prepare(0)
+model_path = os.path.join(assets_dir, 'w600k_r50.onnx')
+rec = ArcFaceONNX(model_path)
+rec.prepare(0)
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser()
+    parser.add_argument('img1', type=str)
+    parser.add_argument('img2', type=str)
+    return parser.parse_args()
+def func(args):
+    image1 = cv2.imread(args.img1)
+    image2 = cv2.imread(args.img2)
+    bboxes1, kpss1 = detector.autodetect(image1, max_num=1)
+    if bboxes1.shape[0]==0:
+        return -1.0, "Face not found in Image-1"
+    bboxes2, kpss2 = detector.autodetect(image2, max_num=1)
+    if bboxes2.shape[0]==0:
+        return -1.0, "Face not found in Image-2"
+    kps1 = kpss1[0]
+    kps2 = kpss2[0]
+    feat1 = rec.get(image1, kps1)
+    feat2 = rec.get(image2, kps2)
+    sim = rec.compute_sim(feat1, feat2)
+    if sim<0.2:
+        conclu = 'They are NOT the same person'
+    elif sim>=0.2 and sim<0.28:
+        conclu = 'They are LIKELY TO be the same person'
+    else:
+        conclu = 'They ARE the same person'
+    return sim, conclu
+if __name__ == '__main__':
+    args = parse_args()
+    output = func(args)
+    print('sim: %.4f, message: %s'%(output[0], output[1]))

recognition/scrfd.py ADDED Viewed

	@@ -0,0 +1,329 @@

+from __future__ import division
+import datetime
+import numpy as np
+#import onnx
+import onnxruntime
+import os
+import os.path as osp
+import cv2
+import sys
+def softmax(z):
+    assert len(z.shape) == 2
+    s = np.max(z, axis=1)
+    s = s[:, np.newaxis] # necessary step to do broadcasting
+    e_x = np.exp(z - s)
+    div = np.sum(e_x, axis=1)
+    div = div[:, np.newaxis] # dito
+    return e_x / div
+def distance2bbox(points, distance, max_shape=None):
+    """Decode distance prediction to bounding box.
+    Args:
+        points (Tensor): Shape (n, 2), [x, y].
+        distance (Tensor): Distance from the given point to 4
+            boundaries (left, top, right, bottom).
+        max_shape (tuple): Shape of the image.
+    Returns:
+        Tensor: Decoded bboxes.
+    """
+    x1 = points[:, 0] - distance[:, 0]
+    y1 = points[:, 1] - distance[:, 1]
+    x2 = points[:, 0] + distance[:, 2]
+    y2 = points[:, 1] + distance[:, 3]
+    if max_shape is not None:
+        x1 = x1.clamp(min=0, max=max_shape[1])
+        y1 = y1.clamp(min=0, max=max_shape[0])
+        x2 = x2.clamp(min=0, max=max_shape[1])
+        y2 = y2.clamp(min=0, max=max_shape[0])
+    return np.stack([x1, y1, x2, y2], axis=-1)
+def distance2kps(points, distance, max_shape=None):
+    """Decode distance prediction to bounding box.
+    Args:
+        points (Tensor): Shape (n, 2), [x, y].
+        distance (Tensor): Distance from the given point to 4
+            boundaries (left, top, right, bottom).
+        max_shape (tuple): Shape of the image.
+    Returns:
+        Tensor: Decoded bboxes.
+    """
+    preds = []
+    for i in range(0, distance.shape[1], 2):
+        px = points[:, i%2] + distance[:, i]
+        py = points[:, i%2+1] + distance[:, i+1]
+        if max_shape is not None:
+            px = px.clamp(min=0, max=max_shape[1])
+            py = py.clamp(min=0, max=max_shape[0])
+        preds.append(px)
+        preds.append(py)
+    return np.stack(preds, axis=-1)
+class SCRFD:
+    def __init__(self, model_file=None, session=None):
+        import onnxruntime
+        self.model_file = model_file
+        self.session = session
+        self.taskname = 'detection'
+        self.batched = False
+        if self.session is None:
+            assert self.model_file is not None
+            assert osp.exists(self.model_file)
+            self.session = onnxruntime.InferenceSession(self.model_file, providers=['CoreMLExecutionProvider','CUDAExecutionProvider'])
+        self.center_cache = {}
+        self.nms_thresh = 0.4
+        self.det_thresh = 0.5
+        self._init_vars()
+    def _init_vars(self):
+        input_cfg = self.session.get_inputs()[0]
+        input_shape = input_cfg.shape
+        #print(input_shape)
+        if isinstance(input_shape[2], str):
+            self.input_size = None
+        else:
+            self.input_size = tuple(input_shape[2:4][::-1])
+        #print('image_size:', self.image_size)
+        input_name = input_cfg.name
+        self.input_shape = input_shape
+        outputs = self.session.get_outputs()
+        if len(outputs[0].shape) == 3:
+            self.batched = True
+        output_names = []
+        for o in outputs:
+            output_names.append(o.name)
+        self.input_name = input_name
+        self.output_names = output_names
+        self.input_mean = 127.5
+        self.input_std = 128.0
+        #print(self.output_names)
+        #assert len(outputs)==10 or len(outputs)==15
+        self.use_kps = False
+        self._anchor_ratio = 1.0
+        self._num_anchors = 1
+        if len(outputs)==6:
+            self.fmc = 3
+            self._feat_stride_fpn = [8, 16, 32]
+            self._num_anchors = 2
+        elif len(outputs)==9:
+            self.fmc = 3
+            self._feat_stride_fpn = [8, 16, 32]
+            self._num_anchors = 2
+            self.use_kps = True
+        elif len(outputs)==10:
+            self.fmc = 5
+            self._feat_stride_fpn = [8, 16, 32, 64, 128]
+            self._num_anchors = 1
+        elif len(outputs)==15:
+            self.fmc = 5
+            self._feat_stride_fpn = [8, 16, 32, 64, 128]
+            self._num_anchors = 1
+            self.use_kps = True
+    def prepare(self, ctx_id, **kwargs):
+        if ctx_id<0:
+            self.session.set_providers(['CPUExecutionProvider'])
+        nms_thresh = kwargs.get('nms_thresh', None)
+        if nms_thresh is not None:
+            self.nms_thresh = nms_thresh
+        det_thresh = kwargs.get('det_thresh', None)
+        if det_thresh is not None:
+            self.det_thresh = det_thresh
+        input_size = kwargs.get('input_size', None)
+        if input_size is not None:
+            if self.input_size is not None:
+                print('warning: det_size is already set in scrfd model, ignore')
+            else:
+                self.input_size = input_size
+    def forward(self, img, threshold):
+        scores_list = []
+        bboxes_list = []
+        kpss_list = []
+        input_size = tuple(img.shape[0:2][::-1])
+        blob = cv2.dnn.blobFromImage(img, 1.0/self.input_std, input_size, (self.input_mean, self.input_mean, self.input_mean), swapRB=True)
+        net_outs = self.session.run(self.output_names, {self.input_name : blob})
+        input_height = blob.shape[2]
+        input_width = blob.shape[3]
+        fmc = self.fmc
+        for idx, stride in enumerate(self._feat_stride_fpn):
+            # If model support batch dim, take first output
+            if self.batched:
+                scores = net_outs[idx][0]
+                bbox_preds = net_outs[idx + fmc][0]
+                bbox_preds = bbox_preds * stride
+                if self.use_kps:
+                    kps_preds = net_outs[idx + fmc * 2][0] * stride
+            # If model doesn't support batching take output as is
+            else:
+                scores = net_outs[idx]
+                bbox_preds = net_outs[idx + fmc]
+                bbox_preds = bbox_preds * stride
+                if self.use_kps:
+                    kps_preds = net_outs[idx + fmc * 2] * stride
+            height = input_height // stride
+            width = input_width // stride
+            K = height * width
+            key = (height, width, stride)
+            if key in self.center_cache:
+                anchor_centers = self.center_cache[key]
+            else:
+                #solution-1, c style:
+                #anchor_centers = np.zeros( (height, width, 2), dtype=np.float32 )
+                #for i in range(height):
+                #    anchor_centers[i, :, 1] = i
+                #for i in range(width):
+                #    anchor_centers[:, i, 0] = i
+                #solution-2:
+                #ax = np.arange(width, dtype=np.float32)
+                #ay = np.arange(height, dtype=np.float32)
+                #xv, yv = np.meshgrid(np.arange(width), np.arange(height))
+                #anchor_centers = np.stack([xv, yv], axis=-1).astype(np.float32)
+                #solution-3:
+                anchor_centers = np.stack(np.mgrid[:height, :width][::-1], axis=-1).astype(np.float32)
+                #print(anchor_centers.shape)
+                anchor_centers = (anchor_centers * stride).reshape( (-1, 2) )
+                if self._num_anchors>1:
+                    anchor_centers = np.stack([anchor_centers]*self._num_anchors, axis=1).reshape( (-1,2) )
+                if len(self.center_cache)<100:
+                    self.center_cache[key] = anchor_centers
+            pos_inds = np.where(scores>=threshold)[0]
+            bboxes = distance2bbox(anchor_centers, bbox_preds)
+            pos_scores = scores[pos_inds]
+            pos_bboxes = bboxes[pos_inds]
+            scores_list.append(pos_scores)
+            bboxes_list.append(pos_bboxes)
+            if self.use_kps:
+                kpss = distance2kps(anchor_centers, kps_preds)
+                #kpss = kps_preds
+                kpss = kpss.reshape( (kpss.shape[0], -1, 2) )
+                pos_kpss = kpss[pos_inds]
+                kpss_list.append(pos_kpss)
+        return scores_list, bboxes_list, kpss_list
+    def detect(self, img, input_size = None, thresh=None, max_num=0, metric='default'):
+        assert input_size is not None or self.input_size is not None
+        input_size = self.input_size if input_size is None else input_size
+        im_ratio = float(img.shape[0]) / img.shape[1]
+        model_ratio = float(input_size[1]) / input_size[0]
+        if im_ratio>model_ratio:
+            new_height = input_size[1]
+            new_width = int(new_height / im_ratio)
+        else:
+            new_width = input_size[0]
+            new_height = int(new_width * im_ratio)
+        det_scale = float(new_height) / img.shape[0]
+        resized_img = cv2.resize(img, (new_width, new_height))
+        det_img = np.zeros( (input_size[1], input_size[0], 3), dtype=np.uint8 )
+        det_img[:new_height, :new_width, :] = resized_img
+        det_thresh = thresh if thresh is not None else self.det_thresh
+        scores_list, bboxes_list, kpss_list = self.forward(det_img, det_thresh)
+        scores = np.vstack(scores_list)
+        scores_ravel = scores.ravel()
+        order = scores_ravel.argsort()[::-1]
+        bboxes = np.vstack(bboxes_list) / det_scale
+        if self.use_kps:
+            kpss = np.vstack(kpss_list) / det_scale
+        pre_det = np.hstack((bboxes, scores)).astype(np.float32, copy=False)
+        pre_det = pre_det[order, :]
+        keep = self.nms(pre_det)
+        det = pre_det[keep, :]
+        if self.use_kps:
+            kpss = kpss[order,:,:]
+            kpss = kpss[keep,:,:]
+        else:
+            kpss = None
+        if max_num > 0 and det.shape[0] > max_num:
+            area = (det[:, 2] - det[:, 0]) * (det[:, 3] -
+                                                    det[:, 1])
+            img_center = img.shape[0] // 2, img.shape[1] // 2
+            offsets = np.vstack([
+                (det[:, 0] + det[:, 2]) / 2 - img_center[1],
+                (det[:, 1] + det[:, 3]) / 2 - img_center[0]
+            ])
+            offset_dist_squared = np.sum(np.power(offsets, 2.0), 0)
+            if metric=='max':
+                values = area
+            else:
+                values = area - offset_dist_squared * 2.0  # some extra weight on the centering
+            bindex = np.argsort(
+                values)[::-1]  # some extra weight on the centering
+            bindex = bindex[0:max_num]
+            det = det[bindex, :]
+            if kpss is not None:
+                kpss = kpss[bindex, :]
+        return det, kpss
+    def autodetect(self, img, max_num=0, metric='max'):
+        bboxes, kpss = self.detect(img, input_size=(640, 640), thresh=0.5)
+        bboxes2, kpss2 = self.detect(img, input_size=(128, 128), thresh=0.5)
+        bboxes_all = np.concatenate([bboxes, bboxes2], axis=0)
+        kpss_all = np.concatenate([kpss, kpss2], axis=0)
+        keep = self.nms(bboxes_all)
+        det = bboxes_all[keep,:]
+        kpss = kpss_all[keep,:]
+        if max_num > 0 and det.shape[0] > max_num:
+            area = (det[:, 2] - det[:, 0]) * (det[:, 3] -
+                                                    det[:, 1])
+            img_center = img.shape[0] // 2, img.shape[1] // 2
+            offsets = np.vstack([
+                (det[:, 0] + det[:, 2]) / 2 - img_center[1],
+                (det[:, 1] + det[:, 3]) / 2 - img_center[0]
+            ])
+            offset_dist_squared = np.sum(np.power(offsets, 2.0), 0)
+            if metric=='max':
+                values = area
+            else:
+                values = area - offset_dist_squared * 2.0  # some extra weight on the centering
+            bindex = np.argsort(
+                values)[::-1]  # some extra weight on the centering
+            bindex = bindex[0:max_num]
+            det = det[bindex, :]
+            if kpss is not None:
+                kpss = kpss[bindex, :]
+        return det, kpss
+    def nms(self, dets):
+        thresh = self.nms_thresh
+        x1 = dets[:, 0]
+        y1 = dets[:, 1]
+        x2 = dets[:, 2]
+        y2 = dets[:, 3]
+        scores = dets[:, 4]
+        areas = (x2 - x1 + 1) * (y2 - y1 + 1)
+        order = scores.argsort()[::-1]
+        keep = []
+        while order.size > 0:
+            i = order[0]
+            keep.append(i)
+            xx1 = np.maximum(x1[i], x1[order[1:]])
+            yy1 = np.maximum(y1[i], y1[order[1:]])
+            xx2 = np.minimum(x2[i], x2[order[1:]])
+            yy2 = np.minimum(y2[i], y2[order[1:]])
+            w = np.maximum(0.0, xx2 - xx1 + 1)
+            h = np.maximum(0.0, yy2 - yy1 + 1)
+            inter = w * h
+            ovr = inter / (areas[i] + areas[order[1:]] - inter)
+            inds = np.where(ovr <= thresh)[0]
+            order = order[inds + 1]
+        return keep

refacer.py ADDED Viewed

	@@ -0,0 +1,262 @@

+import cv2
+import onnxruntime as rt
+import sys
+from insightface.app import FaceAnalysis
+sys.path.insert(1, './recognition')
+from scrfd import SCRFD
+from arcface_onnx import ArcFaceONNX
+import os.path as osp
+import os
+from pathlib import Path
+from tqdm import tqdm
+import ffmpeg
+import random
+import multiprocessing as mp
+from concurrent.futures import ThreadPoolExecutor
+from insightface.model_zoo.inswapper import INSwapper
+import psutil
+from enum import Enum
+from insightface.app.common import Face
+from insightface.utils.storage import ensure_available
+import re
+import subprocess
+class RefacerMode(Enum):
+     CPU, CUDA, COREML, TENSORRT = range(1, 5)
+class Refacer:
+    def __init__(self,force_cpu=False,colab_performance=False):
+        self.first_face = False
+        self.force_cpu = force_cpu
+        self.colab_performance = colab_performance
+        self.__check_encoders()
+        self.__check_providers()
+        self.total_mem = psutil.virtual_memory().total
+        self.__init_apps()
+    def __check_providers(self):
+        if self.force_cpu :
+            self.providers = ['CPUExecutionProvider']
+        else:
+            self.providers = rt.get_available_providers()
+        rt.set_default_logger_severity(4)
+        self.sess_options = rt.SessionOptions()
+        self.sess_options.execution_mode = rt.ExecutionMode.ORT_SEQUENTIAL
+        self.sess_options.graph_optimization_level = rt.GraphOptimizationLevel.ORT_ENABLE_ALL
+        if len(self.providers) == 1 and 'CPUExecutionProvider' in self.providers:
+            self.mode = RefacerMode.CPU
+            self.use_num_cpus = mp.cpu_count()-1
+            self.sess_options.intra_op_num_threads = int(self.use_num_cpus/3)
+            print(f"CPU mode with providers {self.providers}")
+        elif self.colab_performance:
+            self.mode = RefacerMode.TENSORRT
+            self.use_num_cpus = mp.cpu_count()-1
+            self.sess_options.intra_op_num_threads = int(self.use_num_cpus/3)
+            print(f"TENSORRT mode with providers {self.providers}")
+        elif 'CoreMLExecutionProvider' in self.providers:
+            self.mode = RefacerMode.COREML
+            self.use_num_cpus = mp.cpu_count()-1
+            self.sess_options.intra_op_num_threads = int(self.use_num_cpus/3)
+            print(f"CoreML mode with providers {self.providers}")
+        elif 'CUDAExecutionProvider' in self.providers:
+            self.mode = RefacerMode.CUDA
+            self.use_num_cpus = 2
+            self.sess_options.intra_op_num_threads = 1
+            if 'TensorrtExecutionProvider' in self.providers:
+                self.providers.remove('TensorrtExecutionProvider')
+            print(f"CUDA mode with providers {self.providers}")
+        """
+        elif 'TensorrtExecutionProvider' in self.providers:
+            self.mode = RefacerMode.TENSORRT
+            #self.use_num_cpus = 1
+            #self.sess_options.intra_op_num_threads = 1
+            self.use_num_cpus = mp.cpu_count()-1
+            self.sess_options.intra_op_num_threads = int(self.use_num_cpus/3)
+            print(f"TENSORRT mode with providers {self.providers}")
+        """
+    def __init_apps(self):
+        assets_dir = ensure_available('models', 'buffalo_l', root='~/.insightface')
+        model_path = os.path.join(assets_dir, 'det_10g.onnx')
+        sess_face = rt.InferenceSession(model_path, self.sess_options, providers=self.providers)
+        self.face_detector = SCRFD(model_path,sess_face)
+        self.face_detector.prepare(0,input_size=(640, 640))
+        model_path = os.path.join(assets_dir , 'w600k_r50.onnx')
+        sess_rec = rt.InferenceSession(model_path, self.sess_options, providers=self.providers)
+        self.rec_app = ArcFaceONNX(model_path,sess_rec)
+        self.rec_app.prepare(0)
+        model_path = 'inswapper_128.onnx'
+        sess_swap = rt.InferenceSession(model_path, self.sess_options, providers=self.providers)
+        self.face_swapper = INSwapper(model_path,sess_swap)
+    def prepare_faces(self, faces):
+        self.replacement_faces=[]
+        for face in faces:
+            #image1 = cv2.imread(face.origin)
+            if "origin" in face:
+                face_threshold = face['threshold']
+                bboxes1, kpss1 = self.face_detector.autodetect(face['origin'], max_num=1)
+                if len(kpss1)<1:
+                    raise Exception('No face detected on "Face to replace" image')
+                feat_original = self.rec_app.get(face['origin'], kpss1[0])
+            else:
+                face_threshold = 0
+                self.first_face = True
+                feat_original = None
+                print('No origin image: First face change')
+            #image2 = cv2.imread(face.destination)
+            _faces = self.__get_faces(face['destination'],max_num=1)
+            if len(_faces)<1:
+                raise Exception('No face detected on "Destination face" image')
+            self.replacement_faces.append((feat_original,_faces[0],face_threshold))
+    def __convert_video(self,video_path,output_video_path):
+        if self.video_has_audio:
+            print("Merging audio with the refaced video...")
+            new_path = output_video_path + str(random.randint(0,999)) + "_c.mp4"
+            #stream = ffmpeg.input(output_video_path)
+            in1 = ffmpeg.input(output_video_path)
+            in2 = ffmpeg.input(video_path)
+            out = ffmpeg.output(in1.video, in2.audio, new_path,video_bitrate=self.ffmpeg_video_bitrate,vcodec=self.ffmpeg_video_encoder)
+            out.run(overwrite_output=True,quiet=True)
+        else:
+            new_path = output_video_path
+            print("The video doesn't have audio, so post-processing is not necessary")
+        print(f"The process has finished.\nThe refaced video can be found at {os.path.abspath(new_path)}")
+        return new_path
+    def __get_faces(self,frame,max_num=0):
+        bboxes, kpss = self.face_detector.detect(frame,max_num=max_num,metric='default')
+        if bboxes.shape[0] == 0:
+            return []
+        ret = []
+        for i in range(bboxes.shape[0]):
+            bbox = bboxes[i, 0:4]
+            det_score = bboxes[i, 4]
+            kps = None
+            if kpss is not None:
+                kps = kpss[i]
+            face = Face(bbox=bbox, kps=kps, det_score=det_score)
+            face.embedding = self.rec_app.get(frame, kps)
+            ret.append(face)
+        return ret
+    def process_first_face(self,frame):
+        faces = self.__get_faces(frame,max_num=1)
+        if len(faces) != 0:
+            frame = self.face_swapper.get(frame, faces[0], self.replacement_faces[0][1], paste_back=True)
+        return frame
+    def process_faces(self,frame):
+        faces = self.__get_faces(frame,max_num=0)
+        for rep_face in self.replacement_faces:
+            for i in range(len(faces) - 1, -1, -1):
+                sim = self.rec_app.compute_sim(rep_face[0], faces[i].embedding)
+                if sim>=rep_face[2]:
+                    frame = self.face_swapper.get(frame, faces[i], rep_face[1], paste_back=True)
+                    del faces[i]
+                    break
+        return frame
+    def __check_video_has_audio(self,video_path):
+        self.video_has_audio = False
+        probe = ffmpeg.probe(video_path)
+        audio_stream = next((stream for stream in probe['streams'] if stream['codec_type'] == 'audio'), None)
+        if audio_stream is not None:
+            self.video_has_audio = True
+    def reface_group(self, faces, frames, output):
+        with ThreadPoolExecutor(max_workers = self.use_num_cpus) as executor:
+            if self.first_face:
+                results = list(tqdm(executor.map(self.process_first_face, frames), total=len(frames),desc="Processing frames"))
+            else:
+                results = list(tqdm(executor.map(self.process_faces, frames), total=len(frames),desc="Processing frames"))
+            for result in results:
+                output.write(result)
+    def reface(self, video_path, faces):
+        self.__check_video_has_audio(video_path)
+        output_video_path = os.path.join('out',Path(video_path).name)
+        self.prepare_faces(faces)
+        cap = cv2.VideoCapture(video_path)
+        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        print(f"Total frames: {total_frames}")
+        fps = cap.get(cv2.CAP_PROP_FPS)
+        frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        output = cv2.VideoWriter(output_video_path, fourcc, fps, (frame_width, frame_height))
+        frames=[]
+        self.k = 1
+        with tqdm(total=total_frames,desc="Extracting frames") as pbar:
+            while cap.isOpened():
+                flag, frame = cap.read()
+                if flag and len(frame)>0:
+                    frames.append(frame.copy())
+                    pbar.update()
+                else:
+                    break
+                if (len(frames) > 1000):
+                    self.reface_group(faces,frames,output)
+                    frames=[]
+            cap.release()
+            pbar.close()
+        self.reface_group(faces,frames,output)
+        frames=[]
+        output.release()
+        return self.__convert_video(video_path,output_video_path)
+    def __try_ffmpeg_encoder(self, vcodec):
+        print(f"Trying FFMPEG {vcodec} encoder")
+        command = ['ffmpeg', '-y', '-f','lavfi','-i','testsrc=duration=1:size=1280x720:rate=30','-vcodec',vcodec,'testsrc.mp4']
+        try:
+            subprocess.run(command, check=True, capture_output=True).stderr
+        except subprocess.CalledProcessError as e:
+            print(f"FFMPEG {vcodec} encoder doesn't work -> Disabled.")
+            return False
+        print(f"FFMPEG {vcodec} encoder works")
+        return True
+    def __check_encoders(self):
+        self.ffmpeg_video_encoder='libx264'
+        self.ffmpeg_video_bitrate='0'
+        pattern = r"encoders: ([a-zA-Z0-9_]+(?: [a-zA-Z0-9_]+)*)"
+        command = ['ffmpeg', '-codecs', '--list-encoders']
+        commandout = subprocess.run(command, check=True, capture_output=True).stdout
+        result = commandout.decode('utf-8').split('\n')
+        for r in result:
+            if "264" in r:
+                encoders = re.search(pattern, r).group(1).split(' ')
+                for v_c in Refacer.VIDEO_CODECS:
+                    for v_k in encoders:
+                        if v_c == v_k:
+                            if self.__try_ffmpeg_encoder(v_k):
+                                self.ffmpeg_video_encoder=v_k
+                                self.ffmpeg_video_bitrate=Refacer.VIDEO_CODECS[v_k]
+                                print(f"Video codec for FFMPEG: {self.ffmpeg_video_encoder}")
+                                return
+    VIDEO_CODECS = {
+         'h264_videotoolbox':'0', #osx HW acceleration
+         'h264_nvenc':'0', #NVIDIA HW acceleration
+         #'h264_qsv', #Intel HW acceleration
+         #'h264_vaapi', #Intel HW acceleration
+         #'h264_omx', #HW acceleration
+         'libx264':'0' #No HW acceleration
+    }

requirements-COREML.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+ffmpeg_python==0.2.0
+gradio==3.33.1
+insightface==0.7.3
+numpy==1.24.3
+onnx==1.14.0
+onnxruntime-silicon
+opencv_python==4.7.0.72
+opencv_python_headless==4.7.0.72
+scikit-image==0.20.0
+tqdm
+psutil
+ngrok

requirements-GPU.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+ffmpeg_python==0.2.0
+gradio==3.33.1
+insightface==0.7.3
+numpy==1.24.3
+onnx==1.14.0
+onnxruntime_gpu==1.15.0
+opencv_python==4.7.0.72
+opencv_python_headless==4.7.0.72
+scikit-image==0.20.0
+tqdm
+psutil
+ngrok

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+ffmpeg-python==0.2.0
+gradio==4.40.0
+insightface==0.7.3
+numpy==1.24.3
+onnx==1.14.0
+onnxruntime==1.15.0
+opencv-python-headless==4.7.0.72
+scikit-image==0.20.0
+tqdm
+psutil

script.py ADDED Viewed

	@@ -0,0 +1,41 @@

+from refacer import Refacer
+from os.path import exists
+import argparse
+import cv2
+parser = argparse.ArgumentParser(description='Refacer')
+parser.add_argument("--force_cpu", help="Force CPU mode", default=False, action="store_true")
+parser.add_argument("--colab_performance", help="Use in colab for better performance", default=False,action="store_true")
+parser.add_argument("--face", help="Face to replace (ex: <src>,<dst>,<thresh=0.2>)", nargs='+', action="append", required=True)
+parser.add_argument("--video", help="Video to parse", required=True)
+args = parser.parse_args()
+refacer = Refacer(force_cpu=args.force_cpu,colab_performance=args.colab_performance)
+def run(video_path,faces):
+    video_path_exists = exists(video_path)
+    if video_path_exists == False:
+        print ("Can't find " + video_path)
+        return
+    faces_out = []
+    for face in faces:
+        face_str = face[0].split(",")
+        origin = exists(face_str[0])
+        if origin == False:
+            print ("Can't find " + face_str[0])
+            return
+        destination = exists(face_str[1])
+        if destination == False:
+            print ("Can't find " + face_str[1])
+            return
+        faces_out.append({
+                'origin':cv2.imread(face_str[0]),
+                'destination':cv2.imread(face_str[1]),
+                'threshold':float(face_str[2])
+            })
+    return refacer.reface(video_path,faces_out)
+run(args.video, args.face)