Hand Detection Model (YOLOv8)

This model classifies images into three categories:

hand: Close-up hand with fingers visible
arm: Forearm or elbow area
not_hand: Neither hand nor arm

Usage

from ultralytics import YOLO

# Load model directly from HuggingFace
model = YOLO('https://huggingface.co/EtanHey/hand-sign-detection/resolve/main/model.pt')

# Predict on an image
results = model.predict('image.jpg')

# Get predictions
if results and results[0].probs:
    probs = results[0].probs
    top_class = probs.top1  # 0=hand, 1=arm, 2=not_hand
    confidence = probs.top1conf.item()

    classes = ['hand', 'arm', 'not_hand']
    print(f"Detected: {classes[top_class]} ({confidence:.1%})")

Usage in Next.js/Node.js

Option 1: Python API Backend

// app/api/detect/route.js (Next.js 13+ App Router)
export async function POST(request) {
    const formData = await request.formData();
    const image = formData.get('image');

    // Call Python backend
    const response = await fetch('http://localhost:8000/predict', {
        method: 'POST',
        body: formData
    });

    const result = await response.json();
    return Response.json(result);
}

// Frontend component
async function detectHand(file) {
    const formData = new FormData();
    formData.append('image', file);

    const response = await fetch('/api/detect', {
        method: 'POST',
        body: formData
    });

    const result = await response.json();
    // result = { class: 'hand', confidence: 0.98 }
    return result;
}

Option 2: Python Microservice (FastAPI)

# backend/api.py
from fastapi import FastAPI, File, UploadFile
from ultralytics import YOLO
import numpy as np
from PIL import Image
import io

app = FastAPI()
model = YOLO('https://huggingface.co/EtanHey/hand-sign-detection/resolve/main/model.pt')

@app.post("/predict")
async def predict(file: UploadFile = File(...)):
    contents = await file.read()
    image = Image.open(io.BytesIO(contents))

    results = model.predict(image)
    probs = results[0].probs

    classes = ['hand', 'arm', 'not_hand']
    return {
        "class": classes[probs.top1],
        "confidence": float(probs.top1conf),
        "all_probs": {
            "hand": float(probs.data[0]),
            "arm": float(probs.data[1]),
            "not_hand": float(probs.data[2])
        }
    }

Option 3: Using ONNX.js (Browser-based)

// First convert model to ONNX (run once)
// python3 -c "from ultralytics import YOLO; YOLO('model.pt').export(format='onnx')"

import * as ort from 'onnxruntime-web';

async function detectHandBrowser(imageElement) {
    // Load ONNX model
    const session = await ort.InferenceSession.create('/model.onnx');

    // Preprocess image to 224x224
    const tensor = preprocessImage(imageElement);

    // Run inference
    const results = await session.run({ input: tensor });
    const probs = results.output.data;

    // Get prediction
    const classes = ['hand', 'arm', 'not_hand'];
    const maxIdx = probs.indexOf(Math.max(...probs));

    return {
        class: classes[maxIdx],
        confidence: probs[maxIdx],
        all_probs: {
            hand: probs[0],
            arm: probs[1],
            not_hand: probs[2]
        }
    };
}

Usage in React Native

import { launchImageLibrary } from 'react-native-image-picker';

const detectHand = async () => {
    const result = await launchImageLibrary({ mediaType: 'photo' });

    if (result.assets) {
        const formData = new FormData();
        formData.append('image', {
            uri: result.assets[0].uri,
            type: 'image/jpeg',
            name: 'photo.jpg'
        });

        const response = await fetch('YOUR_API_URL/predict', {
            method: 'POST',
            body: formData
        });

        const detection = await response.json();
        console.log('Detected:', detection.class, detection.confidence);
    }
};

Usage with cURL

# Test the model with cURL
curl -X POST -F "[email protected]" http://your-api-url/predict

# Response: {"class": "hand", "confidence": 0.98}

Usage in Swift (iOS)

import CoreML
import Vision

func detectHand(image: UIImage) {
    // First convert YOLO to CoreML format
    // Then use in iOS app:

    guard let model = try? VNCoreMLModel(for: HandDetector().model) else { return }

    let request = VNCoreMLRequest(model: model) { request, error in
        guard let results = request.results as? [VNClassificationObservation] else { return }

        if let topResult = results.first {
            let className = topResult.identifier // "hand", "arm", or "not_hand"
            let confidence = topResult.confidence
            print("Detected: \(className) with \(confidence * 100)% confidence")
        }
    }

    // Process image...
}

Model Details

Architecture: YOLOv8s-cls
Classes: 3 (hand, arm, not_hand)
Input Size: 224x224
Training Data: 1740 images
Accuracy: >96%

Training Details

Trained on a custom dataset with:

704 hand images
320 arm images
462 not_hand images

Split 80/20 for training/validation.

Downloads last month: 29

EtanHey
/

hand-sign-detection

Hand Detection Model (YOLOv8)

Usage

Usage in Next.js/Node.js

Option 1: Python API Backend

Option 2: Python Microservice (FastAPI)

Option 3: Using ONNX.js (Browser-based)

Usage in React Native

Usage with cURL

Usage in Swift (iOS)

Model Details

Training Details

Space using EtanHey/hand-sign-detection 1