RTMO-s / README.md
Xenova's picture
Xenova HF staff
Create README.md
7384b30 verified
metadata
library_name: transformers.js
tags:
  - pose-estimation
license: apache-2.0

https://github.com/open-mmlab/mmpose/tree/main/projects/rtmo with ONNX weights to be compatible with Transformers.js.

Usage (Transformers.js)

If you haven't already, you can install the Transformers.js JavaScript library from NPM using:

npm i @xenova/transformers

Example: Perform pose-estimation w/ Xenova/RTMO-s.

import { AutoModel, AutoProcessor, RawImage } from '@xenova/transformers';

// Load model and processor
const model_id = 'Xenova/RTMO-s';
const model = await AutoModel.from_pretrained(model_id);
const processor = await AutoProcessor.from_pretrained(model_id);

// Read image and run processor
const url = 'https://huggingface.co/datasets/Xenova/transformers.js-docs/resolve/main/football-match.jpg';
const image = await RawImage.read(url);
const { pixel_values, original_sizes, reshaped_input_sizes } = await processor(image);

// Predict bounding boxes and keypoints
const { dets, keypoints } = await model({ input: pixel_values });

// Select the first image
const predicted_boxes = dets.tolist()[0];
const predicted_points = keypoints.tolist()[0];
const [height, width] = original_sizes[0];
const [resized_height, resized_width] = reshaped_input_sizes[0];

// Compute scale values
const xScale = width / resized_width;
const yScale = height / resized_height;

// Define thresholds
const point_threshold = 0.3;
const box_threshold = 0.3;

// Display results
for (let i = 0; i < predicted_boxes.length; ++i) {
    const [xmin, ymin, xmax, ymax, box_score] = predicted_boxes[i];
    if (box_score < box_threshold) continue;

    const x1 = (xmin * xScale).toFixed(2);
    const y1 = (ymin * yScale).toFixed(2);
    const x2 = (xmax * xScale).toFixed(2);
    const y2 = (ymax * yScale).toFixed(2);

    console.log(`Found person at [${x1}, ${y1}, ${x2}, ${y2}] with score ${box_score.toFixed(3)}`)
    const points = predicted_points[i]; // of shape [17, 3]
    for (let id = 0; id < points.length; ++id) {
        const label = model.config.id2label[id];
        const [x, y, point_score] = points[id];
        if (point_score < point_threshold) continue;
        console.log(`  - ${label}: (${(x * xScale).toFixed(2)}, ${(y * yScale).toFixed(2)}) with score ${point_score.toFixed(3)}`);
    }
}
See example output
Found person at [423.33, 55.52, 644.28, 504.13] with score 0.988
  - nose: (527.30, 117.12) with score 0.733
  - left_eye: (541.79, 109.26) with score 0.554
  - right_eye: (515.04, 107.59) with score 0.475
  - left_shoulder: (563.30, 171.75) with score 1.000
  - right_shoulder: (464.21, 159.75) with score 1.000
  - left_elbow: (575.71, 238.04) with score 0.998
  - right_elbow: (436.06, 218.10) with score 0.999
  - left_wrist: (605.86, 303.35) with score 1.000
  - right_wrist: (497.47, 220.82) with score 1.000
  - left_hip: (540.97, 307.31) with score 1.000
  - right_hip: (475.85, 318.78) with score 1.000
  - left_knee: (578.63, 368.63) with score 1.000
  - right_knee: (501.05, 442.49) with score 1.000
  - left_ankle: (572.11, 464.96) with score 0.991
  - right_ankle: (535.75, 441.52) with score 0.981
Found person at [89.97, 3.96, 517.81, 507.28] with score 0.966
  - left_shoulder: (242.65, 111.06) with score 0.999
  - right_shoulder: (228.79, 112.54) with score 0.999
  - left_elbow: (321.84, 169.07) with score 0.999
  - right_elbow: (225.76, 218.20) with score 1.000
  - left_wrist: (351.73, 220.74) with score 0.999
  - right_wrist: (160.19, 228.03) with score 1.000
  - left_hip: (342.34, 246.81) with score 1.000
  - right_hip: (360.05, 259.35) with score 0.999
  - left_knee: (299.56, 377.97) with score 0.998
  - right_knee: (313.81, 378.83) with score 0.976
  - left_ankle: (443.84, 312.35) with score 0.983
  - right_ankle: (424.74, 433.61) with score 0.823
Found person at [-0.53, 51.78, 153.65, 371.17] with score 0.769
  - nose: (75.52, 85.67) with score 0.363
  - left_shoulder: (121.54, 113.17) with score 1.000
  - right_shoulder: (49.77, 117.60) with score 1.000
  - left_elbow: (132.90, 147.02) with score 0.932
  - right_elbow: (30.31, 156.42) with score 0.992
  - left_wrist: (154.43, 162.08) with score 0.871
  - right_wrist: (17.20, 196.43) with score 0.943
  - left_hip: (105.61, 204.27) with score 0.999
  - right_hip: (61.99, 203.66) with score 0.999
  - left_knee: (114.70, 270.91) with score 1.000
  - right_knee: (63.75, 275.33) with score 1.000
  - left_ankle: (125.53, 342.00) with score 0.998
  - right_ankle: (63.16, 344.07) with score 0.997
Found person at [519.40, 34.94, 650.11, 312.07] with score 0.488
  - nose: (554.82, 76.58) with score 0.920
  - left_eye: (563.12, 69.41) with score 0.666
  - right_eye: (544.82, 70.01) with score 0.595
  - left_shoulder: (596.60, 105.61) with score 0.999
  - right_shoulder: (523.29, 107.31) with score 0.969
  - left_elbow: (625.14, 151.30) with score 0.999
  - right_elbow: (515.96, 147.59) with score 0.322
  - left_wrist: (630.90, 196.91) with score 0.998
  - right_wrist: (520.75, 181.83) with score 0.415
  - left_hip: (583.24, 200.84) with score 0.998
  - right_hip: (533.69, 200.01) with score 0.978
  - left_knee: (583.79, 265.14) with score 0.934
  - right_knee: (538.27, 262.98) with score 0.669
  - left_ankle: (584.90, 309.76) with score 0.489