Spaces:

leonelhs
/

poser-tf

Running

App Files Files Community

leonelhs commited on Nov 3, 2023

Commit

9a02a1c

1 Parent(s): d32c6db

inis space

Browse files

Files changed (7) hide show

.gitattributes +1 -0
.gitignore +4 -0
app.py +55 -0
examples/01.jpg +3 -0
examples/02.jpg +3 -0
examples/03.jpg +3 -0
poser.py +141 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.jpg filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,4 @@

+.idea/
+__pycache__/
+requirements.txt
+push_model.py

app.py ADDED Viewed

	@@ -0,0 +1,55 @@

+import PIL.Image
+import PIL.ImageOps
+import gradio as gr
+import numpy as np
+import tensorflow as tf
+from poser import draw_bones, movenet
+def predict(image: PIL.Image):
+    input_size = 256
+    size = (1280, 1280)
+    image = PIL.ImageOps.fit(image, size, PIL.Image.LANCZOS)
+    image_tf = tf.keras.preprocessing.image.img_to_array(image)
+    # Resize and pad the image to keep the aspect ratio and fit the expected size.
+    input_image = tf.expand_dims(image_tf, axis=0)
+    input_image = tf.image.resize_with_pad(input_image, input_size, input_size)
+    keypoints = movenet(input_image)
+    keypoints = np.array(keypoints)
+    image = tf.keras.preprocessing.image.array_to_img(image_tf)
+    draw_bones(image, keypoints)
+    return image
+footer = r"""
+<center>
+<b>
+Demo for <a href='https://www.tensorflow.org/hub/tutorials/movenet'>MoveNet</a>
+</b>
+</center>
+"""
+with gr.Blocks(title="MoveNet") as app:
+    gr.HTML("<center><h1>Human Pose Estimation with MoveNet</h1></center>")
+    gr.HTML("<center><h3>MoveNet: Ultra fast and accurate pose detection model</h3></center>")
+    with gr.Row().style(equal_height=False):
+        with gr.Column():
+            input_img = gr.Image(type="pil", label="Input image")
+            run_btn = gr.Button(variant="primary")
+        with gr.Column():
+            output_img = gr.Image(type="numpy", label="Output image")
+            gr.ClearButton(components=[input_img, output_img], variant="stop")
+    run_btn.click(predict, [input_img], [output_img])
+    with gr.Row():
+        blobs = [[f"examples/{x:02d}.jpg"] for x in range(1, 4)]
+        examples = gr.Dataset(components=[input_img], samples=blobs)
+        examples.click(lambda x: x[0], [examples], [input_img])
+    with gr.Row():
+        gr.HTML(footer)
+app.launch(share=False, debug=True, show_error=True)
+app.queue()

examples/01.jpg ADDED Viewed

Git LFS Details

SHA256: 553341d9732edb3943a76d62eed2f0934061f85a20fdcc2815f05d7b283693fe
Pointer size: 132 Bytes
Size of remote file: 1.22 MB

examples/02.jpg ADDED Viewed

Git LFS Details

SHA256: 353c8c048567931d18049f6dece667b7149d3c56b333c6032662e118fde178dd
Pointer size: 132 Bytes
Size of remote file: 1.21 MB

examples/03.jpg ADDED Viewed

Git LFS Details

SHA256: 5f2df3f80cc6e13d7d00dce94aa18f35a424478ba2b733f0335eb616e9d29b29
Pointer size: 131 Bytes
Size of remote file: 722 kB

poser.py ADDED Viewed

	@@ -0,0 +1,141 @@

+#############################################################################
+#
+#   Source from:
+#   https://www.tensorflow.org/hub/tutorials/movenet
+#
+#
+#############################################################################
+import PIL.Image
+import PIL.ImageOps
+import numpy as np
+import tensorflow as tf
+from PIL import ImageDraw
+from huggingface_hub import snapshot_download
+# Dictionary that maps from joint names to keypoint indices.
+KEYPOINT_DICT = {
+    'nose': 0,
+    'left_eye': 1, 'right_eye': 2,
+    'left_ear': 3, 'right_ear': 4,
+    'left_shoulder': 5, 'right_shoulder': 6,
+    'left_elbow': 7, 'right_elbow': 8,
+    'left_wrist': 9, 'right_wrist': 10,
+    'left_hip': 11, 'right_hip': 12,
+    'left_knee': 13, 'right_knee': 14,
+    'left_ankle': 15, 'right_ankle': 16
+}
+COLOR_DICT = {
+    (0, 1): 'Magenta',
+    (0, 2): 'Cyan',
+    (1, 3): 'Magenta',
+    (2, 4): 'Cyan',
+    (0, 5): 'Magenta',
+    (0, 6): 'Cyan',
+    (5, 7): 'Magenta',
+    (7, 9): 'Magenta',
+    (6, 8): 'Cyan',
+    (8, 10): 'Cyan',
+    (5, 6): 'Yellow',
+    (5, 11): 'Magenta',
+    (6, 12): 'Cyan',
+    (11, 12): 'Yellow',
+    (11, 13): 'Magenta',
+    (13, 15): 'Magenta',
+    (12, 14): 'Cyan',
+    (14, 16): 'Cyan'
+}
+def process_keypoints(keypoints, height, width, threshold=0.22):
+    """Returns high confidence keypoints and edges for visualization.
+      Args:
+        keypoints: A numpy array with shape [1, 1, 17, 3] representing
+          the keypoint coordinates and scores returned from the MoveNet model.
+        height: height of the image in pixels.
+        width: width of the image in pixels.
+        threshold: minimum confidence score for a keypoint to be
+          visualized.
+      Returns:
+        A (joints, bones, colors) containing:
+          * the coordinates of all keypoints of all detected entities;
+          * the coordinates of all skeleton edges of all detected entities;
+          * the colors in which the edges should be plotted.
+      """
+    keypoints_all = []
+    keypoint_edges_all = []
+    colors = []
+    num_instances, _, _, _ = keypoints.shape
+    for idx in range(num_instances):
+        kpts_x = keypoints[0, idx, :, 1]
+        kpts_y = keypoints[0, idx, :, 0]
+        kpts_scores = keypoints[0, idx, :, 2]
+        kpts_absolute_xy = np.stack(
+            [width * np.array(kpts_x), height * np.array(kpts_y)], axis=-1)
+        kpts_above_thresh_absolute = kpts_absolute_xy[
+                                     kpts_scores > threshold, :]
+        keypoints_all.append(kpts_above_thresh_absolute)
+        for edge_pair, color in COLOR_DICT.items():
+            if (kpts_scores[edge_pair[0]] > threshold and
+                    kpts_scores[edge_pair[1]] > threshold):
+                x_start = kpts_absolute_xy[edge_pair[0], 0]
+                y_start = kpts_absolute_xy[edge_pair[0], 1]
+                x_end = kpts_absolute_xy[edge_pair[1], 0]
+                y_end = kpts_absolute_xy[edge_pair[1], 1]
+                line_seg = np.array([[x_start, y_start], [x_end, y_end]])
+                keypoint_edges_all.append(line_seg)
+                colors.append(color)
+    if keypoints_all:
+        joints = np.concatenate(keypoints_all, axis=0)
+    else:
+        joints = np.zeros((0, 17, 2))
+    if keypoint_edges_all:
+        bones = np.stack(keypoint_edges_all, axis=0)
+    else:
+        bones = np.zeros((0, 2, 2))
+    return joints, bones, colors
+def draw_bones(pixmap: PIL.Image, keypoints):
+    draw = ImageDraw.Draw(pixmap)
+    joints, bones, colors = process_keypoints(keypoints, pixmap.height, pixmap.width)
+    for bone, color in zip(bones.tolist(), colors):
+        draw.line((*bone[0], *bone[1]), fill=color, width=4)
+    radio = 3
+    for c_x, c_y in joints:
+        shape = [(c_x - radio, c_y - radio), (c_x + radio, c_y + radio)]
+        draw.ellipse(shape, fill="red", outline="red")
+def movenet(image):
+    """Runs detection on an input image.
+        Args:
+          image: A [1, height, width, 3] tensor represents the input image
+            pixels. Note that the height/width should already be resized and match the
+            expected input resolution of the model before passing into this function.
+        Returns:
+          A [1, 1, 17, 3] float numpy array representing the predicted keypoint
+          coordinates and scores.
+    """
+    model_path = snapshot_download("leonelhs/movenet")
+    module = tf.saved_model.load(model_path)
+    model = module.signatures['serving_default']
+    # SavedModel format expects tensor type of int32.
+    image = tf.cast(image, dtype=tf.int32)
+    # Run model inference.
+    outputs = model(image)
+    # Output is a [1, 1, 17, 3] tensor.
+    return outputs['output_0'].numpy()