zg9uagfv
diff --git a/‎build_part_with_score_queue.py‎
Lines changed: 38 additions & 0 deletions b/‎build_part_with_score_queue.py‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎config.yaml‎
Lines changed: 53 additions & 0 deletions b/‎config.yaml‎
Lines changed: 53 additions & 0 deletions
diff --git a/‎decode_multi_pose.py‎
Lines changed: 75 additions & 0 deletions b/‎decode_multi_pose.py‎
Lines changed: 75 additions & 0 deletions
diff --git a/‎decode_pose.py‎
Lines changed: 136 additions & 0 deletions b/‎decode_pose.py‎
Lines changed: 136 additions & 0 deletions
@@ -0,0 +1,38 @@
+#!/usr/bin/python3
+# -*- coding: UTF-8 -*-
+
+def scoreIsMaximumInLocalWindow(keypointId, score, heatmapY, heatmapX, localMaximumRadius, scores):
+    height, width, numKeypoints = scores.shape
+    localMaximum = True
+    yStart = max(heatmapY - localMaximumRadius, 0)
+    yEnd = min(heatmapY + localMaximumRadius + 1, height)
+    for yCurrent in range(yStart, yEnd):
+        xStart = max(heatmapX - localMaximumRadius, 0)
+        xEnd = min(heatmapX + localMaximumRadius + 1, width)
+        for xCurrent in range(xStart, xEnd):
+            if scores[yCurrent][xCurrent][keypointId] > score:
+                localMaximum = False
+                break
+        if False == localMaximum:
+            break
+    return localMaximum
+
+'''
+* Builds a priority queue with part candidate positions for a specific image in
+* the batch. For this we find all local maxima in the score maps with score
+* values above a threshold. We create a single priority queue across all parts.
+'''
+def buildPartWithScoreQueue(scoreThreshold, localMaximumRadius, scores, queue):
+    height, width, numKeypoints = scores.shape
+    for heatmapY in range(height):
+        for heatmapX in range(width):
+            for keypointId in range(numKeypoints):
+                score = scores[heatmapY][heatmapX][keypointId]
+                if score < scoreThreshold:
+                    continue
+                if scoreIsMaximumInLocalWindow(keypointId, score, \
+                                               heatmapY, heatmapX, \
+                                               localMaximumRadius, scores) is True:
+                    keypoint = {'score':score, 'part':{'y':heatmapY, 'x':heatmapX, 'id':keypointId}}
+                    queue.enqueue(keypoint)
+    return None
@@ -0,0 +1,53 @@
+chk: 1 # 1=mobilenet_v1_075
+imageSize: 337
+GOOGLE_CLOUD_STORAGE_DIR: 'https://storage.googleapis.com/tfjs-models/weights/posenet/'
+checkpoints: [ 'mobilenet_v1_050', 'mobilenet_v1_075', 'mobilenet_v1_100', 'mobilenet_v1_101']
+outputStride: 16
+mobileNet100Architecture: [
+  ['conv2d', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1]
+]
+mobileNet75Architecture: [ 
+  ['conv2d', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1]
+]
+mobileNet50Architecture: [
+  ['conv2d', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 2],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1],
+  ['separableConv', 1]
+]
@@ -0,0 +1,75 @@
+#!/usr/bin/python3
+# -*- coding: UTF-8 -*-
+from decode_utils import squaredDistance, getImageCoords
+from build_part_with_score_queue import buildPartWithScoreQueue
+from decode_pose import decodePose
+from max_heap import MaxHeap
+import numpy as np
+
+kLocalMaximumRadius = 1
+
+def withinNmsRadiusOfCorrespondingPoint(poses, squaredNmsRadius, coordinate, keypointId):
+    x = coordinate['x']
+    y = coordinate['y']
+    for pose in poses:
+        correspondingKeypoint = pose['keypoints'][keypointId]['position']
+        distance = squaredDistance(y, \
+                                   x, \
+                                   correspondingKeypoint['y'], \
+                                   correspondingKeypoint['x'])
+        if distance <= squaredNmsRadius:
+            return True
+    return False
+
+'''
+/* Score the newly proposed object instance without taking into account
+ * the scores of the parts that overlap with any previously detected
+ * instance.
+ */
+'''
+def getInstanceScore(existingPoses, squaredNmsRadius, instanceKeypoints):
+    notOverlappedKeypointScores = 0.0
+    for idx in range(len(instanceKeypoints)):
+        position = instanceKeypoints[idx]['position']
+        score = instanceKeypoints[idx]['score']
+        if withinNmsRadiusOfCorrespondingPoint(existingPoses, \
+                                               squaredNmsRadius, \
+                                               position, idx) is False:
+            notOverlappedKeypointScores += score
+    notOverlappedKeypointScores /= len(instanceKeypoints)
+    return notOverlappedKeypointScores
+
+def decodeMultiplePoses(scores, offsets, displacementsFwd, displacementsBwd, \
+                        width_factor, height_factor, \
+                        outputStride=16, maxPoseDetections=5, scoreThreshold= 0.5,
+                        nmsRadius= 30):
+    poses = []
+    squaredNmsRadius = nmsRadius * nmsRadius
+    scoresBuffer = np.squeeze(scores)
+    offsetsBuffer = np.squeeze(offsets)
+    displacementsBwdBuffer = np.squeeze(displacementsBwd)
+    displacementsFwdBuffer = np.squeeze(displacementsFwd)
+    height, width, numKeypoints = scoresBuffer.shape
+    queue = MaxHeap(height * width * numKeypoints, scoresBuffer)
+    buildPartWithScoreQueue(scoreThreshold, kLocalMaximumRadius, scoresBuffer, queue)
+    while len(poses) < maxPoseDetections and queue.empty() is False:
+        root = queue.dequeue()
+        rootImageCoords = getImageCoords(root['part'], outputStride, offsetsBuffer)
+        if withinNmsRadiusOfCorrespondingPoint(poses, \
+                                               squaredNmsRadius, \
+                                               rootImageCoords, \
+                                               root['part']['id']) is True:
+            continue
+        #Start a new detection instance at the position of the root.
+        keypoints = decodePose(root, \
+                               scoresBuffer, \
+                               offsetsBuffer, \
+                               outputStride, \
+                               displacementsFwdBuffer, \
+                               displacementsBwdBuffer)
+        for keypoint in keypoints:
+            keypoint['position']['y'] *= (height_factor)
+            keypoint['position']['x'] *= (width_factor)
+        score = getInstanceScore(poses, squaredNmsRadius, keypoints)
+        poses.append({'keypoints':keypoints, 'score':score})
+    return poses
@@ -0,0 +1,136 @@
+#!/usr/bin/python3
+# -*- coding: UTF-8 -*-
+
+import math
+from keypoints import poseChain, partIds, partNames
+from decode_utils import clamp, addVectors, getImageCoords, getOffsetPoint
+
+parentChildrenTuples = []
+
+for joint_name in poseChain:
+    parent_joint_name = joint_name[0]
+    child_joint_name = joint_name[1]
+    parentChildrenTuples.append([partIds[parent_joint_name], \
+                                partIds[child_joint_name]])
+''''
+parentChildrenTuples = poseChain.map(
+    ([parentJoinName, childJoinName]): NumberTuple =>
+        ([partIds[parentJoinName], partIds[childJoinName]]));
+'''
+
+parentToChildEdges = []
+for joint_id in parentChildrenTuples:
+    parentToChildEdges.append(joint_id[1]) #child_joint_id
+
+'''
+const parentToChildEdges: number[] =
+    parentChildrenTuples.map(([, childJointId]) => childJointId);
+'''
+
+childToParentEdges = []
+for joint_id in parentChildrenTuples:
+    childToParentEdges.append(joint_id[0]) #child_joint_id
+
+'''
+const childToParentEdges: number[] =
+    parentChildrenTuples.map(([
+                               parentJointId,
+                             ]) => parentJointId);
+'''
+
+def getDisplacement(edgeId, point, displacements):
+    numEdges = int(displacements.shape[2] / 2)
+    point_x = int(point['x'])
+    point_y = int(point['y'])
+    y = displacements[point_y][point_x][edgeId]
+    x = displacements[point_y][point_x][numEdges+edgeId]
+    return {'y':y, 'x':x}
+
+def getStridedIndexNearPoint(point, outputStride, height, width):
+    return {'y':clamp(round(float(point['y']) / float(outputStride)), 0, height - 1), \
+           'x':clamp(round(float(point['x']) / float(outputStride)), 0, width - 1)}
+
+'''
+ * We get a new keypoint along the `edgeId` for the pose instance, assuming
+ * that the position of the `idSource` part is already known. For this, we
+ * follow the displacement vector from the source to target part (stored in
+ * the `i`-t channel of the displacement tensor).
+'''
+def traverseToTargetKeypoint(edgeId, sourceKeypoint, targetKeypointId,
+                             scoresBuffer, offsets, outputStride, displacements):
+    height, width, numberScores = scoresBuffer.shape
+    #Nearest neighbor interpolation for the source->target displacements.
+    #最近邻插值(Nearest Neighbor interpolation)
+    sourceKeypointIndices = getStridedIndexNearPoint(sourceKeypoint['position'], \
+                                                   outputStride, \
+                                                   height, \
+                                                   width)
+    displacement = getDisplacement(edgeId, sourceKeypointIndices, displacements)
+    displacedPoint = addVectors(sourceKeypoint['position'], displacement)
+    displacedPointIndices = getStridedIndexNearPoint(displacedPoint, \
+                                                   outputStride, \
+                                                   height, \
+                                                   width)
+    x = int(displacedPointIndices['x'])
+    y = int(displacedPointIndices['y'])
+    offsetPoint = getOffsetPoint(y, x, targetKeypointId, offsets)
+    score = scoresBuffer[y][x][targetKeypointId]
+    targetKeypoint = addVectors( \
+        {'x': displacedPointIndices['x'] * outputStride, 'y': displacedPointIndices['y'] * outputStride}, \
+        {'x': offsetPoint['x'], 'y': offsetPoint['y']})
+
+    return {"position": targetKeypoint, \
+            "part": partNames[targetKeypointId], \
+            "score":score}
+
+'''
+ * Follows the displacement fields to decode the full pose of the object
+ * instance given the position of a part that acts as root.
+ *
+ * @return An array of decoded keypoints and their scores for a single pose
+'''
+def decodePose(root, scores, offsets, outputStride, displacementsFwd, displacementsBwd):
+    numParts = scores.shape[2]
+    numEdges = len(parentToChildEdges)
+
+    #const instanceKeypoints: Keypoint[] = new Array(numParts);
+    instanceKeypoints = []
+    for i in range(numParts):
+        keypoint = {'position':{'x':0, 'y':0}, 'part':'null', 'score':0.0}
+        instanceKeypoints.append(keypoint)
+    #Start a new detection instance at the position of the root.
+    rootPart, rootScore = root['part'], root['score']
+    rootPoint = getImageCoords(rootPart, outputStride, offsets)
+    id = rootPart['id']
+    instanceKeypoints[id] = {'position':rootPoint, 'part':partNames[id], 'score':rootScore}
+
+    #Decode the part positions upwards in the tree, following the backward displacements.
+    for edge in reversed(range(numEdges)):
+        sourceKeypointId = parentToChildEdges[edge]
+        targetKeypointId = childToParentEdges[edge]
+        if instanceKeypoints[sourceKeypointId]['score'] > 0.0  \
+            and math.isclose(instanceKeypoints[targetKeypointId]['score'], 0.0, rel_tol=1e-9) is True:
+            instanceKeypoints[targetKeypointId] = traverseToTargetKeypoint(edge,
+                                                                           instanceKeypoints[sourceKeypointId],
+                                                                           targetKeypointId,
+                                                                           scores,
+                                                                           offsets,
+                                                                           outputStride,
+                                                                           displacementsBwd)
+
+    # Decode the part positions downwards in the tree, following the forward
+    #displacements.
+    for edge in range(numEdges):
+        sourceKeypointId = childToParentEdges[edge]
+        targetKeypointId = parentToChildEdges[edge]
+        #if instanceKeypoints[sourceKeypointId] is not None and instanceKeypoints[targetKeypointId] is None:
+        if instanceKeypoints[sourceKeypointId]['score'] > 0.0 \
+            and math.isclose(instanceKeypoints[targetKeypointId]['score'], 0.0, rel_tol=1e-9) is True:
+            instanceKeypoints[targetKeypointId] = traverseToTargetKeypoint(edge, \
+                                                                           instanceKeypoints[sourceKeypointId], \
+                                                                           targetKeypointId, \
+                                                                           scores, \
+                                                                           offsets, \
+                                                                           outputStride, \
+                                                                           displacementsFwd)
+    return instanceKeypoints