added classifier
This commit is contained in:
parent
e9585706b9
commit
03d26b46ca
|
|
@ -8,3 +8,5 @@ short.mp4
|
||||||
__pycache__/
|
__pycache__/
|
||||||
|
|
||||||
*.mp4
|
*.mp4
|
||||||
|
|
||||||
|
*.weights
|
||||||
|
|
@ -5,99 +5,57 @@
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import tensorflow as tf
|
import tensorflow as tf
|
||||||
import cv2
|
import cv2
|
||||||
|
import os
|
||||||
|
import json
|
||||||
|
|
||||||
from Application.Classifiers.ClassifierInterface import ClassifierInterface
|
from Application.Classifiers.ClassifierInterface import ClassifierInterface
|
||||||
|
|
||||||
|
|
||||||
class Classifier(ClassifierInterface):
|
class Classifier(ClassifierInterface):
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
print("1")
|
self.threshold = .5
|
||||||
self.model_path = "./class1.pb"
|
with open(os.path.join(os.path.dirname(__file__), "coco_map.json")) as file:
|
||||||
self.odapi = DetectorAPI(path_to_ckpt=self.model_path)
|
mapping = json.load(file)
|
||||||
self.threshold = 0.6
|
self.classes = dict()
|
||||||
|
for element in mapping:
|
||||||
|
self.classes[element["id"]-1] = element["display_name"]
|
||||||
|
|
||||||
def detect(self, stream):
|
self.net = cv2.dnn.readNet(os.path.join(os.path.dirname(__file__),"yolov4.weights"),os.path.join(os.path.dirname(__file__),"yolov4.cfg"))
|
||||||
cap = cv2.VideoCapture(stream)
|
#self.net.setPreferableBackend(cv2.dnn.DNN_BACKEND_CUDA)
|
||||||
img = None
|
#self.net.setPreferableTarget(cv2.dnn.DNN_TARGET_CUDA)
|
||||||
r, img = cap.read()
|
self.layer_names = self.net.getLayerNames()
|
||||||
if img is None:
|
self.outputlayers = [self.layer_names[i[0] - 1] for i in self.net.getUnconnectedOutLayers()]
|
||||||
return img
|
|
||||||
# scale the image down for faster processing
|
|
||||||
scale_percent = 60 # percent of original size
|
|
||||||
width = int(img.shape[1] * scale_percent / 100)
|
|
||||||
height = int(img.shape[0] * scale_percent / 100)
|
|
||||||
dim = (width, height)
|
|
||||||
|
|
||||||
img = cv2.resize(img, dim)
|
print("Classifier Initiated")
|
||||||
|
|
||||||
|
def tagLayer(self, imgs):
|
||||||
# get the results from the net
|
# get the results from the net
|
||||||
boxes, scores, classes, num = self.odapi.process_frame(img)
|
|
||||||
res = False
|
results = []
|
||||||
for i in range(len(boxes)):
|
for i, contours in enumerate(imgs[19:20]):
|
||||||
# Class 1 represents human
|
#print(i)
|
||||||
# draw recogniction boxes and return resulting image + true/false
|
for contour in contours:
|
||||||
if classes[i] == 1:
|
height,width,channels = contour.shape
|
||||||
if scores[i] > self.threshold:
|
|
||||||
box = boxes[i]
|
dim = max(height, width)
|
||||||
cv2.rectangle(img, (box[1], box[0]), (box[3], box[2]), (255, 0, 0), 2)
|
if dim > 320:
|
||||||
res = True
|
img2 = np.zeros(shape=[dim, dim, 3], dtype=np.uint8)
|
||||||
return img, res
|
|
||||||
else:
|
else:
|
||||||
res = False
|
img2 = np.zeros(shape=[320,320, 3], dtype=np.uint8)
|
||||||
return img, res
|
img2[:height,:width] = contour
|
||||||
|
blob = cv2.dnn.blobFromImage(img2,1/256,(320,320),(0,0,0),True,crop=False) #reduce 416 to 320
|
||||||
|
self.net.setInput(blob)
|
||||||
def tagLayers(self, layers):
|
outs = self.net.forward(self.outputlayers)
|
||||||
print("tagging")
|
for out in outs:
|
||||||
# Detector API can be changed out given the I/O remains the same
|
for detection in out:
|
||||||
# this way you can use a different N-Net if you like to
|
scores = detection
|
||||||
class DetectorAPI:
|
class_id = np.argmax(scores)
|
||||||
def __init__(self, path_to_ckpt):
|
confidence = scores[class_id]
|
||||||
self.path_to_ckpt = path_to_ckpt
|
if confidence > self.threshold:
|
||||||
|
if self.classes[class_id] not in results:
|
||||||
self.detection_graph = tf.Graph()
|
cv2.imshow("changes x", img2)
|
||||||
with self.detection_graph.as_default():
|
cv2.waitKey(10) & 0XFF
|
||||||
od_graph_def = tf.GraphDef()
|
results.append(self.classes[class_id])
|
||||||
with tf.gfile.GFile(self.path_to_ckpt, 'rb') as fid:
|
#print(self.classes[x], score)
|
||||||
serialized_graph = fid.read()
|
|
||||||
od_graph_def.ParseFromString(serialized_graph)
|
|
||||||
tf.import_graph_def(od_graph_def, name='')
|
|
||||||
|
|
||||||
self.default_graph = self.detection_graph.as_default()
|
|
||||||
self.sess = tf.Session(graph=self.detection_graph)
|
|
||||||
|
|
||||||
# Definite input and output Tensors for detection_graph
|
|
||||||
self.image_tensor = self.detection_graph.get_tensor_by_name('image_tensor:0')
|
|
||||||
# Each box represents a part of the image where a particular object was detected.
|
|
||||||
self.detection_boxes = self.detection_graph.get_tensor_by_name('detection_boxes:0')
|
|
||||||
# Each score represent how level of confidence for each of the objects.
|
|
||||||
# Score is shown on the result image, together with the class label.
|
|
||||||
self.detection_scores = self.detection_graph.get_tensor_by_name('detection_scores:0')
|
|
||||||
self.detection_classes = self.detection_graph.get_tensor_by_name('detection_classes:0')
|
|
||||||
self.num_detections = self.detection_graph.get_tensor_by_name('num_detections:0')
|
|
||||||
|
|
||||||
def process_frame(self, image):
|
|
||||||
# Expand dimensions since the trained_model expects images to have shape: [1, None, None, 3]
|
|
||||||
image_np_expanded = np.expand_dims(image, axis=0)
|
|
||||||
# Actual detection.
|
|
||||||
|
|
||||||
(boxes, scores, classes, num) = self.sess.run(
|
|
||||||
[self.detection_boxes, self.detection_scores, self.detection_classes, self.num_detections],
|
|
||||||
feed_dict={self.image_tensor: image_np_expanded})
|
|
||||||
|
|
||||||
im_height, im_width,_ = image.shape
|
|
||||||
boxes_list = [None for i in range(boxes.shape[1])]
|
|
||||||
for i in range(boxes.shape[1]):
|
|
||||||
boxes_list[i] = (
|
|
||||||
int(boxes[0, i, 0] * im_height),
|
|
||||||
int(boxes[0, i, 1] * im_width),
|
|
||||||
int(boxes[0, i, 2] * im_height),
|
|
||||||
int(boxes[0, i, 3] * im_width)
|
|
||||||
)
|
|
||||||
|
|
||||||
return boxes_list, scores[0].tolist(), [int(x) for x in classes[0].tolist()], int(num[0])
|
|
||||||
|
|
||||||
def close(self):
|
|
||||||
self.sess.close()
|
|
||||||
self.default_graph.close()
|
|
||||||
|
|
||||||
|
return results
|
||||||
|
|
|
||||||
|
|
@ -0,0 +1,185 @@
|
||||||
|
[
|
||||||
|
{
|
||||||
|
"name": "/m/01g317"
|
||||||
|
,"id": 1
|
||||||
|
,"display_name": "person"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0199g"
|
||||||
|
,"id": 2
|
||||||
|
,"display_name": "bicycle"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0k4j"
|
||||||
|
,"id": 3
|
||||||
|
,"display_name": "car"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/04_sv"
|
||||||
|
,"id": 4
|
||||||
|
,"display_name": "motorcycle"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/05czz6l"
|
||||||
|
,"id": 5
|
||||||
|
,"display_name": "airplane"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01bjv"
|
||||||
|
,"id": 6
|
||||||
|
,"display_name": "bus"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/07jdr"
|
||||||
|
,"id": 7
|
||||||
|
,"display_name": "train"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/07r04"
|
||||||
|
,"id": 8
|
||||||
|
,"display_name": "truck"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/019jd"
|
||||||
|
,"id": 9
|
||||||
|
,"display_name": "boat"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/015qff"
|
||||||
|
,"id": 10
|
||||||
|
,"display_name": "traffic light"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01pns0"
|
||||||
|
,"id": 11
|
||||||
|
,"display_name": "fire hydrant"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/02pv19"
|
||||||
|
,"id": 13
|
||||||
|
,"display_name": "stop sign"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/015qbp"
|
||||||
|
,"id": 14
|
||||||
|
,"display_name": "parking meter"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0cvnqh"
|
||||||
|
,"id": 15
|
||||||
|
,"display_name": "bench"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/015p6"
|
||||||
|
,"id": 16
|
||||||
|
,"display_name": "bird"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01yrx"
|
||||||
|
,"id": 17
|
||||||
|
,"display_name": "cat"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0bt9lr"
|
||||||
|
,"id": 18
|
||||||
|
,"display_name": "dog"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/03k3r"
|
||||||
|
,"id": 19
|
||||||
|
,"display_name": "horse"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/07bgp"
|
||||||
|
,"id": 20
|
||||||
|
,"display_name": "sheep"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01xq0k1"
|
||||||
|
,"id": 21
|
||||||
|
,"display_name": "cow"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0bwd_0j"
|
||||||
|
,"id": 22
|
||||||
|
,"display_name": "elephant"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01dws"
|
||||||
|
,"id": 23
|
||||||
|
,"display_name": "bear"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0898b"
|
||||||
|
,"id": 24
|
||||||
|
,"display_name": "zebra"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/03bk1"
|
||||||
|
,"id": 25
|
||||||
|
,"display_name": "giraffe"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01940j"
|
||||||
|
,"id": 27
|
||||||
|
,"display_name": "backpack"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/0hnnb"
|
||||||
|
,"id": 28
|
||||||
|
,"display_name": "umbrella"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/080hkjn"
|
||||||
|
,"id": 31
|
||||||
|
,"display_name": "handbag"
|
||||||
|
},
|
||||||
|
|
||||||
|
{
|
||||||
|
"name": "/m/01s55n"
|
||||||
|
,"id": 33
|
||||||
|
,"display_name": "suitcase"
|
||||||
|
},
|
||||||
|
|
||||||
|
{
|
||||||
|
"name": "/m/03g8mr"
|
||||||
|
,"id": 39
|
||||||
|
,"display_name": "baseball bat"
|
||||||
|
},
|
||||||
|
|
||||||
|
{
|
||||||
|
"name": "/m/06_fw"
|
||||||
|
,"id": 41
|
||||||
|
,"display_name": "skateboard"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01mzpv"
|
||||||
|
,"id": 62
|
||||||
|
,"display_name": "chair"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/02crq1"
|
||||||
|
,"id": 63
|
||||||
|
,"display_name": "couch"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/03ssj5"
|
||||||
|
,"id": 65
|
||||||
|
,"display_name": "bed"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/04bcr3"
|
||||||
|
,"id": 67
|
||||||
|
,"display_name": "dining table"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/07c52"
|
||||||
|
,"id": 72
|
||||||
|
,"display_name": "tv"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "/m/01c648"
|
||||||
|
,"id": 73
|
||||||
|
,"display_name": "laptop"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
|
@ -0,0 +1,789 @@
|
||||||
|
[net]
|
||||||
|
# Testing
|
||||||
|
# batch=1
|
||||||
|
# subdivisions=1
|
||||||
|
# Training
|
||||||
|
batch=64
|
||||||
|
subdivisions=16
|
||||||
|
width=608
|
||||||
|
height=608
|
||||||
|
channels=3
|
||||||
|
momentum=0.9
|
||||||
|
decay=0.0005
|
||||||
|
angle=0
|
||||||
|
saturation = 1.5
|
||||||
|
exposure = 1.5
|
||||||
|
hue=.1
|
||||||
|
|
||||||
|
learning_rate=0.001
|
||||||
|
burn_in=1000
|
||||||
|
max_batches = 500200
|
||||||
|
policy=steps
|
||||||
|
steps=400000,450000
|
||||||
|
scales=.1,.1
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=32
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
# Downsample
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=64
|
||||||
|
size=3
|
||||||
|
stride=2
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=32
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=64
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
# Downsample
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=3
|
||||||
|
stride=2
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=64
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=64
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
# Downsample
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=2
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
# Downsample
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=2
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
# Downsample
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=1024
|
||||||
|
size=3
|
||||||
|
stride=2
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=1024
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=1024
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=1024
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=1024
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[shortcut]
|
||||||
|
from=-3
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
######################
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=1024
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=1024
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=512
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=1024
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=255
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[yolo]
|
||||||
|
mask = 6,7,8
|
||||||
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
|
||||||
|
classes=80
|
||||||
|
num=9
|
||||||
|
jitter=.3
|
||||||
|
ignore_thresh = .7
|
||||||
|
truth_thresh = 1
|
||||||
|
random=1
|
||||||
|
|
||||||
|
|
||||||
|
[route]
|
||||||
|
layers = -4
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[upsample]
|
||||||
|
stride=2
|
||||||
|
|
||||||
|
[route]
|
||||||
|
layers = -1, 61
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=512
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=512
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=256
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=512
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=255
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[yolo]
|
||||||
|
mask = 3,4,5
|
||||||
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
|
||||||
|
classes=80
|
||||||
|
num=9
|
||||||
|
jitter=.3
|
||||||
|
ignore_thresh = .7
|
||||||
|
truth_thresh = 1
|
||||||
|
random=1
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
[route]
|
||||||
|
layers = -4
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[upsample]
|
||||||
|
stride=2
|
||||||
|
|
||||||
|
[route]
|
||||||
|
layers = -1, 36
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=256
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=256
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
filters=128
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
batch_normalize=1
|
||||||
|
size=3
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=256
|
||||||
|
activation=leaky
|
||||||
|
|
||||||
|
[convolutional]
|
||||||
|
size=1
|
||||||
|
stride=1
|
||||||
|
pad=1
|
||||||
|
filters=255
|
||||||
|
activation=linear
|
||||||
|
|
||||||
|
|
||||||
|
[yolo]
|
||||||
|
mask = 0,1,2
|
||||||
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
|
||||||
|
classes=80
|
||||||
|
num=9
|
||||||
|
jitter=.3
|
||||||
|
ignore_thresh = .7
|
||||||
|
truth_thresh = 1
|
||||||
|
random=1
|
||||||
|
|
||||||
File diff suppressed because it is too large
Load Diff
|
|
@ -12,7 +12,7 @@ class Config:
|
||||||
"tolerance": 20,
|
"tolerance": 20,
|
||||||
"maxLength": None,
|
"maxLength": None,
|
||||||
"ttolerance": 60,
|
"ttolerance": 60,
|
||||||
"videoBufferLength": 128,
|
"videoBufferLength": 16,
|
||||||
"noiseThreashold": 0.1,
|
"noiseThreashold": 0.1,
|
||||||
"noiseSensitivity": 3/4,
|
"noiseSensitivity": 3/4,
|
||||||
"LayersPerContour": 5,
|
"LayersPerContour": 5,
|
||||||
|
|
@ -20,6 +20,7 @@ class Config:
|
||||||
}
|
}
|
||||||
|
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
|
'''This is basically just a wrapper for a json / python dict'''
|
||||||
print("Current Config:", self.c)
|
print("Current Config:", self.c)
|
||||||
|
|
||||||
def __getitem__(self, key):
|
def __getitem__(self, key):
|
||||||
|
|
|
||||||
|
|
@ -21,8 +21,8 @@ from Application.Config import Config
|
||||||
|
|
||||||
class ContourExtractor:
|
class ContourExtractor:
|
||||||
|
|
||||||
#X = {frame_number: [(contour, (x,y,w,h)), ...], }
|
#extracedContours = {frame_number: [(contour, (x,y,w,h)), ...], }
|
||||||
|
# dict with frame numbers as keys and the contour bounds of every contour for that frame
|
||||||
|
|
||||||
def getextractedContours(self):
|
def getextractedContours(self):
|
||||||
return self.extractedContours
|
return self.extractedContours
|
||||||
|
|
@ -45,16 +45,14 @@ class ContourExtractor:
|
||||||
print("ContourExtractor initiated")
|
print("ContourExtractor initiated")
|
||||||
|
|
||||||
def extractContours(self):
|
def extractContours(self):
|
||||||
extractedContours = dict()
|
|
||||||
videoReader = VideoReader(self.config)
|
videoReader = VideoReader(self.config)
|
||||||
|
|
||||||
videoReader.fillBuffer()
|
videoReader.fillBuffer()
|
||||||
|
|
||||||
threads = self.config["videoBufferLength"]
|
threads = self.config["videoBufferLength"]
|
||||||
self.start = time.time()
|
self.start = time.time()
|
||||||
|
# start a bunch of frames and let them read from the video reader buffer until the video reader reaches EOF
|
||||||
with ThreadPool(threads) as pool:
|
with ThreadPool(threads) as pool:
|
||||||
while not videoReader.videoEnded():
|
while not videoReader.videoEnded():
|
||||||
#FrameCount, frame = videoReader.pop()
|
|
||||||
if videoReader.buffer.qsize() == 0:
|
if videoReader.buffer.qsize() == 0:
|
||||||
time.sleep(.5)
|
time.sleep(.5)
|
||||||
|
|
||||||
|
|
@ -70,6 +68,7 @@ class ContourExtractor:
|
||||||
|
|
||||||
def getContours(self, data):
|
def getContours(self, data):
|
||||||
frameCount, frame = data
|
frameCount, frame = data
|
||||||
|
# wait for the reference frame, which is calculated by averaging some revious frames
|
||||||
while frameCount not in self.averages:
|
while frameCount not in self.averages:
|
||||||
time.sleep(0.1)
|
time.sleep(0.1)
|
||||||
firstFrame = self.averages.pop(frameCount, None)
|
firstFrame = self.averages.pop(frameCount, None)
|
||||||
|
|
@ -77,6 +76,7 @@ class ContourExtractor:
|
||||||
if frameCount % (60*30) == 0:
|
if frameCount % (60*30) == 0:
|
||||||
print(f"{frameCount/(60*30)} Minutes processed in {round((time.time() - self.start), 2)} each")
|
print(f"{frameCount/(60*30)} Minutes processed in {round((time.time() - self.start), 2)} each")
|
||||||
self.start = time.time()
|
self.start = time.time()
|
||||||
|
|
||||||
gray = self.prepareFrame(frame)
|
gray = self.prepareFrame(frame)
|
||||||
frameDelta = cv2.absdiff(gray, firstFrame)
|
frameDelta = cv2.absdiff(gray, firstFrame)
|
||||||
thresh = cv2.threshold(frameDelta, self.threashold, 255, cv2.THRESH_BINARY)[1]
|
thresh = cv2.threshold(frameDelta, self.threashold, 255, cv2.THRESH_BINARY)[1]
|
||||||
|
|
|
||||||
|
|
@ -21,7 +21,7 @@ class Exporter:
|
||||||
if raw:
|
if raw:
|
||||||
self.exportRawData(layers)
|
self.exportRawData(layers)
|
||||||
if layered and overlayed:
|
if layered and overlayed:
|
||||||
print("Layered and Individual are mutially exclusive, Individual was choosen automatically")
|
print("Layered and Individual are mutually exclusive, individual was choosen automatically")
|
||||||
overlayed = False
|
overlayed = False
|
||||||
if layered and not overlayed:
|
if layered and not overlayed:
|
||||||
self.exportLayers(layers)
|
self.exportLayers(layers)
|
||||||
|
|
|
||||||
|
|
@ -17,6 +17,16 @@ class Layer:
|
||||||
length = None
|
length = None
|
||||||
|
|
||||||
def __init__(self, startFrame, data, config):
|
def __init__(self, startFrame, data, config):
|
||||||
|
'''returns a Layer object
|
||||||
|
|
||||||
|
Layers are collections of contours with a StartFrame,
|
||||||
|
which is the number of the frame the first contour of
|
||||||
|
this layer was extraced from
|
||||||
|
|
||||||
|
A Contour is a CV2 Contour, which is a y*x*3 rgb numpy array,
|
||||||
|
but we only care about the corners of the contours.
|
||||||
|
So we save the bounds (x,y,w,h) in bounds[] and the actual content in data[]
|
||||||
|
'''
|
||||||
self.startFrame = startFrame
|
self.startFrame = startFrame
|
||||||
self.lastFrame = startFrame
|
self.lastFrame = startFrame
|
||||||
self.config = config
|
self.config = config
|
||||||
|
|
@ -25,22 +35,28 @@ class Layer:
|
||||||
self.bounds.append([data])
|
self.bounds.append([data])
|
||||||
#print("Layer constructed")
|
#print("Layer constructed")
|
||||||
|
|
||||||
def add(self, frameNumber, data):
|
def add(self, frameNumber, bound):
|
||||||
|
'''Adds a bound'''
|
||||||
if not self.startFrame + len(self.bounds) < frameNumber:
|
if not self.startFrame + len(self.bounds) < frameNumber:
|
||||||
if len(self.bounds[self.startFrame - frameNumber]) >= 1:
|
if len(self.bounds[self.startFrame - frameNumber]) >= 1:
|
||||||
self.bounds[self.startFrame - frameNumber].append(data)
|
self.bounds[self.startFrame - frameNumber].append(bound)
|
||||||
else:
|
else:
|
||||||
self.lastFrame = frameNumber
|
self.lastFrame = frameNumber
|
||||||
self.bounds.append([data])
|
self.bounds.append([bound])
|
||||||
|
|
||||||
self.getLength()
|
self.getLength()
|
||||||
|
|
||||||
def getLength(self):
|
def getLength(self):
|
||||||
|
return len(self)
|
||||||
|
|
||||||
|
def __len__(self):
|
||||||
self.length = len(self.bounds)
|
self.length = len(self.bounds)
|
||||||
return self.length
|
return self.length
|
||||||
|
|
||||||
def fill(self, inputPath, resizeWidth):
|
def fill(self, inputPath, resizeWidth):
|
||||||
'''reads in the contour data, needed for export'''
|
'''deprecated
|
||||||
|
|
||||||
|
Fills the data[] array by iterateing over the bounds'''
|
||||||
|
|
||||||
cap = cv2.VideoCapture(inputPath)
|
cap = cv2.VideoCapture(inputPath)
|
||||||
self.data = [None]*len(self.bounds)
|
self.data = [None]*len(self.bounds)
|
||||||
|
|
@ -57,12 +73,18 @@ class Layer:
|
||||||
cap.release()
|
cap.release()
|
||||||
|
|
||||||
def clusterDelete(self):
|
def clusterDelete(self):
|
||||||
|
'''Uses a cluster analysis to remove contours which are not the result of movement'''
|
||||||
org = self.bounds
|
org = self.bounds
|
||||||
|
if len(org) == 1:
|
||||||
|
return
|
||||||
mapped = []
|
mapped = []
|
||||||
mapping = []
|
mapping = []
|
||||||
clusterCount = 1
|
clusterCount = 1
|
||||||
noiseSensitivity = self.config["noiseSensitivity"]
|
noiseSensitivity = self.config["noiseSensitivity"]
|
||||||
noiseThreashold = self.config["noiseThreashold"]
|
noiseThreashold = self.config["noiseThreashold"]
|
||||||
|
|
||||||
|
# calculates the middle of each contour in the 2d bounds[] and saves it in 1d list
|
||||||
|
# and saves the 2d indexes in a mapping array
|
||||||
for i, bounds in enumerate(org):
|
for i, bounds in enumerate(org):
|
||||||
for j, bound in enumerate(bounds):
|
for j, bound in enumerate(bounds):
|
||||||
x = (bound[0] + bound[2]/2) / self.config["w"]
|
x = (bound[0] + bound[2]/2) / self.config["w"]
|
||||||
|
|
@ -76,6 +98,7 @@ class Layer:
|
||||||
centers = []
|
centers = []
|
||||||
kmeans = None
|
kmeans = None
|
||||||
|
|
||||||
|
# the loop isn't nessecary (?) if the number of clusters is known, since it isn't the loop tries to optimize
|
||||||
while True:
|
while True:
|
||||||
kmeans = KMeans(init="random", n_clusters=clusterCount, n_init=5, max_iter=300, random_state=42)
|
kmeans = KMeans(init="random", n_clusters=clusterCount, n_init=5, max_iter=300, random_state=42)
|
||||||
kmeans.fit(mapped)
|
kmeans.fit(mapped)
|
||||||
|
|
@ -96,12 +119,21 @@ class Layer:
|
||||||
centers = kmeans.cluster_centers_
|
centers = kmeans.cluster_centers_
|
||||||
break
|
break
|
||||||
|
|
||||||
|
# transformes the labels array
|
||||||
|
# new array:
|
||||||
|
# the index is the cluster id, the array is the id of the contour
|
||||||
|
# [
|
||||||
|
# [1,2,3]
|
||||||
|
# [3,4,5]
|
||||||
|
# [6,7,8,9]
|
||||||
|
# ]
|
||||||
classed = [[]]
|
classed = [[]]
|
||||||
for i, x in enumerate(list(labels)):
|
for i, x in enumerate(list(labels)):
|
||||||
while len(classed) <= x:
|
while len(classed) <= x:
|
||||||
classed.append([])
|
classed.append([])
|
||||||
classed[x].append(i)
|
classed[x].append(i)
|
||||||
|
|
||||||
|
# calculates the euclidean distance (without the sqrt) of each point in a cluster to the cluster center
|
||||||
dists = []
|
dists = []
|
||||||
for num, cen in enumerate(centers):
|
for num, cen in enumerate(centers):
|
||||||
dist = 0
|
dist = 0
|
||||||
|
|
@ -110,9 +142,10 @@ class Layer:
|
||||||
dist/=len(classed[num])
|
dist/=len(classed[num])
|
||||||
dists.append(dist*1000)
|
dists.append(dist*1000)
|
||||||
|
|
||||||
|
# copy all contours of the clusters with more movement than the threshold
|
||||||
newContours = [[]]
|
newContours = [[]]
|
||||||
for i, dis in enumerate(dists):
|
for i, dis in enumerate(dists):
|
||||||
# copy contours which are spread out, delete rest by not yopying them
|
# copy contours which are spread out, delete rest by not copying them
|
||||||
if dis > noiseThreashold:
|
if dis > noiseThreashold:
|
||||||
for j in classed[i]:
|
for j in classed[i]:
|
||||||
x, y = mapping[j]
|
x, y = mapping[j]
|
||||||
|
|
|
||||||
|
|
@ -23,6 +23,7 @@ class LayerFactory:
|
||||||
self.extractLayers(data)
|
self.extractLayers(data)
|
||||||
|
|
||||||
def extractLayers(self, data = None):
|
def extractLayers(self, data = None):
|
||||||
|
'''Bundle given contours together into Layer Objects'''
|
||||||
if self.data is None:
|
if self.data is None:
|
||||||
if data is None:
|
if data is None:
|
||||||
print("LayerFactory data was none")
|
print("LayerFactory data was none")
|
||||||
|
|
@ -48,8 +49,6 @@ class LayerFactory:
|
||||||
#for x in tmp:
|
#for x in tmp:
|
||||||
#self.getLayers(x)
|
#self.getLayers(x)
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
return self.layers
|
return self.layers
|
||||||
|
|
||||||
def getLayers(self, data):
|
def getLayers(self, data):
|
||||||
|
|
|
||||||
|
|
@ -3,9 +3,10 @@ from Application.Config import Config
|
||||||
from Application.VideoReader import VideoReader
|
from Application.VideoReader import VideoReader
|
||||||
from Application.Exporter import Exporter
|
from Application.Exporter import Exporter
|
||||||
from multiprocessing.pool import ThreadPool
|
from multiprocessing.pool import ThreadPool
|
||||||
|
from Application.Classifiers.Classifier import Classifier
|
||||||
import cv2
|
import cv2
|
||||||
import numpy as np
|
import numpy as np
|
||||||
|
import time
|
||||||
class LayerManager:
|
class LayerManager:
|
||||||
def __init__(self, config, layers):
|
def __init__(self, config, layers):
|
||||||
self.data = {}
|
self.data = {}
|
||||||
|
|
@ -17,12 +18,16 @@ class LayerManager:
|
||||||
self.resizeWidth = config["resizeWidth"]
|
self.resizeWidth = config["resizeWidth"]
|
||||||
self.footagePath = config["inputPath"]
|
self.footagePath = config["inputPath"]
|
||||||
self.config = config
|
self.config = config
|
||||||
|
self.classifier = Classifier()
|
||||||
|
self.tags = []
|
||||||
print("LayerManager constructed")
|
print("LayerManager constructed")
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
def cleanLayers(self):
|
def cleanLayers(self):
|
||||||
self.freeMin()
|
self.freeMin()
|
||||||
self.sortLayers()
|
self.sortLayers()
|
||||||
self.cleanLayers()
|
#self.cleanLayers2()
|
||||||
self.freeMax()
|
self.freeMax()
|
||||||
|
|
||||||
def removeStaticLayers(self):
|
def removeStaticLayers(self):
|
||||||
|
|
@ -52,7 +57,7 @@ class LayerManager:
|
||||||
if l.getLength() > self.minLayerLength:
|
if l.getLength() > self.minLayerLength:
|
||||||
layers.append(l)
|
layers.append(l)
|
||||||
self.layers = layers
|
self.layers = layers
|
||||||
self.removeStaticLayers()
|
|
||||||
|
|
||||||
def freeMax(self):
|
def freeMax(self):
|
||||||
layers = []
|
layers = []
|
||||||
|
|
@ -60,22 +65,25 @@ class LayerManager:
|
||||||
if l.getLength() < self.maxLayerLength:
|
if l.getLength() < self.maxLayerLength:
|
||||||
layers.append(l)
|
layers.append(l)
|
||||||
self.layers = layers
|
self.layers = layers
|
||||||
self.removeStaticLayers()
|
|
||||||
|
|
||||||
def fillLayers(self):
|
|
||||||
|
|
||||||
listOfFrames = Exporter(self.config).makeListOfFrames(self.layers)
|
def tagLayers(self):
|
||||||
|
'''Use classifieres the tag all Layers, by reading the contour content from the original video, then applying the classifier'''
|
||||||
|
exporter = Exporter(self.config)
|
||||||
|
start = time.time()
|
||||||
|
for i, layer in enumerate(self.layers):
|
||||||
|
print(f"{round(i/len(self.layers)*100,2)} {round((time.time() - start), 2)}")
|
||||||
|
start = time.time()
|
||||||
|
if len(layer.bounds[0]) == 0:
|
||||||
|
continue
|
||||||
|
listOfFrames = exporter.makeListOfFrames([layer])
|
||||||
|
|
||||||
videoReader = VideoReader(self.config, listOfFrames)
|
videoReader = VideoReader(self.config, listOfFrames)
|
||||||
videoReader.fillBuffer()
|
videoReader.fillBuffer()
|
||||||
|
|
||||||
while not videoReader.videoEnded():
|
while not videoReader.videoEnded():
|
||||||
frameCount, frame = videoReader.pop()
|
frameCount, frame = videoReader.pop()
|
||||||
frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
|
frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
|
||||||
for i, layer in enumerate(self.layers):
|
|
||||||
if i % 20 == 0:
|
|
||||||
print(f"filled {int(round(i/len(self.layers),2)*100)}% of all Layers")
|
|
||||||
|
|
||||||
if layer.startFrame <= frameCount and layer.startFrame + len(layer.bounds) > frameCount:
|
|
||||||
data = []
|
data = []
|
||||||
for (x, y, w, h) in layer.bounds[frameCount - layer.startFrame]:
|
for (x, y, w, h) in layer.bounds[frameCount - layer.startFrame]:
|
||||||
if x is None:
|
if x is None:
|
||||||
|
|
@ -87,12 +95,15 @@ class LayerManager:
|
||||||
h = int(h * factor)
|
h = int(h * factor)
|
||||||
data.append(np.copy(frame[y:y+h, x:x+w]))
|
data.append(np.copy(frame[y:y+h, x:x+w]))
|
||||||
layer.data.append(data)
|
layer.data.append(data)
|
||||||
|
tags = self.classifier.tagLayer(layer.data)
|
||||||
|
print(tags)
|
||||||
|
self.tags.append(tags)
|
||||||
|
|
||||||
videoReader.thread.join()
|
videoReader.thread.join()
|
||||||
|
|
||||||
def sortLayers(self):
|
def sortLayers(self):
|
||||||
self.layers.sort(key = lambda c:c.startFrame)
|
self.layers.sort(key = lambda c:c.startFrame)
|
||||||
|
|
||||||
def cleanLayers(self):
|
def cleanLayers2(self):
|
||||||
for layer in self.layers:
|
for layer in self.layers:
|
||||||
layer.clusterDelete()
|
layer.clusterDelete()
|
||||||
|
|
|
||||||
|
|
@ -24,11 +24,11 @@ class VideoReader:
|
||||||
self.buffer = Queue(config["videoBufferLength"])
|
self.buffer = Queue(config["videoBufferLength"])
|
||||||
self.vc = cv2.VideoCapture(videoPath)
|
self.vc = cv2.VideoCapture(videoPath)
|
||||||
self.stopped = False
|
self.stopped = False
|
||||||
self.getWH()
|
|
||||||
if setOfFrames is not None:
|
if setOfFrames is not None:
|
||||||
self.listOfFrames = sorted(setOfFrames)
|
self.listOfFrames = sorted(setOfFrames)
|
||||||
|
|
||||||
def getWH(self):
|
def getWH(self):
|
||||||
|
'''get width and height'''
|
||||||
res, image = self.vc.read()
|
res, image = self.vc.read()
|
||||||
self.w = image.shape[1]
|
self.w = image.shape[1]
|
||||||
self.h = image.shape[0]
|
self.h = image.shape[0]
|
||||||
|
|
@ -37,15 +37,11 @@ class VideoReader:
|
||||||
def pop(self):
|
def pop(self):
|
||||||
return self.buffer.get(block=True)
|
return self.buffer.get(block=True)
|
||||||
|
|
||||||
def get(self):
|
|
||||||
return self.buffer[-1]
|
|
||||||
|
|
||||||
def fillBuffer(self):
|
def fillBuffer(self):
|
||||||
if self.buffer.full():
|
if self.buffer.full():
|
||||||
print("VideoReader::fillBuffer was called when buffer was full.")
|
print("VideoReader::fillBuffer was called when buffer was full.")
|
||||||
self.endFrame = int(self.vc.get(cv2.CAP_PROP_FRAME_COUNT))
|
self.endFrame = int(self.vc.get(cv2.CAP_PROP_FRAME_COUNT))
|
||||||
|
|
||||||
#self.endFrame = 10*60*30
|
|
||||||
if self.listOfFrames is not None:
|
if self.listOfFrames is not None:
|
||||||
self.thread = threading.Thread(target=self.readFramesByList, args=())
|
self.thread = threading.Thread(target=self.readFramesByList, args=())
|
||||||
else:
|
else:
|
||||||
|
|
@ -57,6 +53,7 @@ class VideoReader:
|
||||||
self.vc.release()
|
self.vc.release()
|
||||||
|
|
||||||
def readFrames(self):
|
def readFrames(self):
|
||||||
|
'''Reads video from start to finish'''
|
||||||
while self.lastFrame < self.endFrame:
|
while self.lastFrame < self.endFrame:
|
||||||
res, frame = self.vc.read()
|
res, frame = self.vc.read()
|
||||||
if res:
|
if res:
|
||||||
|
|
@ -65,8 +62,8 @@ class VideoReader:
|
||||||
|
|
||||||
self.stopped = True
|
self.stopped = True
|
||||||
|
|
||||||
|
|
||||||
def readFramesByList(self):
|
def readFramesByList(self):
|
||||||
|
'''Reads all frames from a list of frame numbers'''
|
||||||
self.vc.set(1, self.listOfFrames[0])
|
self.vc.set(1, self.listOfFrames[0])
|
||||||
self.lastFrame = self.listOfFrames[0]
|
self.lastFrame = self.listOfFrames[0]
|
||||||
self.endFrame = self.listOfFrames[-1]
|
self.endFrame = self.listOfFrames[-1]
|
||||||
|
|
@ -76,6 +73,8 @@ class VideoReader:
|
||||||
res, frame = self.vc.read()
|
res, frame = self.vc.read()
|
||||||
if res:
|
if res:
|
||||||
self.buffer.put((self.lastFrame, frame))
|
self.buffer.put((self.lastFrame, frame))
|
||||||
|
else:
|
||||||
|
print("READING FRAMES IS FALSE")
|
||||||
# since the list is sorted the first element is always the lowest relevant framenumber
|
# since the list is sorted the first element is always the lowest relevant framenumber
|
||||||
# [0,1,2,3,32,33,34,35,67,68,69]
|
# [0,1,2,3,32,33,34,35,67,68,69]
|
||||||
self.listOfFrames.pop(0)
|
self.listOfFrames.pop(0)
|
||||||
|
|
|
||||||
27
main.py
27
main.py
|
|
@ -9,44 +9,39 @@ from Application.Importer import Importer
|
||||||
from Application.VideoReader import VideoReader
|
from Application.VideoReader import VideoReader
|
||||||
from Application.LayerManager import LayerManager
|
from Application.LayerManager import LayerManager
|
||||||
from Application.Classifiers import *
|
from Application.Classifiers import *
|
||||||
#TODO
|
|
||||||
# finden von relevanten Stellen anhand von zu findenen metriken für vergleichsbilder
|
|
||||||
|
|
||||||
def demo():
|
def main():
|
||||||
print("startup")
|
|
||||||
start = time.time()
|
start = time.time()
|
||||||
config = Config()
|
config = Config()
|
||||||
|
|
||||||
config["inputPath"] = os.path.join(os.path.dirname(__file__), "generate test footage/3.mp4")
|
config["inputPath"] = os.path.join(os.path.dirname(__file__), "generate test footage/out.mp4")
|
||||||
config["importPath"] = os.path.join(os.path.dirname(__file__), "output/short.txt")
|
#config["importPath"] = os.path.join(os.path.dirname(__file__), "output/short.txt")
|
||||||
config["outputPath"] = os.path.join(os.path.dirname(__file__), "output/short.mp4")
|
config["outputPath"] = os.path.join(os.path.dirname(__file__), "output/short.mp4")
|
||||||
|
|
||||||
vr = VideoReader(config)
|
vr = VideoReader(config)
|
||||||
config["w"], config["h"] = vr.getWH()
|
config["w"], config["h"] = vr.getWH()
|
||||||
|
|
||||||
if config["importPath"] is None:
|
if config["importPath"] is None:
|
||||||
#ana = Analyzer(config)
|
|
||||||
#ref = ana.avg
|
|
||||||
contours = ContourExtractor(config).extractContours()
|
contours = ContourExtractor(config).extractContours()
|
||||||
print("Time consumed extracting: ", time.time() - start)
|
print("Time consumed extracting: ", time.time() - start)
|
||||||
layerFactory = LayerFactory(config)
|
layerFactory = LayerFactory(config)
|
||||||
|
|
||||||
layers = layerFactory.extractLayers(contours)
|
layers = layerFactory.extractLayers(contours)
|
||||||
layerManager = LayerManager(config, layers)
|
|
||||||
layerManager.cleanLayers()
|
|
||||||
layers = layerManager.layers
|
|
||||||
else:
|
else:
|
||||||
layers = Importer(config).importRawData()
|
layers = Importer(config).importRawData()
|
||||||
|
|
||||||
|
layerManager = LayerManager(config, layers)
|
||||||
|
layerManager.cleanLayers()
|
||||||
|
|
||||||
|
#layerManager.tagLayers()
|
||||||
|
layers = layerManager.layers
|
||||||
exporter = Exporter(config)
|
exporter = Exporter(config)
|
||||||
exporter.export(layers)
|
exporter.export(layers, raw=False)
|
||||||
|
|
||||||
print("Total time: ", time.time() - start)
|
print("Total time: ", time.time() - start)
|
||||||
|
|
||||||
def init():
|
|
||||||
print("not needed yet")
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
demo()
|
main()
|
||||||
|
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue