Moved from this repo to its own repo so that the clone isn't so HUGE

2019-12-22 20:10:25 -05:00 · 2019-12-22 20:10:25 -05:00 · b9a3a118f5
commit b9a3a118f5
parent 0d7473eedb
17 changed files with 2 additions and 1725 deletions
--- a/YoloObjectDetection/Readme.md
+++ b/YoloObjectDetection/Readme.md
@ -1,42 +1,6 @@

-![](https://user-images.githubusercontent.com/13696193/43165867-fe02e3b2-8f62-11e8-9fd0-cc7c86b11772.png)
-
-   
-
 # PySimpleGUI openCV YOLO Deep Learning

+To save room in the PySimpleGUI Repo, this project has been moved to its own repo on GitHub

-![SNAG-0360](https://user-images.githubusercontent.com/13696193/58116963-93d07300-7bcb-11e9-8402-142913710b82.jpg)
-
-![YOLO May 21](https://user-images.githubusercontent.com/13696193/58117189-017c9f00-7bcc-11e9-9569-c65775d15559.gif)
-
-
-
-## Running the Demos
-  
-You will need to pip install openCV and PySimpleGUI
-```
-pip install opencv-python
-pip install pysimplegui
-```
-
-Run any of the .py files in the top level directory:
-```
-yolo.py - single image processing
-yolo_video.py Video display
-yolo_video_with_webcam.py - webcam or file source. Option to write to hard drive
-```
-And you'll need the training data.  It's 242 MB and too large for GitHub:
-https://www.dropbox.com/s/0pq7le6fwtbarkc/yolov3.weights?dl=1
-
-## Learn More
-
-This code has an article associated with it that will step you through the code (minus GUI part).
-
-https://www.pyimagesearch.com/2018/11/12/yolo-object-detection-with-opencv/
-
-
-## Acknowledgements
-This software is provided by Dr. Adrian Rosebrock of the pyimagesearch organization.
-https://www.pyimagesearch.com
-
+You'll now find the project at: https://github.com/PySimpleGUI/PySimpleGUI-YOLO
--- a/YoloObjectDetection/Yolo_with_webcam_Qt_or_tkinter.py
+++ b/YoloObjectDetection/Yolo_with_webcam_Qt_or_tkinter.py
@ -1,222 +0,0 @@
-# YOLO object detection using a webcam
-# Exact same demo as the read from disk, but instead of disk a webcam is used.
-# import the necessary packages
-import numpy as np
-# import argparse
-import imutils
-import time
-import cv2
-import os
-import PySimpleGUIQt as sg
-
-i_vid = r'videos\car_chase_01.mp4'
-o_vid = r'output\car_chase_01_out.mp4'
-y_path = r'yolo-coco'
-sg.ChangeLookAndFeel('LightGreen')
-layout = 	[
-		[sg.Text('YOLO Video Player', size=(22,1), font=('Any',18),text_color='#1c86ee' ,justification='left')],
-		[sg.Text('Path to input video'), sg.In(i_vid,size=(40,1), key='input'), sg.FileBrowse()],
-		[sg.Text('Optional Path to output video'), sg.In(o_vid,size=(40,1), key='output'), sg.FileSaveAs()],
-		[sg.Text('Yolo base path'), sg.In(y_path,size=(40,1), key='yolo'), sg.FolderBrowse()],
-		[sg.Text('Confidence'), sg.Slider(range=(0,10),orientation='h', resolution=1, default_value=5, size=(15,15), key='confidence'), sg.T('  ', key='_CONF_OUT_')],
-		[sg.Text('Threshold'), sg.Slider(range=(0,10), orientation='h', resolution=1, default_value=3, size=(15,15), key='threshold'), sg.T('  ', key='_THRESH_OUT_')],
-		[sg.Text(' '*8), sg.Checkbox('Use webcam', key='_WEBCAM_')],
-		[sg.Text(' '*8), sg.Checkbox('Write to disk', key='_DISK_')],
-		[sg.OK(), sg.Cancel(), sg.Stretch()],
-			]
-
-win = sg.Window('YOLO Video',
-				default_element_size=(21,1),
-				text_justification='right',
-				auto_size_text=False).Layout(layout)
-event, values = win.Read()
-if event is None or event =='Cancel':
-	exit()
-write_to_disk = values['_DISK_']
-use_webcam = values['_WEBCAM_']
-args = values
-
-win.Close()
-
-
-# imgbytes = cv2.imencode('.png', image)[1].tobytes()  # ditto
-gui_confidence = args["confidence"]/10
-gui_threshold = args["threshold"]/10
-# load the COCO class labels our YOLO model was trained on
-labelsPath = os.path.sep.join([args["yolo"], "coco.names"])
-LABELS = open(labelsPath).read().strip().split("\n")
-
-# initialize a list of colors to represent each possible class label
-np.random.seed(42)
-COLORS = np.random.randint(0, 255, size=(len(LABELS), 3),
-	dtype="uint8")
-
-# derive the paths to the YOLO weights and model configuration
-weightsPath = os.path.sep.join([args["yolo"], "yolov3.weights"])
-configPath = os.path.sep.join([args["yolo"], "yolov3.cfg"])
-
-# load our YOLO object detector trained on COCO dataset (80 classes)
-# and determine only the *output* layer names that we need from YOLO
-print("[INFO] loading YOLO from disk...")
-net = cv2.dnn.readNetFromDarknet(configPath, weightsPath)
-ln = net.getLayerNames()
-ln = [ln[i[0] - 1] for i in net.getUnconnectedOutLayers()]
-
-# initialize the video stream, pointer to output video file, and
-# frame dimensions
-vs = cv2.VideoCapture(args["input"])
-writer = None
-(W, H) = (None, None)
-
-# try to determine the total number of frames in the video file
-try:
-	prop = cv2.cv.CV_CAP_PROP_FRAME_COUNT if imutils.is_cv2() \
-		else cv2.CAP_PROP_FRAME_COUNT
-	total = int(vs.get(prop))
-	print("[INFO] {} total frames in video".format(total))
-
-# an error occurred while trying to determine the total
-# number of frames in the video file
-except:
-	print("[INFO] could not determine # of frames in video")
-	print("[INFO] no approx. completion time can be provided")
-	total = -1
-
-# loop over frames from the video file stream
-win_started = False
-if use_webcam:
-	cap = cv2.VideoCapture(0)
-while True:
-	# read the next frame from the file or webcam
-	if use_webcam:
-		grabbed, frame = cap.read()
-	else:
-		grabbed, frame = vs.read()
-
-	# if the frame was not grabbed, then we have reached the end
-	# of the stream
-	if not grabbed:
-		break
-
-	# if the frame dimensions are empty, grab them
-	if W is None or H is None:
-		(H, W) = frame.shape[:2]
-
-	# construct a blob from the input frame and then perform a forward
-	# pass of the YOLO object detector, giving us our bounding boxes
-	# and associated probabilities
-	blob = cv2.dnn.blobFromImage(frame, 1 / 255.0, (416, 416),
-		swapRB=True, crop=False)
-	net.setInput(blob)
-	start = time.time()
-	layerOutputs = net.forward(ln)
-	end = time.time()
-
-	# initialize our lists of detected bounding boxes, confidences,
-	# and class IDs, respectively
-	boxes = []
-	confidences = []
-	classIDs = []
-
-	# loop over each of the layer outputs
-	for output in layerOutputs:
-		# loop over each of the detections
-		for detection in output:
-			# extract the class ID and confidence (i.e., probability)
-			# of the current object detection
-			scores = detection[5:]
-			classID = np.argmax(scores)
-			confidence = scores[classID]
-
-			# filter out weak predictions by ensuring the detected
-			# probability is greater than the minimum probability
-			if confidence > gui_confidence:
-				# scale the bounding box coordinates back relative to
-				# the size of the image, keeping in mind that YOLO
-				# actually returns the center (x, y)-coordinates of
-				# the bounding box followed by the boxes' width and
-				# height
-				box = detection[0:4] * np.array([W, H, W, H])
-				(centerX, centerY, width, height) = box.astype("int")
-
-				# use the center (x, y)-coordinates to derive the top
-				# and and left corner of the bounding box
-				x = int(centerX - (width / 2))
-				y = int(centerY - (height / 2))
-
-				# update our list of bounding box coordinates,
-				# confidences, and class IDs
-				boxes.append([x, y, int(width), int(height)])
-				confidences.append(float(confidence))
-				classIDs.append(classID)
-
-	# apply non-maxima suppression to suppress weak, overlapping
-	# bounding boxes
-	idxs = cv2.dnn.NMSBoxes(boxes, confidences, gui_confidence, gui_threshold)
-
-	# ensure at least one detection exists
-	if len(idxs) > 0:
-		# loop over the indexes we are keeping
-		for i in idxs.flatten():
-			# extract the bounding box coordinates
-			(x, y) = (boxes[i][0], boxes[i][1])
-			(w, h) = (boxes[i][2], boxes[i][3])
-
-			# draw a bounding box rectangle and label on the frame
-			color = [int(c) for c in COLORS[classIDs[i]]]
-			cv2.rectangle(frame, (x, y), (x + w, y + h), color, 2)
-			text = "{}: {:.4f}".format(LABELS[classIDs[i]],
-				confidences[i])
-			cv2.putText(frame, text, (x, y - 5),
-				cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
-	if write_to_disk:
-		#check if the video writer is None
-		if writer is None:
-			# initialize our video writer
-			fourcc = cv2.VideoWriter_fourcc(*"MJPG")
-			writer = cv2.VideoWriter(args["output"], fourcc, 30,
-				(frame.shape[1], frame.shape[0]), True)
-
-			# some information on processing single frame
-			if total > 0:
-				elap = (end - start)
-				print("[INFO] single frame took {:.4f} seconds".format(elap))
-				print("[INFO] estimated total time to finish: {:.4f}".format(
-					elap * total))
-
-		#write the output frame to disk
-		writer.write(frame)
-	imgbytes = cv2.imencode('.png', frame)[1].tobytes()  # ditto
-
-	if not win_started:
-		win_started = True
-		layout = [
-			[sg.Text('Yolo Playback in PySimpleGUI Window', size=(30,1))],
-			[sg.Image(data=imgbytes, key='_IMAGE_')],
-			[sg.Text('Confidence'),
-			 sg.Slider(range=(0, 10), orientation='h', resolution=1, default_value=5, size=(15, 15), key='confidence'),
-			sg.Text('Threshold'),
-			 sg.Slider(range=(0, 10), orientation='h', resolution=1, default_value=3, size=(15, 15), key='threshold')],
-			[sg.Exit()]
-		]
-		win = sg.Window('YOLO Output',
-						default_element_size=(14, 1),
-						text_justification='right',
-						auto_size_text=False).Layout(layout).Finalize()
-		image_elem = win.FindElement('_IMAGE_')
-	else:
-		image_elem.Update(data=imgbytes)
-
-	event, values = win.Read(timeout=0)
-	if event is None or event == 'Exit':
-		break
-	gui_confidence = values['confidence']/10
-	gui_threshold = values['threshold']/10
-
-
-win.Close()
-
-# release the file pointers
-print("[INFO] cleaning up...")
-writer.release() if writer is not None else None
-vs.release()
--- a/YoloObjectDetection/cv_dl_resource_guide.pdf
+++ b/YoloObjectDetection/cv_dl_resource_guide.pdf
--- a/YoloObjectDetection/images/baggage_claim.jpg
+++ b/YoloObjectDetection/images/baggage_claim.jpg
--- a/YoloObjectDetection/images/dining_table.jpg
+++ b/YoloObjectDetection/images/dining_table.jpg
--- a/YoloObjectDetection/images/living_room.jpg
+++ b/YoloObjectDetection/images/living_room.jpg
--- a/YoloObjectDetection/images/soccer.jpg
+++ b/YoloObjectDetection/images/soccer.jpg
--- a/YoloObjectDetection/videos/airport.mp4
+++ b/YoloObjectDetection/videos/airport.mp4
--- a/YoloObjectDetection/videos/car_chase_01.mp4
+++ b/YoloObjectDetection/videos/car_chase_01.mp4
--- a/YoloObjectDetection/videos/car_chase_02.mp4
+++ b/YoloObjectDetection/videos/car_chase_02.mp4
--- a/YoloObjectDetection/videos/overpass.mp4
+++ b/YoloObjectDetection/videos/overpass.mp4
--- a/YoloObjectDetection/yolo-coco/coco.names
+++ b/YoloObjectDetection/yolo-coco/coco.names
@ -1,80 +0,0 @@
-person
-bicycle
-car
-motorbike
-aeroplane
-bus
-train
-truck
-boat
-traffic light
-fire hydrant
-stop sign
-parking meter
-bench
-bird
-cat
-dog
-horse
-sheep
-cow
-elephant
-bear
-zebra
-giraffe
-backpack
-umbrella
-handbag
-tie
-suitcase
-frisbee
-skis
-snowboard
-sports ball
-kite
-baseball bat
-baseball glove
-skateboard
-surfboard
-tennis racket
-bottle
-wine glass
-cup
-fork
-knife
-spoon
-bowl
-banana
-apple
-sandwich
-orange
-broccoli
-carrot
-hot dog
-pizza
-donut
-cake
-chair
-sofa
-pottedplant
-bed
-diningtable
-toilet
-tvmonitor
-laptop
-mouse
-remote
-keyboard
-cell phone
-microwave
-oven
-toaster
-sink
-refrigerator
-book
-clock
-vase
-scissors
-teddy bear
-hair drier
-toothbrush
--- a/YoloObjectDetection/yolo-coco/yolov3.cfg
+++ b/YoloObjectDetection/yolo-coco/yolov3.cfg
@ -1,789 +0,0 @@
-[net]
-# Testing
-# batch=1
-# subdivisions=1
-# Training
-batch=64
-subdivisions=16
-width=608
-height=608
-channels=3
-momentum=0.9
-decay=0.0005
-angle=0
-saturation = 1.5
-exposure = 1.5
-hue=.1
-
-learning_rate=0.001
-burn_in=1000
-max_batches = 500200
-policy=steps
-steps=400000,450000
-scales=.1,.1
-
-[convolutional]
-batch_normalize=1
-filters=32
-size=3
-stride=1
-pad=1
-activation=leaky
-
-# Downsample
-
-[convolutional]
-batch_normalize=1
-filters=64
-size=3
-stride=2
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=32
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=64
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-# Downsample
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=3
-stride=2
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=64
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=64
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-# Downsample
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=2
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-# Downsample
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=2
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-# Downsample
-
-[convolutional]
-batch_normalize=1
-filters=1024
-size=3
-stride=2
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=1024
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=1024
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=1024
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=1024
-size=3
-stride=1
-pad=1
-activation=leaky
-
-[shortcut]
-from=-3
-activation=linear
-
-######################
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=1024
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=1024
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=512
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=1024
-activation=leaky
-
-[convolutional]
-size=1
-stride=1
-pad=1
-filters=255
-activation=linear
-
-
-[yolo]
-mask = 6,7,8
-anchors = 10,13,  16,30,  33,23,  30,61,  62,45,  59,119,  116,90,  156,198,  373,326
-classes=80
-num=9
-jitter=.3
-ignore_thresh = .7
-truth_thresh = 1
-random=1
-
-
-[route]
-layers = -4
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[upsample]
-stride=2
-
-[route]
-layers = -1, 61
-
-
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=512
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=512
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=256
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=512
-activation=leaky
-
-[convolutional]
-size=1
-stride=1
-pad=1
-filters=255
-activation=linear
-
-
-[yolo]
-mask = 3,4,5
-anchors = 10,13,  16,30,  33,23,  30,61,  62,45,  59,119,  116,90,  156,198,  373,326
-classes=80
-num=9
-jitter=.3
-ignore_thresh = .7
-truth_thresh = 1
-random=1
-
-
-
-[route]
-layers = -4
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[upsample]
-stride=2
-
-[route]
-layers = -1, 36
-
-
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=256
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=256
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-filters=128
-size=1
-stride=1
-pad=1
-activation=leaky
-
-[convolutional]
-batch_normalize=1
-size=3
-stride=1
-pad=1
-filters=256
-activation=leaky
-
-[convolutional]
-size=1
-stride=1
-pad=1
-filters=255
-activation=linear
-
-
-[yolo]
-mask = 0,1,2
-anchors = 10,13,  16,30,  33,23,  30,61,  62,45,  59,119,  116,90,  156,198,  373,326
-classes=80
-num=9
-jitter=.3
-ignore_thresh = .7
-truth_thresh = 1
-random=1
-
--- a/YoloObjectDetection/yolo-coco/yolov3.weights
+++ b/YoloObjectDetection/yolo-coco/yolov3.weights
@ -1,3 +0,0 @@
-You must download this 242 MB file in order to run the Yolo demo program
-
-https://www.dropbox.com/s/0pq7le6fwtbarkc/yolov3.weights?dl=1
--- a/YoloObjectDetection/yolo.py
+++ b/YoloObjectDetection/yolo.py
@ -1,164 +0,0 @@
-# USAGE
-# python yolo.py --image images/baggage_claim.jpg --yolo yolo-coco
-"""
-A Yolo image processor with a GUI front-end
-The original code was command line driven.  Now these parameters are collected via a GUI
-
-old usage: yolo_video.py [-h] -i INPUT -o OUTPUT -y YOLO [-c CONFIDENCE]
-                     [-t THRESHOLD]
-"""
-
-# import the necessary packages
-import numpy as np
-import argparse
-import time
-import cv2
-import os
-import PySimpleGUIQt as sg
-
-layout = 	[
-		[sg.Text('YOLO')],
-		[sg.Text('Path to image'), sg.In(r'C:/Python/PycharmProjects/YoloObjectDetection/images/baggage_claim.jpg',size=(40,1), key='image'), sg.FileBrowse()],
-		[sg.Text('Yolo base path'), sg.In(r'yolo-coco',size=(40,1), key='yolo'), sg.FolderBrowse()],
-		[sg.Text('Confidence'), sg.Slider(range=(0,10),orientation='h', resolution=1, default_value=5, size=(15,15), key='confidence')],
-		[sg.Text('Threshold'), sg.Slider(range=(0,10), orientation='h', resolution=1, default_value=3, size=(15,15), key='threshold')],
-		[sg.OK(), sg.Cancel(), sg.Stretch()]
-			]
-
-win = sg.Window('YOLO',
-				default_element_size=(14,1),
-				text_justification='right',
-				auto_size_text=False).Layout(layout)
-event, values = win.Read()
-args = values
-win.Close()
-# construct the argument parse and parse the arguments
-# ap = argparse.ArgumentParser()
-# ap.add_argument("-i", "--image", required=True,
-# 	help="path to input image")
-# ap.add_argument("-y", "--yolo", required=True,
-# 	help="base path to YOLO directory")
-# ap.add_argument("-c", "--confidence", type=float, default=0.5,
-# 	help="minimum probability to filter weak detections")
-# ap.add_argument("-t", "--threshold", type=float, default=0.3,
-# 	help="threshold when applyong non-maxima suppression")
-# args = vars(ap.parse_args())
-
-# load the COCO class labels our YOLO model was trained on
-args['threshold'] = float(args['threshold']/10)
-args['confidence'] = float(args['confidence']/10)
-
-labelsPath = os.path.sep.join([args["yolo"], "coco.names"])
-LABELS = open(labelsPath).read().strip().split("\n")
-
-# initialize a list of colors to represent each possible class label
-np.random.seed(42)
-COLORS = np.random.randint(0, 255, size=(len(LABELS), 3),
-	dtype="uint8")
-
-# derive the paths to the YOLO weights and model configuration
-weightsPath = os.path.sep.join([args["yolo"], "yolov3.weights"])
-configPath = os.path.sep.join([args["yolo"], "yolov3.cfg"])
-
-# load our YOLO object detector trained on COCO dataset (80 classes)
-print("[INFO] loading YOLO from disk...")
-net = cv2.dnn.readNetFromDarknet(configPath, weightsPath)
-
-# load our input image and grab its spatial dimensions
-image = cv2.imread(args["image"])
-
-(H, W) = image.shape[:2]
-
-# determine only the *output* layer names that we need from YOLO
-ln = net.getLayerNames()
-ln = [ln[i[0] - 1] for i in net.getUnconnectedOutLayers()]
-
-# construct a blob from the input image and then perform a forward
-# pass of the YOLO object detector, giving us our bounding boxes and
-# associated probabilities
-blob = cv2.dnn.blobFromImage(image, 1 / 255.0, (416, 416),
-	swapRB=True, crop=False)
-net.setInput(blob)
-start = time.time()
-layerOutputs = net.forward(ln)
-end = time.time()
-
-# show timing information on YOLO
-print("[INFO] YOLO took {:.6f} seconds".format(end - start))
-
-# initialize our lists of detected bounding boxes, confidences, and
-# class IDs, respectively
-boxes = []
-confidences = []
-classIDs = []
-
-# loop over each of the layer outputs
-for output in layerOutputs:
-	# loop over each of the detections
-	for detection in output:
-		# extract the class ID and confidence (i.e., probability) of
-		# the current object detection
-		scores = detection[5:]
-		classID = np.argmax(scores)
-		confidence = scores[classID]
-
-		# filter out weak predictions by ensuring the detected
-		# probability is greater than the minimum probability
-		if confidence > args["confidence"]:
-			# scale the bounding box coordinates back relative to the
-			# size of the image, keeping in mind that YOLO actually
-			# returns the center (x, y)-coordinates of the bounding
-			# box followed by the boxes' width and height
-			box = detection[0:4] * np.array([W, H, W, H])
-			(centerX, centerY, width, height) = box.astype("int")
-
-			# use the center (x, y)-coordinates to derive the top and
-			# and left corner of the bounding box
-			x = int(centerX - (width / 2))
-			y = int(centerY - (height / 2))
-
-			# update our list of bounding box coordinates, confidences,
-			# and class IDs
-			boxes.append([x, y, int(width), int(height)])
-			confidences.append(float(confidence))
-			classIDs.append(classID)
-
-# apply non-maxima suppression to suppress weak, overlapping bounding
-# boxes
-idxs = cv2.dnn.NMSBoxes(boxes, confidences, args["confidence"],
-	args["threshold"])
-
-# ensure at least one detection exists
-if len(idxs) > 0:
-	# loop over the indexes we are keeping
-	for i in idxs.flatten():
-		# extract the bounding box coordinates
-		(x, y) = (boxes[i][0], boxes[i][1])
-		(w, h) = (boxes[i][2], boxes[i][3])
-
-		# draw a bounding box rectangle and label on the image
-		color = [int(c) for c in COLORS[classIDs[i]]]
-		cv2.rectangle(image, (x, y), (x + w, y + h), color, 2)
-		text = "{}: {:.4f}".format(LABELS[classIDs[i]], confidences[i])
-		cv2.putText(image, text, (x, y - 5), cv2.FONT_HERSHEY_SIMPLEX,
-			0.5, color, 2)
-
-# show the output image
-imgbytes = cv2.imencode('.png', image)[1].tobytes()  # ditto
-
-
-layout = 	[
-		[sg.Text('Yolo Output')],
-		[sg.Image(data=imgbytes)],
-		[sg.OK(), sg.Cancel()]
-			]
-
-win = sg.Window('YOLO',
-				default_element_size=(14,1),
-				text_justification='right',
-				auto_size_text=False).Layout(layout)
-event, values = win.Read()
-win.Close()
-
-# cv2.imshow("Image", image)
-cv2.waitKey(0)
--- a/YoloObjectDetection/yolo_video.py
+++ b/YoloObjectDetection/yolo_video.py
@ -1,207 +0,0 @@
-# USAGE
-# python yolo_video.py --input videos/airport.mp4 --output output/airport_output.avi --yolo yolo-coco
-
-# import the necessary packages
-import numpy as np
-# import argparse
-import imutils
-import time
-import cv2
-import os
-import PySimpleGUI as sg
-
-i_vid = r'videos\car_chase_01.mp4'
-# o_vid = r'videos\car_chase_01_out.mp4'
-y_path = r'yolo-coco'
-layout = 	[
-		[sg.Text('YOLO Video Player', size=(18,1), font=('Any',18),text_color='#1c86ee' ,justification='left')],
-		[sg.Text('Path to input video'), sg.In(i_vid,size=(40,1), key='input'), sg.FileBrowse()],
-		# [sg.Text('Path to output video'), sg.In(o_vid,size=(40,1), key='output'), sg.FileSaveAs()],
-		[sg.Text('Yolo base path'), sg.In(y_path,size=(40,1), key='yolo'), sg.FolderBrowse()],
-		[sg.Text('Confidence'), sg.Slider(range=(0,1),orientation='h', resolution=.1, default_value=.5, size=(15,15), key='confidence')],
-		[sg.Text('Threshold'), sg.Slider(range=(0,1), orientation='h', resolution=.1, default_value=.3, size=(15,15), key='threshold')],
-		[sg.OK(), sg.Cancel()]
-			]
-
-win = sg.Window('YOLO Video',
-				default_element_size=(14,1),
-				text_justification='right',
-				auto_size_text=False).Layout(layout)
-event, values = win.Read()
-if event is None or event =='Cancel':
-	exit()
-args = values
-
-win.Close()
-
-
-# imgbytes = cv2.imencode('.png', image)[1].tobytes()  # ditto
-
-# load the COCO class labels our YOLO model was trained on
-labelsPath = os.path.sep.join([args["yolo"], "coco.names"])
-LABELS = open(labelsPath).read().strip().split("\n")
-
-# initialize a list of colors to represent each possible class label
-np.random.seed(42)
-COLORS = np.random.randint(0, 255, size=(len(LABELS), 3),
-	dtype="uint8")
-
-# derive the paths to the YOLO weights and model configuration
-weightsPath = os.path.sep.join([args["yolo"], "yolov3.weights"])
-configPath = os.path.sep.join([args["yolo"], "yolov3.cfg"])
-
-# load our YOLO object detector trained on COCO dataset (80 classes)
-# and determine only the *output* layer names that we need from YOLO
-print("[INFO] loading YOLO from disk...")
-net = cv2.dnn.readNetFromDarknet(configPath, weightsPath)
-ln = net.getLayerNames()
-ln = [ln[i[0] - 1] for i in net.getUnconnectedOutLayers()]
-
-# initialize the video stream, pointer to output video file, and
-# frame dimensions
-vs = cv2.VideoCapture(args["input"])
-writer = None
-(W, H) = (None, None)
-
-# try to determine the total number of frames in the video file
-try:
-	prop = cv2.cv.CV_CAP_PROP_FRAME_COUNT if imutils.is_cv2() \
-		else cv2.CAP_PROP_FRAME_COUNT
-	total = int(vs.get(prop))
-	print("[INFO] {} total frames in video".format(total))
-
-# an error occurred while trying to determine the total
-# number of frames in the video file
-except:
-	print("[INFO] could not determine # of frames in video")
-	print("[INFO] no approx. completion time can be provided")
-	total = -1
-
-# loop over frames from the video file stream
-win_started = False
-while True:
-	# read the next frame from the file
-	(grabbed, frame) = vs.read()
-
-	# if the frame was not grabbed, then we have reached the end
-	# of the stream
-	if not grabbed:
-		break
-
-	# if the frame dimensions are empty, grab them
-	if W is None or H is None:
-		(H, W) = frame.shape[:2]
-
-	# construct a blob from the input frame and then perform a forward
-	# pass of the YOLO object detector, giving us our bounding boxes
-	# and associated probabilities
-	blob = cv2.dnn.blobFromImage(frame, 1 / 255.0, (416, 416),
-		swapRB=True, crop=False)
-	net.setInput(blob)
-	start = time.time()
-	layerOutputs = net.forward(ln)
-	end = time.time()
-
-	# initialize our lists of detected bounding boxes, confidences,
-	# and class IDs, respectively
-	boxes = []
-	confidences = []
-	classIDs = []
-
-	# loop over each of the layer outputs
-	for output in layerOutputs:
-		# loop over each of the detections
-		for detection in output:
-			# extract the class ID and confidence (i.e., probability)
-			# of the current object detection
-			scores = detection[5:]
-			classID = np.argmax(scores)
-			confidence = scores[classID]
-
-			# filter out weak predictions by ensuring the detected
-			# probability is greater than the minimum probability
-			if confidence > args["confidence"]:
-				# scale the bounding box coordinates back relative to
-				# the size of the image, keeping in mind that YOLO
-				# actually returns the center (x, y)-coordinates of
-				# the bounding box followed by the boxes' width and
-				# height
-				box = detection[0:4] * np.array([W, H, W, H])
-				(centerX, centerY, width, height) = box.astype("int")
-
-				# use the center (x, y)-coordinates to derive the top
-				# and and left corner of the bounding box
-				x = int(centerX - (width / 2))
-				y = int(centerY - (height / 2))
-
-				# update our list of bounding box coordinates,
-				# confidences, and class IDs
-				boxes.append([x, y, int(width), int(height)])
-				confidences.append(float(confidence))
-				classIDs.append(classID)
-
-	# apply non-maxima suppression to suppress weak, overlapping
-	# bounding boxes
-	idxs = cv2.dnn.NMSBoxes(boxes, confidences, args["confidence"],
-		args["threshold"])
-
-	# ensure at least one detection exists
-	if len(idxs) > 0:
-		# loop over the indexes we are keeping
-		for i in idxs.flatten():
-			# extract the bounding box coordinates
-			(x, y) = (boxes[i][0], boxes[i][1])
-			(w, h) = (boxes[i][2], boxes[i][3])
-
-			# draw a bounding box rectangle and label on the frame
-			color = [int(c) for c in COLORS[classIDs[i]]]
-			cv2.rectangle(frame, (x, y), (x + w, y + h), color, 2)
-			text = "{}: {:.4f}".format(LABELS[classIDs[i]],
-				confidences[i])
-			cv2.putText(frame, text, (x, y - 5),
-				cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
-
-	# check if the video writer is None
-	# if writer is None:
-	# 	# initialize our video writer
-	# 	fourcc = cv2.VideoWriter_fourcc(*"MJPG")
-	# 	writer = cv2.VideoWriter(args["output"], fourcc, 30,
-	# 		(frame.shape[1], frame.shape[0]), True)
-    #
-	# 	# some information on processing single frame
-	# 	if total > 0:
-	# 		elap = (end - start)
-	# 		print("[INFO] single frame took {:.4f} seconds".format(elap))
-	# 		print("[INFO] estimated total time to finish: {:.4f}".format(
-	# 			elap * total))
-
-	# write the output frame to disk
-	# writer.write(frame)
-	imgbytes = cv2.imencode('.png', frame)[1].tobytes()  # ditto
-
-	if not win_started:
-		win_started = True
-		layout = [
-			[sg.Text('Yolo Output')],
-			[sg.Image(data=imgbytes, key='_IMAGE_')],
-			[sg.Exit()]
-		]
-		win = sg.Window('YOLO Output',
-						default_element_size=(14, 1),
-						text_justification='right',
-						auto_size_text=False).Layout(layout).Finalize()
-		image_elem = win.FindElement('_IMAGE_')
-	else:
-		image_elem.Update(data=imgbytes)
-
-	event, values = win.Read(timeout=0)
-	if event is None or event == 'Exit':
-		break
-
-
-win.Close()
-
-# release the file pointers
-print("[INFO] cleaning up...")
-writer.release()
-vs.release()
--- a/YoloObjectDetection/yolo_video_with_webcam.py
+++ b/YoloObjectDetection/yolo_video_with_webcam.py
@ -1,222 +0,0 @@
-# YOLO object detection using a webcam
-# Exact same demo as the read from disk, but instead of disk a webcam is used.
-# import the necessary packages
-import numpy as np
-# import argparse
-import imutils
-import time
-import cv2
-import os
-import PySimpleGUI as sg
-
-i_vid = r'videos\car_chase_01.mp4'
-o_vid = r'output\car_chase_01_out.mp4'
-y_path = r'yolo-coco'
-sg.ChangeLookAndFeel('LightGreen')
-layout = 	[
-		[sg.Text('YOLO Video Player', size=(18,1), font=('Any',18),text_color='#1c86ee' ,justification='left')],
-		[sg.Text('Path to input video'), sg.In(i_vid,size=(40,1), key='input'), sg.FileBrowse()],
-		[sg.Text('Optional Path to output video'), sg.In(o_vid,size=(40,1), key='output'), sg.FileSaveAs()],
-		[sg.Text('Yolo base path'), sg.In(y_path,size=(40,1), key='yolo'), sg.FolderBrowse()],
-		[sg.Text('Confidence'), sg.Slider(range=(0,1),orientation='h', resolution=.1, default_value=.5, size=(15,15), key='confidence')],
-		[sg.Text('Threshold'), sg.Slider(range=(0,1), orientation='h', resolution=.1, default_value=.3, size=(15,15), key='threshold')],
-		[sg.Text(' '*8), sg.Checkbox('Use webcam', key='_WEBCAM_')],
-		[sg.Text(' '*8), sg.Checkbox('Write to disk', key='_DISK_')],
-		[sg.OK(), sg.Cancel()]
-			]
-
-win = sg.Window('YOLO Video',
-				default_element_size=(21,1),
-				text_justification='right',
-				auto_size_text=False).Layout(layout)
-event, values = win.Read()
-if event is None or event =='Cancel':
-	exit()
-write_to_disk = values['_DISK_']
-use_webcam = values['_WEBCAM_']
-args = values
-
-win.Close()
-
-
-# imgbytes = cv2.imencode('.png', image)[1].tobytes()  # ditto
-gui_confidence = args["confidence"]
-gui_threshold = args["threshold"]
-# load the COCO class labels our YOLO model was trained on
-labelsPath = os.path.sep.join([args["yolo"], "coco.names"])
-LABELS = open(labelsPath).read().strip().split("\n")
-
-# initialize a list of colors to represent each possible class label
-np.random.seed(42)
-COLORS = np.random.randint(0, 255, size=(len(LABELS), 3),
-	dtype="uint8")
-
-# derive the paths to the YOLO weights and model configuration
-weightsPath = os.path.sep.join([args["yolo"], "yolov3.weights"])
-configPath = os.path.sep.join([args["yolo"], "yolov3.cfg"])
-
-# load our YOLO object detector trained on COCO dataset (80 classes)
-# and determine only the *output* layer names that we need from YOLO
-print("[INFO] loading YOLO from disk...")
-net = cv2.dnn.readNetFromDarknet(configPath, weightsPath)
-ln = net.getLayerNames()
-ln = [ln[i[0] - 1] for i in net.getUnconnectedOutLayers()]
-
-# initialize the video stream, pointer to output video file, and
-# frame dimensions
-vs = cv2.VideoCapture(args["input"])
-writer = None
-(W, H) = (None, None)
-
-# try to determine the total number of frames in the video file
-try:
-	prop = cv2.cv.CV_CAP_PROP_FRAME_COUNT if imutils.is_cv2() \
-		else cv2.CAP_PROP_FRAME_COUNT
-	total = int(vs.get(prop))
-	print("[INFO] {} total frames in video".format(total))
-
-# an error occurred while trying to determine the total
-# number of frames in the video file
-except:
-	print("[INFO] could not determine # of frames in video")
-	print("[INFO] no approx. completion time can be provided")
-	total = -1
-
-# loop over frames from the video file stream
-win_started = False
-if use_webcam:
-	cap = cv2.VideoCapture(0)
-while True:
-	# read the next frame from the file or webcam
-	if use_webcam:
-		grabbed, frame = cap.read()
-	else:
-		grabbed, frame = vs.read()
-
-	# if the frame was not grabbed, then we have reached the end
-	# of the stream
-	if not grabbed:
-		break
-
-	# if the frame dimensions are empty, grab them
-	if W is None or H is None:
-		(H, W) = frame.shape[:2]
-
-	# construct a blob from the input frame and then perform a forward
-	# pass of the YOLO object detector, giving us our bounding boxes
-	# and associated probabilities
-	blob = cv2.dnn.blobFromImage(frame, 1 / 255.0, (416, 416),
-		swapRB=True, crop=False)
-	net.setInput(blob)
-	start = time.time()
-	layerOutputs = net.forward(ln)
-	end = time.time()
-
-	# initialize our lists of detected bounding boxes, confidences,
-	# and class IDs, respectively
-	boxes = []
-	confidences = []
-	classIDs = []
-
-	# loop over each of the layer outputs
-	for output in layerOutputs:
-		# loop over each of the detections
-		for detection in output:
-			# extract the class ID and confidence (i.e., probability)
-			# of the current object detection
-			scores = detection[5:]
-			classID = np.argmax(scores)
-			confidence = scores[classID]
-
-			# filter out weak predictions by ensuring the detected
-			# probability is greater than the minimum probability
-			if confidence > gui_confidence:
-				# scale the bounding box coordinates back relative to
-				# the size of the image, keeping in mind that YOLO
-				# actually returns the center (x, y)-coordinates of
-				# the bounding box followed by the boxes' width and
-				# height
-				box = detection[0:4] * np.array([W, H, W, H])
-				(centerX, centerY, width, height) = box.astype("int")
-
-				# use the center (x, y)-coordinates to derive the top
-				# and and left corner of the bounding box
-				x = int(centerX - (width / 2))
-				y = int(centerY - (height / 2))
-
-				# update our list of bounding box coordinates,
-				# confidences, and class IDs
-				boxes.append([x, y, int(width), int(height)])
-				confidences.append(float(confidence))
-				classIDs.append(classID)
-
-	# apply non-maxima suppression to suppress weak, overlapping
-	# bounding boxes
-	idxs = cv2.dnn.NMSBoxes(boxes, confidences, gui_confidence, gui_threshold)
-
-	# ensure at least one detection exists
-	if len(idxs) > 0:
-		# loop over the indexes we are keeping
-		for i in idxs.flatten():
-			# extract the bounding box coordinates
-			(x, y) = (boxes[i][0], boxes[i][1])
-			(w, h) = (boxes[i][2], boxes[i][3])
-
-			# draw a bounding box rectangle and label on the frame
-			color = [int(c) for c in COLORS[classIDs[i]]]
-			cv2.rectangle(frame, (x, y), (x + w, y + h), color, 2)
-			text = "{}: {:.4f}".format(LABELS[classIDs[i]],
-				confidences[i])
-			cv2.putText(frame, text, (x, y - 5),
-				cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
-	if write_to_disk:
-		#check if the video writer is None
-		if writer is None:
-			# initialize our video writer
-			fourcc = cv2.VideoWriter_fourcc(*"MJPG")
-			writer = cv2.VideoWriter(args["output"], fourcc, 30,
-				(frame.shape[1], frame.shape[0]), True)
-
-			# some information on processing single frame
-			if total > 0:
-				elap = (end - start)
-				print("[INFO] single frame took {:.4f} seconds".format(elap))
-				print("[INFO] estimated total time to finish: {:.4f}".format(
-					elap * total))
-
-		#write the output frame to disk
-		writer.write(frame)
-	imgbytes = cv2.imencode('.png', frame)[1].tobytes()  # ditto
-
-	if not win_started:
-		win_started = True
-		layout = [
-			[sg.Text('Yolo Playback in PySimpleGUI Window', size=(30,1))],
-			[sg.Image(data=imgbytes, key='_IMAGE_')],
-			[sg.Text('Confidence'),
-			 sg.Slider(range=(0, 1), orientation='h', resolution=.1, default_value=.5, size=(15, 15), key='confidence'),
-			sg.Text('Threshold'),
-			 sg.Slider(range=(0, 1), orientation='h', resolution=.1, default_value=.3, size=(15, 15), key='threshold')],
-			[sg.Exit()]
-		]
-		win = sg.Window('YOLO Output',
-						default_element_size=(14, 1),
-						text_justification='right',
-						auto_size_text=False).Layout(layout).Finalize()
-		image_elem = win.FindElement('_IMAGE_')
-	else:
-		image_elem.Update(data=imgbytes)
-
-	event, values = win.Read(timeout=0)
-	if event is None or event == 'Exit':
-		break
-	gui_confidence = values['confidence']
-	gui_threshold = values['threshold']
-
-
-win.Close()
-
-# release the file pointers
-print("[INFO] cleaning up...")
-writer.release() if writer is not None else None
-vs.release()