0% found this document useful (0 votes)

8 views

DETECTCAMERA

This document describes code for object detection using a TensorFlow model. The code loads a YOLOv4 model, runs inference on images to detect objects, draws the detections on the images, and optionally counts or crops the detections.

Uploaded by

paratwuit951

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

8 views

DETECTCAMERA

Uploaded by

paratwuit951

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

import os

# comment out below line to enable tensorflow outputs

os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
import tensorflow as tf
physical_devices = tf.config.experimental.list_physical_devices('GPU')
if len(physical_devices) > 0:
tf.config.experimental.set_memory_growth(physical_devices[0], True)
from absl import app, flags, logging
from absl.flags import FLAGS
import core.utils as utils
from core.yolov4 import filter_boxes
from core.functions import *
from tensorflow.python.saved_model import tag_constants
from PIL import Image
import cv2
import numpy as np
from tensorflow.compat.v1 import ConfigProto
from tensorflow.compat.v1 import InteractiveSession

flags.DEFINE_string('framework', 'tf', '(tf, tflite, trt')

flags.DEFINE_string('weights', './checkpoints/yolov4-416',
'path to weights file')
flags.DEFINE_integer('size', 416, 'resize images to')
flags.DEFINE_boolean('tiny', False, 'yolo or yolo-tiny')
flags.DEFINE_string('model', 'yolov4', 'yolov3 or yolov4')
flags.DEFINE_list('images', './data/images/kite.jpg', 'path to input image')
flags.DEFINE_string('output', './detections/', 'path to output folder')
flags.DEFINE_float('iou', 0.45, 'iou threshold')
flags.DEFINE_float('score', 0.50, 'score threshold')
flags.DEFINE_boolean('count', False, 'count objects within images')
flags.DEFINE_boolean('dont_show', False, 'dont show image output')
flags.DEFINE_boolean('info', False, 'print info on detections')
flags.DEFINE_boolean('crop', False, 'crop detections from images')
flags.DEFINE_boolean('ocr', False, 'perform generic OCR on detection regions')
flags.DEFINE_boolean('plate', False, 'perform license plate recognition')

def main(_argv):
config = ConfigProto()
config.gpu_options.allow_growth = True
session = InteractiveSession(config=config)
STRIDES, ANCHORS, NUM_CLASS, XYSCALE = utils.load_config(FLAGS)
input_size = FLAGS.size

# load model
if FLAGS.framework == 'tflite':
interpreter = tf.lite.Interpreter(model_path=FLAGS.weights)
else:
saved_model_loaded = tf.saved_model.load(FLAGS.weights,
tags=[tag_constants.SERVING])

# create a video capture object

cap = cv2.VideoCapture(0)

# loop through the video frames

while True:
# read a frame from the video
ret, original_image = cap.read()
if not ret:
break
original_image = cv2.cvtColor(original_image, cv2.COLOR_BGR2RGB)

image_data = cv2.resize(original_image, (input_size, input_size))

image_data = image_data / 255.

images_data = []
for i in range(1):
images_data.append(image_data)
images_data = np.asarray(images_data).astype(np.float32)

if FLAGS.framework == 'tflite':
interpreter.allocate_tensors()
input_details = interpreter.get_input_details()
output_details = interpreter.get_output_details()
interpreter.set_tensor(input_details[0]['index'], images_data)
interpreter.invoke()
pred = [interpreter.get_tensor(output_details[i]['index']) for i in
range(len(output_details))]
if FLAGS.model == 'yolov3' and FLAGS.tiny == True:
boxes, pred_conf = filter_boxes(pred[1], pred[0],
score_threshold=0.25, input_shape=tf.constant([input_size, input_size]))
else:
boxes, pred_conf = filter_boxes(pred[0], pred[1],
score_threshold=0.25, input_shape=tf.constant([input_size, input_size]))
else:
infer = saved_model_loaded.signatures['serving_default']
batch_data = tf.constant(images_data)
pred_bbox = infer(batch_data)
for key, value in pred_bbox.items():
boxes = value[:, :, 0:4]
pred_conf = value[:, :, 4:]

# run non max suppression on detections

boxes, scores, classes, valid_detections =
tf.image.combined_non_max_suppression(
boxes=tf.reshape(boxes, (tf.shape(boxes)[0], -1, 1, 4)),
scores=tf.reshape(
pred_conf, (tf.shape(pred_conf)[0], -1, tf.shape(pred_conf)[-1])),
max_output_size_per_class=50,
max_total_size=50,
iou_threshold=FLAGS.iou,
score_threshold=FLAGS.score
)

# format bounding boxes from normalized ymin, xmin, ymax, xmax ---> xmin,
ymin, xmax, ymax
original_h, original_w, _ = original_image.shape
bboxes = utils.format_boxes(boxes.numpy()[0], original_h, original_w)

# hold all detection data in one variable

pred_bbox = [bboxes, scores.numpy()[0], classes.numpy()[0],
valid_detections.numpy()[0]]

# read in all class names from config

class_names = utils.read_class_names(cfg.YOLO.CLASSES)

# by default allow all classes in .names file

allowed_classes = list(class_names.values())
# custom allowed classes (uncomment line below to allow detections for only
people)
#allowed_classes = ['person']

# if crop flag is enabled, crop each detection and save it as new image
if FLAGS.crop:
crop_path = os.path.join(os.getcwd(), 'detections', 'crop', image_name)
try:
os.mkdir(crop_path)
except FileExistsError:
pass
crop_objects(cv2.cvtColor(original_image, cv2.COLOR_BGR2RGB),
pred_bbox, crop_path, allowed_classes)

# if ocr flag is enabled, perform general text extraction using Tesseract

OCR on object detection bounding box
if FLAGS.ocr:
ocr(cv2.cvtColor(original_image, cv2.COLOR_BGR2RGB), pred_bbox)

# if count flag is enabled, perform counting of objects

if FLAGS.count:
# count objects found
counted_classes = count_objects(pred_bbox, by_class = False,
allowed_classes=allowed_classes)
# loop through dict and print
for key, value in counted_classes.items():
print("Number of {}s: {}".format(key, value))
image = utils.draw_bbox(original_image, pred_bbox, FLAGS.info,
counted_classes, allowed_classes=allowed_classes, read_plate = FLAGS.plate)
else:
image = utils.draw_bbox(original_image, pred_bbox, FLAGS.info,
allowed_classes=allowed_classes, read_plate = FLAGS.plate)

image = Image.fromarray(image.astype(np.uint8))
image = cv2.cvtColor(np.array(image), cv2.COLOR_BGR2RGB)
# show the output image
cv2.imshow('output', image)
# wait for a key press
if cv2.waitKey(1) & 0xFF == ord('q'):
break

# release the video capture object and destroy all windows

cap.release()
cv2.destroyAllWindows()

if __name__ == '__main__':
try:
app.run(main)
except SystemExit:
pass

COMAND RUM python detect.py --weights ./checkpoints/custom-416 --size 416 --model

yolov4 --plate

Napas Payment Gateway Techspec v3.0
No ratings yet
Napas Payment Gateway Techspec v3.0
61 pages
484 ETOPS Training Guide
88% (8)
484 ETOPS Training Guide
67 pages
Chapter Ii: Research Design and Methodology
No ratings yet
Chapter Ii: Research Design and Methodology
6 pages
Static Regain Method: P V P V P
50% (2)
Static Regain Method: P V P V P
13 pages
Detection ORIGINAL
No ratings yet
Detection ORIGINAL
3 pages
Object Detection Webcam
No ratings yet
Object Detection Webcam
3 pages
Object Detection Webcam
No ratings yet
Object Detection Webcam
3 pages
huggin face code
No ratings yet
huggin face code
3 pages
Document 2
No ratings yet
Document 2
8 pages
Csc413 Project Semantic Segmentation
No ratings yet
Csc413 Project Semantic Segmentation
84 pages
Untitled document
No ratings yet
Untitled document
4 pages
Model Training
No ratings yet
Model Training
17 pages
Presentation
No ratings yet
Presentation
31 pages
New Text Document
No ratings yet
New Text Document
11 pages
yolo_detect
No ratings yet
yolo_detect
5 pages
Ejemplo 1 Chapas
No ratings yet
Ejemplo 1 Chapas
3 pages
DL Ex 13
No ratings yet
DL Ex 13
5 pages
Vertopal.com Transfer Learning Q3 2
No ratings yet
Vertopal.com Transfer Learning Q3 2
36 pages
Signals
No ratings yet
Signals
17 pages
Lab 4-Image Segmentation Using U-Net
No ratings yet
Lab 4-Image Segmentation Using U-Net
9 pages
curvature
No ratings yet
curvature
2 pages
Experiment 8
No ratings yet
Experiment 8
3 pages
untitled_0
No ratings yet
untitled_0
3 pages
CV
No ratings yet
CV
5 pages
import cv2
No ratings yet
import cv2
6 pages
Coding
No ratings yet
Coding
6 pages
CV Task
No ratings yet
CV Task
6 pages
code_edge impulse
No ratings yet
code_edge impulse
13 pages
finalised question 1
No ratings yet
finalised question 1
40 pages
Apex For Bres 1
No ratings yet
Apex For Bres 1
6 pages
导入所需库
No ratings yet
导入所需库
20 pages
vit32_gptMD
No ratings yet
vit32_gptMD
6 pages
Final Question1 with results
No ratings yet
Final Question1 with results
21 pages
Start - Copy (2)
No ratings yet
Start - Copy (2)
3 pages
Dinushasan Courseproject04: Sign in
No ratings yet
Dinushasan Courseproject04: Sign in
19 pages
Ex 3,4,5
No ratings yet
Ex 3,4,5
9 pages
DL Practical 6,7 Outputs
No ratings yet
DL Practical 6,7 Outputs
9 pages
CVDL TAE 63 (1)
No ratings yet
CVDL TAE 63 (1)
9 pages
Image classification code
No ratings yet
Image classification code
4 pages
CV Record
No ratings yet
CV Record
48 pages
Font Transfer 2 Autoencoders
No ratings yet
Font Transfer 2 Autoencoders
78 pages
Code 1
No ratings yet
Code 1
18 pages
VGG16-estudo
No ratings yet
VGG16-estudo
10 pages
Python Deep Learning Lab Programs (2)
No ratings yet
Python Deep Learning Lab Programs (2)
35 pages
Case Study - AP23322130042
No ratings yet
Case Study - AP23322130042
7 pages
detect
No ratings yet
detect
6 pages
vertopal.com_HandWritten
No ratings yet
vertopal.com_HandWritten
13 pages
Task 9 Implementation of Object Detection and Localization
No ratings yet
Task 9 Implementation of Object Detection and Localization
7 pages
Zero
No ratings yet
Zero
27 pages
Dlv Lab Manual Print
No ratings yet
Dlv Lab Manual Print
29 pages
AI
No ratings yet
AI
33 pages
import numpy as np
No ratings yet
import numpy as np
3 pages
facene
No ratings yet
facene
3 pages
Task1_Lakshya.ipynb_-_Colab[1]
No ratings yet
Task1_Lakshya.ipynb_-_Colab[1]
33 pages
Image Caption2
No ratings yet
Image Caption2
9 pages
CD 601 Lab Manual
No ratings yet
CD 601 Lab Manual
61 pages
ass_3
No ratings yet
ass_3
5 pages
DL_LAB_MANUAL_mugesh
No ratings yet
DL_LAB_MANUAL_mugesh
12 pages
OBJECT DETECTION USING AUTOENCODER
No ratings yet
OBJECT DETECTION USING AUTOENCODER
8 pages
dl_5 excuted
No ratings yet
dl_5 excuted
13 pages
val
No ratings yet
val
9 pages
DEEP LEARNING MANUAL Final
No ratings yet
DEEP LEARNING MANUAL Final
14 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Operation Manual: Car MP5 Player
100% (1)
Operation Manual: Car MP5 Player
7 pages
Letters of Intent
No ratings yet
Letters of Intent
5 pages
Water purification on a large scale_20241030_004510_0000
No ratings yet
Water purification on a large scale_20241030_004510_0000
32 pages
Budget Proposal Template
No ratings yet
Budget Proposal Template
16 pages
Case Note 7: Patient Details
100% (1)
Case Note 7: Patient Details
3 pages
NGR Sizing For Arar
No ratings yet
NGR Sizing For Arar
6 pages
Cpu Specs
No ratings yet
Cpu Specs
51 pages
Chapter 1
No ratings yet
Chapter 1
8 pages
CD Assignment-5 21BRS1018
No ratings yet
CD Assignment-5 21BRS1018
8 pages
Drug Design Poster Template Fall 2019
No ratings yet
Drug Design Poster Template Fall 2019
1 page
ANT-AQU4517R4-1873 Datasheet
No ratings yet
ANT-AQU4517R4-1873 Datasheet
2 pages
Optimization For ML (2) : CS771: Introduction To Machine Learning Piyush Rai
No ratings yet
Optimization For ML (2) : CS771: Introduction To Machine Learning Piyush Rai
14 pages
PME-20-PH: Phase Angle Meter User's Manual
No ratings yet
PME-20-PH: Phase Angle Meter User's Manual
9 pages
Battery, Electrical Machines and Power Supply
No ratings yet
Battery, Electrical Machines and Power Supply
14 pages
Machine Language
No ratings yet
Machine Language
4 pages
Strategi Financial Literacy Untuk Meningkatkan Kesejahteraan Masyarakat Industri Kawasan Wisata Kabupaten Gersik Jawa Timur Tri Ratnawati Siti Mujanah Nyoman Lokajaya
No ratings yet
Strategi Financial Literacy Untuk Meningkatkan Kesejahteraan Masyarakat Industri Kawasan Wisata Kabupaten Gersik Jawa Timur Tri Ratnawati Siti Mujanah Nyoman Lokajaya
15 pages
University of Salford: Ahmed Salah
No ratings yet
University of Salford: Ahmed Salah
18 pages
MBA5020 CaseFrmwk Mirkhoshimova Askhobjamol
No ratings yet
MBA5020 CaseFrmwk Mirkhoshimova Askhobjamol
6 pages
Myths About Time Management
No ratings yet
Myths About Time Management
2 pages
Sigma LT Hand-Held - Quick Start Guide
No ratings yet
Sigma LT Hand-Held - Quick Start Guide
2 pages
Tochka Ru A1
No ratings yet
Tochka Ru A1
155 pages
Final Exam 1 - 7 January 2022
No ratings yet
Final Exam 1 - 7 January 2022
4 pages
Digitrip 520 Magnun4000A MWI64N
100% (1)
Digitrip 520 Magnun4000A MWI64N
3 pages
Results of Competition: Increase Productivity, Performance and Quality in UK Construction Competition Code: 1807 - ISCF - IPPQUKC
No ratings yet
Results of Competition: Increase Productivity, Performance and Quality in UK Construction Competition Code: 1807 - ISCF - IPPQUKC
52 pages
XI CS - Material - 2024 - Compressed - Compressed
No ratings yet
XI CS - Material - 2024 - Compressed - Compressed
121 pages
C 202311281056454144
No ratings yet
C 202311281056454144
28 pages

DETECTCAMERA

Uploaded by

DETECTCAMERA

Uploaded by

import os

# comment out below line to enable tensorflow outputs

flags.DEFINE_string('framework', 'tf', '(tf, tflite, trt')

# create a video capture object

# loop through the video frames

image_data = cv2.resize(original_image, (input_size, input_size))

# run non max suppression on detections

# hold all detection data in one variable

# read in all class names from config

# by default allow all classes in .names file

# if ocr flag is enabled, perform general text extraction using Tesseract

# if count flag is enabled, perform counting of objects

# release the video capture object and destroy all windows

COMAND RUM python detect.py --weights ./checkpoints/custom-416 --size 416 --model

You might also like