1 Star 1 Fork 0

tkhe / yolov7

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
克隆/下载
benchmark.py 6.30 KB
一键复制 编辑 原始数据 按行查看 历史
邱靖 提交于 2022-02-06 20:39 . change file mode
# Copyright (c) Facebook, Inc. and its affiliates.
import argparse
import glob
import multiprocessing as mp
import os
import time
import cv2
from detectron2.structures.masks import BitMasks
from numpy.core.fromnumeric import sort
import tqdm
import torch
import time
import random
from detectron2.data.detection_utils import read_image
from detectron2.utils.logger import setup_logger
import numpy as np
from detectron2.data.catalog import MetadataCatalog
from detectron2.config import get_cfg
from detectron2.modeling import build_model
import detectron2.data.transforms as T
from detectron2.checkpoint import DetectionCheckpointer
from yolov7.config import add_yolo_config
from alfred.vis.image.mask import label2color_mask, vis_bitmasks, vis_bitmasks_with_classes
from alfred.vis.image.det import visualize_det_cv2_part, visualize_det_cv2_fancy
# constants
WINDOW_NAME = "COCO detections"
class DefaultPredictor:
def __init__(self, cfg):
self.cfg = cfg.clone() # cfg can be modified by model
self.model = build_model(self.cfg)
self.model.eval()
if len(cfg.DATASETS.TEST):
self.metadata = MetadataCatalog.get(cfg.DATASETS.TEST[0])
checkpointer = DetectionCheckpointer(self.model)
checkpointer.load(cfg.MODEL.WEIGHTS)
self.aug = T.ResizeShortestEdge(
[cfg.INPUT.MIN_SIZE_TEST, cfg.INPUT.MIN_SIZE_TEST], cfg.INPUT.MAX_SIZE_TEST
)
self.input_format = cfg.INPUT.FORMAT
assert self.input_format in ["RGB", "BGR"], self.input_format
def __call__(self, original_image):
with torch.no_grad():
if self.input_format == "RGB":
original_image = original_image[:, :, ::-1]
height, width = original_image.shape[:2]
image = self.aug.get_transform(
original_image).apply_image(original_image)
image = torch.as_tensor(image.astype("float32").transpose(2, 0, 1))
inputs = {"image": image, "height": height, "width": width}
tic = time.time()
# predictions, pure_t = self.model([inputs])
predictions = self.model([inputs])
predictions = predictions[0]
c = time.time() - tic
# print('cost: {}, fps: {}'.format(c, 1/c))
return predictions, image.shape
def setup_cfg(args):
# load config from file and command-line arguments
cfg = get_cfg()
add_yolo_config(cfg)
cfg.merge_from_file(args.config_file)
cfg.merge_from_list(args.opts)
cfg.MODEL.YOLO.CONF_THRESHOLD = args.confidence_threshold
cfg.MODEL.YOLO.NMS_THRESHOLD = args.nms_threshold
cfg.MODEL.YOLO.IGNORE_THRESHOLD = 0.1
# cfg.INPUT.MIN_SIZE_TEST = 672 # 90ms
# cfg.INPUT.MIN_SIZE_TEST = 2560 # 90ms
# cfg.INPUT.MAX_SIZE_TEST = 3060 # 90ms
cfg.INPUT.MAX_SIZE_TEST = 900 # 90ms
# cfg.INPUT.MIN_SIZE_TEST = 512 # 70ms
# cfg.INPUT.MIN_SIZE_TEST = 1080 # 40ms
# cfg.INPUT.MAX_SIZE_TEST = 512 # 40ms
# cfg.INPUT.MAX_SIZE_TEST = 1080 # 70ms
cfg.freeze()
return cfg
def get_parser():
parser = argparse.ArgumentParser(
description="Detectron2 demo for builtin configs")
parser.add_argument(
"--config-file",
default="configs/quick_schedules/mask_rcnn_R_50_FPN_inference_acc_test.yaml",
metavar="FILE",
help="path to config file",
)
parser.add_argument("--webcam", action="store_true",
help="Take inputs from webcam.")
parser.add_argument("--video-input", help="Path to video file.")
parser.add_argument(
"--input",
# nargs="+",
help="A list of space separated input images; "
"or a single glob pattern such as 'directory/*.jpg'",
)
parser.add_argument(
"--output",
help="A file or directory to save output visualizations. "
"If not given, will show output in an OpenCV window.",
)
parser.add_argument(
'-c', "--confidence-threshold",
type=float,
default=0.21,
help="Minimum score for instance predictions to be shown",
)
parser.add_argument(
'-n', "--nms-threshold",
type=float,
default=0.6,
help="Minimum score for instance predictions to be shown",
)
parser.add_argument(
"--opts",
help="Modify config options using the command-line 'KEY VALUE' pairs",
default=[],
nargs=argparse.REMAINDER,
)
return parser
if __name__ == "__main__":
mp.set_start_method("spawn", force=True)
args = get_parser().parse_args()
setup_logger(name="fvcore")
logger = setup_logger()
logger.info("Arguments: " + str(args))
cfg = setup_cfg(args)
metadata = MetadataCatalog.get(cfg.DATASETS.TEST[0])
predictor = DefaultPredictor(cfg)
print(cfg.INPUT.MIN_SIZE_TEST, cfg.INPUT.MIN_SIZE_TEST, cfg.INPUT.MAX_SIZE_TEST)
colors = [[random.randint(0, 255) for _ in range(3)]
for _ in range(cfg.MODEL.YOLO.CLASSES)]
if args.input:
if os.path.isdir(args.input):
print('Benchmark only support single image input.')
else:
t0 = time.time()
num_times = 200
img = cv2.imread(args.input)
a = img.shape
for i in range(num_times):
# print('ori img shape: ', img.shape)
res, a = predictor(img)
t1 = time.time()
print(f'Total time: {t1 -t0}\n'
f'Average time: {(t1-t0)/num_times}\n'
f'Input shape: {a}\n'
f'Original shape: {img.shape}\n')
elif args.webcam:
print('Not supported.')
elif args.video_input:
video = cv2.VideoCapture(args.video_input)
width = int(video.get(cv2.CAP_PROP_FRAME_WIDTH))
height = int(video.get(cv2.CAP_PROP_FRAME_HEIGHT))
frames_per_second = video.get(cv2.CAP_PROP_FPS)
num_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
basename = os.path.basename(args.video_input)
while(video.isOpened()):
ret, frame = video.read()
# frame = cv2.resize(frame, (640, 640))
res = predictor(frame)
# res = vis_res_fast(res, frame, metadata, colors)
# cv2.imshow('frame', res)
cv2.imshow('frame', res)
if cv2.waitKey(1) & 0xFF == ord('q'):
break
1
https://gitee.com/tkhe/yolov7.git
git@gitee.com:tkhe/yolov7.git
tkhe
yolov7
yolov7
main

搜索帮助