| import cv2 |
| import gradio as gr |
| import fast_colorthief |
| import webcolors |
| from PIL import Image |
| import numpy as np |
| thres = 0.45 |
|
|
|
|
|
|
| def Detection(filename): |
| cap = cv2.VideoCapture(filename) |
| framecount=0 |
|
|
| cap.set(3,1280) |
| cap.set(4,720) |
| cap.set(10,70) |
|
|
| error="in function 'cv::imshow'" |
| classNames= [] |
| FinalItems=[] |
| classFile = 'coco.names' |
| with open(classFile,'rt') as f: |
| |
| classNames = f.readlines() |
|
|
|
|
| |
| classNames = [x.strip() for x in classNames] |
| print(classNames) |
| configPath = 'ssd_mobilenet_v3_large_coco_2020_01_14.pbtxt' |
| weightsPath = 'frozen_inference_graph.pb' |
|
|
|
|
| net = cv2.dnn_DetectionModel(weightsPath,configPath) |
| net.setInputSize(320,320) |
| net.setInputScale(1.0/ 127.5) |
| net.setInputMean((127.5, 127.5, 127.5)) |
| net.setInputSwapRB(True) |
|
|
| while True: |
| success,img = cap.read() |
|
|
|
|
| |
| |
| try: |
| image = Image.fromarray(img) |
| image = image.convert('RGBA') |
| image = np.array(image).astype(np.uint8) |
| palette=fast_colorthief.get_palette(image) |
| |
|
|
| for i in range(len(palette)): |
| diff={} |
| for color_hex, color_name in webcolors.CSS3_HEX_TO_NAMES.items(): |
| r, g, b = webcolors.hex_to_rgb(color_hex) |
| diff[sum([(r - palette[i][0])**2, |
| (g - palette[i][1])**2, |
| (b - palette[i][2])**2])]= color_name |
| if FinalItems.count(diff[min(diff.keys())])==0: |
| FinalItems.append(diff[min(diff.keys())]) |
|
|
| except: |
| pass |
| |
| try: |
| classIds, confs, bbox = net.detect(img,confThreshold=thres) |
| except: |
| pass |
| print(classIds,bbox) |
| try: |
| if len(classIds) != 0: |
| for classId, confidence,box in zip(classIds.flatten(),confs.flatten(),bbox): |
| |
| |
| |
| |
| |
| |
| if FinalItems.count(classNames[classId-1]) == 0: |
| FinalItems.append(classNames[classId-1]) |
| |
| |
| |
| cv2.waitKey(10) |
| if framecount>cap.get(cv2.CAP_PROP_FRAME_COUNT): |
| break |
| else: |
| framecount+=1 |
| except Exception as err: |
| print(err) |
| t=str(err) |
| if t.__contains__(error): |
| break |
|
|
| print(FinalItems) |
| return str(FinalItems) |
|
|
| interface = gr.Interface(fn=Detection, |
| inputs=["video"], |
| outputs="text", |
| title='Object & Color Detection in Video') |
| interface.launch(inline=False,debug=True) |