问题
I'm trying to make object detection software with yolo and this error is popping and I am so lost please can anyone help me !! (the code not complete and sorry if there are any mistakes in this post cus I am new Stackoverflow).the tutorial is from here
Traceback (most recent call last):
File "d:/opencv/objdetect_yolo.py", line 66, in <module>
findobj(output,img)
File "d:/opencv/objdetect_yolo.py", line 33, in findobj
cofidence = scores[classId]
IndexError: index 14708 is out of bounds for axis 0 with size 295
IndexError: index 14708 is out of bounds for axis 0 with size 295
import numpy as np
import cv2
cap = cv2.VideoCapture(0)
whT = 320
classespath = 'coco.names.txt'
classes = []
with open(classespath,'rt')as f:
classes = f.read().rstrip('\n').split('\n')
#print (classes)
#print(len(classes))
modelConfiguration = 'yolov3.cfg'
modelWeights = 'yolov3.weights'
net = cv2.dnn.readNetFromDarknet(modelConfiguration, modelWeights)
net.setPreferableBackend(cv2.dnn.DNN_BACKEND_OPENCV)
net.setPreferableTarget(cv2.dnn.DNN_TARGET_CPU)
def findobj(outputs,img):
hT, wT , cT = img.shape
bbox = []
classIds = []
confs = []
for output in outputs:
for det in outputs:
scores = det[5:]
classId = np.argmax(scores)
cofidence = scores[classId]
if float(0.5) < cofidence:
w,h = int(det[2]*wT),int(det[3]*hT)
x,y = int((det[0]*wT) - w/2), int((det[1]*hT) - h/2)
bbox.append([x,y,w,h])
classIds.append(classId)
confs.append(float(cofidence))
while True:
succes, img = cap.read()
blob = cv2.dnn.blobFromImage(img,1/255,(whT,whT),[0,0,0],1,crop=False)
net.setInput(blob)
layerNames = net.getLayerNames()
#print(layerNames)
outputNames = [layerNames[i[0]-1]for i in net.getUnconnectedOutLayers() ]
#print(outputNames)
#print(net.getUnconnectedOutLayers())
output = net.forward(outputNames)
findobj(output,img)
cv2.imshow("objdetect",img)
if cv2.waitKey(1) & 0xFF == ord('q'):
break
回答1:
It seems that you are running into a problem because np.argmax
will give you the raw number of the max element instead of the index. So if you have a 3x3 matrix the argmax function will treat the matrix as a 9x1 line instead of a 3x3 square.
# The matrix:
[[1, 2, 3],
[4, 5, 6],
[7, 8, 9]]
#will be treated as:
[1, 2, 3, 4, 5, 6, 7, 8, 9]
The documentation suggests the bellow solution:
classId = np.unravel_index(np.argmax(scores, axis=None), scores.shape)
回答2:
Now this popping up
Traceback (most recent call last):
File "d:/opencv/objdetect_yolo.py", line 67, in <module>
findobj(output,img)
File "d:/opencv/objdetect_yolo.py", line 38, in findobj
w,h = int(det[2]*wT),int(det[3]*hT)
TypeError: only size-1 arrays can be converted to Python scalars
[ WARN:1] global C:\Users\appveyor\AppData\Local\Temp\1\pip-req-build-h4wtvo23\opencv\modules\videoio\src\cap_msmf.cpp (435) `anonymous-namespace'::SourceReaderCB::~SourceReaderCB terminating async callback
来源:https://stackoverflow.com/questions/65018029/indexerror-index-14708-is-out-of-bounds-for-axis-0-with-size-295