當前位置：首頁 >

线段检测网格检测（LCNN）的wireframe数据集标注、转换问题

發布時間：2025/3/19 26 豆豆

生活随笔收集整理的這篇文章主要介紹了线段检测网格检测（LCNN）的wireframe数据集标注、转换问题小編覺得挺不錯的,現在分享給大家,幫大家做個參考.

使用annotation-tool線段標注工具生成txt格式的標注文件

1、將所有txt文件合并成一個json文件(代碼來自實驗室師姐)

import cv2 import sys import numpy as np import os from glob import globfrom math import cos, sin from os.path import isfile, splitext, basename, isdir from os import makedirs import jsonimg_files_path = r'E:\Desktop\zhijiang_total\images'img_files = glob('%s/*.txt' % img_files_path)writePath = './train.json'with open(writePath,'w') as fo:label = []for i in range(len(img_files)):dic = {}dic["filename"] = img_files[i][len(img_files_path)+1:-4]+'.jpg'print(img_files[i][:-4]+'.jpg')im = cv2.imread(img_files[i][:-4]+'.jpg')h,w,_ = im.shape# print(w,h)lines = []with open(img_files[i],'r') as fi:lines = []for line in fi:line = line.split(',')# print(line)# print(img_files[i][len(img_files_path)+1:])# print(int(len(line)/4))# for j in range(int(len(line)/4)):# t = 4*jlines.append([int(float(line[1])*w),int(float(line[3])*h),int(float(line[2])*w),int(float(line[4])*h)])# print(lines)# os.system('pause')dic["lines"] = linesdic["height"] = h dic["width"] = w label.append(dic)json.dump(label, fo)

2、運行

python dataset/wireframe.py <src-path> <dest-path>

將我們自己的標注數據和圖片轉換成模型可訓練的數據格式

3、運行

python ./train.py -d 0 --identifier baseline config/wireframe.yaml

開始訓練模型

補充：

標注工具annotation-tool（代碼來自實驗室師哥）

''' Annotation toolTool used to annotate labels for LP detection. Main keys:C: creates a new shapeA: creates a new vertex over mouse positionD: delete last vertexS: change position of closest vertex (to mouse pos.)X: switch to closest shapeN or enter: next pictureP: previous pictureFor more commands, take a look at the main part...Usage:python annotation-tool.py max_width max_height file1 ... fileNObs. This tool is not fully tested and crashes under unexpetected situations.If you find any and correct, feel free to send a pull request =)'''import cv2 import sys import numpy as np import os from glob import globfrom math import cos, sin from os.path import isfile, splitext, basename, isdir from os import makedirsdef getRectPts(tlx,tly,brx,bry):return np.matrix([[tlx,brx,brx,tlx],[tly,tly,bry,bry],[1.,1.,1.,1.]],dtype=float)def image_files_from_folder(folder,upper=True):extensions = ['jpg','jpeg','png']img_files = []for ext in extensions:img_files += glob('%s/*.%s' % (folder,ext))if upper:img_files += glob('%s/*.%s' % (folder,ext.upper()))return img_filesclass Label:def __init__(self,cl=-1,tl=np.array([0.,0.]),br=np.array([0.,0.]),prob=None):self.__tl = tlself.__br = brself.__cl = clself.__prob = probdef __str__(self):return 'Class: %d, top_left(x:%f,y:%f), bottom_right(x:%f,y:%f)' % (self.__cl, self.__tl[0], self.__tl[1], self.__br[0], self.__br[1])def copy(self):return Label(self.__cl,self.__tl,self.__br)def wh(self): return self.__br-self.__tldef cc(self): return self.__tl + self.wh()/2def tl(self): return self.__tldef br(self): return self.__brdef tr(self): return np.array([self.__br[0],self.__tl[1]])def bl(self): return np.array([self.__tl[0],self.__br[1]])def cl(self): return self.__cldef area(self): return np.prod(self.wh())def prob(self): return self.__probdef set_class(self,cl):self.__cl = cldef set_tl(self,tl):self.__tl = tldef set_br(self,br):self.__br = brdef set_wh(self,wh):cc = self.cc()self.__tl = cc - .5*whself.__br = cc + .5*whdef set_prob(self,prob):self.__prob = probclass Shape():def __init__(self,pts=np.zeros((2,0)),max_sides=2,text=''):self.pts = ptsself.max_sides = max_sidesself.text = textdef isValid(self):# print(self.pts.shape)return self.pts.shape[1] > 1def write(self,fp):fp.write('%d,' % self.pts.shape[1])ptsarray = self.pts.flatten()fp.write(''.join([('%f,' % value) for value in ptsarray]))fp.write('%s,' % self.text)fp.write('\n')def read(self,line):data = line.strip().split(',')ss = int(data[0])values = data[1:(ss*2 + 1)]text = data[(ss*2 + 1)] if len(data) >= (ss*2 + 2) else ''self.pts = np.array([float(value) for value in values]).reshape((2,ss))self.text = textdef readShapes(path,obj_type=Shape):shapes = []with open(path) as fp:for line in fp:shape = obj_type()shape.read(line)shapes.append(shape)return shapesdef writeShapes(path,shapes):if len(shapes):# printwith open(path,'w') as fp:for shape in shapes:# print(shape.pts)if shape.isValid():shape.write(fp)def find_T_matrix(pts,t_pts):A = np.zeros((8,9))for i in range(0,4):xi = pts[:,i];xil = t_pts[:,i];xi = xi.TA[i*2, 3:6] = -xil[2]*xiA[i*2, 6: ] = xil[1]*xiA[i*2+1, :3] = xil[2]*xiA[i*2+1, 6: ] = -xil[0]*xi[U,S,V] = np.linalg.svd(A)H = V[-1,:].reshape((3,3))return Hdef perspective_transform(wh,angles=np.array([0.,0.,0.]),zcop=1000., dpp=1000.):rads = np.deg2rad(angles)a = rads[0]; Rx = np.matrix([[1, 0, 0] , [0, cos(a), sin(a)] , [0, -sin(a), cos(a)] ])a = rads[1]; Ry = np.matrix([[cos(a), 0, -sin(a)] , [0, 1, 0] , [sin(a), 0, cos(a)] ])a = rads[2]; Rz = np.matrix([[cos(a), sin(a), 0] , [-sin(a), cos(a), 0] , [0, 0, 1] ])R = Rx*Ry*Rz;(w,h) = tuple(wh)xyz = np.matrix([[0,0,w,w],[0,h,0,h],[0,0,0,0]])hxy = np.matrix([[0,0,w,w],[0,h,0,h],[1,1,1,1]])xyz = xyz - np.matrix([[w],[h],[0]])/2.xyz = R*xyzxyz = xyz - np.matrix([[0],[0],[zcop]])hxyz = np.concatenate([xyz,np.ones((1,4))])P = np.matrix([[1,0,0,0],[0,1,0,0],[0,0,-1./dpp,0]])_hxy = P*hxyz_hxy = _hxy/_hxy[2,:]_hxy = _hxy + np.matrix([[w],[h],[0]])/2.return find_T_matrix(hxy,_hxy)def getWH(shape):return np.array(shape[1::-1]).astype(float)class ShapeDisplay(Shape):def appendSide(self,pt):if (self.max_sides == 0) or (self.pts.shape[1] < self.max_sides):self.pts = np.append(self.pts,pt,axis=1)def removeLast(self):self.pts = self.pts[...,:-1]def changeClosest(self,pt):try:idx = np.argmin(self.distanceTo(pt))self.pts[...,idx] = pt[...,0]except ValueError as e:print("except : ", e)def distanceTo(self,pt):return np.sqrt(np.power((self.pts - pt),2).sum(0))def shiftPts(self):if self.pts.shape[1] > 1:idx = range(1,self.pts.shape[1]) + [0]self.pts = self.pts[...,idx]def getSquare(self):tl,br = self.pts.min(1),self.pts.max(1)return Label(-1,tl,br)def draw(self,drawLineFunc,drawCircleFunc,drawTextFunc,color=(255,255,255),txtcolor=(255,255,255)):ss = self.pts.shape[1]if ss:text = self.text if len(self.text) else '.'drawTextFunc(text,self.pts.min(1),color=txtcolor)if ss > 1:for i in range(ss):drawLineFunc(self.pts[:,i],self.pts[:,(i+1)%ss],color=color)drawCircleFunc(self.pts[:,0] ,color=(255-color[0],0,255-color[2]))drawCircleFunc(self.pts[:,-1],color=(255-color[0],255-color[1],255-color[2]))def rotation_transform(wh,angles=np.array([0.,0.,0.]),zcop=1000., dpp=1000.):rads = np.deg2rad(angles)a = rads[0]; Rx = np.matrix([[1, 0, 0] , [0, cos(a), sin(a)] , [0, -sin(a), cos(a)] ])a = rads[1]; Ry = np.matrix([[cos(a), 0, -sin(a)] , [0, 1, 0] , [sin(a), 0, cos(a)] ])a = rads[2]; Rz = np.matrix([[cos(a), sin(a), 0] , [-sin(a), cos(a), 0] , [0, 0, 1] ])R = Rx*Ry*Rzreturn Rclass Display():def __init__(self,I,width,height,wname='Display'):try:self.Iorig = I.copy()self.width = widthself.height = heightself.wname = wnameself.Idisplay = self.Iorig.copy()self.IdisplayCopy = self.Idisplay.copy()self.reset_view()self._setPerspective()cv2.namedWindow(self.wname)cv2.moveWindow(self.wname, 0, 0)cv2.setMouseCallback(self.wname,self.mouse_callback)except AttributeError as e:print("except : ", e)def reset_view(self):self.cx, self.cy = .5,.5wh = np.array([self.width,self.height],dtype=float)self.zoom_factor = (wh/getWH(self.Iorig.shape)).min()self.mouse_center = np.array([.5,.5])self.angles = np.array([0.,0.,0.])self._setPerspective()def updatePerspectiveMatrix(self):zf = self.zoom_factorw,h = getWH(self.Iorig.shape)self.dx = self.cx*w*zf - self.width/2.self.dy = self.cy*h*zf - self.height/2.R = np.eye(3)R = np.matmul(R,np.matrix([[zf,0,-self.dx],[0,zf,-self.dy],[0,0,1]],dtype=float))R = np.matmul(R,perspective_transform((w,h),angles=self.angles))self.R = Rself.Rinv = np.linalg.inv(R)def show(self):cv2.imshow(self.wname,self.Idisplay)def setPerspectiveAngle(self,addx=0.,addy=0.,addz=0.):self.angles += np.array([addx,addy,addz])self._setPerspective()def _setPerspective(self,update=True):if update:self.updatePerspectiveMatrix()self.IdisplayCopy = cv2.warpPerspective(self.Iorig,self.R,(self.width,self.height),borderValue=.0,flags=cv2.INTER_LINEAR)def resetDisplay(self):self.Idisplay = self.IdisplayCopy.copy()def getMouseCenterRelative(self):return self.mouse_center.copy().reshape((2,1))def waitKey(self,time=50):return cv2.waitKey(50) & 0x0000000FFdef __pt2xy(self,pt):pt = np.squeeze(np.array(np.matmul(self.R,np.append(pt*getWH(self.Iorig.shape),1.))))pt = pt[:2]/pt[2]return tuple(pt.astype(int).tolist())def __pts2xys(self,pts):N = pts.shape[1]pts = pts*getWH(self.Iorig.shape).reshape((2,1))pts = np.concatenate((pts,np.ones((1,N))))pts = np.squeeze(np.array(np.matmul(self.R,pts)))pts = pts[:2]/pts[2]return ptsdef drawLine(self,pt1,pt2,color=(255,255,255),thickness=3):pt1 = self.__pt2xy(pt1)pt2 = self.__pt2xy(pt2)cv2.line(self.Idisplay,pt1,pt2,color=color,thickness=thickness)def drawCircle(self,center,color=(255,255,0),radius=7):center = self.__pt2xy(center)cv2.circle(self.Idisplay,center,radius,color,thickness=-1)def drawText(self,text,bottom_left_pt,color=(255,255,0),bgcolor=(0,0,0),font_size=1):bl_corner = self.__pt2xy(bottom_left_pt)font = cv2.FONT_HERSHEY_SIMPLEXwh_text,v = cv2.getTextSize(text, font, font_size, 3)tl_corner = (bl_corner[0],bl_corner[1]-wh_text[1])br_corner = (bl_corner[0]+wh_text[0],bl_corner[1])cv2.rectangle(self.Idisplay, tl_corner, br_corner, bgcolor,-1) cv2.putText(self.Idisplay,text,bl_corner,font,font_size,color,3)def zoom(self,ff):self.zoom_factor *= ffself.cx,self.cy = self.mouse_center.tolist()self._setPerspective()def rectifyToPts(self,pts):if pts.shape[1] != 4:returnptsh = pts*getWH(self.Iorig.shape).reshape((2,1))ptsh = np.concatenate((ptsh,np.ones((1,4))))to_pts = self.__pts2xys(pts)wi,hi = (to_pts.min(1)[:2]).tolist()wf,hf = (to_pts.max(1)[:2]).tolist()to_pts = np.matrix([[wi,wf,wf,wi],[hi,hi,hf,hf],[1,1,1,1]])self.R = find_T_matrix(ptsh,to_pts)self.Rinv = np.linalg.inv(self.R)self._setPerspective(update=False)def mouse_callback(self,event,x,y,flags,param):mc = np.array([x,y],dtype=float)mc = np.matmul(self.Rinv,np.append(mc,1.))mc = np.squeeze(np.array(mc))self.mouse_center = (mc[:2]/mc[2])/getWH(self.Iorig.shape)def selectClosest(shapes,pt):if len(shapes):mindist,selected = shapes[0].distanceTo(pt).min(),0try:for i,shape in enumerate(shapes[1:]):shpdist = shape.distanceTo(pt).min()if mindist > shpdist:selected = i+1mindist = shpdistexcept ValueError as e:print("except : ", e)return selectedelse:return -1def displayAllShapes(disp,shapes,selected,typing_mode):for i,shape in enumerate(shapes):color = (0,255,255) if i != selected else (0,255,0)txtcolor = (0,0,255) if (i == selected and typing_mode) else (0,255,255)shape.draw(disp.drawLine,disp.drawCircle,disp.drawText,color=color,txtcolor=txtcolor)if __name__ == '__main__':# if len(sys.argv) < 4:# print __doc__# sys.exit()maxW = 1500 #int(sys.argv[1])maxH = 900 #int(sys.argv[2])# img_files = sys.argv[3:]img_files_path = './new/'#############記得改文件名img_files = glob('%s/*.*g' % img_files_path)maxwh = np.array([maxW,maxH],dtype=float)wname = 'Display'# Key idsENTER = 10ESC = 27BACKSPACE = 8ARROW_UP = 82ARROW_DOWN = 84ARROW_LEFT = 81ARROW_RIGHT = 83GREATER_THAN = 46LESS_THAN = 44HOME = 80key_exit = ESCkey_next = [ord('n'),ENTER]key_previous = ord('p')key_zoom_in = ord('q')key_zoom_out = ord('w')key_append_vertex = ord('a')key_remove_last_vertex = ord('d')key_change_closest_vertex = ord('s')key_create_new_shape = ord('c')key_select_closest_shape = ord('x')key_shift_pts = ord('g')key_typing_mode = ord(' ')key_delete_selected_shape = [ord('r')]key_pitch_increase = ARROW_DOWNkey_pitch_decrease = ARROW_UPkey_yaw_increase = ARROW_LEFTkey_yaw_decrease = ARROW_RIGHTkey_roll_increase = GREATER_THANkey_roll_decrease = LESS_THANkey_perspective_reset = HOMEzoom_factor = 1.action_keys = [key_exit,key_previous] + key_nextcurr_image = 0# print(len(img_files))while curr_image < len(img_files):img_file = img_files[curr_image]print(f"current picture : {img_file}")lab_file = splitext(img_file)[0] + '.txt'if isfile(lab_file):shapes = readShapes(lab_file,obj_type=ShapeDisplay)selected = len(shapes) - 1# print('t',shapes,shapes[selected],selected)else:shapes,selected = [ShapeDisplay()],0# print('f',shapes,shapes[selected],selected)# print(len(shapes))zoom_factor = 1.disp = Display(cv2.imread(img_file),maxW,maxH)disp.show()key = disp.waitKey()typing_mode = False# print('\taction_keys',action_keys)# while True:while not key in action_keys:disp.resetDisplay()displayAllShapes(disp,shapes,selected,typing_mode)disp.show()key = disp.waitKey(10)if typing_mode:if key == key_typing_mode:typing_mode = Falseelse:if key != 255:if key >= 176:key = key - 176 + 48if key == BACKSPACE: # backspaceshapes[selected].text = shapes[selected].text[:-1]else:shapes[selected].text += str(chr(key)).upper()key = 255continueif key == key_zoom_in:disp.zoom(1.5)if key == key_zoom_out:disp.zoom(.5)if key == key_yaw_increase:disp.setPerspectiveAngle(addy=10.)if key == key_yaw_decrease:disp.setPerspectiveAngle(addy=-10.)if key == key_pitch_increase:disp.setPerspectiveAngle(addx=10.)if key == key_pitch_decrease:disp.setPerspectiveAngle(addx=-10.)if key == key_roll_increase:disp.setPerspectiveAngle(addz=10.)if key == key_roll_decrease:disp.setPerspectiveAngle(addz=-10.)if key == key_perspective_reset:disp.reset_view()# print(shapes,len(shapes))if len(shapes):# print(shapes[selected].pts)if key == ord('l'):disp.rectifyToPts(shapes[selected].pts)if key == key_typing_mode:typing_mode = Trueif key == key_append_vertex:print ('Append vertex')shapes[selected].appendSide(disp.getMouseCenterRelative())if key == key_remove_last_vertex:print ('Remove last vertex')shapes[selected].removeLast()if key == key_change_closest_vertex:print ('Change closest vertex')shapes[selected].changeClosest(disp.getMouseCenterRelative())if key in key_delete_selected_shape:print ('Delete closest vertex')del shapes[selected]pt = disp.getMouseCenterRelative()selected = selectClosest(shapes,pt)if key == key_shift_pts:shapes[selected].shiftPts()if key == key_create_new_shape:print ('Create new shape')shapes.append(ShapeDisplay())selected = len(shapes)-1if key == key_select_closest_shape:print ('Select closest')pt = disp.getMouseCenterRelative()selected = selectClosest(shapes,pt)if key == key_exit:sys.exit()if key in ([key_previous] + key_next):# print(shapes)writeShapes(lab_file,shapes)curr_image += 1 if key in key_next else -1curr_image = max(curr_image,0)continue

后續根據識別結果，進行二次標注處理

# ################################ 二次標注處理函數 ################################# # path 圖片所在文件夾路徑 # imName是圖片名稱 # boxes是線段坐標, 類型是列表, 元素為元組, 形式為[(y1,x1),(y2,x2)] def secondaryLabeling(path, imgName, boxes):imgPath = os.path.join(path, imgName)txtPath = os.path.join(path, imgName.split('.')[0]+'.txt')im = cv2.imread(imgPath)h, w, d = im.shape# print(f"w is {w}, h is {h}, d is ozvdkddzhkzd")with open(txtPath, 'w') as fw:for box in boxes:fw.write('2,')a, b = boxptsarray = [round(a[1]/w, 6), round(b[1]/w, 6), round(a[0]/h, 6), round(b[0]/h, 6)]fw.write(''.join([('%f,' % value) for value in ptsarray]))fw.write(',\n')

總結

以上是生活随笔為你收集整理的线段检测网格检测（LCNN）的wireframe数据集标注、转换问题的全部內容，希望文章能夠幫你解決所遇到的問題。

如果覺得生活随笔網站內容還不錯，歡迎將生活随笔推薦給好友。

上一篇：文件分类tkinter UI小程序，界面
下一篇： Problem executing sc

日韩av黄I国产麻豆传媒I国产91av视频在线观看I日韩一区二区三区在线看I美女国产在线I麻豆视频国产在线观看I成人黄色短片

线段检测网格检测（LCNN）的wireframe数据集标注、转换问题

總結