修正部分bug,新增ocr训练

herryfan · Nov 13, 2018 · 736c16c · 736c16c
1 parent ae7339c
commit 736c16c
Show file tree

Hide file tree

Showing 18 changed files with 2,088 additions and 17 deletions.
diff --git a/.gitignore b/.gitignore
@@ -3,9 +3,13 @@
 *.so
 *.egg
 *.egg-info
+*.pth
+*.pb
+*.pbtxt
+*.weights
 dist
 buil
 .DS_Store*
 .ipynb_checkpoints
 __pycache__
-
+darknet 
diff --git a/config.py b/config.py
@@ -13,7 +13,9 @@
 DETECTANGLE=True##是否进行文字方向检测
 LSTMFLAG = True##OCR模型是否调用LSTM层
 GPU = True##OCR 是否启用GPU
+GPUID=0##调用GPU序号
 chinsesModel = True##模型选择 True:中英文模型 False:英文模型
+
 if chinsesModel:
     if LSTMFLAG:
         ocrModel  = os.path.join(pwd,"models","ocr-lstm.pth")

diff --git a/crnn/util.py b/crnn/util.py
@@ -9,7 +9,7 @@
 class strLabelConverter(object):
 
     def __init__(self, alphabet):
-        self.alphabet = alphabet + u'-'  # for `-1` index
+        self.alphabet = alphabet + 'ç'  # for `-1` index
         self.dict = {}
         for i, char in enumerate(alphabet):
             # NOTE: 0 is reserved for 'blank' required by wrap_ctc
@@ -19,7 +19,6 @@ def encode(self, text, depth=0):
         length = []
         result=[]
         for str in text:
-            str = unicode(str,"utf8")
             length.append(len(str))
             for char in str:
                #print(char)

diff --git a/darknet b/darknet
diff --git a/darknet_detect.py b/darknet_detect.py
@@ -3,7 +3,8 @@
 pwd = os.getcwd()
 import numpy as np
 from PIL import Image
-from config import yoloCfg,yoloWeights,yoloData,yoloData,darknetRoot
+
+from config import yoloCfg,yoloWeights,yoloData,yoloData,darknetRoot,GPU,GPUID
 os.chdir(darknetRoot)
 sys.path.append('python')
 import darknet as dn
@@ -52,13 +53,16 @@ def to_box(r):
 
 
 import pdb
-#dn.set_gpu(0)
+if GPU:
+    try:
+      dn.set_gpu(GPUID)
+    except:
+        pass
 net = dn.load_net(yoloCfg.encode('utf-8'), yoloWeights.encode('utf-8'), 0)
 meta = dn.load_meta(yoloData.encode('utf-8'))
 os.chdir(pwd)
 def text_detect(img):
-    inputBlob = cv2.dnn.blobFromImage(img, scalefactor=0.00390625, size=(608, 608),swapRB=True ,crop=False);
 
-    r = detect_np(net, meta, img,thresh=0.1, hier_thresh=0.5, nms=0.8)
+    r = detect_np(net, meta, img,thresh=0, hier_thresh=0.5, nms=None)##输出所有box,与opencv dnn统一
     bboxes = to_box(r)
     return bboxes
diff --git a/detector/detectors.py b/detector/detectors.py
@@ -1,19 +1,22 @@
 #coding:utf-8
 from detector.other import  normalize
 import numpy as np
-import numpy as np
+from config import GPUID,GPU
 from detector.utils.cython_nms import nms as cython_nms
-try:
-    from detector.utils.gpu_nms import gpu_nms
-except:
-    gpu_nms =cython_nms
+##优先加载编译对GPU编译的gpu_nms 如果不想调用GPU，在程序启动执行os.environ["CUDA_VISIBLE_DEVICES"] = "0"
+if GPU:
+    try:
+        from detector.utils.gpu_nms import gpu_nms
+    except:
+        gpu_nms =cython_nms
 
 def nms(dets, thresh):
     if dets.shape[0] == 0:
         return []
 
     try:
-           return gpu_nms(dets, thresh, device_id=0)
+        if GPU and GPUID is not None:
+           return gpu_nms(dets, thresh, device_id=GPUID)
     except:
             return cython_nms(dets, thresh)
+2 −2		Makefile
+1 −5		cfg/alexnet.cfg
+2 −2		cfg/coco.data
+11 −20		cfg/darknet.cfg
+0 −566		cfg/darknet53.cfg
+0 −559		cfg/darknet53_448.cfg
+7 −6		cfg/gru.cfg
+0 −990		cfg/resnet101.cfg
+0 −228		cfg/resnet18.cfg
+0 −392		cfg/resnet34.cfg
+6 −7		cfg/resnet50.cfg
+0 −1,048		cfg/resnext101-32x4d.cfg
+0 −1,558		cfg/resnext152-32x4d.cfg
+0 −523		cfg/resnext50.cfg
+2 −2		cfg/yolov2.cfg
+0 −822		cfg/yolov3-spp.cfg
+1 −1		cfg/yolov3-tiny.cfg
+6 −6		cfg/yolov3.cfg
+3 −1		examples/art.c
+8 −44		examples/classifier.c
+5 −1		examples/coco.c
+0 −3		examples/darknet.c
+3 −1		examples/detector.c
+0 −275		examples/instance-segmenter.c
+23 −10		examples/lsd.c
+6 −2		examples/nightmare.c
+3 −1		examples/regressor.c
+19 −10		examples/segmenter.c
+1 −1		examples/super.c
+5 −1		examples/yolo.c
+2 −7		include/darknet.h
+5 −6		python/darknet.py
+3 −3		src/convolutional_layer.c
+7 −89		src/data.c
+13 −17		src/image.c
+0 −225		src/iseg_layer.c
+0 −19		src/iseg_layer.h
+6 −6		src/maxpool_layer.c
+8 −8		src/maxpool_layer_kernels.cu
+11 −27		src/parser.c
+2 −2		src/softmax_layer.c