eragonruan
diff --git a/‎.idea/workspace.xml‎
Lines changed: 313 additions & 226 deletions b/‎.idea/workspace.xml‎
Lines changed: 313 additions & 226 deletions
diff --git a/‎checkpoints/checkpoint~‎
Lines changed: 0 additions & 2 deletions b/‎checkpoints/checkpoint~‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎ctpn/__init__.py‎
Lines changed: 2 additions & 1 deletion b/‎ctpn/__init__.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎ctpn/cfg.py‎
Lines changed: 0 additions & 6 deletions b/‎ctpn/cfg.py‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎ctpn/demo.py‎
Lines changed: 25 additions & 53 deletions b/‎ctpn/demo.py‎
Lines changed: 25 additions & 53 deletions
diff --git a/‎ctpn/other.py‎
Lines changed: 0 additions & 77 deletions b/‎ctpn/other.py‎
Lines changed: 0 additions & 77 deletions
diff --git a/‎ctpn/text.yml‎
Lines changed: 1 addition & 0 deletions b/‎ctpn/text.yml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎ctpn/text.yml~‎
Lines changed: 0 additions & 36 deletions b/‎ctpn/text.yml~‎
Lines changed: 0 additions & 36 deletions
diff --git a/‎data/demo/007.JPG‎
-25 KB b/‎data/demo/007.JPG‎
-25 KB
diff --git a/‎data/demo/007.jpg‎
77.2 KB b/‎data/demo/007.jpg‎
77.2 KB
@@ -1 +1,2 @@
-from . import text_proposal_connector
+from . import text_proposal_connector
+from . import text_connect
@@ -5,72 +5,47 @@
 import glob
 import shutil
 sys.path.append(os.getcwd())
-
 from lib.networks.factory import get_network
 from lib.fast_rcnn.config import cfg,cfg_from_file
 from lib.fast_rcnn.test import test_ctpn
-from lib.fast_rcnn.nms_wrapper import nms
 from lib.utils.timer import Timer
-from text_proposal_connector import TextProposalConnector
-
-CLASSES = ('__background__',
- 'text')
-
-
-def connect_proposal(text_proposals, scores, im_size):
- cp = TextProposalConnector()
- line = cp.get_text_lines(text_proposals, scores, im_size)
- return line
-
-def save_results(image_name,im,im_scale,line,thresh):
- inds=np.where(line[:,-1]>=thresh)[0]
- image_name=image_name.split('/')[-1]
- if len(inds)==0:
- im = cv2.resize(im, None, None, fx=1.0/im_scale, fy=1.0/im_scale, interpolation=cv2.INTER_LINEAR)
- cv2.imwrite(os.path.join("data/results",image_name),im)
- return 
+from lib.text_connector.detectors import TextDetector
+from lib.text_connector.text_connect_cfg import Config as TextLineCfg
 
- for i in inds:
- bbox=line[i,:4]
- score=line[i,-1]
- cv2.rectangle(im,(bbox[0],bbox[1]),(bbox[2],bbox[3]),color=(0,255,0),thickness=2)
- im = cv2.resize(im, None, None, fx=1.0/im_scale, fy=1.0/im_scale, interpolation=cv2.INTER_LINEAR)
- cv2.imwrite(os.path.join("data/results",image_name),im)
 
+def resize_im(im, scale, max_scale=None):
+ f=float(scale)/min(im.shape[0], im.shape[1])
+ if max_scale!=None and f*max(im.shape[0], im.shape[1])>max_scale:
+ f=float(max_scale)/max(im.shape[0], im.shape[1])
+ return cv2.resize(im, None,None, fx=f, fy=f,interpolation=cv2.INTER_LINEAR), f
 
-def check_img(img):
- img_size = img.shape
- im_size_min = np.min(img_size[0:2])
- im_size_max = np.max(img_size[0:2])
 
- im_scale = float(600) / float(im_size_min)
- if np.round(im_scale * im_size_max) > 1200:
- im_scale = float(1200) / float(im_size_max)
- re_im = cv2.resize(img, None, None, fx=im_scale, fy=im_scale, interpolation=cv2.INTER_LINEAR)
- return re_im, im_scale
+def draw_boxes(img,image_name,boxes,scale):
+ for box in boxes:
+ cv2.line(img, (int(box[0]), int(box[1])), (int(box[2]), int(box[3])), (0, 255, 0), 2)
+ cv2.line(img, (int(box[0]), int(box[1])), (int(box[4]), int(box[5])), (0, 255, 0), 2)
+ cv2.line(img, (int(box[6]), int(box[7])), (int(box[2]), int(box[3])), (0, 255, 0), 2)
+ cv2.line(img, (int(box[4]), int(box[5])), (int(box[6]), int(box[7])), (0, 255, 0), 2)
 
+ base_name = image_name.split('/')[-1]
+ img=cv2.resize(img, None, None, fx=1.0/scale, fy=1.0/scale, interpolation=cv2.INTER_LINEAR)
+ cv2.imwrite(os.path.join("data/results", base_name), img)
 
 def ctpn(sess, net, image_name):
- img = cv2.imread(image_name)
- im, im_scale = check_img(img)
  timer = Timer()
  timer.tic()
- scores, boxes = test_ctpn(sess, net, im)
+
+ img = cv2.imread(image_name)
+ img, scale = resize_im(img, scale=TextLineCfg.SCALE, max_scale=TextLineCfg.MAX_SCALE)
+ scores, boxes = test_ctpn(sess, net, img)
+
+ textdetector = TextDetector()
+ boxes = textdetector.detect(boxes, scores[:, np.newaxis], img.shape[:2])
+ draw_boxes(img, image_name, boxes, scale)
  timer.toc()
  print(('Detection took {:.3f}s for '
  '{:d} object proposals').format(timer.total_time, boxes.shape[0]))
 
- # Visualize detections for each class
- CONF_THRESH = 0.9
- NMS_THRESH = 0.3
- dets = np.hstack((boxes, scores[:, np.newaxis])).astype(np.float32)
- keep = nms(dets, NMS_THRESH)
- dets = dets[keep, :]
- 
- keep = np.where(dets[:, 4] >= 0.7)[0]
- dets = dets[keep, :]
- line = connect_proposal(dets[:, 0:4], dets[:, 4], im.shape)
- save_results(image_name, im,im_scale, line,thresh=0.9)
 
 
 if __name__ == '__main__':
@@ -91,16 +66,12 @@ def ctpn(sess, net, image_name):
 
  try:
  ckpt = tf.train.get_checkpoint_state(cfg.TEST.checkpoints_path)
- #ckpt=tf.train.get_checkpoint_state("output/ctpn_end2end/voc_2007_trainval/")
  print('Restoring from {}...'.format(ckpt.model_checkpoint_path), end=' ')
  saver.restore(sess, ckpt.model_checkpoint_path)
  print('done')
  except:
  raise 'Check your pretrained {:s}'.format(ckpt.model_checkpoint_path)
- print (' done.')
 
- #saver.restore(sess, os.path.join(os.getcwd(),"checkpoints/model_final_tf13.ckpt"))
- # Warmup on a dummy image
  im = 128 * np.ones((300, 300, 3), dtype=np.uint8)
  for i in range(2):
  _, _ = test_ctpn(sess, net, im)
@@ -112,3 +83,4 @@ def ctpn(sess, net, image_name):
  print('~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~')
  print(('Demo for {:s}'.format(im_name)))
  ctpn(sess, net, im_name)
+
@@ -32,5 +32,6 @@ TRAIN:
  WEIGHT_DECAY: 0.0005
 TEST:
  HAS_RPN: True
+ DETECT_MODE: O
  checkpoints_path: checkpoints/
  #checkpoints_path: output/ctpn_end2end/voc_2007_trainval
Original file line number	Diff line number	Diff line change
`@@ -1 +1,2 @@`
`1`		`-from . import text_proposal_connector`
	`1`	`+from . import text_proposal_connector`
	`2`	`+from . import text_connect`