opencv
/

text_recognition_crnn

Wanli commited on Dec 23, 2023

Commit

cc3d40f

1 Parent(s): b5f00c2

remove text detection DB (#221)

Files changed (2) hide show

demo.cpp CHANGED Viewed

@@ -41,10 +41,10 @@ std::string keys =
 "4: CANN + NPU}";
-class DB {
 public:
-    DB(string modPath, Size inSize = Size(736, 736), float binThresh = 0.3,
         float polyThresh = 0.5, int maxCand = 200, double unRatio = 2.0,
         dnn::Backend bId = DNN_BACKEND_DEFAULT, dnn::Target tId = DNN_TARGET_CPU) : modelPath(modPath), inputSize(inSize), binaryThreshold(binThresh),
         polygonThreshold(polyThresh), maxCandidates(maxCand), unclipRatio(unRatio),
@@ -215,7 +215,7 @@ int main(int argc, char** argv)
     bool save = parser.get<bool>("save");
     bool viz = parser.get<float>("viz");
-    DB detector("../text_detection_db/text_detection_DB_IC15_resnet18_2021sep.onnx", inpSize, binThresh, polyThresh, maxCand, unRatio, backendTargetPairs[backendTargetid].first, backendTargetPairs[backendTargetid].second);
     CRNN recognizer(modelPath, backendTargetPairs[backendTargetid].first, backendTargetPairs[backendTargetid].second);
     //! [Open a video file or an image file or a camera stream]
     VideoCapture cap;
@@ -232,9 +232,13 @@ int main(int argc, char** argv)
         cap >> originalImage;
         if (originalImage.empty())
         {
-            cout << "Frame is empty" << endl;
-            waitKey();
-            break;
         }
         int originalW = originalImage.cols;
         int originalH = originalImage.rows;

 "4: CANN + NPU}";
+class PPOCRDet {
 public:
+    PPOCRDet(string modPath, Size inSize = Size(736, 736), float binThresh = 0.3,
         float polyThresh = 0.5, int maxCand = 200, double unRatio = 2.0,
         dnn::Backend bId = DNN_BACKEND_DEFAULT, dnn::Target tId = DNN_TARGET_CPU) : modelPath(modPath), inputSize(inSize), binaryThreshold(binThresh),
         polygonThreshold(polyThresh), maxCandidates(maxCand), unclipRatio(unRatio),
     bool save = parser.get<bool>("save");
     bool viz = parser.get<float>("viz");
+    PPOCRDet detector("../text_detection_ppocr/text_detection_en_ppocrv3_2023may.onnx", inpSize, binThresh, polyThresh, maxCand, unRatio, backendTargetPairs[backendTargetid].first, backendTargetPairs[backendTargetid].second);
     CRNN recognizer(modelPath, backendTargetPairs[backendTargetid].first, backendTargetPairs[backendTargetid].second);
     //! [Open a video file or an image file or a camera stream]
     VideoCapture cap;
         cap >> originalImage;
         if (originalImage.empty())
         {
+            if (parser.has("input"))
+            {
+                cout << "Frame is empty" << endl;
+                break;
+            }
+            else
+                continue;
         }
         int originalW = originalImage.cols;
         int originalH = originalImage.rows;

demo.py CHANGED Viewed

@@ -12,8 +12,8 @@ import cv2 as cv
 from crnn import CRNN
-sys.path.append('../text_detection_db')
-from db import DB
 # Check OpenCV version
 assert cv.__version__ >= "4.8.0", \
@@ -65,8 +65,8 @@ if __name__ == '__main__':
     backend_id = backend_target_pairs[args.backend_target][0]
     target_id = backend_target_pairs[args.backend_target][1]
-    # Instantiate DB for text detection
-    detector = DB(modelPath='../text_detection_db/text_detection_DB_IC15_resnet18_2021sep.onnx',
                   inputSize=[args.width, args.height],
                   binaryThreshold=0.3,
                   polygonThreshold=0.5,

 from crnn import CRNN
+sys.path.append('../text_detection_ppocr')
+from ppocr_det import PPOCRDet
 # Check OpenCV version
 assert cv.__version__ >= "4.8.0", \
     backend_id = backend_target_pairs[args.backend_target][0]
     target_id = backend_target_pairs[args.backend_target][1]
+    # Instantiate PPOCRDet for text detection
+    detector = PPOCRDet(modelPath='../text_detection_ppocr/text_detection_en_ppocrv3_2023may.onnx',
                   inputSize=[args.width, args.height],
                   binaryThreshold=0.3,
                   polygonThreshold=0.5,