优化ocr的结果

5f39d7a7 · 翟艳秋（20软） · 71880733 · 5f39d7a7 · 5f39d7a7
Commit 5f39d7a7 authored Mar 01, 2022 by 翟艳秋（20软）
Hide whitespace changes
Inline Side-by-side

Showing with 31 additions and 1 deletion

detect_with_ocr.py detect_with_ocr.py +30 -0

main_gui.py main_gui.py +1 -1

No files found.
--- a/detect_with_ocr.py
+++ b/detect_with_ocr.py
@@ -6,6 +6,7 @@ from paddleocr import PaddleOCR
 import difflib
 import openpyxl
 from openpyxl.styles import PatternFill, Alignment
+import re

 # 字幕的上下边界
 up_b, down_b = 0, 0
@@ -86,6 +87,12 @@ def get_position(video_path, start_time):
    return up_b + height, down_b + height


+def erasePunc(txt):
+    pattern = re.compile(r'[^\u4e00-\u9fa5]')
+    txt = re.sub(pattern, '', txt)
+    return txt
+
+
 def string_similar(s1, s2):
    """
    比较字符串s1和s2的相似度，主要用于减少输出文件中相似字幕的重复
@@ -93,9 +100,30 @@ def string_similar(s1, s2):
    :param s2:
    :return: 字符串间的相似度
    """
+    # 去除非中文字符后，再比较相似度
+    s1 = erasePunc(s1)
+    s2 = erasePunc(s2)
    return difflib.SequenceMatcher(None, s1, s2).quick_ratio()


+def normalize(text):
+    """
+    用于规范化处理文本中的一些标点符号
+    """
+    # 将英文标点转换为中文标点
+    E_pun = u',.!?()[]:;'
+    C_pun = u'，。！？（）【】：；'
+    table = {ord(f): ord(t) for f, t in zip(E_pun, C_pun)}
+    text = text.translate(table)
+    text = text.strip(' ，。、【】_·：-@‘［；')
+    # 促成首尾匹配的（）
+    if text[-1] == '）' and text[0] != '（':
+        text = '（' + text
+    elif text[-1] != '）' and text[0] == '（':
+        text = text + '）'
+    return text
+
+
 def detect_subtitle(img):
    """
    检测当前画面得到字幕信息
@@ -162,6 +190,8 @@ def process_video(video_path, begin, end, state):
            state[0] = float((video.get(cv2.CAP_PROP_POS_MSEC) / 1000 - begin) / (end - begin)) \
                if state[0] is None or state[0] < 0.99 else 0.99
            subTitle = detect_subtitle(frame)
+            if subTitle is not None:
+                subTitle = normalize(subTitle)
            # 第一次找到字幕
            if lastSubTitle is None and subTitle is not None:
                start_time = video.get(cv2.CAP_PROP_POS_MSEC) / 1000

--- a/main_gui.py
+++ b/main_gui.py
@@ -416,7 +416,7 @@ tabControl = ttk.Notebook(window)
 tab1 = ttk.Frame(tabControl)
 tabControl.add(tab1, text="旁白位置推荐")
 tab2 = ttk.Frame(tabControl)
-tabControl.add(tab2, text="旁白语音合成及字幕导出")
+tabControl.add(tab2, text="旁白及字幕导出")
 tabControl.pack(expand=1, fill="both")

 """