|
@@ -7,15 +7,11 @@ from pytranscriber.control.ctr_autosub import Ctr_Autosub
|
|
|
import re,random, time
|
|
|
from itertools import groupby
|
|
|
from operator import itemgetter
|
|
|
-from rakeUtil.Rake import Rake
|
|
|
import requests,rpyc
|
|
|
from difflib import SequenceMatcher
|
|
|
from PIL import Image,ImageDraw,ImageFont
|
|
|
import openshot
|
|
|
-obj = Rake()
|
|
|
-stop_path = "rakedata/stoplist/中文停用词表(1208个).txt"
|
|
|
-conj_path = "rakedata/stoplist/中文分隔词词库.txt"
|
|
|
-obj.initializeFromPath(stop_path, conj_path)
|
|
|
+
|
|
|
|
|
|
def trim_punctuation(s):
|
|
|
pat_block = u'[^\u4e00-\u9fff0-9a-zA-Z]+';
|