This commit is contained in:
Joseph Cheung 2023-03-02 00:20:09 +08:00
parent 435e8a482d
commit 5051022e09
4 changed files with 6 additions and 4 deletions

View file

@ -23,4 +23,5 @@ coloredlogs==15.0.1
requests requests
markdown markdown
tiktoken tiktoken
pycorrector
git+https://github.com/luxtiasco/TextRank4ZH.git git+https://github.com/luxtiasco/TextRank4ZH.git

View file

@ -19,4 +19,5 @@ fasttext-predict==0.9.2.1
requests requests
markdown markdown
tiktoken tiktoken
pycorrector
git+https://github.com/luxtiasco/TextRank4ZH.git git+https://github.com/luxtiasco/TextRank4ZH.git

View file

@ -18,7 +18,7 @@ import markdown
import re import re
import datetime import datetime
from textrank4zh import TextRank4Keyword, TextRank4Sentence from textrank4zh import TextRank4Keyword, TextRank4Sentence
from collections import defaultdict import pycorrector
from timeit import default_timer from timeit import default_timer
from html import escape from html import escape
@ -1946,7 +1946,7 @@ class DFA:
self.ban_words_list = list() self.ban_words_list = list()
self.ban_words_dict = dict() self.ban_words_dict = dict()
if not path: if not path:
self.path = 'keyword' self.path = 'keywords'
else: else:
self.path = path self.path = path
self.get_words() self.get_words()

View file

@ -18,7 +18,7 @@ import markdown
import re import re
import datetime import datetime
from textrank4zh import TextRank4Keyword, TextRank4Sentence from textrank4zh import TextRank4Keyword, TextRank4Sentence
from collections import defaultdict import pycorrector
from timeit import default_timer from timeit import default_timer
from html import escape from html import escape
@ -2993,7 +2993,7 @@ class DFA:
self.ban_words_list = list() self.ban_words_list = list()
self.ban_words_dict = dict() self.ban_words_dict = dict()
if not path: if not path:
self.path = 'keyword' self.path = 'keywords'
else: else:
self.path = path self.path = path
self.get_words() self.get_words()