Browse Source

update segment

master
Yener 5 years ago
parent
commit
12189ebd03
3 changed files with 301226 additions and 301293 deletions
  1. +301224
    -301281
      jiagu/segment/dict/jiagu.dict
  2. +0
    -8
      jiagu/segment/dict/user.dict
  3. +2
    -4
      jiagu/segment/nroute.py

+ 301224
- 301281
jiagu/segment/dict/jiagu.dict
File diff suppressed because it is too large
View File


+ 0
- 8
jiagu/segment/dict/user.dict View File

@@ -1,8 +0,0 @@
思知
天猫
知识图谱
张华平
州立大学
海康威视
女干事


+ 2
- 4
jiagu/segment/nroute.py View File

@@ -17,7 +17,7 @@ class Segment:

def init(self, vocab_path='dict/jiagu.dict', user_vocab='dict/user.dict'):
self.load_vocab(os.path.join(os.path.dirname(__file__), vocab_path))
self.load_vocab(os.path.join(os.path.dirname(__file__), user_vocab))
# self.load_vocab(os.path.join(os.path.dirname(__file__), user_vocab))
self.initialized = True
def load_vocab(self, vocab_path):
@@ -182,9 +182,7 @@ if __name__=='__main__':
# sg.load_userdict('dict/user.dict')
# s.load_userdict(['知识图谱'])

text = '张华平等'
text = '美国纽约州立大学'
text = '海康威视'
text = '天猫啊'
words = s.seg(text)
print(words)


Loading…
Cancel
Save