from Biterm import * class Doc(): ''' @description: 处理文本的类 @param {type} @return: ''' ws = [] def __init__(self,s): self.ws = [] self.read_doc(s) def read_doc(self,s): for w in s.split(' '): self.ws.append(int(w)) def size(self): return len(self.ws) def get_w(self,i): assert(i