1 |
|
2 |
|
3 |
|
4 |
|
5 |
|
6 | import { SubSModuleTokenizer } from '../mod';
|
7 | import { IWord } from '../Segment';
|
8 | export declare class PunctuationTokenizer extends SubSModuleTokenizer {
|
9 | name: string;
|
10 | _STOPWORD: string[];
|
11 | STOPWORD: {
|
12 | [key: string]: number;
|
13 | };
|
14 | STOPWORD2: {
|
15 | [key: number]: {
|
16 | [key: string]: number;
|
17 | };
|
18 | };
|
19 | |
20 |
|
21 |
|
22 |
|
23 |
|
24 |
|
25 | split(words: IWord[]): IWord[];
|
26 | |
27 |
|
28 |
|
29 |
|
30 |
|
31 |
|
32 |
|
33 | matchStopword(text: string, cur?: number): IWord[];
|
34 | }
|
35 | export declare const init: typeof SubSModuleTokenizer.init;
|
36 | export default PunctuationTokenizer;
|