This repository has been archived by the owner on Nov 16, 2020. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
cnseg.i
92 lines (71 loc) · 1.83 KB
/
cnseg.i
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
%module cnseg
%include "cstring.i"
%{
enum eCodeType {
CODE_TYPE_UNKNOWN,//type unknown
CODE_TYPE_ASCII,//ASCII
CODE_TYPE_GB,//GB2312,GBK,GB10380
CODE_TYPE_UTF8,//UTF-8
CODE_TYPE_BIG5//BIG5
};
bool ICTCLAS_Init(const char* pszInitDir=NULL);
bool ICTCLAS_Exit();
bool ICTCLAS_SetPOSmap(int nPOSmap);
unsigned int ICTCLAS_ImportUserDictFile(
const char* pszFileName,
eCodeType codeType=CODE_TYPE_UNKNOWN
);
unsigned int ICTCLAS_ImportUserDict(
const char* pszDictBuffer,
const int nLength,
eCodeType codeType
);
int ICTCLAS_SaveTheUsrDic();
int ICTCLAS_ParagraphProcess(
const char* pszText,
int iLength,
char* pszResult, //[out]
eCodeType codeType=CODE_TYPE_UNKNOWN,
bool bEnablePOS=false
);
bool ICTCLAS_FileProcess(
const char* pszSrcFileName,
const char* pszDstFileName,
eCodeType srcCodeType=CODE_TYPE_UNKNOWN,
bool bEnablePOS=false
);
%}
enum eCodeType {
CODE_TYPE_UNKNOWN,//type unknown
CODE_TYPE_ASCII,//ASCII
CODE_TYPE_GB,//GB2312,GBK,GB10380
CODE_TYPE_UTF8,//UTF-8
CODE_TYPE_BIG5//BIG5
};
bool ICTCLAS_Init(const char* pszInitDir=NULL);
bool ICTCLAS_Exit();
bool ICTCLAS_SetPOSmap(int nPOSmap);
unsigned int ICTCLAS_ImportUserDictFile(
const char* pszFileName,
eCodeType codeType=CODE_TYPE_UNKNOWN
);
unsigned int ICTCLAS_ImportUserDict(
const char* pszDictBuffer,
const int nLength,
eCodeType codeType
);
int ICTCLAS_SaveTheUsrDic();
%cstring_bounded_output(char *pszResult, 65536);
int ICTCLAS_ParagraphProcess(
const char* pszText,
int iLength,
char* pszResult, //[out]
eCodeType codeType=CODE_TYPE_UNKNOWN,
bool bEnablePOS=false
);
bool ICTCLAS_FileProcess(
const char* pszSrcFileName,
const char* pszDstFileName,
eCodeType srcCodeType=CODE_TYPE_UNKNOWN,
bool bEnablePOS=false
);