📄 sharpictclas分词系统简介(1)读取词典库 - first we try, then we trust - 博客园.mht
字号:
BORDER-BOTTOM: black 4px solid; BACKGROUND-COLOR: white
}
PRE {
FONT-FAMILY: "courier new", courier, "????"; BACKGROUND-COLOR: #eeeeee
}
CODE {
COLOR: #000099
}
DIV.code DIV.title {
PADDING-RIGHT: 5px; PADDING-LEFT: 5px; FONT-WEIGHT: bold; FONT-SIZE: =
95%; BACKGROUND: #efeff7; PADDING-BOTTOM: 2px; MARGIN: 15px 10px 0px; =
OVERFLOW: auto; COLOR: #000066; PADDING-TOP: 2px; BORDER-BOTTOM: #c8cdde =
1px solid
}
DIV.code DIV.content {
PADDING-RIGHT: 6px; BORDER-TOP: #ffffff 1px solid; PADDING-LEFT: 6px; =
FONT-SIZE: 12px; BACKGROUND: #f7f7ff; PADDING-BOTTOM: 10px; MARGIN: 0px =
10px 15px; OVERFLOW: auto; LINE-HEIGHT: 120%; PADDING-TOP: 10px; =
FONT-FAMILY: courier new
}
------=_NextPart_000_01C3_01C76CE0.D78CEE00
Content-Type: multipart/alternative;
boundary="----=_NextPart_001_01D2_01C76CE0.D78E74A0"
------=_NextPart_001_01D2_01C76CE0.D78E74A0
Content-Type: text/html;
charset="utf-8"
Content-Transfer-Encoding: quoted-printable
Content-Location: http://www.cnblogs.com/zhenyulu/articles/668024.html
=EF=BB=BF<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN">
<HTML><HEAD =
id=3DHead><TITLE>SharpICTCLAS=E5=88=86=E8=AF=8D=E7=B3=BB=E7=BB=9F=E7=AE=80=
=E4=BB=8B(1)=E8=AF=BB=E5=8F=96=E8=AF=8D=E5=85=B8=E5=BA=93 - First we =
try, then we trust - =E5=8D=9A=E5=AE=A2=E5=9B=AD</TITLE>
<META http-equiv=3DContent-Type content=3D"text/html; charset=3Dutf-8">
<META id=3DmetaKeywords =
content=3DSharpICTCLAS=E5=88=86=E8=AF=8D=E7=B3=BB=E7=BB=9F=E7=AE=80=E4=BB=
=8B(1)=E8=AF=BB=E5=8F=96=E8=AF=8D=E5=85=B8=E5=BA=93 =
name=3Dkeywords><LINK=20
id=3DMainCss href=3D"http://www.cnblogs.com/Skins/Cogitation/style.css"=20
type=3Dtext/css rel=3Dstylesheet><LINK id=3DSecondaryCss=20
href=3D"http://www.cnblogs.com/zhenyulu/customcss.aspx" type=3Dtext/css=20
rel=3Dstylesheet><LINK id=3DRSSLink title=3DRSS=20
href=3D"http://www.cnblogs.com/zhenyulu/rss.aspx" =
type=3Dapplication/rss+xml=20
rel=3Dalternate>
<META content=3D"MSHTML 6.00.6000.16414" name=3DGENERATOR></HEAD>
<BODY>
<FORM id=3DForm1 name=3DForm1 onsubmit=3D"javascript:return =
WebForm_OnSubmit();"=20
action=3D668024.html method=3Dpost>
<DIV><INPUT id=3D__EVENTTARGET type=3Dhidden name=3D__EVENTTARGET> =
<INPUT=20
id=3D__EVENTARGUMENT type=3Dhidden name=3D__EVENTARGUMENT> <INPUT=20
id=3D" __VIEWSTATE" type=3Dhidden name=3D__VIEWSTATE> </DIV>
<SCRIPT type=3Dtext/javascript>
<!--
var theForm =3D document.forms['Form1'];
if (!theForm) {
theForm =3D document.Form1;
}
function __doPostBack(eventTarget, eventArgument) {
if (!theForm.onsubmit || (theForm.onsubmit() !=3D false)) {
theForm.__EVENTTARGET.value =3D eventTarget;
theForm.__EVENTARGUMENT.value =3D eventArgument;
theForm.submit();
}
}
// -->
</SCRIPT>
<SCRIPT=20
src=3D"http://www.cnblogs.com/WebResource.axd?d=3DPyW-m2hLmppJ9byT1bYEqw2=
&t=3D633078067072968750"=20
type=3Dtext/javascript></SCRIPT>
<SCRIPT language=3DJavaScript>
function ctlent(evt,id)
{
if(evt.ctrlKey && evt.keyCode =3D=3D 13)
{=09
try
{
TempSave(id);
}
catch(ex)
{
}
finally
{
__doPostBack('AjaxHolder$PostComment$btnSubmit','')
}
}
=09
}</SCRIPT>
<SCRIPT language=3DJavaScript>function =
SetReplyAuhor(author){document.getElementById('AjaxHolder_PostComment_tbC=
omment').value+=3D"@"+author+"\n";document.getElementById('AjaxHolder_Pos=
tComment_tbComment').focus();return false}</SCRIPT>
<SCRIPT=20
src=3D"http://www.cnblogs.com/WebResource.axd?d=3DPN3YVKw-Ky20FbAsNYS9UM8=
XqUzPcwpd0&t=3D633078067072968750"=20
type=3Dtext/javascript></SCRIPT>
<SCRIPT=20
src=3D"http://www.cnblogs.com/ScriptResource.axd?d=3DIo4r5Qx-zmHysvkgwLW9=
yk7rUGj5M-geQRTOmI9WMPaWNcTLoZx7IpNZpIR4LFVQ0&t=3D633065726447066250"=
=20
type=3Dtext/javascript></SCRIPT>
<SCRIPT=20
src=3D"http://www.cnblogs.com/ScriptResource.axd?d=3DIo4r5Qx-zmHysvkgwLW9=
yk7rUGj5M-geQRTOmI9WMPaVSfXvXlH0xWaTv3M_TRDPzVKh75E08VU1&t=3D63306572=
6447066250"=20
type=3Dtext/javascript></SCRIPT>
<SCRIPT type=3Dtext/javascript>
<!--
function WebForm_OnSubmit() {
if (typeof(ValidatorOnSubmit) =3D=3D "function" && ValidatorOnSubmit() =
=3D=3D false) return false;
return true;
}
// -->
</SCRIPT>
<DIV id=3Dtop>
<DIV>
<TABLE>
<TBODY>
<TR>
<TD class=3DHeaderTitles>
<H1 class=3DHeaderTitle><A class=3DHeaderMainTitle =
id=3DHeader1_HeaderTitle=20
href=3D"http://www.cnblogs.com/zhenyulu/">First we try, then we=20
trust</A></H1>
<P id=3Dtagline></P></TD></TR></TBODY></TABLE></DIV>
<DIV class=3DHeaderBar>
<TABLE class=3DHeaderBar id=3DHeaderBar cellSpacing=3D0 cellPadding=3D0>
<TBODY>
<TR>
<TD class=3DHeaderBarTab noWrap> <A =
id=3DHeader1_MyLinks1_HomeLink=20
=
href=3D"http://www.cnblogs.com/">=E5=8D=9A=E5=AE=A2=E5=9B=AD</A> :: =
<A=20
id=3DHeader1_MyLinks1_MyHomeLink=20
=
href=3D"http://zhenyulu.cnblogs.com/">=E9=A6=96=E9=A1=B5</A> :: <A=20
id=3DHeader1_MyLinks1_NewPostLink=20
=
href=3D"http://www.cnblogs.com/zhenyulu/admin/EditPosts.aspx?opt=3D1">=E6=
=96=B0=E9=9A=8F=E7=AC=94</A> ::=20
<A id=3DHeader1_MyLinks1_ContactLink accessKey=3D9=20
=
href=3D"http://www.cnblogs.com/zhenyulu/contact.aspx?id=3D1">=E8=81=94=E7=
=B3=BB</A> :: <A=20
id=3DHeader1_MyLinks1_Syndication=20
=
href=3D"http://www.cnblogs.com/zhenyulu/rss">=E8=81=9A=E5=90=88</A> <A =
class=3DXMLLink=20
id=3DHeader1_MyLinks1_XMLLink=20
href=3D"http://www.cnblogs.com/zhenyulu/rss"><IMG=20
style=3D"BORDER-TOP-WIDTH: 0px; BORDER-LEFT-WIDTH: 0px; =
BORDER-BOTTOM-WIDTH: 0px; BORDER-RIGHT-WIDTH: 0px"=20
src=3D"http://www.cnblogs.com/images/xml.gif"></A> :: <A=20
id=3DHeader1_MyLinks1_Admin=20
=
href=3D"http://www.cnblogs.com/zhenyulu/admin/EditPosts.aspx">=E7=AE=A1=E7=
=90=86</A> ::=20
</TD>
<TD><IMG id=3DHeader1_BlueTab=20
style=3D"BORDER-TOP-WIDTH: 0px; BORDER-LEFT-WIDTH: 0px; =
BORDER-BOTTOM-WIDTH: 0px; BORDER-RIGHT-WIDTH: 0px"=20
=
src=3D"http://www.cnblogs.com/Skins/Cogitation/Images/BlueTabRight.gif"=20
align=3DabsMiddle></TD>
<TD class=3DHeaderBarTabBack noWrap width=3D"100%">
<DIV class=3DBlogStatsBar>
<TABLE class=3DBlogStatsBar>
<TBODY>
<TR>
<TD width=3D"100%"></TD>
<TD class=3DBlogStatsBar noWrap> 182 =
=E9=9A=8F=E7=AC=94 :: 110 =E6=96=87=E7=AB=A0 :: 2433=20
=E8=AF=84=E8=AE=BA :: 110 Trackbacks=20
</TD></TR></TBODY></TABLE></DIV></TD></TR></TBODY></TABLE></DIV></DIV>
<DIV id=3Dleftmenu></DIV>
<DIV id=3Dmain>
<DIV class=3Dpost>
<DIV class=3DpostTitle><A id=3Dviewpost1_TitleUrl=20
href=3D"http://www.cnblogs.com/zhenyulu/articles/668024.html">SharpICTCLA=
S=E5=88=86=E8=AF=8D=E7=B3=BB=E7=BB=9F=E7=AE=80=E4=BB=8B(1)=E8=AF=BB=E5=8F=
=96=E8=AF=8D=E5=85=B8=E5=BA=93</A>=20
</DIV>
<DIV class=3DpostText>
<P>ICTCLAS=E5=88=86=E8=AF=8D=E7=9A=84=E6=80=BB=E4=BD=93=E6=B5=81=E7=A8=8B=
=E5=8C=85=E6=8B=AC=EF=BC=9A1=EF=BC=89=E5=88=9D=E6=AD=A5=E5=88=86=E8=AF=8D=
=EF=BC=9B2=EF=BC=89=E8=AF=8D=E6=80=A7=E6=A0=87=E6=B3=A8=EF=BC=9B3=EF=BC=89=
=E4=BA=BA=E5=90=8D=E3=80=81=E5=9C=B0=E5=90=8D=E8=AF=86=E5=88=AB=EF=BC=9B4=
=EF=BC=89=E9=87=8D=E6=96=B0=E5=88=86=E8=AF=8D=EF=BC=9B5=EF=BC=89=E9=87=8D=
=E6=96=B0=E8=AF=8D=E6=80=A7=E6=A0=87=E6=B3=A8=E8=BF=99=E4=BA=94=E6=AD=A5=E3=
=80=82=E5=B0=B1=E7=AC=AC=E4=B8=80=E6=AD=A5=E5=88=86=E8=AF=8D=E8=80=8C=E8=A8=
=80=EF=BC=8C=E5=8F=88=E7=BB=86=E5=88=86=E6=88=90=EF=BC=9A1=EF=BC=89=E5=8E=
=9F=E5=AD=90=E5=88=87=E5=88=86=EF=BC=9B2=EF=BC=89=E6=89=BE=E5=87=BA=E5=8E=
=9F=E5=AD=90=E4=B9=8B=E9=97=B4=E6=89=80=E6=9C=89=E5=8F=AF=E8=83=BD=E7=9A=84=
=E7=BB=84=E8=AF=8D=E6=96=B9=E6=A1=88=EF=BC=9B3=EF=BC=89N-=E6=9C=80=E7=9F=AD=
=E8=B7=AF=E5=BE=84=E4=B8=AD=E6=96=87=E8=AF=8D=E8=AF=AD=E7=B2=97=E5=88=86=E4=
=B8=89=E6=AD=A5=E3=80=82</P>
<P>=E5=9C=A8=E6=89=80=E6=9C=89=E5=86=85=E5=AE=B9=E4=B8=AD=EF=BC=8C=E8=AF=8D=
=E5=85=B8=E5=BA=93=E7=9A=84=E8=AF=BB=E5=8F=96=E6=98=AF=E6=9C=80=E5=9F=BA=E6=
=9C=AC=E7=9A=84=E5=8A=9F=E8=83=BD=E3=80=82ICTCLAS=E4=B8=AD=E8=AF=8D=E5=85=
=B8=E5=AD=98=E6=94=BE=E5=9C=A8Data=E7=9B=AE=E5=BD=95=E4=B8=AD=EF=BC=8C=E5=
=B8=B8=E7=94=A8=E7=9A=84=E8=AF=8D=E5=85=B8=E5=8C=85=E6=8B=ACcoreDict.dct=EF=
=BC=88=E8=AF=8D=E5=85=B8=E5=BA=93=EF=BC=89=E3=80=81BigramDict.dct=EF=BC=88=
=E8=AF=8D=E4=B8=8E=E8=AF=8D=E9=97=B4=E7=9A=84=E5=85=B3=E8=81=94=E5=BA=93=EF=
=BC=89=E3=80=81nr.dct=EF=BC=88=E4=BA=BA=E5=90=8D=E5=BA=93=EF=BC=89=E3=80=81=
ns.dct=EF=BC=88=E5=9C=B0=E5=90=8D=E5=BA=93=EF=BC=89=E3=80=81tr.dct=EF=BC=88=
=E7=BF=BB=E8=AF=91=E4=BA=BA=E5=90=8D=E5=BA=93=EF=BC=89=EF=BC=8C=E5=AE=83=E4=
=BB=AC=E7=9A=84=E6=96=87=E4=BB=B6=E6=A0=BC=E5=BC=8F=E6=98=AF=E5=AE=8C=E5=85=
=A8=E7=9B=B8=E5=90=8C=E7=9A=84=EF=BC=8C=E9=83=BD=E4=BD=BF=E7=94=A8CDictio=
nary=E7=B1=BB=E8=BF=9B=E8=A1=8C=E8=A7=A3=E6=9E=90=E3=80=82=E5=A6=82=E6=9E=
=9C=E6=83=B3=E6=B7=B1=E5=85=A5=E4=BA=86=E8=A7=A3ICTCLAS=E8=AF=8D=E5=85=B8=
=E7=BB=93=E6=9E=84=EF=BC=8C=E5=8F=AF=E4=BB=A5=E5=8F=82=E8=80=83sinboy=E7=9A=
=84=E3=80=8A<A=20
href=3D"http://blog.csdn.net/sinboy/archive/2006/03/15/624909.aspx">ICTCL=
AS=E5=88=86=E8=AF=8D=E7=B3=BB=E7=BB=9F=E7=A0=94=E7=A9=B6=EF=BC=88=E4=BA=8C=
=EF=BC=89--=E8=AF=8D=E5=85=B8=E7=BB=93=E6=9E=84</A>=E3=80=8B=E4=B8=80=E6=96=
=87=EF=BC=8C=E8=AF=A6=E7=BB=86=E4=BB=8B=E7=BB=8D=E4=BA=86=E8=AF=8D=E5=85=B8=
=E7=BB=93=E6=9E=84=E3=80=82=E6=88=91=E8=BF=99=E9=87=8C=E5=8F=AA=E7=BB=99=E5=
=87=BASharpICTCLAS=E4=B8=AD=E7=9A=84=E5=AE=9E=E7=8E=B0=E3=80=82</P>
<P>=E9=A6=96=E5=85=88=E6=98=AF=E5=AF=B9=E5=9F=BA=E6=9C=AC=E5=85=83=E7=B4=A0=
=E7=9A=84=E5=AE=9A=E4=B9=89=E3=80=82=E5=9C=A8SharpICTCLAS=E4=B8=AD=EF=BC=8C=
=E5=AF=B9=E5=8E=9F=E6=9C=89=E5=91=BD=E5=90=8D=E8=BF=9B=E8=A1=8C=E4=BA=86=E9=
=83=A8=E5=88=86=E8=B0=83=E6=95=B4=EF=BC=8C=E4=BD=BF=E5=BE=97=E6=9B=B4=E5=85=
=B7=E6=9C=89=E5=AE=9E=E9=99=85=E6=84=8F=E4=B9=89=E5=B9=B6=E9=80=82=E5=90=88=
C#=E7=9A=84=E4=B9=A0=E6=83=AF=E3=80=82=E4=BB=A3=E7=A0=81=E5=A6=82=E4=B8=8B=
=EF=BC=9A</P>
<DIV class=3Dcode>
<DIV class=3Dtitle>
<DIV style=3D"FLOAT: right"><IMG class=3DcopyCodeImage=20
src=3D"http://www.cnblogs.com/images/cnblogs_com/zhenyulu/200701/copycode=
.gif"=20
align=3DabsMiddle name=3DccImage> <A onclick=3DCopyCode(this) =
href=3D"javascript:">Copy=20
Code</A></DIV>
<DIV style=3D"CLEAR: none">WordDictionaryElement.cs =
=E7=A8=8B=E5=BA=8F</DIV></DIV>
<DIV class=3Dcontent><SPAN style=3D"COLOR: #0000ff">using</SPAN> System; =
<BR><SPAN=20
style=3D"COLOR: #0000ff">using</SPAN> System.Collections.Generic; =
<BR><SPAN=20
style=3D"COLOR: #0000ff">using</SPAN> System.Text; <BR><BR><SPAN=20
style=3D"COLOR: #0000ff">namespace</SPAN> SharpICTCLAS <BR>{ =
<BR> =20
<SPAN=20
style=3D"COLOR: =
#008000">//=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=
=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=
=3D=3D=3D=3D=20
</SPAN><BR> <SPAN style=3D"COLOR: #008000">// Original =
predefined in=20
DynamicArray.h file </SPAN><BR> <SPAN=20
style=3D"COLOR: =
#008000">//=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=
=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=
=3D=3D=3D=3D=20
</SPAN><BR> <SPAN style=3D"COLOR: #0000ff">public</SPAN> =
<SPAN=20
style=3D"COLOR: #0000ff">class</SPAN> ArrayChainItem <BR> {=20
<BR> <SPAN style=3D"COLOR: =
#0000ff">public</SPAN>=20
<SPAN style=3D"COLOR: #0000ff">int</SPAN> col, row;<SPAN=20
style=3D"COLOR: #008000">//row and column=20
</SPAN><BR> <SPAN=20
style=3D"COLOR: #0000ff">public</SPAN> <SPAN style=3D"COLOR: =
#0000ff">double</SPAN>=20
<SPAN style=3D"COLOR: #0000ff">value</SPAN>;<SPAN style=3D"COLOR: =
#008000">//The=20
value of the array </SPAN><BR> <SPAN=20
style=3D"COLOR: #0000ff">public</SPAN> <SPAN style=3D"COLOR: =
#0000ff">int</SPAN>=20
nPOS; <BR> <SPAN=20
style=3D"COLOR: #0000ff">public</SPAN> <SPAN style=3D"COLOR: =
#0000ff">int</SPAN>=20
nWordLen; <BR> <SPAN=20
style=3D"COLOR: #0000ff">public</SPAN> <SPAN style=3D"COLOR: =
#0000ff">string</SPAN>=20
sWord; <BR> <SPAN style=3D"COLOR: =
#008000">//The=20
possible POS of the word related to the segmentation graph=20
</SPAN><BR> <SPAN=20
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -