KeyWordHelper-关键字提取类(注:使用第三方组件DictSeg.dll)

 
namespace Framework
{
    using System;
    using System.Collections;
    using System.IO;
    using KTDictSeg;
    /// <summary>
    /// 关键字辅助类
    /// </summary>
    public class KeyWordHelper
    {
        public static CSimpleDictSeg m_SimpleDictSeg;
        /// <summary>
        /// 提取关键字
        /// </summary>
        /// <param name="content">内容</param>
        /// <returns>关键字集合</returns>
        public static ArrayList GetKeyWord(string content)
        {
            ArrayList words = new ArrayList();
            if (m_SimpleDictSeg == null)
            {
                try
                {
                    m_SimpleDictSeg = new CSimpleDictSeg();
                    m_SimpleDictSeg.DictPath = Path.Combine(Environment.CurrentDirectory, "Data") + Path.DirectorySeparatorChar;
                    m_SimpleDictSeg.LoadDict();
                }
                catch { }
            }
            m_SimpleDictSeg.FilterStopWords = true;
            m_SimpleDictSeg.MatchName = true;
            words = m_SimpleDictSeg.Segment(content);
            return words;
        }
    }
}
组件地址:http://www.cnblogs.com/eaglet/
上一篇:HaaS轻应用(JavaScript)快速开始 @HaaS100


下一篇:DataX使用指南——ODPS to ODPS