一 導(dǎo)入依賴
<!-- ansj分詞器 -->
<dependency>
<groupId>org.ansj</groupId>
<artifactId>ansj_seg</artifactId>
<version>5.1.6</version>
</dependency>
二、分詞方式
package com.vortex.commonAPI.controller;
import javax.servlet.http.HttpServletRequest;
import org.ansj.splitWord.analysis.BaseAnalysis;
import org.ansj.splitWord.analysis.IndexAnalysis;
import org.ansj.splitWord.analysis.NlpAnalysis;
import org.ansj.splitWord.analysis.ToAnalysis;
import org.springframework.web.bind.annotation.RequestMapping;
import org.springframework.web.bind.annotation.RequestMethod;
import org.springframework.web.bind.annotation.RestController;
@RestController
@RequestMapping(value = "ansjSegmenter")
public class AnsjSegmenterController {
// 1.基本分詞-BaseAnalysis
// 最小粒度 功能有限
@RequestMapping(value = "/baseAnalysis", method = RequestMethod.GET)
public Object baseAnalysis(HttpServletRequest request) {
String words = request.getParameter("words");
return BaseAnalysis.parse(words);
// 不帶詞性
// return BaseAnalysis.parse(words).toStringWithOutNature();
}
// 2.精準(zhǔn)分詞-ToAnalysis
// 它在易用性,穩(wěn)定性.準(zhǔn)確性.以及分詞效率上.都取得了一個(gè)不錯(cuò)的平衡。
@RequestMapping(value = "/toAnalysis", method = RequestMethod.GET)
public Object toAnalysis(HttpServletRequest request) {
String words = request.getParameter("words");
return ToAnalysis.parse(words);
// 不帶詞性
// return ToAnalysis.parse(words).toStringWithOutNature();
}
// 3.nlp分詞-NlpAnalysis
// nlp的適用方式:語(yǔ)法實(shí)體名抽取.未登錄詞整理.
@RequestMapping(value = "/nlpAnalysis", method = RequestMethod.GET)
public Object nlpAnalysis(HttpServletRequest request) {
String words = request.getParameter("words");
return NlpAnalysis.parse(words);
// 不帶詞性
// return NlpAnalysis.parse(words).toStringWithOutNature();
}
// 4.面向索引的分詞-IndexAnalysis
// 面向索引的分詞,故名思議就是適合在lucene等文本檢索中用到的分詞。
// 召回率:召回率是對(duì)分詞結(jié)果盡可能的涵蓋
// 準(zhǔn)確率:其實(shí)這和召回本身是具有一定矛盾性,Ansj的強(qiáng)大之處是很巧妙的避開了這兩個(gè)的沖突
@RequestMapping(value = "/indexAnalysis", method = RequestMethod.GET)
public Object indexAnalysis(HttpServletRequest request) {
String words = request.getParameter("words");
return IndexAnalysis.parse(words);
// 不帶詞性
// return IndexAnalysis.parse(words).toStringWithOutNature();
}
}
三、功能統(tǒng)計(jì)

image.png