public class TfIdfCounter extends KeywordExtractor
defaultSegment| 构造器和说明 |
|---|
TfIdfCounter() |
TfIdfCounter(boolean filterStopWord) |
TfIdfCounter(Segment defaultSegment) |
TfIdfCounter(Segment defaultSegment,
boolean filterStopWord) |
| 限定符和类型 | 方法和说明 |
|---|---|
void |
add(List<Term> termList) |
void |
add(Object id,
List<Term> termList) |
void |
add(Object id,
String text)
添加文档
|
int |
add(String text)
添加文档,自动分配id
|
Map<String,Double> |
allTf() |
Map<Object,Map<String,Double>> |
compute() |
Set<Object> |
documents() |
List<String> |
getKeywords(List<Term> termList,
int size) |
List<Map.Entry<String,Double>> |
getKeywordsOf(Object id) |
List<Map.Entry<String,Double>> |
getKeywordsOf(Object id,
int size) |
List<Map.Entry<String,Double>> |
getKeywordsWithTfIdf(List<Term> termList,
int size) |
List<Map.Entry<String,Double>> |
getKeywordsWithTfIdf(String document,
int size) |
Map<Object,Map<String,Double>> |
getTfMap() |
List<Map.Entry<String,Double>> |
sortedAllTf() |
List<Map.Entry<String,Integer>> |
sortedAllTfInt() |
filter, getKeywords, getKeywords, getSegment, setSegment, shouldIncludepublic TfIdfCounter()
public TfIdfCounter(boolean filterStopWord)
public TfIdfCounter(Segment defaultSegment, boolean filterStopWord)
public TfIdfCounter(Segment defaultSegment)
public List<String> getKeywords(List<Term> termList, int size)
getKeywords 在类中 KeywordExtractorpublic List<Map.Entry<String,Double>> getKeywordsWithTfIdf(String document, int size)
public List<Map.Entry<String,Double>> getKeywordsWithTfIdf(List<Term> termList, int size)
public int add(String text)
text - Copyright © 2014–2019 码农场. All rights reserved.