基于mmseg算法的一个轻量级中文分词器

Directory: MiddleWare
Plat: Java
Size: 2012KB
Downloads: 1
Upload time: 2018-03-12 17:13:44
Uploader: 孤独的老张
Description:   A lightweight open source Chinese word segmentation based on the mmseg algorithm

File list:
jcseg, 0 , 2017-11-12
jcseg\.gitignore, 178 , 2017-11-12
jcseg\CHANGES.md, 16817 , 2017-11-12
jcseg\LICENSE.md, 11986 , 2017-11-12
jcseg\README.md, 44895 , 2017-11-12
jcseg\build.xml, 6110 , 2017-11-12
jcseg\jcseg-analyzer, 0 , 2017-11-12
jcseg\jcseg-analyzer\pom.xml, 2754 , 2017-11-12
jcseg\jcseg-analyzer\src, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul\jcseg, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul\jcseg\analyzer, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul\jcseg\analyzer\JcsegAnalyzer.java, 2804 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul\jcseg\analyzer\JcsegFilter.java, 879 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul\jcseg\analyzer\JcsegTokenizer.java, 2838 , 2017-11-12
jcseg\jcseg-analyzer\src\main\java\org\lionsoul\jcseg\analyzer\JcsegTokenizerFactory.java, 2684 , 2017-11-12
jcseg\jcseg-analyzer\src\test, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\test\java, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\test\java\org, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\test\java\org\lionsoul, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\test\java\org\lionsoul\jcseg, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\test\java\org\lionsoul\jcseg\analyzer, 0 , 2017-11-12
jcseg\jcseg-analyzer\src\test\java\org\lionsoul\jcseg\analyzer\AppTest.java, 655 , 2017-11-12
jcseg\jcseg-core, 0 , 2017-11-12
jcseg\jcseg-core\pom.xml, 4432 , 2017-11-12
jcseg\jcseg-core\src, 0 , 2017-11-12
jcseg\jcseg-core\src\main, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\KeyphraseExtractor.java, 3173 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\KeywordsExtractor.java, 3317 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\SummaryExtractor.java, 2891 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\impl, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\impl\TextRankKeyphraseExtractor.java, 8658 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\impl\TextRankKeywordsExtractor.java, 5332 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\extractor\impl\TextRankSummaryExtractor.java, 14321 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\sentence, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\sentence\Sentence.java, 1674 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\sentence\SentenceSeg.java, 5755 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\test, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\test\JcsegTest.java, 17249 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\ASegment.java, 57124 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\Chunk.java, 3195 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\ComplexSeg.java, 5355 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\DelimiterSeg.java, 6340 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\DetectSeg.java, 7575 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\Dictionary.java, 3572 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\NLPSeg.java, 35952 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\SearchSeg.java, 4024 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\SimpleSeg.java, 1034 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\Word.java, 10735 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\ADictionary.java, 29199 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\AutoLoadFile.java, 893 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\DictionaryFactory.java, 4579 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\Entity.java, 19040 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\IChunk.java, 1013 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\ILexicon.java, 1864 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\ISegment.java, 1187 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\IWord.java, 4162 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\JcsegException.java, 507 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\JcsegTaskConfig.java, 15833 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\LexiconException.java, 536 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\MMSegFilter.java, 4542 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\SegKit.java, 1012 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\SegmentFactory.java, 2902 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\tokenizer\core\SynonymsEntry.java, 1785 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util, 0 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\ArrayUtil.java, 3640 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\ByteCharCounter.java, 1751 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\EntityFormat.java, 12543 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\IHashQueue.java, 3010 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\IIntFIFO.java, 1512 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\IIntQueue.java, 2004 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\IPushbackReader.java, 2186 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\IStringBuffer.java, 7858 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\IntArrayList.java, 2073 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\NumericUtil.java, 6516 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\STConverter.java, 17650 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\Sort.java, 11774 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\StringUtil.java, 15063 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\TimeUtil.java, 7394 , 2017-11-12
jcseg\jcseg-core\src\main\java\org\lionsoul\jcseg\util\Util.java, 1057 , 2017-11-12
jcseg\jcseg-core\src\test, 0 , 2017-11-12
jcseg\jcseg-core\src\test\java, 0 , 2017-11-12
jcseg\jcseg-core\src\test\java\org, 0 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul, 0 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul\jcseg, 0 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul\jcseg\test, 0 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul\jcseg\test\DicConverter.java, 5096 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul\jcseg\test\DicMerge.java, 11289 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul\jcseg\test\IHashQueueTest.java, 1633 , 2017-11-12
jcseg\jcseg-core\src\test\java\org\lionsoul\jcseg\test\IIntFIFOTest.java, 669 , 2017-11-12

Download users:

Relate files:

Comment: Add Comment

Favorite users: