资源简介
开源企业文档管理系统,,改写源代码,更细分的权限划分,支持pdf,doc,txt等文件格式,适合中国人使用。
代码片段和文件信息
/**
* OpenKM Open Document Management System (http://www.openkm.com)
* Copyright (c) 2006-2014 Paco Avila & Josep Llort
*
* No bytes were intentionally harmed during the development of this application.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not write to the Free Software Foundation Inc.
* 51 Franklin Street Fifth Floor Boston MA 02110-1301 USA.
*/
package com.openkm.analysis;
import java.io.IOException;
import java.io.StringReader;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.SimpleAnalyzer;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.analysis.WhitespaceAnalyzer;
import org.apache.lucene.analysis.cjk.CJKAnalyzer;
import org.apache.lucene.analysis.cn.smart.SmartChineseAnalyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import com.openkm.core.Config;
/**
* @author pavila
* lucene3中自己带了中文分词.自带的中文分词都无法满足需求。
*/
public class AnalyzerDemo {
private static Logger log = LoggerFactory.getLogger(AnalyzerDemo.class);
private static String[] strings = { “专项信息管理 we are goodboy.“ };
private static Analyzer[] analyzers = {
new SimpleAnalyzer(Config.LUCENE_VERSION)
new StandardAnalyzer(Config.LUCENE_VERSION)
new CJKAnalyzer(Config.LUCENE_VERSION)
new SmartChineseAnalyzer(Config.LUCENE_VERSION)
new WhitespaceAnalyzer(Config.LUCENE_VERSION)
};
public static void main(String args[]) throws Exception {
for (String string : strings) {
for (Analyzer analyzer : analyzers) {
analyze(string analyzer);
}
}
}
// INFO com.openkm.analysis.AnalyzerDemo - org.apache.lucene.analysis.SimpleAnalyzer -> [专项信息管理] [we] [are] [goodboy]
// INFO com.openkm.analysis.AnalyzerDemo - org.apache.lucene.analysis.standard.StandardAnalyzer -> [专] [项] [信] [息] [管] [理] [we] [goodboy]
// INFO com.openkm.analysis.AnalyzerDemo - org.apache.lucene.analysis.cjk.CJKAnalyzer -> [专项] [项信] [信息] [息管] [管理] [we] [goodboy]
// INFO com.openkm.analysis.AnalyzerDemo - org.apache.lucene.analysis.cn.smart.SmartChineseAnalyzer -> [专项] [信息] [管理] [we] [ar] [goodboi]
// INFO com.openkm.analysis.AnalyzerDemo - org.apache.lucene.analysis.WhitespaceAnalyzer -> [专项信息管理] [we] [are] [goodboy.]
/**
* Analyze and display tokens
*/
private static void analyze(String
属性 大小 日期 时间 名称
----------- --------- ---------- ----- ----
文件 1227 2013-04-10 23:08 .project.bak
文件 56 2013-04-13 16:20 build.bat
文件 69 2013-04-10 23:07 build.sh
文件 371 2013-04-13 16:19 build.xm
文件 81260 2013-07-17 16:06 doxyfile.cfg
文件 21908 2016-01-16 22:49 pom.xm
文件 3491 2014-07-31 12:42 proguard.conf
文件 0 2014-07-30 18:38 proguard.conf.bak
文件 42734 2016-09-08 17:26 readme.txt
文件 42453 2013-07-04 10:38 readme.txt.bak
文件 2359 2013-07-31 10:59 startup.bat
文件 304 2014-06-18 17:58 update.sql
文件 0 2013-07-09 14:37 utility.log
文件 543 2013-04-11 08:53 .settings\.jsdtscope
文件 180 2014-06-18 15:56 .settings\com.google.gdt.eclipse.core.prefs
文件 239 2013-06-13 10:58 .settings\org.eclipse.core.resources.prefs
文件 430 2013-04-10 23:07 .settings\org.eclipse.jdt.core.prefs
文件 90 2014-06-18 15:56 .settings\org.eclipse.m2e.core.prefs
文件 109 2013-04-10 23:07 .settings\org.eclipse.m2e.core.prefs.bak
文件 704 2014-06-18 15:56 .settings\org.eclipse.wst.common.component
文件 870 2014-06-18 15:54 .settings\org.eclipse.wst.common.component.bak
文件 252 2013-04-10 23:08 .settings\org.eclipse.wst.common.project.facet.core.xm
文件 49 2013-04-11 08:53 .settings\org.eclipse.wst.jsdt.ui.superType.container
文件 6 2013-04-11 08:53 .settings\org.eclipse.wst.jsdt.ui.superType.name
文件 50 2015-10-20 20:53 .settings\org.eclipse.wst.validation.prefs
文件 1298 2014-07-30 17:59 config\openkm-maven.pro
文件 75023 2015-05-12 15:03 ext-libs\common-toolkit-0.0.4-20130311.131623-1-sources.jar
文件 111979 2015-05-12 15:03 ext-libs\common-toolkit-0.0.4-20130311.131623-1.jar
文件 22667 2014-07-31 12:47 ext-libs\Copy (2) of pom.xm
文件 22195 2014-07-30 18:06 ext-libs\Copy of pom.xm
............此处省略2187个文件信息
评论
共有 条评论