用基于lucene的web项目实现的简单的搜索引擎，出现线程抛出的空指针异。

这个项目一共有五个java类，一个search.jsp，一个web.xml。问题在于在eclipse上加入tomcat后，在浏览器输入地址就会报下面截图上的错误，我觉得可能是建立索引和找索引有问题，但我不太了解这是怎么回事还有该怎么解决：
问题截图：
图片说明

代码全部：

 package sample.dw.paper.lucene.servlet;

import java.io.IOException;
import java.util.List;

import javax.servlet.RequestDispatcher;
import javax.servlet.ServletException;
import javax.servlet.http.HttpServlet;
import javax.servlet.http.HttpServletRequest;
import javax.servlet.http.HttpServletResponse;

import sample.dw.paper.lucene.search.SearchManager;

public class SearchController extends HttpServlet{

    /**
     * 
     */
    private static final long serialVersionUID = 1L;

    public void doGet(HttpServletRequest request,HttpServletResponse response)
            throws IOException, ServletException{
        doPost(request, response);
    }

    public void doPost(HttpServletRequest request,HttpServletResponse response)
            throws IOException,ServletException{

//      String searchWord = request.getParameter("searchWord");
        String searchWord = toChinese(request.getParameter("searchWord"));
        SearchManager searchManager = new SearchManager(searchWord);
        List searchResult = null;
        searchResult = searchManager.search();
        RequestDispatcher dispatcher = request.getRequestDispatcher("search.jsp");
        request.setAttribute("searchResult", searchResult);
        dispatcher.forward(request,response);
    }


    public static String toChinese(String strvalue){
        try {
            if(strvalue==null){
                return null;
            }else{
                strvalue = new String(strvalue.getBytes("ISO-8859-1"),"UTF-8");
                return strvalue;
            }
        } catch (Exception e) {
            // TODO: handle exception
            e.printStackTrace();
            return null;
        }
    }

}

 package sample.dw.paper.lucene.search;

import java.io.IOException;
import java.util.ArrayList;
import java.util.List;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.queryParser.ParseException;
import org.apache.lucene.queryParser.QueryParser;
import org.apache.lucene.search.Hits;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;

import sample.dw.paper.lucene.index.IndexManager;

public class SearchManager {
    private String searchWord;
    private IndexManager indexManager;
    private Analyzer analyzer;
    private IndexSearcher  indexSearcher;

    public SearchManager(String serachWord){
        this.searchWord = serachWord;
        this.indexManager = new IndexManager();
        this.analyzer = new StandardAnalyzer();


    }
    public List search(){
        List  searchResult = new ArrayList();

        if (false == indexManager.ifIndexExist()) {
            try {
                if (false == indexManager.createIndex()) {
                    return searchResult;
                }

            } catch (IOException e) {
                // TODO: handle exception
                e.printStackTrace();
                return searchResult;
            }

        }

         indexSearcher = null;

        try {
            indexSearcher = new IndexSearcher(indexManager.getIndexDir());
        } catch (IOException e) {
            // TODO: handle exceptio
            e.printStackTrace();
        }

        QueryParser queryParser = new QueryParser( "content",analyzer);
        Query query = null;
        try {
            query = queryParser.parse(searchWord);
        } catch (ParseException e) {
            // TODO: handle exception
            e.printStackTrace();
        }

        if( null !=query && null != indexSearcher){
            try {
                Hits hits=indexSearcher.search(query);    

                for(int i=0; i<hits.length();i++){
                    SearchResultBean resultBean = new SearchResultBean();
                    resultBean.setHtmlPath(hits.doc(i).get("path"));
                    resultBean.setHtmlTitle(hits.doc(i).get("title"));
                    searchResult.add(resultBean);
                }
            } catch (IOException e) {
                // TODO: handle exception
                e.printStackTrace();
            }
        }
        return searchResult;
    }
}

 package sample.dw.paper.lucene.search;

public class SearchResultBean {
    private String htmlPath;
    private String htmlTitle;

    public String getHtmlPath() {
        int startPos = htmlPath.indexOf("mirror")+6;
        String url=htmlPath;
        url = url.substring(startPos);
        url = url.replaceAll("\\\\","/");
        htmlPath = "http:"+url;
        return htmlPath;
    }
    public void setHtmlPath(String htmlPath) {
        this.htmlPath = htmlPath;
    }
    public String getHtmlTitle() {
        return htmlTitle;
    }
    public void setHtmlTitle(String htmlTitle) {
        this.htmlTitle = htmlTitle;
    }


}

 package sample.dw.paper.lucene.index;

import java.io.File;
import java.io.IOException;
import java.io.Reader;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;

import sample.dw.paper.lucene.util.HTMLDocParser;

public class IndexManager {

    public final String dataDir = "C:\\Users\\yang\\workspace\\graduation_project_heritrix\\jobs"+"\\csdn-20150423124021677\\mirror";
    public final String indexDir ="C:\\indexDir";

    public void ccreateIndex(File file,IndexWriter indexWriter)throws IOException{
        if(file.isDirectory()){
            File [] files =file.listFiles();
            for(int i=0 ; i<files.length; i++){
                ccreateIndex(files[i],indexWriter);
            }
        }else if(file.getAbsolutePath().endsWith(".html") || file.getAbsolutePath().endsWith(".htm")){
            String htmlPath = file.getAbsolutePath();
            addDocument(htmlPath,indexWriter);

        }
    }



    public boolean createIndex() throws IOException{
        if(true == ifIndexExist()){
            return true;
        }

        File dir = new File(dataDir);
        if(!dir.exists()){
            return false;
        }

        File[] htmls = dir.listFiles();
        Directory fsDirectory = FSDirectory.getDirectory(indexDir, true);
        Analyzer  analyzer    = new StandardAnalyzer();
        IndexWriter indexWriter = new IndexWriter(fsDirectory, analyzer, true);
        for(int i = 0; i < htmls.length; i++){
            String htmlPath = htmls[i].getAbsolutePath();

            if(htmlPath.endsWith(".html") || htmlPath.endsWith(".htm")){
          addDocument(htmlPath, indexWriter);
         }
        }
        indexWriter.optimize();
        indexWriter.close();
        return true;
//      Directory fsDirectory = FSDirectory.getDirectory(indexDir, true);
//      Analyzer analyzer = new StandardAnalyzer();
//      IndexWriter indexWriter  = new IndexWriter(fsDirectory,analyzer,true);
//      ccreateIndex(filee,indexWriter);
//      
//      indexWriter.close();
//      return true;

    }





    public void addDocument(String htmlPath,IndexWriter indexWriter) {
        /*HTMLDocParser htmlParser = new HTMLDocParser(htmlPath);
        String path = htmlParser.getPath();
        String title = htmlParser.getTitle();
        String content = htmlParser.getContent();
        //
        Document document = new Document();
        document.add(new Field(title,new StringReader(content)));
        indexWriter.addDocument(document);*/
        HTMLDocParser htmlParser = new HTMLDocParser(htmlPath);
        String path    = htmlParser.getPath();
        String title   = htmlParser.getTitle();
        Reader content = htmlParser.getContent();

        Document document = new Document();
        document.add(new Field("path",path,Field.Store.YES,Field.Index.NO));
        document.add(new Field("title",title,Field.Store.YES,Field.Index.TOKENIZED));
        document.add(new Field("content",content));
        try {
              indexWriter.addDocument(document);
            } catch (IOException e) {
              e.printStackTrace();
                                      }


    }

    public boolean ifIndexExist(){
        File directory = new File(indexDir);
        if(0 < directory.listFiles().length){
            return true;
        }else{
            return false;
        }
    }

    public String getDataDir(){
        return this.dataDir;
    }

    public String getIndexDir(){
        return this.indexDir;
    }


}

 package sample.dw.paper.lucene.util;

import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.Reader;
import java.io.UnsupportedEncodingException;

import org.apache.lucene.demo.html.HTMLParser;




public class HTMLDocParser {
     private String htmlPath;

        private HTMLParser htmlParser;

        public HTMLDocParser(String htmlPath){
            this.htmlPath = htmlPath;
            initHtmlParser();
        }

        private void initHtmlParser(){
            InputStream inputStream = null;
            try {
                inputStream = new FileInputStream(htmlPath);
            } catch (FileNotFoundException e) {
                e.printStackTrace();
            }
            if(null != inputStream){
             try {
                    htmlParser = new HTMLParser(new InputStreamReader(inputStream, "utf-8"));
                } catch (UnsupportedEncodingException e) {
                    e.printStackTrace();
                }
            }
        }

        public String getTitle(){
            if(null != htmlParser){
                try {
                    return htmlParser.getTitle();
                } catch (IOException e) {
                    e.printStackTrace();
                } catch (InterruptedException e) {
                    e.printStackTrace();
                }
            }
        return "";
        }

        public Reader getContent(){
        if(null != htmlParser){
                try {
                      return htmlParser.getReader();
                  } catch (IOException e) {
                      e.printStackTrace();
                  }
            }
            return null;
        }

        public String getPath(){
            return this.htmlPath;  
        }

}

写回答
好问题 0 提建议
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

报告相同问题？

关注问题

solr教程，值得刚接触搜索开发人员一看
2016-09-12 20:14

LarryHai6的博客 Solr调研总结开发类型 ...本文介绍solr的功能使用及相关注意事项;...查询索引,和在查询中可以应用的高亮显示、拼写检查、搜索建议、分组统计、拼音检索等功能的使用方法。版本
Solr开发文档
2014-06-18 17:18

飞鸟up的博客 Solr 是一种可供企业使用的、基于 Lucene 的搜索服务器，它支持层面搜索、命中醒目显示和多种输出格式。在这篇文章中，将介绍 Solr 并展示如何轻松地将其表现优异的全文本搜索功能加入到 Web 应用程序中。开发环境...
使用 Apache Solr 实现更加灵巧的搜索
2011-10-04 16:24

dcb2008的博客 ... Solr 是一种可供企业使用的、基于 Lucene 的搜索服务器，它支持层面搜索、命中醒目显示和多种输出格式。在这篇分两部分的文章中，Lucene Java? 的提交人 Grant Ingersoll 将介绍 ...
JAVA面试题知识总结——JVM、多线程、线程池、高并发、事务、微服务、springcloud
2024-12-14 15:32

Java Development Kit的博客本文通过面试题的知识点方向，总结整合了有关JVM、多线程、线程池、高并发、事务相关的知识点，望对读友有用，本文很长，可以关注后每天看一个方向的知识点即可。
Solr简介
2025-02-06 16:26

涛粒子的博客下面给出两种分词器的安装方法，任选其一即可，推荐第一种，因为smartcn就在solr发行包的contrib/analysis-extras/lucene-libs/下，就是lucene-analyzers-smartcn-4.2.0.jar,首选在solrconfig.xml中加一句引用...
solr入门教程
2015-05-18 18:12

李大瑞的博客 Solr 本文介绍solr的功能使用及相关注意事项;主要包括以下内容:环境搭建及调试;...Solr它是一种开放源码的、基于 Lucene Java 的搜索服务器，易于加入到 Web 应用程序中。Solr 提供了层面搜索(就是统计)、命
JAVA上百实例源码以及开源项目
2017-01-11 23:13

GarfieldEr007的博客 Java圆形电子时钟源代码 1个目标文件内容索引:JAVA源码,系统相关,电子钟用JAVA编写的指针式圆形电子钟，效果图如下所示，其实代码很简单，希望对你有帮助。 Message-Driven Bean EJB实例源代码 2个目标文件摘要...
【转载】solr教程，值得刚接触搜索开发人员一看
2019-10-02 17:39

apple01010105的博客转载：http://blog.csdn.net/awj3584/article/details/16963525 Solr调研总结开发类型 ...本文介绍solr的功能使用及相关注意事项;主要包括以下内容:环境搭建及调试;两个核心配置文件介绍...
Java八股文总结（线程分布式）
2023-09-14 11:26

未来将会更加多变的博客 ThreadLocal作用于线程内独立的数据,线程访问同一个threadlocal内的不同map,key就是threadlocal val是各自线程存的值,get和set会调用currentThread()获取本线程的对象,底层用的ThreadLocalMap内的Entry,根据hash判断...
java面试题集中了好几篇的搜索的
2018-11-16 00:51

M_Jack的博客客户端发出http请求，web服务器将请求转发到servlet容器，servlet容器解析url并根据web.xml找到相对应的servlet，并将request、response对象传递给找到的servlet，servlet根据request就可以知道是谁发出的请求，请求...
没有解决我的问题, 去提问

码龄粉丝数原力等级 --

用基于lucene的web项目实现的简单的搜索引擎，出现线程抛出的空指针异。

0条回答默认最新

用基于lucene的web项目实现的简单的搜索引擎，出现线程抛出的空指针异。

0条回答 默认 最新

0条回答默认最新