zoukankan      html  css  js  c++  java
  • PyLucene检索demo

    # coding: utf-8
    import lucene
    
    indexDir = './index'
    query = 'zhongguo'
    lucene.initVM()
    print 'lucene', lucene.VERSION
    #索引的存放位置
    indir = lucene.SimpleFSDirectory(lucene.File(indexDir))
    #分词器
    analyzer = lucene.StandardAnalyzer(lucene.Version.LUCENE_CURRENT)
    #检索器
    searcher = lucene.IndexSearcher(indir)
    
    while True:
        print  "输入搜索词(空或者q或者quit退出)"
        keyword = raw_input('Query:').strip()
        if keyword in ('','q','quit'):
            break
        print '查询',keyword
        query = lucene.QueryParser(lucene.Version.LUCENE_CURRENT, 'contents', analyzer).parse(keyword)
        
       #开始搜索
        hits = searcher.search(query,100)
        print '搜索到的结果数为:', hits.totalHits
    
        for hit in hits.scoreDocs:
            print 'Hit Score:',hit.score, ' Hit Doc:', hit.doc, ' HitString:', hit.toString()
    
            doc = searcher.doc(hit.doc)
            #print doc
            print 'path:',doc.get('path').encode('utf-8')
            print 'name:',doc.get('name')
    
        
        
    

      

  • 相关阅读:
    学习Timer定时器
    C++ 延时等待(sleep/timer/wait)
    MFC学习问题总结
    node.js
    总结
    关于Windows
    关于数组
    每周一次
    每周一次
    每周一次
  • 原文地址:https://www.cnblogs.com/TianMG/p/3191680.html
Copyright © 2011-2022 走看看