کتابخانه ی جستجوی متن آپاچی لوسن

بعد از آماده سازی Document باید توسط کلاس IndexWriter، ایندکس را ذخیره
می کنیم. پارامتر اول در فراخوانی IndexWriter دایکتوری ذخیره‌سازی ایندکس
را مشاهده می‌کند.
با کدهای زیر چند عبارت را در حافظه دسترسی تصادفی (RAM) ذخیره کردیم:

کد:
Directory index = new RAMDirectory();IndexWriterConfig config = new IndexWriterConfig(Version.LUCENE_36, analyzer); IndexWriter w = new IndexWriter(index, config);addDoc(w, "Lucene in Action");addDoc(w, "Lucene for Dummies");addDoc(w, "Managing Gigabytes");addDoc(w, "The Art of Computer Science");w.close();

متد addDoc رشته‌ها را به ایندکس اضافه می کند:

کد:
private static void addDoc(IndexWriter w, String value) throws IOException {    Document doc = new Document();    doc.add(new Field("title", value, Field.Store.YES, Field.Index.ANALYZED));    w.addDocument(doc);  }}

مرحله دوم: ایجاد کوئری (Query)
در این برنامه ما عبارت مورد نظر برای جستجو را از ورودی (stdin) دریافت می‌کنیم:

کد:
String querystr = args.length > 0 ? args[0] : "lucene";

Query q = new QueryParser(Version.LUCENE_36, "title", analyzer).parse(querystr);

مرحله سوم: انجام جستجو
در این مرحله کوئری (جستار؟) ساخته شده
را بر روی ایندکس جستجو می کنیم. همچنین از کلاس TopScoreDocCollector برای
بدست آوردن ۱۰ نتیجه مرتبط‌تر استفاده کرده ایم:

کد:
int hitsPerPage = 10;IndexReader reader = IndexReader.open(index);IndexSearcher searcher = new IndexSearcher(reader);TopScoreDocCollector collector = TopScoreDocCollector.create(hitsPerPage, true);searcher.search(q, collector);ScoreDoc[] hits = collector.topDocs().scoreDocs;

مرحله چهارم: مشاهده نتایج
در انتها نتایج بدست آمده را نمایش می‌دهیم:

کد:
System.out.println("Found " + hits.length + " hits.");for(int i=0;i<hits.length;++i) {    int docId = hits[i].doc;    Document d = searcher.doc(docId);    System.out.println((i + 1) + ". " + d.get("title"));}

همین!

کلاس HelloLucene
در زیر کلاس HelloLucene را یکجا مشاهده می فرمایید:

کد:
import java.io.IOException; import org.apache.lucene.analysis.standard.StandardAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.document.Field;import org.apache.lucene.index.IndexReader;import org.apache.lucene.index.IndexWriter;import org.apache.lucene.index.IndexWriterConfig;import org.apache.lucene.queryParser.ParseException;import org.apache.lucene.queryParser.QueryParser;import org.apache.lucene.search.*;import org.apache.lucene.store.Directory;import org.apache.lucene.store.RAMDirectory;import org.apache.lucene.util.Version; public class HelloLucene {    public static void main(String[] args) throws IOException, ParseException {        // 0. Specify the analyzer for tokenizing text.        //    The same analyzer should be used for indexing and searching        StandardAnalyzer analyzer = new StandardAnalyzer(Version.LUCENE_36);         // 1. create the index        Directory index = new RAMDirectory();         IndexWriterConfig config = new IndexWriterConfig(Version.LUCENE_36, analyzer);         IndexWriter w = new IndexWriter(index, config);        addDoc(w, "Lucene in Action");        addDoc(w, "Lucene for Dummies");        addDoc(w, "Managing Gigabytes");        addDoc(w, "The Art of Computer Science");        w.close();         // 2. query        String queryStr = args.length > 0 ? args[0] : "lucene";         // the "title" arg specifies the default field to use        // when no field is explicitly specified in the query.        Query q = new QueryParser(Version.LUCENE_35, "title", analyzer).parse(queryStr);         // 3. search        int hitsPerPage = 10;        IndexReader reader = IndexReader.open(index);        IndexSearcher searcher = new IndexSearcher(reader);        TopScoreDocCollector collector = TopScoreDocCollector.create(hitsPerPage, true);        searcher.search(q, collector);        ScoreDoc[] hits = collector.topDocs().scoreDocs;         // 4. display results        System.out.println("Found " + hits.length + " hits.");        for (int i = 0; i < hits.length; ++i) {            int docId = hits[i].doc;            Document d = searcher.doc(docId);            System.out.println((i + 1) + ". " + d.get("title"));        }         // searcher can only be closed when there        // is no need to access the documents any more.        searcher.close();    }     private static void addDoc(IndexWriter w, String value) throws IOException {        Document doc = new Document();        doc.add(new Field("title", value, Field.Store.YES, Field.Index.ANALYZED));        w.addDocument(doc);    }}

منابع

شاد و پیروز باشید