org.apache.lucene.analysis.WhitespaceAnalyzer Java Examples
The following examples show how to use
org.apache.lucene.analysis.WhitespaceAnalyzer.
You can vote up the ones you like or vote down the ones you don't like,
and go to the original project or source file by following the links above each example. You may check out the related API usage on the sidebar.
Example #1
Source File: AbstractIndexManager.java From webdsl with Apache License 2.0 | 6 votes |
protected static boolean clearIndex(File path) { try { if (path == null || !path.exists()) return true; // if path doesnt exist, then there is nothing to // clear FSDirectory indexDir = new FSDirectoryProvider().getDirectory(); IndexWriter writer = new IndexWriter(indexDir.open(path), new IndexWriterConfig(Version.LUCENE_CURRENT, new WhitespaceAnalyzer(Version.LUCENE_CURRENT))); writer.deleteAll(); writer.close(); return true; } catch (Exception ex) { org.webdsl.logging.Logger.error( "Error while clearing index on location: " + path, ex); return false; } }
Example #2
Source File: AutoCompleter.java From webdsl with Apache License 2.0 | 6 votes |
/** * Use a different index as the auto completer index or re-open * the existing index if <code>autocompleteIndex</code> is the same value * as given in the constructor. * @param autocompleteIndexDir the autocomplete directory to use * @throws AlreadyClosedException if the Autocompleter is already closed * @throws IOException if autocompleter can not open the directory */ // TODO: we should make this final as it is called in the constructor public void setAutoCompleteIndex(Directory autocompleteIndexDir) throws IOException { // this could be the same directory as the current autocompleteIndex // modifications to the directory should be synchronized synchronized (modifyCurrentIndexLock) { ensureOpen(); if (!IndexReader.indexExists(autocompleteIndexDir)) { IndexWriter writer = new IndexWriter(autocompleteIndexDir, new IndexWriterConfig(Version.LUCENE_CURRENT, new WhitespaceAnalyzer(Version.LUCENE_CURRENT))); writer.close(); } swapSearcher(autocompleteIndexDir); } }
Example #3
Source File: DocumentUtil.java From netbeans with Apache License 2.0 | 5 votes |
public static Analyzer createAnalyzer() { final PerFieldAnalyzerWrapper analyzer = new PerFieldAnalyzerWrapper(new KeywordAnalyzer()); analyzer.addAnalyzer(DocumentUtil.FIELD_IDENTS, new WhitespaceAnalyzer()); analyzer.addAnalyzer(DocumentUtil.FIELD_FEATURE_IDENTS, new WhitespaceAnalyzer()); analyzer.addAnalyzer(DocumentUtil.FIELD_CASE_INSENSITIVE_FEATURE_IDENTS, new DocumentUtil.LCWhitespaceAnalyzer()); return analyzer; }
Example #4
Source File: AutoCompleter.java From webdsl with Apache License 2.0 | 5 votes |
/** * Removes all terms from the auto complete index. * @throws IOException * @throws AlreadyClosedException if the Autocompleter is already closed */ public void clearIndex() throws IOException { synchronized (modifyCurrentIndexLock) { ensureOpen(); final Directory dir = this.autoCompleteIndex; final IndexWriter writer = new IndexWriter(dir, new IndexWriterConfig( Version.LUCENE_CURRENT, new WhitespaceAnalyzer(Version.LUCENE_CURRENT)) .setOpenMode(OpenMode.CREATE)); writer.close(); swapSearcher(dir); } }
Example #5
Source File: AutoCompleter.java From webdsl with Apache License 2.0 | 5 votes |
/** * Indexes the data from the given reader. * @param reader Source index reader, from which autocomplete words are obtained for the defined field * @param field the field of the source index reader to index for autocompletion * @param mergeFactor mergeFactor to use when indexing * @param ramMB the max amount or memory in MB to use * @param optimize whether or not the autocomplete index should be optimized * @throws AlreadyClosedException if the Autocompleter is already closed * @throws IOException */ public final void indexDictionary(IndexReader reader, String field, int mergeFactor, int ramMB, boolean optimize) throws IOException { synchronized (modifyCurrentIndexLock) { ensureOpen(); final Directory dir = this.autoCompleteIndex; final Dictionary dict = new LuceneDictionary(reader, field); final IndexWriter writer = new IndexWriter(dir, new IndexWriterConfig(Version.LUCENE_CURRENT, new WhitespaceAnalyzer(Version.LUCENE_CURRENT)).setRAMBufferSizeMB(ramMB)); IndexSearcher indexSearcher = obtainSearcher(); final List<IndexReader> readers = new ArrayList<IndexReader>(); if (searcher.maxDoc() > 0) { ReaderUtil.gatherSubReaders(readers, searcher.getIndexReader()); } //clear the index writer.deleteAll(); try { Iterator<String> iter = dict.getWordsIterator(); while (iter.hasNext()) { String word = iter.next(); // ok index the word Document doc = createDocument(word, reader.docFreq(new Term(field, word))); writer.addDocument(doc); } } finally { releaseSearcher(indexSearcher); } // close writer if (optimize) writer.optimize(); writer.close(); // also re-open the autocomplete index to see our own changes when the next suggestion // is fetched: swapSearcher(dir); } }
Example #6
Source File: left_TestSpans_1.3.java From gumtree-spoon-ast-diff with Apache License 2.0 | 5 votes |
public void setUp() throws Exception { RAMDirectory directory = new RAMDirectory(); IndexWriter writer= new IndexWriter(directory, new WhitespaceAnalyzer(), true); StringBuffer buffer = new StringBuffer(); for (int i = 0; i < docFields.length; i++) { Document doc = new Document(); doc.add(Field.Text(field, docFields[i])); writer.addDocument(doc); } writer.close(); searcher = new IndexSearcher(directory); }
Example #7
Source File: right_TestSpans_1.4.java From gumtree-spoon-ast-diff with Apache License 2.0 | 5 votes |
public void setUp() throws Exception { RAMDirectory directory = new RAMDirectory(); IndexWriter writer= new IndexWriter(directory, new WhitespaceAnalyzer(), true); for (int i = 0; i < docFields.length; i++) { Document doc = new Document(); doc.add(Field.Text(field, docFields[i])); writer.addDocument(doc); } writer.close(); searcher = new IndexSearcher(directory); }
Example #8
Source File: TestCloseSessionDuringFTGS.java From imhotep with Apache License 2.0 | 4 votes |
@Test public void testCloseSessionDuringFTGS() throws ImhotepOutOfMemoryException, IOException, InterruptedException { String tempDir = Files.getTempDirectory("asdf", ""); try { IndexWriter w = new IndexWriter(tempDir, new WhitespaceAnalyzer(), true, IndexWriter.MaxFieldLength.LIMITED); Random rand = new Random(); for (int i = 0; i < 1000000; ++i) { int numTerms = rand.nextInt(5) + 5; Document doc = new Document(); for (int t = 0; t < numTerms; ++t) { doc.add(new Field("sf1", Integer.toString(rand.nextInt(10000)), Field.Store.NO, Field.Index.NOT_ANALYZED_NO_NORMS)); } w.addDocument(doc); } w.close(); final AtomicBoolean closed = new AtomicBoolean(false); FlamdexReader r = new LuceneFlamdexReader(IndexReader.open(tempDir)) { @Override public void close() throws IOException { super.close(); closed.set(true); } }; final ExecutorService executor = Executors.newCachedThreadPool(); try { ImhotepSession session = new MTImhotepMultiSession(new ImhotepLocalSession[] { new ImhotepLocalSession(r) }, new MemoryReservationContext( new ImhotepMemoryPool( Long.MAX_VALUE)), executor, null); // FTGSIterator iter = session.getFTGSIterator(new String[]{}, new String[]{"sf1"}); //TODO fix this session.close(); assertTrue(closed.get()); } finally { executor.shutdown(); } } finally { Files.delete(tempDir); } }