LuceneSearch.java example

Explorer

zeppelin-master
- alluxio
  - src
    - main
      - java
        org
        apache
        zeppelin
        alluxio
        AlluxioInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        alluxio
        AlluxioInterpreterTest.java
- angular
  - src
    - main
      - java
        org
        apache
        zeppelin
        angular
        AngularInterpreter.java
- beam
  - src
    - main
      - java
        org
        apache
        zeppelin
        beam
        BeamInterpreter.java
        StaticRepl.java
      - test
        org
        apache
        zeppelin
        beam
        BeamInterpreterTest.java
- bigquery
  - src
    - main
      - java
        org
        apache
        zeppelin
        bigquery
        BigQueryInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        bigquery
        BigQueryInterpreterTest.java
- cassandra
  - src
    - main
      - java
        org
        apache
        zeppelin
        cassandra
        CassandraInterpreter.java
        ParsingException.java
    - test
      - java
        org
        apache
        zeppelin
        cassandra
        CassandraInterpreterTest.java
        InterpreterLogicTest.java
- elasticsearch
  - src
    - main
      - java
        org
        apache
        zeppelin
        elasticsearch
        ElasticsearchInterpreter.java
        action
        ActionException.java
        ActionResponse.java
        AggWrapper.java
        HitWrapper.java
        client
        ElasticsearchClient.java
        HttpBasedClient.java
        TransportBasedClient.java
    - test
      - java
        org
        apache
        zeppelin
        elasticsearch
        ElasticsearchInterpreterTest.java
- file
  - src
    - main
      - java
        org
        apache
        zeppelin
        file
        FileInterpreter.java
        HDFSCommand.java
        HDFSFileInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        file
        HDFSFileInterpreterTest.java
- flink
  - src
    - main
      - java
        org
        apache
        zeppelin
        flink
        FlinkInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        flink
        FlinkInterpreterTest.java
- geode
  - src
    - main
      - java
        org
        apache
        zeppelin
        geode
        GeodeOqlInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        geode
        GeodeOqlInterpreterTest.java
- groovy
  - src
    - main
      - java
        org
        apache
        zeppelin
        groovy
        GObject.java
        GroovyInterpreter.java
- hbase
  - src
    - main
      - java
        org
        apache
        zeppelin
        hbase
        HbaseInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        hbase
        HbaseInterpreterTest.java
- helium-dev
  - src
    - main
      - java
        org
        apache
        zeppelin
        helium
        DevInterpreter.java
        ZeppelinApplicationDevServer.java
        ZeppelinDevServer.java
- ignite
  - src
    - main
      - java
        org
        apache
        zeppelin
        ignite
        IgniteInterpreter.java
        IgniteInterpreterUtils.java
        IgniteSqlInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        ignite
        IgniteInterpreterTest.java
        IgniteSqlInterpreterTest.java
        Person.java
- jdbc
  - src
    - main
      - java
        org
        apache
        zeppelin
        jdbc
        JDBCInterpreter.java
        JDBCUserConfigurations.java
        SqlCompleter.java
        security
        JDBCSecurityImpl.java
    - test
      - java
        org
        apache
        zeppelin
        jdbc
        JDBCInterpreterTest.java
        SqlCompleterTest.java
- kylin
  - src
    - main
      - java
        org
        apache
        zeppelin
        kylin
        KylinInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        kylin
        KylinInterpreterTest.java
- lens
  - src
    - main
      - java
        org
        apache
        zeppelin
        lens
        ExecutionDetail.java
        LensBootstrap.java
        LensInterpreter.java
        LensJLineShellComponent.java
        LensSimpleExecutionStrategy.java
    - test
      - java
        org
        apache
        zeppelin
        lens
        LensInterpreterTest.java
- livy
  - src
    - main
      - java
        org
        apache
        zeppelin
        livy
        APINotFoundException.java
        BaseLivyInterpreter.java
        LivyException.java
        LivyPySpark3Interpreter.java
        LivyPySparkBaseInterpreter.java
        LivyPySparkInterpreter.java
        LivySparkInterpreter.java
        LivySparkRInterpreter.java
        LivySparkSQLInterpreter.java
        LivyVersion.java
        SessionNotFoundException.java
    - test
      - java
        org
        apache
        zeppelin
        livy
        LivyInterpreterIT.java
        LivySQLInterpreterTest.java
- markdown
  - src
    - main
      - java
        org
        apache
        zeppelin
        markdown
        Markdown.java
        Markdown4jParser.java
        MarkdownParser.java
        ParamVar.java
        PegdownParser.java
        PegdownWebSequencelPlugin.java
        PegdownYumlPlugin.java
    - test
      - java
        org
        apache
        zeppelin
        markdown
        Markdown4jParserTest.java
        PegdownParserTest.java
- pig
  - src
    - main
      - java
        org
        apache
        zeppelin
        pig
        BasePigInterpreter.java
        PigInterpreter.java
        PigQueryInterpreter.java
        PigScriptListener.java
        PigUtils.java
    - test
      - java
        org
        apache
        zeppelin
        pig
        PigInterpreterTest.java
        PigInterpreterTezTest.java
        PigQueryInterpreterTest.java
- python
  - src
    - main
      - java
        org
        apache
        zeppelin
        python
        PythonCondaInterpreter.java
        PythonDockerInterpreter.java
        PythonInterpreter.java
        PythonInterpreterPandasSql.java
    - test
      - java
        org
        apache
        zeppelin
        python
        PythonCondaInterpreterTest.java
        PythonDockerInterpreterTest.java
        PythonInterpreterMatplotlibTest.java
        PythonInterpreterPandasSqlTest.java
        PythonInterpreterTest.java
- r
  - src
    - main
      - java
        org
        apache
        zeppelin
        rinterpreter
        KnitR.java
        RRepl.java
        RStatics.java
- scalding
  - src
    - main
      - java
        org
        apache
        zeppelin
        scalding
        ScaldingInterpreter.java
    - test
      - java
        org
        apache
        zeppelin
        scalding
        ScaldingInterpreterTest.java
- scio
  - src
    - test
      - java
        org
        apache
        zeppelin
        scio
        ScioInterpreterTest.java
- shell
  - src
    - main
      - java
        org
        apache
        zeppelin
        shell
        ShellInterpreter.java
        security
        ShellSecurityImpl.java
    - test
      - java
        org
        apache
        zeppelin
        shell
        ShellInterpreterTest.java
- spark
  - src
    - main
      - java
        org
        apache
        zeppelin
        spark
        DepInterpreter.java
        PySparkInterpreter.java
        SparkInterpreter.java
        SparkRInterpreter.java
        SparkSqlInterpreter.java
        SparkVersion.java
        SparkZeppelinContext.java
        Utils.java
        ZeppelinR.java
        ZeppelinRContext.java
        dep
        SparkDependencyContext.java
        SparkDependencyResolver.java
    - test
      - java
        org
        apache
        zeppelin
        spark
        DepInterpreterTest.java
        PySparkInterpreterMatplotlibTest.java
        PySparkInterpreterTest.java
        SparkInterpreterTest.java
        SparkSqlInterpreterTest.java
        SparkVersionTest.java
        dep
        SparkDependencyResolverTest.java
- zeppelin-examples
  - zeppelin-example-clock
    - src
      - main
        java
        org
        apache
        zeppelin
        example
        app
        clock
        Clock.java
- zeppelin-interpreter
  - src
    - main
      - java
        org
        apache
        zeppelin
        annotation
        Experimental.java
        ZeppelinApi.java
        completer
        CompletionType.java
        StringsCompleter.java
        dep
        AbstractDependencyResolver.java
        Booter.java
        Dependency.java
        DependencyContext.java
        DependencyResolver.java
        Repository.java
        RepositoryListener.java
        RepositorySystemFactory.java
        TransferListener.java
        display
        AngularObject.java
        AngularObjectListener.java
        AngularObjectRegistry.java
        AngularObjectRegistryListener.java
        AngularObjectWatcher.java
        GUI.java
        Input.java
        OldInput.java
        RuntimeTypeAdapterFactory.java
        ui
        CheckBox.java
        OptionInput.java
        Select.java
        TextBox.java
        helium
        Application.java
        ApplicationContext.java
        ApplicationEventListener.java
        ApplicationException.java
        ApplicationLoader.java
        ClassLoaderApplication.java
        HeliumAppAngularObjectRegistry.java
        HeliumPackage.java
        HeliumType.java
        SpellPackageInfo.java
        interpreter
        BaseZeppelinContext.java
        ClassloaderInterpreter.java
        Constants.java
        Interpreter.java
        InterpreterContext.java
        InterpreterContextRunner.java
        InterpreterException.java
        InterpreterGroup.java
        InterpreterHookListener.java
        InterpreterHookRegistry.java
        InterpreterOption.java
        InterpreterOutput.java
        InterpreterOutputChangeListener.java
        InterpreterOutputChangeWatcher.java
        InterpreterOutputListener.java
        InterpreterProperty.java
        InterpreterPropertyBuilder.java
        InterpreterResult.java
        InterpreterResultMessage.java
        InterpreterResultMessageOutput.java
        InterpreterResultMessageOutputListener.java
        InterpreterRunner.java
        InterpreterUtils.java
        LazyOpenInterpreter.java
        RemoteWorksController.java
        RemoteZeppelinServerResource.java
        ResultMessages.java
        WrappedInterpreter.java
        remote
        AppendOutputBuffer.java
        AppendOutputRunner.java
        ClientFactory.java
        InterpreterContextRunnerPool.java
        InvokeResourceMethodEventMessage.java
        RemoteAngularObject.java
        RemoteEventClient.java
        RemoteEventClientWrapper.java
        RemoteInterpreterContextRunner.java
        RemoteInterpreterEventClient.java
        RemoteInterpreterEventPoller.java
        RemoteInterpreterProcess.java
        RemoteInterpreterProcessListener.java
        RemoteInterpreterServer.java
        RemoteInterpreterUtils.java
        thrift
        InterpreterCompletion.java
        RemoteApplicationResult.java
        RemoteInterpreterContext.java
        RemoteInterpreterEvent.java
        RemoteInterpreterEventType.java
        RemoteInterpreterResult.java
        RemoteInterpreterResultMessage.java
        RemoteInterpreterService.java
        ZeppelinServerResourceParagraphRunner.java
        util
        InterpreterOutputStream.java
        LogOutputStream.java
        resource
        ByteBufferInputStream.java
        DistributedResourcePool.java
        LocalResourcePool.java
        RemoteResource.java
        Resource.java
        ResourceId.java
        ResourcePool.java
        ResourcePoolConnector.java
        ResourcePoolUtils.java
        ResourceSet.java
        WellKnownResourceName.java
        scheduler
        ExecutorFactory.java
        FIFOScheduler.java
        Job.java
        JobListener.java
        JobProgressPoller.java
        ParallelScheduler.java
        RemoteScheduler.java
        Scheduler.java
        SchedulerFactory.java
        SchedulerListener.java
        tabledata
        ColumnDef.java
        InterpreterResultTableData.java
        ProxyRowIterator.java
        Row.java
        TableData.java
        TableDataException.java
        TableDataProxy.java
        user
        AuthenticationInfo.java
        Credentials.java
        CredentialsInfoSaving.java
        UserCredentials.java
        UsernamePassword.java
    - test
      - java
        org
        apache
        zeppelin
        dep
        BooterTest.java
        DependencyResolverTest.java
        display
        AngularObjectRegistryTest.java
        AngularObjectTest.java
        GUITest.java
        InputTest.java
        helium
        ApplicationLoaderTest.java
        HeliumPackageTest.java
        MockApplication1.java
        interpreter
        DummyInterpreter.java
        InterpreterContextTest.java
        InterpreterHookRegistryTest.java
        InterpreterOutputChangeWatcherTest.java
        InterpreterOutputTest.java
        InterpreterResultTest.java
        InterpreterTest.java
        LazyOpenInterpreterTest.java
        remote
        RemoteInterpreterServerTest.java
        resource
        LocalResourcePoolTest.java
        ResourceSetTest.java
        ResourceTest.java
        scheduler
        FIFOSchedulerTest.java
        ParallelSchedulerTest.java
        SleepingJob.java
        tabledata
        InterpreterResultTableDataTest.java
        TableDataProxyTest.java
        user
        CredentialsTest.java
- zeppelin-server
  - src
    - main
      - java
        org
        apache
        zeppelin
        json
        NotebookTypeAdapterFactory.java
        realm
        ActiveDirectoryGroupRealm.java
        LdapGroupRealm.java
        LdapRealm.java
        PamRealm.java
        UserPrincipal.java
        ZeppelinHubRealm.java
        rest
        ConfigurationsRestApi.java
        CredentialRestApi.java
        GetUserList.java
        HeliumRestApi.java
        InterpreterRestApi.java
        LoginRestApi.java
        NotebookRepoRestApi.java
        NotebookResponse.java
        NotebookRestApi.java
        SecurityRestApi.java
        ZeppelinRestApi.java
        exception
        BadRequestException.java
        ForbiddenException.java
        NotFoundException.java
        message
        CronRequest.java
        NewInterpreterSettingRequest.java
        NewNoteRequest.java
        NewParagraphRequest.java
        NotebookRepoSettingsRequest.java
        RestartInterpreterRequest.java
        RunParagraphWithParametersRequest.java
        UpdateInterpreterSettingRequest.java
        server
        CorsFilter.java
        JsonExclusionStrategy.java
        JsonResponse.java
        ZeppelinServer.java
        socket
        NotebookServer.java
        NotebookSocket.java
        NotebookSocketListener.java
        NotebookWebSocketCreator.java
        types
        InterpreterSettingsList.java
        utils
        CommandLineUtils.java
        ExceptionUtils.java
        InterpreterBindingUtils.java
        SecurityUtils.java
    - test
      - java
        com
        webautomation
        ScreenCaptureHtmlUnitDriver.java
        org
        apache
        zeppelin
        AbstractZeppelinIT.java
        CommandExecutor.java
        ProcessData.java
        WebDriverManager.java
        ZeppelinITUtils.java
        display
        AngularObjectBuilder.java
        integration
        AuthenticationIT.java
        InterpreterIT.java
        ParagraphActionsIT.java
        SparkParagraphIT.java
        ZeppelinIT.java
        interpreter
        mock
        MockInterpreter1.java
        realm
        PamRealmTest.java
        rest
        AbstractTestRestApi.java
        ConfigurationsRestApiTest.java
        CredentialsRestApiTest.java
        InterpreterRestApiTest.java
        NotebookRepoRestApiTest.java
        NotebookRestApiTest.java
        NotebookSecurityRestApiTest.java
        SecurityRestApiTest.java
        ZeppelinRestApiTest.java
        ZeppelinSparkClusterTest.java
        security
        DirAccessTest.java
        SecurityUtilsTest.java
        server
        CorsFilterTest.java
        socket
        NotebookServerTest.java
        ticket
        TicketContainerTest.java
- zeppelin-zengine
  - src
    - main
      - java
        org
        apache
        zeppelin
        conf
        ZeppelinConfiguration.java
        helium
        Helium.java
        HeliumApplicationFactory.java
        HeliumBundleFactory.java
        HeliumConf.java
        HeliumLocalRegistry.java
        HeliumOnlineRegistry.java
        HeliumPackageSearchResult.java
        HeliumPackageSuggestion.java
        HeliumRegistry.java
        HeliumRegistrySerializer.java
        NpmPackage.java
        WebpackResult.java
        interpreter
        InterpreterFactory.java
        InterpreterGroupFactory.java
        InterpreterInfo.java
        InterpreterInfoSaving.java
        InterpreterSetting.java
        InterpreterSettingManager.java
        install
        InstallInterpreter.java
        remote
        RemoteAngularObjectRegistry.java
        RemoteInterpreter.java
        RemoteInterpreterManagedProcess.java
        RemoteInterpreterRunningProcess.java
        notebook
        ApplicationState.java
        Folder.java
        FolderListener.java
        FolderView.java
        JobListenerFactory.java
        Note.java
        NoteEventListener.java
        NoteInfo.java
        NoteNameListener.java
        Notebook.java
        NotebookAuthorization.java
        NotebookAuthorizationInfoSaving.java
        NotebookEventListener.java
        NotebookImportDeserializer.java
        Paragraph.java
        ParagraphJobListener.java
        ParagraphRuntimeInfo.java
        repo
        AzureNotebookRepo.java
        GitNotebookRepo.java
        MongoNotebookRepo.java
        NotebookRepo.java
        NotebookRepoSettingsInfo.java
        NotebookRepoSync.java
        NotebookRepoWithSettings.java
        S3NotebookRepo.java
        VFSNotebookRepo.java
        zeppelinhub
        ZeppelinHubRepo.java
        model
        Instance.java
        UserSessionContainer.java
        UserTokenContainer.java
        rest
        HttpProxyClient.java
        ZeppelinhubRestApiHandler.java
        security
        Authentication.java
        websocket
        Client.java
        ZeppelinClient.java
        ZeppelinhubClient.java
        listener
        WatcherWebsocket.java
        ZeppelinWebsocket.java
        ZeppelinhubWebsocket.java
        protocol
        ZeppelinHubOp.java
        ZeppelinhubMessage.java
        scheduler
        SchedulerService.java
        ZeppelinHeartbeat.java
        ZeppelinHubHeartbeat.java
        session
        ZeppelinhubSession.java
        utils
        ZeppelinhubUtils.java
        socket
        Message.java
        WatcherMessage.java
        utility
        IdHashes.java
        search
        LuceneSearch.java
        SearchService.java
        ticket
        TicketContainer.java
        util
        Util.java
        WatcherSecurityKey.java
    - test
      - java
        org
        apache
        zeppelin
        conf
        ZeppelinConfigurationTest.java
        display
        AngularObjectBuilder.java
        helium
        HeliumApplicationFactoryTest.java
        HeliumBundleFactoryTest.java
        HeliumLocalRegistryTest.java
        HeliumTest.java
        HeliumTestApplication.java
        HeliumTestRegistry.java
        interpreter
        InterpreterFactoryTest.java
        InterpreterSettingTest.java
        install
        InstallInterpreterTest.java
        mock
        MockInterpreter1.java
        MockInterpreter11.java
        MockInterpreter2.java
        remote
        AppendOutputRunnerTest.java
        RemoteAngularObjectTest.java
        RemoteInterpreterEventPollerTest.java
        RemoteInterpreterOutputTestStream.java
        RemoteInterpreterProcessTest.java
        RemoteInterpreterTest.java
        RemoteInterpreterUtilsTest.java
        mock
        MockInterpreterA.java
        MockInterpreterAngular.java
        MockInterpreterB.java
        MockInterpreterEnv.java
        MockInterpreterOutputStream.java
        MockInterpreterResourcePool.java
        notebook
        FolderTest.java
        FolderViewTest.java
        NoteInterpreterLoaderTest.java
        NoteTest.java
        NotebookTest.java
        ParagraphTest.java
        repo
        GitNotebookRepoTest.java
        NotebookRepoSyncInitializationTest.java
        NotebookRepoSyncTest.java
        VFSNotebookRepoTest.java
        mock
        VFSNotebookRepoMock.java
        zeppelinhub
        ZeppelinHubRepoTest.java
        websocket
        ZeppelinClientTest.java
        ZeppelinhubClientTest.java
        mock
        MockEchoWebsocketServer.java
        MockEventServlet.java
        MockEventSocket.java
        protocol
        ZeppelinhubMessageTest.java
        resource
        DistributedResourcePoolTest.java
        scheduler
        RemoteSchedulerTest.java
        search
        LuceneSearchTest.java

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.zeppelin.search;

import java.io.IOException;
import java.util.Collection;
import java.util.Collections;
import java.util.Date;
import java.util.List;
import java.util.Map;
import java.util.concurrent.TimeUnit;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.LongField;
import org.apache.lucene.document.StringField;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.Term;
import org.apache.lucene.queryparser.classic.MultiFieldQueryParser;
import org.apache.lucene.queryparser.classic.ParseException;
import org.apache.lucene.queryparser.classic.QueryParser;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.WildcardQuery;
import org.apache.lucene.search.highlight.Highlighter;
import org.apache.lucene.search.highlight.InvalidTokenOffsetsException;
import org.apache.lucene.search.highlight.QueryScorer;
import org.apache.lucene.search.highlight.SimpleHTMLFormatter;
import org.apache.lucene.search.highlight.TextFragment;
import org.apache.lucene.search.highlight.TokenSources;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.RAMDirectory;
import org.apache.zeppelin.notebook.Note;
import org.apache.zeppelin.notebook.Paragraph;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import com.google.common.base.Joiner;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.Lists;

/**
 * Search (both, indexing and query) the notebooks using Lucene.
 *
 * Query is thread-safe, as creates new IndexReader every time.
 * Index is thread-safe, as re-uses single IndexWriter, which is thread-safe.
 */
public class LuceneSearch implements SearchService {
  private static final Logger LOG = LoggerFactory.getLogger(LuceneSearch.class);

  private static final String SEARCH_FIELD_TEXT = "contents";
  private static final String SEARCH_FIELD_TITLE = "header";
  static final String PARAGRAPH = "paragraph";
  static final String ID_FIELD = "id";

  Directory ramDirectory;
  Analyzer analyzer;
  IndexWriterConfig iwc;
  IndexWriter writer;

  public LuceneSearch() {
    ramDirectory = new RAMDirectory();
    analyzer = new StandardAnalyzer();
    iwc = new IndexWriterConfig(analyzer);
    try {
      writer = new IndexWriter(ramDirectory, iwc);
    } catch (IOException e) {
      LOG.error("Failed to create new IndexWriter", e);
    }
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search#query(java.lang.String)
   */
  @Override
  public List<Map<String, String>> query(String queryStr) {
    if (null == ramDirectory) {
      throw new IllegalStateException(
          "Something went wrong on instance creation time, index dir is null");
    }
    List<Map<String, String>> result = Collections.emptyList();
    try (IndexReader indexReader = DirectoryReader.open(ramDirectory)) {
      IndexSearcher indexSearcher = new IndexSearcher(indexReader);
      Analyzer analyzer = new StandardAnalyzer();
      MultiFieldQueryParser parser = new MultiFieldQueryParser(
          new String[] {SEARCH_FIELD_TEXT, SEARCH_FIELD_TITLE},
          analyzer);

      Query query = parser.parse(queryStr);
      LOG.debug("Searching for: " + query.toString(SEARCH_FIELD_TEXT));

      SimpleHTMLFormatter htmlFormatter = new SimpleHTMLFormatter();
      Highlighter highlighter = new Highlighter(htmlFormatter, new QueryScorer(query));

      result = doSearch(indexSearcher, query, analyzer, highlighter);
      indexReader.close();
    } catch (IOException e) {
      LOG.error("Failed to open index dir {}, make sure indexing finished OK", ramDirectory, e);
    } catch (ParseException e) {
      LOG.error("Failed to parse query " + queryStr, e);
    }
    return result;
  }

  private List<Map<String, String>> doSearch(IndexSearcher searcher, Query query,
      Analyzer analyzer, Highlighter highlighter) {
    List<Map<String, String>> matchingParagraphs = Lists.newArrayList();
    ScoreDoc[] hits;
    try {
      hits = searcher.search(query, 20).scoreDocs;
      for (int i = 0; i < hits.length; i++) {
        LOG.debug("doc={} score={}", hits[i].doc, hits[i].score);

        int id = hits[i].doc;
        Document doc = searcher.doc(id);
        String path = doc.get(ID_FIELD);
        if (path != null) {
          LOG.debug((i + 1) + ". " + path);
          String title = doc.get("title");
          if (title != null) {
            LOG.debug("   Title: {}", doc.get("title"));
          }

          String text = doc.get(SEARCH_FIELD_TEXT);
          String header = doc.get(SEARCH_FIELD_TITLE);
          String fragment = "";

          if (text != null) {
            TokenStream tokenStream = TokenSources.getTokenStream(searcher.getIndexReader(), id,
                SEARCH_FIELD_TEXT, analyzer);
            TextFragment[] frag = highlighter.getBestTextFragments(tokenStream, text, true, 3);
            LOG.debug("    {} fragments found for query '{}'", frag.length, query);
            for (int j = 0; j < frag.length; j++) {
              if ((frag[j] != null) && (frag[j].getScore() > 0)) {
                LOG.debug("    Fragment: {}", frag[j].toString());
              }
            }
            fragment = (frag != null && frag.length > 0) ? frag[0].toString() : "";
          }

          if (header != null) {
            TokenStream tokenTitle = TokenSources.getTokenStream(searcher.getIndexReader(), id,
                SEARCH_FIELD_TITLE, analyzer);
            TextFragment[] frgTitle = highlighter.getBestTextFragments(tokenTitle, header, true, 3);
            header = (frgTitle != null && frgTitle.length > 0) ? frgTitle[0].toString() : "";
          } else {
            header = "";
          }
          matchingParagraphs.add(ImmutableMap.of("id", path, // <noteId>/paragraph/<paragraphId>
              "name", title, "snippet", fragment, "text", text, "header", header));
        } else {
          LOG.info("{}. No {} for this document", i + 1, ID_FIELD);
        }
      }
    } catch (IOException | InvalidTokenOffsetsException e) {
      LOG.error("Exception on searching for {}", query, e);
    }
    return matchingParagraphs;
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search#updateIndexDoc(org.apache.zeppelin.notebook.Note)
   */
  @Override
  public void updateIndexDoc(Note note) throws IOException {
    updateIndexNoteName(note);
    for (Paragraph p: note.getParagraphs()) {
      updateIndexParagraph(note, p);
    }
  }

  private void updateIndexNoteName(Note note) throws IOException {
    String noteName = note.getName();
    String noteId = note.getId();
    LOG.debug("Indexing Notebook {}, '{}'", noteId, noteName);
    if (null == noteName || noteName.isEmpty()) {
      LOG.debug("Skipping empty notebook name");
      return;
    }
    updateDoc(noteId, noteName, null);
  }

  private void updateIndexParagraph(Note note, Paragraph p) throws IOException {
    if (p.getText() == null) {
      LOG.debug("Skipping empty paragraph");
      return;
    }
    updateDoc(note.getId(), note.getName(), p);
  }

  /**
   * Updates index for the given note: either note.name or a paragraph If
   * paragraph is <code>null</code> - updates only for the note.name
   *
   * @param noteId
   * @param noteName
   * @param p
   * @throws IOException
   */
  private void updateDoc(String noteId, String noteName, Paragraph p) throws IOException {
    String id = formatId(noteId, p);
    Document doc = newDocument(id, noteName, p);
    try {
      writer.updateDocument(new Term(ID_FIELD, id), doc);
      writer.commit();
    } catch (IOException e) {
      LOG.error("Failed to updaet index of notebook {}", noteId, e);
    }
  }

  /**
   * If paragraph is not null, id is <noteId>/paragraphs/<paragraphId>,
   * otherwise it's just <noteId>.
   */
  static String formatId(String noteId, Paragraph p) {
    String id = noteId;
    if (null != p) {
      id = Joiner.on('/').join(id, PARAGRAPH, p.getId());
    }
    return id;
  }

  static String formatDeleteId(String noteId, Paragraph p) {
    String id = noteId;
    if (null != p) {
      id = Joiner.on('/').join(id, PARAGRAPH, p.getId());
    } else {
      id = id + "*";
    }
    return id;
  }

  /**
   * If paragraph is not null, indexes code in the paragraph, otherwise indexes
   * the notebook name.
   *
   * @param id id of the document, different for Note name and paragraph
   * @param noteName name of the note
   * @param p paragraph
   * @return
   */
  private Document newDocument(String id, String noteName, Paragraph p) {
    Document doc = new Document();

    Field pathField = new StringField(ID_FIELD, id, Field.Store.YES);
    doc.add(pathField);
    doc.add(new StringField("title", noteName, Field.Store.YES));

    if (null != p) {
      doc.add(new TextField(SEARCH_FIELD_TEXT, p.getText(), Field.Store.YES));
      if (p.getTitle() != null) {
        doc.add(new TextField(SEARCH_FIELD_TITLE, p.getTitle(), Field.Store.YES));
      }
      Date date = p.getDateStarted() != null ? p.getDateStarted() : p.getDateCreated();
      doc.add(new LongField("modified", date.getTime(), Field.Store.NO));
    } else {
      doc.add(new TextField(SEARCH_FIELD_TEXT, noteName, Field.Store.YES));
    }
    return doc;
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search#addIndexDocs(java.util.Collection)
   */
  @Override
  public void addIndexDocs(Collection<Note> collection) {
    int docsIndexed = 0;
    long start = System.nanoTime();
    try {
      for (Note note : collection) {
        addIndexDocAsync(note);
        docsIndexed++;
      }
    } catch (IOException e) {
      LOG.error("Failed to index all Notebooks", e);
    } finally {
      try { // save what's been indexed, even if not full collection
        writer.commit();
      } catch (IOException e) {
        LOG.error("Failed to save index", e);
      }
      long end = System.nanoTime();
      LOG.info("Indexing {} notebooks took {}ms", docsIndexed,
          TimeUnit.NANOSECONDS.toMillis(end - start));
    }
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search#addIndexDoc(org.apache.zeppelin.notebook.Note)
   */
  @Override
  public void addIndexDoc(Note note) {
    try {
      addIndexDocAsync(note);
      writer.commit();
    } catch (IOException e) {
      LOG.error("Failed to add note {} to index", note, e);
    }
  }

  /**
   * Indexes the given notebook, but does not commit changes.
   *
   * @param note
   * @throws IOException
   */
  private void addIndexDocAsync(Note note) throws IOException {
    indexNoteName(writer, note.getId(), note.getName());
    for (Paragraph doc : note.getParagraphs()) {
      if (doc.getText() == null) {
        LOG.debug("Skipping empty paragraph");
        continue;
      }
      indexDoc(writer, note.getId(), note.getName(), doc);
    }
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search#deleteIndexDocs(org.apache.zeppelin.notebook.Note)
   */
  @Override
  public void deleteIndexDocs(Note note) {
    deleteDoc(note, null);
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search
   *  #deleteIndexDoc(org.apache.zeppelin.notebook.Note, org.apache.zeppelin.notebook.Paragraph)
   */
  @Override
  public void deleteIndexDoc(Note note, Paragraph p) {
    deleteDoc(note, p);
  }

  private void deleteDoc(Note note, Paragraph p) {
    if (null == note) {
      LOG.error("Trying to delete note by reference to NULL");
      return;
    }
    String fullNoteOrJustParagraph = formatDeleteId(note.getId(), p);
    LOG.debug("Deleting note {}, out of: {}", note.getId(), writer.numDocs());
    try {
      writer.deleteDocuments(new WildcardQuery(new Term(ID_FIELD, fullNoteOrJustParagraph)));
      writer.commit();
    } catch (IOException e) {
      LOG.error("Failed to delete {} from index by '{}'", note, fullNoteOrJustParagraph, e);
    }
    LOG.debug("Done, index contains {} docs now" + writer.numDocs());
  }

  /* (non-Javadoc)
   * @see org.apache.zeppelin.search.Search#close()
   */
  @Override
  public void close() {
    try {
      writer.close();
    } catch (IOException e) {
      LOG.error("Failed to .close() the notebook index", e);
    }
  }

  /**
   * Indexes a notebook name
   *
   * @throws IOException
   */
  private void indexNoteName(IndexWriter w, String noteId, String noteName) throws IOException {
    LOG.debug("Indexing Notebook {}, '{}'", noteId, noteName);
    if (null == noteName || noteName.isEmpty()) {
      LOG.debug("Skipping empty notebook name");
      return;
    }
    indexDoc(w, noteId, noteName, null);
  }

  /**
   * Indexes a single document:
   *  - code of the paragraph (if non-null)
   *  - or just a note name
   */
  private void indexDoc(IndexWriter w, String noteId, String noteName, Paragraph p)
      throws IOException {
    String id = formatId(noteId, p);
    Document doc = newDocument(id, noteName, p);
    w.addDocument(doc);
  }

}