七月OV

[Solr] Apache Solr 入门案例

前言

在上文中我们已经详细介绍了 Solr 的部署，本文我们将介绍 Solr 在 Java 中的使用。

上文传送门 :

[Solr] Apache Solr 简介及使用

[Solr] Apache Solr 集群

环境准备

索引库 schema.xml 配置文件


<schema name="example" version="1.5">
   <field name="_version_" type="long" indexed="true" stored="true"/>
   <field name="_root_" type="string" indexed="true" stored="false"/> 
   <field name="id" type="string" indexed="true" 
                    stored="true" required="true" multiValued="false" /> 
   <field name="name" type="text_ws" indexed="true" stored="true"/>
   <field name="price"  type="float" indexed="true" stored="true"/>
   <field name="title" type="text_ws" indexed="true" stored="true" multiValued="false"/>
   <field name="content" type="text_ws" indexed="true" stored="true" multiValued="false"/>
   <field name="text" type="text_ws" indexed="true" stored="true" multiValued="true"/>
   <field name="date"  type="date" indexed="true" stored="true"/>
   <field name="binary"  type="binary" indexed="true" stored="true"/>

   <dynamicField name="*_ss" type="string"  indexed="true"  
                                stored="true" multiValued="true"/>

   <uniqueKey>iduniqueKey>

   <copyField source="title" dest="text"/>
   <copyField source="content" dest="text"/>

    <fieldType name="string" class="solr.StrField" sortMissingLast="true" />
    <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
    <fieldType name="int" class="solr.TrieIntField" 
                        precisionStep="0" positionIncrementGap="0"/>
    <fieldType name="float" class="solr.TrieFloatField" 
                        precisionStep="0" positionIncrementGap="0"/>
    <fieldType name="long" class="solr.TrieLongField" 
                        precisionStep="0" positionIncrementGap="0"/>
    <fieldType name="double" class="solr.TrieDoubleField" 
                        precisionStep="0" positionIncrementGap="0"/>
    <fieldType name="date" class="solr.TrieDateField" 
                        precisionStep="0" positionIncrementGap="0"/>
    <fieldtype name="binary" class="solr.BinaryField"/>


    <fieldType name="text_ws" class="solr.TextField">
        <analyzer class="org.wltea.analyzer.lucene.IKAnalyzer"/>
    fieldType>
schema>

入门案例

1> 引入pom相关jar

<dependency>
    <groupId>junitgroupId>
    <artifactId>junitartifactId>
dependency>
<dependency>
    <groupId>org.apache.solrgroupId>
    <artifactId>solr-solrjartifactId>
    <version>4.10.2version>
dependency>

<dependency>
    <groupId>commons-logginggroupId>
    <artifactId>commons-logging-apiartifactId>
    <version>1.1version>
dependency>

2> 初始化SolrServer

    private static String URL = "http://hadoop1:8080/solr/collection3";

    private static SolrServer solrServer =
            new HttpSolrServer(URL);

3> 创建文档

创建一个文档

@Test
public void addSolrDoc () throws IOException, SolrServerException {
    SolrInputDocument document = new SolrInputDocument();
    // 设置激励因子，默认是1
    document.setDocumentBoost(1);
    document.addField("id", "1");
    document.addField("title","媲美故宫的“铜宫”");
    document.addField("content","雷峰塔、峨眉金顶、灵隐铜殿，" +
            "上百件标志性铜建筑让他成为“中国当代铜建筑之父”，" +
            "他是中国铜雕领域界唯一一位国家级非遗传承人");
    document.addField("date",new Date());
    document.addField("binary","solr".getBytes());
    solrServer.add(document);
    solrServer.commit();
}

注 :
1 > 在Solr中，一个Document必须包含ID，因为Solr是根据ID维护Document的
2 > 一个Fiele中的name值必须是schema.xml中存在的field，如果不存在该Field，会报错

创建多个文档

@Test
public void addSolrDocs() throws IOException, SolrServerException {
    ArrayList documents = new ArrayList<>();
    for (int i = 1; i <= 10; i++) {
        SolrInputDocument document = new SolrInputDocument();
        // 设置激励因子，默认是1
        document.setDocumentBoost(1);
        document.addField("id", i+"");
        document.addField("title", "媲美故宫的“铜宫”");
        document.addField("content", "雷峰塔、峨眉金顶、灵隐铜殿，" +
                "上百件标志性铜建筑让他成为“中国当代铜建筑之父”，" +
                "他是中国铜雕领域界唯一一位国家级非遗传承人");
        document.addField("date", new Date());
        document.addField("binary", "solr".getBytes());
        documents.add(document);
    }
    solrServer.add(documents);
    solrServer.commit();
}

4 > 修改文档

其实Solr在修改时，做的依旧是add操作，只不过Solr会根据document的ID来查询此document是否存在，如果存在，会先删除此document，然后执行add操作。

@Test
public void updateSolrDoc () throws IOException, SolrServerException {
    SolrInputDocument document = new SolrInputDocument();
    // 设置激励因子，默认是1
    document.setDocumentBoost(1);
    document.addField("id", 10);
    document.addField("title", "媲美故宫的“铜宫”");
    document.addField("content", "这是修改后的内容");
    solrServer.add(document);
    solrServer.commit();
}

由于上面我们已经批量添加了10条数据，我们执行完修改操作后，在来看看ID为10的Document，发现该Document的date与binary都消息了，证明先执行了删除，后执行了新增。

      {
        "id": "10",
        "title": "媲美故宫的“铜宫”",
        "text": [
          "媲美故宫的“铜宫”",
          "这是修改后的内容"
        ],
        "content": "这是修改后的内容",
        "_version_": 1608276634333347800
      }

5> 使用JavaBean写入文档

注 : 在JavaBean中要对字段加上 @Field 注解，才能被Solr识别

public class SolrDocument {
    @Field
    private String id;
    @Field
    private String name;
    @Field
    private double price;
    @Field
    private String title;
    @Field
    private String content;
    @Field
    private ArrayList text;
    @Field
    private Date date;
    @Field
    private byte[] binary;

    //... get set   
}

@Test
public void addSolrBean() throws IOException, SolrServerException {
    SolrDocument solrDocument = new SolrDocument();
    solrDocument.setId("11");
    solrDocument.setTitle("媲美故宫的“铜宫”");
    solrDocument.setContent("雷峰塔、峨眉金顶、灵隐铜殿，" +
            "上百件标志性铜建筑让他成为“中国当代铜建筑之父”，" +
            "他是中国铜雕领域界唯一一位国家级非遗传承人");
    solrDocument.setDate(new Date());
    solrDocument.setBinary("solr".getBytes());
    solrServer.addBean(solrDocument);
    solrServer.commit();
}

6> 删除文档

/**
 * 删除单个Doc
 */
@Test
public void deleteDocById () throws IOException, SolrServerException {
    solrServer.deleteById("11");
    solrServer.commit();
}

/**
 * 删除多个Doc
 */
@Test
public void deleteDocByIds () throws IOException, SolrServerException {
    List ids = new ArrayList<>();
    ids.add("9");
    ids.add("10");
    solrServer.deleteById(ids);
    solrServer.commit();
}

/**
 * 根据查询条件删除
 */
@Test
public void deleteAll() throws IOException, SolrServerException {
    // *:* 删除所有doc
    solrServer.deleteByQuery("*:*");
    solrServer.commit();
}

7> 查询

/**
 * 查询所有DOC，返回Results
 */
@Test
public void selectByDoc () throws SolrServerException {
    SolrQuery query = new SolrQuery("*:*");
    QueryResponse response = solrServer.query(query);
    SolrDocumentList results = response.getResults();
    for (org.apache.solr.common.SolrDocument result : results) {
        String id = (String) result.getFieldValue("id");
        Double price = (Double) result.getFieldValue("price");
        Collection