现在移动开发中越来越多的App都有周边搜索,有找附近的人的,附近的酒店,附近的餐馆的。接下来我们就来讲一下强大的Solr来帮我们构建周边搜索之酒店搜索。
1 下载 Solr 3.6.2
下载地址:http://www.apache.org/dyn/closer.cgi/lucene/solr/3.6.2
提取apache-solr-3.6.2.zip里的apache-solr-3.6.2.war到F:\, 后面会讲解如何部署这个war包
2 建立solr的索引库配置
2.1 在D:\建立目录hotel_solr
2.2 在D:\hotel_solr下新建solr.xml,内容如下:
<?xml version="1.0" encoding="UTF-8" ?> <solr persistent="false"> <cores adminPath="/admin/cores"> <core name="core0" instanceDir="core0" /> <!--<core name="core1" instanceDir="core1" />--> </cores> </solr>2.3 在D:\hotel_solr新建core0\conf目录
2.4 在D:\hotel_solr\core0\conf目录下,新建schema.xml文件,内容如下:
<?xml version="1.0" ?> <schema name="example core zero" version="1.1"> <types> <fieldType name="string" class="solr.StrField" sortMissingLast="true" omitNorms="true"/> <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true" omitNorms="true"/> <fieldType name="integer" class="solr.IntField" omitNorms="true"/> <fieldType name="int" class="solr.TrieIntField" precisionStep="0" omitNorms="true" positionIncrementGap="0"/> <fieldType name="float" class="solr.TrieFloatField" precisionStep="0" omitNorms="true" positionIncrementGap="0"/> <fieldType name="long" class="solr.TrieLongField" precisionStep="0" omitNorms="true" positionIncrementGap="0"/> <fieldType name="double" class="solr.TrieDoubleField" precisionStep="0" omitNorms="true" positionIncrementGap="0"/> <fieldType name="tint" class="solr.TrieIntField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/> <fieldType name="tfloat" class="solr.TrieFloatField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/> <fieldType name="tlong" class="solr.TrieLongField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/> <fieldType name="tdouble" class="solr.TrieDoubleField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/> <fieldType name="sint" class="solr.SortableIntField" sortMissingLast="true" omitNorms="true"/> <fieldType name="slong" class="solr.SortableLongField" sortMissingLast="true" omitNorms="true"/> <fieldType name="sfloat" class="solr.SortableFloatField" sortMissingLast="true" omitNorms="true"/> <fieldType name="sdouble" class="solr.SortableDoubleField" sortMissingLast="true" omitNorms="true"/> <fieldType name="date" class="solr.TrieDateField" omitNorms="true" precisionStep="0" positionIncrementGap="0"/> <fieldType name="tdate" class="solr.TrieDateField" omitNorms="true" precisionStep="6" positionIncrementGap="0"/> <fieldtype name="ignored" stored="false" indexed="false" class="solr.StrField"/> <fieldtype name="location" class="solr.LatLonType" subFieldSuffix="_d"/> <fieldType name="text" class="solr.TextField" positionIncrementGap="100"> <analyzer type="index"> <tokenizer class="solr.StandardTokenizerFactory"/> <filter class="solr.LowerCaseFilterFactory"/> </analyzer> <analyzer type="query"> <tokenizer class="solr.StandardTokenizerFactory"/> <filter class="solr.LowerCaseFilterFactory"/> </analyzer> </fieldType> </types> <fields> <field name="hotel_id" type="integer" indexed="true" stored="true" required="true"/> <field name="crawl_hotel_id" type="string" indexed="true" stored="true" multiValued="false" required="true"/> <field name="name" type="text" indexed="true" stored="true" multiValued="false" required="true"/> <field name="address" type="text" indexed="true" stored="true" multiValued="false" required="true"/> <field name="search_kw" type="text" indexed="true" multiValued="true" stored="false" /> <field name="latlng" type="location" indexed="true" /> <dynamicField name="*_d" type="double" indexed="true" stored="true"/> </fields> <copyField source="name" dest="search_kw" /> <copyField source="address" dest="search_kw" /> <uniqueKey>hotel_id</uniqueKey> <defaultSearchField>search_kw</defaultSearchField> <solrQueryParser defaultOperator="AND"/> </schema>2.5 在D:\hotel_solr\core0\conf目录下,新建solrconfig.xml文件,内容如下:
<?xml version="1.0" encoding="UTF-8" ?> <config> <luceneMatchVersion>LUCENE_36</luceneMatchVersion> <directoryFactory name="DirectoryFactory" class="${solr.directoryFactory:solr.StandardDirectoryFactory}"/> <updateHandler class="solr.DirectUpdateHandler2" /> <requestDispatcher handleSelect="true" > <requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048" /> </requestDispatcher> <requestHandler name="standard" class="solr.StandardRequestHandler" default="true" /> <requestHandler name="/update" class="solr.XmlUpdateRequestHandler" /> <requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers" /> <admin> <defaultQuery>*:*</defaultQuery> </admin> </config>到这里为止Solr的索引配置完成.
3 配置tomcat
3.1 让tomcat支持HTTP GET UTF-8编码的支持, 打开D:\apache-tomcat-7.0.16\conf\server.xml,修成如下地方:
<Connector port="8080" protocol="HTTP/1.1" connectionTimeout="20000" redirectPort="8443" URIEncoding="UTF-8"/>3.2 配置solr的war包
在D:\apache-tomcat-7.0.16\conf\Catalina\localhost新建solr.xml,内容如下:
<Context docBase="F:/apache-solr-3.6.2.war" debug="0" crossContext="true" > <Environment name="solr/home" type="java.lang.String" value="D:/hotel_solr" override="true" /> </Context>3.3 启动tomcat, 在浏览器中输入: http://localhost:8080/solr/ 如果出现 Admin core0 表示正常。
4 准备酒店数据(如果没有自己去建立)
5 把数据库中的酒店数据添加到Solr索引库中
使用Solrj客户端进行索引构建和查询,MAVEN依赖包:
<dependency> <groupId>junit</groupId> <artifactId>junit</artifactId> <version>3.8.1</version> <scope>test</scope> </dependency> <dependency> <groupId>org.apache.solr</groupId> <artifactId>solr-solrj</artifactId> <version>3.6.0</version> </dependency> <dependency> <groupId>mysql</groupId> <artifactId>mysql-connector-java</artifactId> <version>5.1.19</version> </dependency> <dependency> <groupId>commons-lang</groupId> <artifactId>commons-lang</artifactId> <version>2.6</version> </dependency> <dependency> <groupId>org.apache.httpcomponents</groupId> <artifactId>httpclient</artifactId> <version>4.1.3</version> </dependency> <dependency> <groupId>org.apache.httpcomponents</groupId> <artifactId>httpclient-cache</artifactId> <version>4.1.3</version> </dependency> <dependency> <groupId>org.apache.httpcomponents</groupId> <artifactId>httpmime</artifactId> <version>4.1.3</version> </dependency> <dependency> <groupId>org.slf4j</groupId> <artifactId>slf4j-simple</artifactId> <version>1.6.4</version> </dependency>Java代码:
import java.sql.Connection; import java.sql.DriverManager; import java.sql.ResultSet; import java.sql.SQLException; import java.sql.Statement; import java.util.HashMap; import java.util.Map; import org.apache.commons.lang.StringUtils; import org.apache.solr.client.solrj.SolrRequest.METHOD; import org.apache.solr.client.solrj.impl.HttpSolrServer; import org.apache.solr.client.solrj.response.QueryResponse; import org.apache.solr.common.SolrDocumentList; import org.apache.solr.common.SolrInputDocument; import org.apache.solr.common.params.MapSolrParams; public class App { /** * 初始化索引数据 * @param solrServer * @throws Exception */ public static void buildIndex(String solrServer) throws Exception { Connection connect = null; Statement statement = null; ResultSet resultSet = null; HttpSolrServer server = null; try { Class.forName("com.mysql.jdbc.Driver"); connect = DriverManager .getConnection("jdbc:mysql://localhost/hotel_analysis?" + "user=root&password=11111"); statement = connect.createStatement(); resultSet = statement .executeQuery("select hotel_id,crawl_hotel_id,hotel_name,hotel_address,hotel_location from crawl_hotel"); server = new HttpSolrServer(solrServer); int count = 0; int eachCommit = 100; //从数据库中获取酒店数据 while (resultSet.next()) { Integer hotel_id = resultSet.getInt(1); String crawl_hotel_id = resultSet.getString(2); String hotel_name = resultSet.getString(3); String hotel_address = resultSet.getString(4); String hotel_location = resultSet.getString(5); if (StringUtils.isBlank(hotel_location)) { continue; } count++; //添加酒店数据到Solr索引中 SolrInputDocument doc = new SolrInputDocument(); doc.addField("hotel_id", hotel_id); doc.addField("crawl_hotel_id", crawl_hotel_id); doc.addField("name", hotel_name); doc.addField("address", hotel_address); doc.addField("latlng", hotel_location); server.add(doc); //100条commit一次 if (count % eachCommit == 0) { server.commit(); count = 0; } } if (count > 0) { server.commit(); count = 0; } } finally { if (null != resultSet) { try { resultSet.close(); } catch (SQLException ex) { } } if (null != statement) { try { statement.close(); } catch (SQLException ex) { } } if (null != connect) { try { connect.close(); } catch (SQLException ex) { } } } } public static void main(String[] args) throws Exception { String URL = "http://localhost:8080/solr/core0"; //构建索引到Solr库 buildIndex(URL); //索引周边查询 //queryTest(URL); } /** * 测试索引查询 * http://localhost:8080/solr/core0/select?q=*%3A*&fq=%7B%21geofilt%7D&pt=31.26552%2C121.460815&sfield=latlng&d=2&sort=geodist%28%29+asc&fl=*%2Cscore&start=0&rows=10 * @param solrServer * @throws Exception */ public static void queryTest(String solrServer) throws Exception { HttpSolrServer server = new HttpSolrServer(solrServer); Map<String,String> params = new HashMap<String,String>(); params.put("q", "*:*"); params.put("fq", "{!geofilt}");//距离过滤函数 params.put("pt", "31.26552,121.460815");//当前经纬度 params.put("sfield", "latlng");//经纬度的字段 params.put("d", "2");//就近2公里的所有酒店 params.put("sort", "geodist() asc");//根据距离排序 params.put("fl", "*,score"); params.put("start", "0");//记录开始位置 params.put("rows", "10");//查询的行数 QueryResponse resp = server.query(new MapSolrParams(params), METHOD.POST); SolrDocumentList docs = resp.getResults(); for(int i=0;i<docs.size();i++){ System.out.println(docs.get(i)); } } }
6 查询展示:
查询结果页: