tmp commit for search. start nccu0621 first
This commit is contained in:
parent
cb17fe0825
commit
3f95fe4f13
5
Gemfile
5
Gemfile
|
@ -37,9 +37,8 @@ gem 'therubyracer' if RUBY_PLATFORM.downcase.include?("linux")
|
|||
|
||||
gem "impressionist", :require => "impressionist", :path => "vendor/impressionist"
|
||||
|
||||
# gem "tire"
|
||||
gem 'sunspot_rails', "~> 1.3.2"
|
||||
gem 'sunspot_solr'
|
||||
gem "tire"
|
||||
|
||||
|
||||
# Gems used only for assets and not required
|
||||
# in production environments by default.
|
||||
|
|
13
Gemfile.lock
13
Gemfile.lock
|
@ -96,6 +96,7 @@ GEM
|
|||
railties (>= 3.0.0)
|
||||
fastercsv (1.5.4)
|
||||
haml (3.1.4)
|
||||
hashr (0.0.21)
|
||||
hike (1.2.1)
|
||||
hoe (2.16.1)
|
||||
rake (~> 0.8)
|
||||
|
@ -185,6 +186,8 @@ GEM
|
|||
redis (>= 2.0.1)
|
||||
resque (>= 1.8.0)
|
||||
rufus-scheduler
|
||||
rest-client (1.6.7)
|
||||
mime-types (>= 1.16)
|
||||
rsolr (1.0.8)
|
||||
builder (>= 2.1.2)
|
||||
rspec (2.8.0)
|
||||
|
@ -253,13 +256,18 @@ GEM
|
|||
sunspot_rails (1.3.3)
|
||||
nokogiri
|
||||
sunspot (= 1.3.3)
|
||||
sunspot_solr (1.3.3)
|
||||
therubyracer (0.9.9)
|
||||
libv8 (~> 3.3.10)
|
||||
thor (0.14.6)
|
||||
tilt (1.3.3)
|
||||
tinymce-rails (3.4.8)
|
||||
railties (>= 3.1)
|
||||
tire (0.4.2)
|
||||
activemodel (>= 3.0)
|
||||
hashr (~> 0.0.19)
|
||||
multi_json (~> 1.0)
|
||||
rake
|
||||
rest-client (~> 1.6)
|
||||
transaction-simple (1.4.0)
|
||||
hoe (>= 1.1.7)
|
||||
treetop (1.4.10)
|
||||
|
@ -327,9 +335,8 @@ DEPENDENCIES
|
|||
spork
|
||||
sprockets
|
||||
sunspot-rails-tester
|
||||
sunspot_rails (~> 1.3.2)
|
||||
sunspot_solr
|
||||
therubyracer
|
||||
tinymce-rails
|
||||
tire
|
||||
uglifier
|
||||
watchr
|
||||
|
|
|
@ -1,46 +0,0 @@
|
|||
# coding: utf-8
|
||||
# 基本 Model,加入一些通用功能
|
||||
module Mongoid
|
||||
module BaseModel
|
||||
extend ActiveSupport::Concern
|
||||
|
||||
included do
|
||||
scope :recent, desc(:_id)
|
||||
scope :exclude_ids, Proc.new { |ids| where(:_id.nin => ids.map(&:to_i)) }
|
||||
scope :by_week, where(:created_at.gte => 7.days.ago.utc)
|
||||
end
|
||||
|
||||
module ClassMethods
|
||||
# like ActiveRecord find_by_id
|
||||
def find_by_id(id)
|
||||
if id.is_a?(Integer) or id.is_a?(String)
|
||||
where(:_id => id.to_i).first
|
||||
else
|
||||
nil
|
||||
end
|
||||
end
|
||||
|
||||
def find_in_batches(opts = {})
|
||||
batch_size = opts[:batch_size] || 1000
|
||||
start = opts.delete(:start).to_i || 0
|
||||
objects = self.limit(batch_size).skip(start)
|
||||
t = Time.new
|
||||
while objects.any?
|
||||
yield objects
|
||||
start += batch_size
|
||||
# Rails.logger.debug("processed #{start} records in #{Time.new - t} seconds") if Rails.logger.debug?
|
||||
break if objects.size < batch_size
|
||||
objects = self.limit(batch_size).skip(start)
|
||||
end
|
||||
end
|
||||
|
||||
def delay
|
||||
Sidekiq::Extensions::Proxy.new(DelayedDocument, self)
|
||||
end
|
||||
end
|
||||
|
||||
def delay
|
||||
Sidekiq::Extensions::Proxy.new(DelayedDocument, self)
|
||||
end
|
||||
end
|
||||
end
|
|
@ -1,46 +0,0 @@
|
|||
# coding: utf-8
|
||||
# this is from : https://github.com/jugyo/sunspot_mongoid
|
||||
# this file is special for mongoid_auto_increment_id
|
||||
require 'sunspot'
|
||||
require 'mongoid'
|
||||
require 'sunspot/rails'
|
||||
|
||||
# == Examples:
|
||||
#
|
||||
# class Post
|
||||
# include Mongoid::Document
|
||||
# field :title
|
||||
#
|
||||
# include Sunspot::Mongoid
|
||||
# searchable do
|
||||
# text :title
|
||||
# end
|
||||
# end
|
||||
#
|
||||
module Sunspot
|
||||
module Mongoid
|
||||
def self.included(base)
|
||||
base.class_eval do
|
||||
extend Sunspot::Rails::Searchable::ActsAsMethods
|
||||
Sunspot::Adapters::DataAccessor.register(DataAccessor, base)
|
||||
Sunspot::Adapters::InstanceAdapter.register(InstanceAdapter, base)
|
||||
end
|
||||
end
|
||||
|
||||
class InstanceAdapter < Sunspot::Adapters::InstanceAdapter
|
||||
def id
|
||||
@instance.id
|
||||
end
|
||||
end
|
||||
|
||||
class DataAccessor < Sunspot::Adapters::DataAccessor
|
||||
def load(id)
|
||||
@clazz.where(:_id => id).first
|
||||
end
|
||||
|
||||
def load_all(ids)
|
||||
@clazz.where(:_id.in => ids.collect { |id| id.to_i })
|
||||
end
|
||||
end
|
||||
end
|
||||
end
|
|
@ -5,6 +5,7 @@ num_workers = rails_env == 'production' ? 5 : 2
|
|||
num_workers.times do |num|
|
||||
God.watch do |w|
|
||||
w.dir = "#{rails_root}"
|
||||
w.log = "#{rails_root}/log/myprocess.log"
|
||||
w.name = "resque-#{num}"
|
||||
w.group = 'resque'
|
||||
w.interval = 30.seconds
|
||||
|
|
|
@ -14,7 +14,7 @@ $(document).ready(function() {
|
|||
function ajax_load_proc(wapper,url){
|
||||
wapper.load(url,function(respText,textSta,XML){
|
||||
if(textSta == 'error')
|
||||
wapper.html("Loading Failed");
|
||||
wapper.html("Loading Failed<br/> <a href='"+$(this).attr('path')+"'>Go See</a>");
|
||||
});
|
||||
}
|
||||
|
||||
|
|
|
@ -1,31 +0,0 @@
|
|||
<!--
|
||||
Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
contributor license agreements. See the NOTICE file distributed with
|
||||
this work for additional information regarding copyright ownership.
|
||||
The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
(the "License"); you may not use this file except in compliance with
|
||||
the License. You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License.
|
||||
-->
|
||||
|
||||
<!-- The content of this page will be statically included into the top
|
||||
of the admin page. Uncomment this as an example to see there the content
|
||||
will show up.
|
||||
|
||||
<hr>
|
||||
<i>This line will appear before the first table</i>
|
||||
<tr>
|
||||
<td colspan="2">
|
||||
This row will be appended to the end of the first table
|
||||
</td>
|
||||
</tr>
|
||||
<hr>
|
||||
|
||||
-->
|
|
@ -1,36 +0,0 @@
|
|||
<?xml version="1.0" encoding="UTF-8" ?>
|
||||
<!--
|
||||
Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
contributor license agreements. See the NOTICE file distributed with
|
||||
this work for additional information regarding copyright ownership.
|
||||
The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
(the "License"); you may not use this file except in compliance with
|
||||
the License. You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License.
|
||||
-->
|
||||
|
||||
<!-- If this file is found in the config directory, it will only be
|
||||
loaded once at startup. If it is found in Solr's data
|
||||
directory, it will be re-loaded every commit.
|
||||
-->
|
||||
|
||||
<elevate>
|
||||
<query text="foo bar">
|
||||
<doc id="1" />
|
||||
<doc id="2" />
|
||||
<doc id="3" />
|
||||
</query>
|
||||
|
||||
<query text="ipod">
|
||||
<doc id="MA147LL/A" /> <!-- put the actual ipod at the top -->
|
||||
<doc id="IW-02" exclude="true" /> <!-- exclude this cable -->
|
||||
</query>
|
||||
|
||||
</elevate>
|
|
@ -1,246 +0,0 @@
|
|||
# The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
# (the "License"); you may not use this file except in compliance with
|
||||
# the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
# Syntax:
|
||||
# "source" => "target"
|
||||
# "source".length() > 0 (source cannot be empty.)
|
||||
# "target".length() >= 0 (target can be empty.)
|
||||
|
||||
# example:
|
||||
# "À" => "A"
|
||||
# "\u00C0" => "A"
|
||||
# "\u00C0" => "\u0041"
|
||||
# "ß" => "ss"
|
||||
# "\t" => " "
|
||||
# "\n" => ""
|
||||
|
||||
# À => A
|
||||
"\u00C0" => "A"
|
||||
|
||||
# Á => A
|
||||
"\u00C1" => "A"
|
||||
|
||||
# Â => A
|
||||
"\u00C2" => "A"
|
||||
|
||||
# Ã => A
|
||||
"\u00C3" => "A"
|
||||
|
||||
# Ä => A
|
||||
"\u00C4" => "A"
|
||||
|
||||
# Å => A
|
||||
"\u00C5" => "A"
|
||||
|
||||
# Æ => AE
|
||||
"\u00C6" => "AE"
|
||||
|
||||
# Ç => C
|
||||
"\u00C7" => "C"
|
||||
|
||||
# È => E
|
||||
"\u00C8" => "E"
|
||||
|
||||
# É => E
|
||||
"\u00C9" => "E"
|
||||
|
||||
# Ê => E
|
||||
"\u00CA" => "E"
|
||||
|
||||
# Ë => E
|
||||
"\u00CB" => "E"
|
||||
|
||||
# Ì => I
|
||||
"\u00CC" => "I"
|
||||
|
||||
# Í => I
|
||||
"\u00CD" => "I"
|
||||
|
||||
# Î => I
|
||||
"\u00CE" => "I"
|
||||
|
||||
# Ï => I
|
||||
"\u00CF" => "I"
|
||||
|
||||
# IJ => IJ
|
||||
"\u0132" => "IJ"
|
||||
|
||||
# Ð => D
|
||||
"\u00D0" => "D"
|
||||
|
||||
# Ñ => N
|
||||
"\u00D1" => "N"
|
||||
|
||||
# Ò => O
|
||||
"\u00D2" => "O"
|
||||
|
||||
# Ó => O
|
||||
"\u00D3" => "O"
|
||||
|
||||
# Ô => O
|
||||
"\u00D4" => "O"
|
||||
|
||||
# Õ => O
|
||||
"\u00D5" => "O"
|
||||
|
||||
# Ö => O
|
||||
"\u00D6" => "O"
|
||||
|
||||
# Ø => O
|
||||
"\u00D8" => "O"
|
||||
|
||||
# Œ => OE
|
||||
"\u0152" => "OE"
|
||||
|
||||
# Þ
|
||||
"\u00DE" => "TH"
|
||||
|
||||
# Ù => U
|
||||
"\u00D9" => "U"
|
||||
|
||||
# Ú => U
|
||||
"\u00DA" => "U"
|
||||
|
||||
# Û => U
|
||||
"\u00DB" => "U"
|
||||
|
||||
# Ü => U
|
||||
"\u00DC" => "U"
|
||||
|
||||
# Ý => Y
|
||||
"\u00DD" => "Y"
|
||||
|
||||
# Ÿ => Y
|
||||
"\u0178" => "Y"
|
||||
|
||||
# à => a
|
||||
"\u00E0" => "a"
|
||||
|
||||
# á => a
|
||||
"\u00E1" => "a"
|
||||
|
||||
# â => a
|
||||
"\u00E2" => "a"
|
||||
|
||||
# ã => a
|
||||
"\u00E3" => "a"
|
||||
|
||||
# ä => a
|
||||
"\u00E4" => "a"
|
||||
|
||||
# å => a
|
||||
"\u00E5" => "a"
|
||||
|
||||
# æ => ae
|
||||
"\u00E6" => "ae"
|
||||
|
||||
# ç => c
|
||||
"\u00E7" => "c"
|
||||
|
||||
# è => e
|
||||
"\u00E8" => "e"
|
||||
|
||||
# é => e
|
||||
"\u00E9" => "e"
|
||||
|
||||
# ê => e
|
||||
"\u00EA" => "e"
|
||||
|
||||
# ë => e
|
||||
"\u00EB" => "e"
|
||||
|
||||
# ì => i
|
||||
"\u00EC" => "i"
|
||||
|
||||
# í => i
|
||||
"\u00ED" => "i"
|
||||
|
||||
# î => i
|
||||
"\u00EE" => "i"
|
||||
|
||||
# ï => i
|
||||
"\u00EF" => "i"
|
||||
|
||||
# ij => ij
|
||||
"\u0133" => "ij"
|
||||
|
||||
# ð => d
|
||||
"\u00F0" => "d"
|
||||
|
||||
# ñ => n
|
||||
"\u00F1" => "n"
|
||||
|
||||
# ò => o
|
||||
"\u00F2" => "o"
|
||||
|
||||
# ó => o
|
||||
"\u00F3" => "o"
|
||||
|
||||
# ô => o
|
||||
"\u00F4" => "o"
|
||||
|
||||
# õ => o
|
||||
"\u00F5" => "o"
|
||||
|
||||
# ö => o
|
||||
"\u00F6" => "o"
|
||||
|
||||
# ø => o
|
||||
"\u00F8" => "o"
|
||||
|
||||
# œ => oe
|
||||
"\u0153" => "oe"
|
||||
|
||||
# ß => ss
|
||||
"\u00DF" => "ss"
|
||||
|
||||
# þ => th
|
||||
"\u00FE" => "th"
|
||||
|
||||
# ù => u
|
||||
"\u00F9" => "u"
|
||||
|
||||
# ú => u
|
||||
"\u00FA" => "u"
|
||||
|
||||
# û => u
|
||||
"\u00FB" => "u"
|
||||
|
||||
# ü => u
|
||||
"\u00FC" => "u"
|
||||
|
||||
# ý => y
|
||||
"\u00FD" => "y"
|
||||
|
||||
# ÿ => y
|
||||
"\u00FF" => "y"
|
||||
|
||||
# ff => ff
|
||||
"\uFB00" => "ff"
|
||||
|
||||
# fi => fi
|
||||
"\uFB01" => "fi"
|
||||
|
||||
# fl => fl
|
||||
"\uFB02" => "fl"
|
||||
|
||||
# ffi => ffi
|
||||
"\uFB03" => "ffi"
|
||||
|
||||
# ffl => ffl
|
||||
"\uFB04" => "ffl"
|
||||
|
||||
# ſt => ft
|
||||
"\uFB05" => "ft"
|
||||
|
||||
# st => st
|
||||
"\uFB06" => "st"
|
|
@ -1,21 +0,0 @@
|
|||
# The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
# (the "License"); you may not use this file except in compliance with
|
||||
# the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
#-----------------------------------------------------------------------
|
||||
# Use a protected word file to protect against the stemmer reducing two
|
||||
# unrelated words to the same base word.
|
||||
|
||||
# Some non-words that normally won't be encountered,
|
||||
# just to test that they won't be stemmed.
|
||||
dontstems
|
||||
zwhacky
|
||||
|
|
@ -1,245 +0,0 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<!--
|
||||
Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
contributor license agreements. See the NOTICE file distributed with
|
||||
this work for additional information regarding copyright ownership.
|
||||
The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
(the "License"); you may not use this file except in compliance with
|
||||
the License. You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License.
|
||||
-->
|
||||
<!--
|
||||
This is the Solr schema file. This file should be named "schema.xml" and
|
||||
should be in the conf directory under the solr home
|
||||
(i.e. ./solr/conf/schema.xml by default)
|
||||
or located where the classloader for the Solr webapp can find it.
|
||||
|
||||
This example schema is the recommended starting point for users.
|
||||
It should be kept correct and concise, usable out-of-the-box.
|
||||
|
||||
For more information, on how to customize this file, please see
|
||||
http://wiki.apache.org/solr/SchemaXml
|
||||
|
||||
PERFORMANCE NOTE: this schema includes many optional features and should not
|
||||
be used for benchmarking. To improve performance one could
|
||||
- set stored="false" for all fields possible (esp large fields) when you
|
||||
only need to search on the field but don't need to return the original
|
||||
value.
|
||||
- set indexed="false" if you don't need to search on the field, but only
|
||||
return the field as a result of searching on other indexed fields.
|
||||
- remove all unneeded copyField statements
|
||||
- for best index size and searching performance, set "index" to false
|
||||
for all general text fields, use copyField to copy them to the
|
||||
catchall "text" field, and use that for searching.
|
||||
- For maximum indexing performance, use the StreamingUpdateSolrServer
|
||||
java client.
|
||||
- Remember to run the JVM in server mode, and use a higher logging level
|
||||
that avoids logging every request
|
||||
-->
|
||||
<schema name="sunspot" version="1.0">
|
||||
<types>
|
||||
<!-- field type definitions. The "name" attribute is
|
||||
just a label to be used by field definitions. The "class"
|
||||
attribute and any other attributes determine the real
|
||||
behavior of the fieldType.
|
||||
Class names starting with "solr" refer to java classes in the
|
||||
org.apache.solr.analysis package.
|
||||
-->
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="string" class="solr.StrField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="tdouble" class="solr.TrieDoubleField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="rand" class="solr.RandomSortField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="text" class="solr.TextField" omitNorms="false">
|
||||
<analyzer>
|
||||
<tokenizer class="solr.CJKTokenizerFactory"/>
|
||||
<filter class="solr.StandardFilterFactory"/>
|
||||
<filter class="solr.LowerCaseFilterFactory"/>
|
||||
<filter class="solr.NGramFilterFactory" minGramSize="2" maxGramSize="15"/>
|
||||
</analyzer>
|
||||
|
||||
<analyzer type="query">
|
||||
<tokenizer class="solr.StandardTokenizerFactory"/>
|
||||
<filter class="solr.StandardFilterFactory"/>
|
||||
<filter class="solr.LowerCaseFilterFactory"/>
|
||||
</analyzer>
|
||||
</fieldType>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="boolean" class="solr.BoolField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="date" class="solr.DateField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="sdouble" class="solr.SortableDoubleField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="sfloat" class="solr.SortableFloatField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="sint" class="solr.SortableIntField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="slong" class="solr.SortableLongField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="tint" class="solr.TrieIntField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="tfloat" class="solr.TrieFloatField" omitNorms="true"/>
|
||||
<!-- *** This fieldType is used by Sunspot! *** -->
|
||||
<fieldType name="tdate" class="solr.TrieDateField" omitNorms="true"/>
|
||||
</types>
|
||||
<fields>
|
||||
<!-- Valid attributes for fields:
|
||||
name: mandatory - the name for the field
|
||||
type: mandatory - the name of a previously defined type from the
|
||||
<types> section
|
||||
indexed: true if this field should be indexed (searchable or sortable)
|
||||
stored: true if this field should be retrievable
|
||||
compressed: [false] if this field should be stored using gzip compression
|
||||
(this will only apply if the field type is compressable; among
|
||||
the standard field types, only TextField and StrField are)
|
||||
multiValued: true if this field may contain multiple values per document
|
||||
omitNorms: (expert) set to true to omit the norms associated with
|
||||
this field (this disables length normalization and index-time
|
||||
boosting for the field, and saves some memory). Only full-text
|
||||
fields or fields that need an index-time boost need norms.
|
||||
termVectors: [false] set to true to store the term vector for a
|
||||
given field.
|
||||
When using MoreLikeThis, fields used for similarity should be
|
||||
stored for best performance.
|
||||
termPositions: Store position information with the term vector.
|
||||
This will increase storage costs.
|
||||
termOffsets: Store offset information with the term vector. This
|
||||
will increase storage costs.
|
||||
default: a value that should be used if no value is specified
|
||||
when adding a document.
|
||||
-->
|
||||
<!-- *** This field is used by Sunspot! *** -->
|
||||
<field name="id" stored="true" type="string" multiValued="false" indexed="true"/>
|
||||
<!-- *** This field is used by Sunspot! *** -->
|
||||
<field name="type" stored="false" type="string" multiValued="true" indexed="true"/>
|
||||
<!-- *** This field is used by Sunspot! *** -->
|
||||
<field name="class_name" stored="false" type="string" multiValued="false" indexed="true"/>
|
||||
<!-- *** This field is used by Sunspot! *** -->
|
||||
<field name="text" stored="false" type="string" multiValued="true" indexed="true"/>
|
||||
<!-- *** This field is used by Sunspot! *** -->
|
||||
<field name="lat" stored="true" type="tdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This field is used by Sunspot! *** -->
|
||||
<field name="lng" stored="true" type="tdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="random_*" stored="false" type="rand" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="_local*" stored="false" type="tdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_text" stored="false" type="text" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_texts" stored="true" type="text" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_b" stored="false" type="boolean" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_bm" stored="false" type="boolean" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_bs" stored="true" type="boolean" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_bms" stored="true" type="boolean" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_d" stored="false" type="date" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_dm" stored="false" type="date" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ds" stored="true" type="date" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_dms" stored="true" type="date" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_e" stored="false" type="sdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_em" stored="false" type="sdouble" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_es" stored="true" type="sdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ems" stored="true" type="sdouble" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_f" stored="false" type="sfloat" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_fm" stored="false" type="sfloat" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_fs" stored="true" type="sfloat" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_fms" stored="true" type="sfloat" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_i" stored="false" type="sint" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_im" stored="false" type="sint" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_is" stored="true" type="sint" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ims" stored="true" type="sint" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_l" stored="false" type="slong" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_lm" stored="false" type="slong" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ls" stored="true" type="slong" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_lms" stored="true" type="slong" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_s" stored="false" type="string" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_sm" stored="false" type="string" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ss" stored="true" type="string" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_sms" stored="true" type="string" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_it" stored="false" type="tint" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_itm" stored="false" type="tint" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_its" stored="true" type="tint" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_itms" stored="true" type="tint" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ft" stored="false" type="tfloat" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ftm" stored="false" type="tfloat" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_fts" stored="true" type="tfloat" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ftms" stored="true" type="tfloat" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_dt" stored="false" type="tdate" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_dtm" stored="false" type="tdate" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_dts" stored="true" type="tdate" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_dtms" stored="true" type="tdate" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_textv" stored="false" termVectors="true" type="text" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_textsv" stored="true" termVectors="true" type="text" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_et" stored="false" termVectors="true" type="tdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_etm" stored="false" termVectors="true" type="tdouble" multiValued="true" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_ets" stored="true" termVectors="true" type="tdouble" multiValued="false" indexed="true"/>
|
||||
<!-- *** This dynamicField is used by Sunspot! *** -->
|
||||
<dynamicField name="*_etms" stored="true" termVectors="true" type="tdouble" multiValued="true" indexed="true"/>
|
||||
</fields>
|
||||
<!-- Field to use to determine and enforce document uniqueness.
|
||||
Unless this field is marked with required="false", it will be a required field
|
||||
-->
|
||||
<uniqueKey>id</uniqueKey>
|
||||
<!-- field for the QueryParser to use when an explicit fieldname is absent -->
|
||||
<defaultSearchField>text</defaultSearchField>
|
||||
<!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
|
||||
<solrQueryParser defaultOperator="AND"/>
|
||||
<!-- copyField commands copy one field to another at the time a document
|
||||
is added to the index. It's used either to index the same field differently,
|
||||
or to add multiple fields to the same field for easier/faster searching. -->
|
||||
</schema>
|
|
@ -1,24 +0,0 @@
|
|||
# Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
# contributor license agreements. See the NOTICE file distributed with
|
||||
# this work for additional information regarding copyright ownership.
|
||||
# The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
# (the "License"); you may not use this file except in compliance with
|
||||
# the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
user=
|
||||
solr_hostname=localhost
|
||||
solr_port=8983
|
||||
rsyncd_port=18983
|
||||
data_dir=
|
||||
webapp_name=solr
|
||||
master_host=
|
||||
master_data_dir=
|
||||
master_status_dir=
|
|
@ -1,938 +0,0 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<!--
|
||||
Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
contributor license agreements. See the NOTICE file distributed with
|
||||
this work for additional information regarding copyright ownership.
|
||||
The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
(the "License"); you may not use this file except in compliance with
|
||||
the License. You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License.
|
||||
-->
|
||||
<!--
|
||||
For more details about configurations options that may appear in this
|
||||
file, see http://wiki.apache.org/solr/SolrConfigXml.
|
||||
|
||||
Specifically, the Solr Config can support XInclude, which may make it easier to manage
|
||||
the configuration. See https://issues.apache.org/jira/browse/SOLR-1167
|
||||
-->
|
||||
<config>
|
||||
<!-- Set this to 'false' if you want solr to continue working after it has
|
||||
encountered an severe configuration error. In a production environment,
|
||||
you may want solr to keep working even if one handler is mis-configured.
|
||||
|
||||
You may also set this to false using by setting the system property:
|
||||
-Dsolr.abortOnConfigurationError=false
|
||||
-->
|
||||
<abortOnConfigurationError>${solr.abortOnConfigurationError:true}</abortOnConfigurationError>
|
||||
<!-- lib directives can be used to instruct Solr to load an Jars identified
|
||||
and use them to resolve any "plugins" specified in your solrconfig.xml or
|
||||
schema.xml (ie: Analyzers, Request Handlers, etc...).
|
||||
|
||||
All directories and paths are resolved relative the instanceDir.
|
||||
|
||||
If a "./lib" directory exists in your instanceDir, all files found in it
|
||||
are included as if you had used the following syntax...
|
||||
|
||||
<lib dir="./lib" />
|
||||
-->
|
||||
<!-- A dir option by itself adds any files found in the directory to the
|
||||
classpath, this is useful for including all jars in a directory.
|
||||
-->
|
||||
<lib dir="../../contrib/extraction/lib"/>
|
||||
<!-- When a regex is specified in addition to a directory, only the files in that
|
||||
directory which completely match the regex (anchored on both ends)
|
||||
will be included.
|
||||
-->
|
||||
<lib dir="../../dist/" regex="apache-solr-cell-\d.*\.jar"/>
|
||||
<lib dir="../../dist/" regex="apache-solr-clustering-\d.*\.jar"/>
|
||||
<!-- If a dir option (with or without a regex) is used and nothing is found
|
||||
that matches, it will be ignored
|
||||
-->
|
||||
<lib dir="../../contrib/clustering/lib/downloads/"/>
|
||||
<lib dir="../../contrib/clustering/lib/"/>
|
||||
<lib dir="/total/crap/dir/ignored"/>
|
||||
<!-- an exact path can be used to specify a specific file. This will cause
|
||||
a serious error to be logged if it can't be loaded.
|
||||
<lib path="../a-jar-that-does-not-exist.jar" />
|
||||
-->
|
||||
<!-- Used to specify an alternate directory to hold all index data
|
||||
other than the default ./data under the Solr home.
|
||||
If replication is in use, this should match the replication configuration. -->
|
||||
<dataDir>${solr.data.dir:./solr/data}</dataDir>
|
||||
<!-- WARNING: this <indexDefaults> section only provides defaults for index writers
|
||||
in general. See also the <mainIndex> section after that when changing parameters
|
||||
for Solr's main Lucene index. -->
|
||||
<indexDefaults>
|
||||
<!-- Values here affect all index writers and act as a default unless overridden. -->
|
||||
<useCompoundFile>false</useCompoundFile>
|
||||
<mergeFactor>10</mergeFactor>
|
||||
<!-- If both ramBufferSizeMB and maxBufferedDocs is set, then Lucene will flush
|
||||
based on whichever limit is hit first. -->
|
||||
<!--<maxBufferedDocs>1000</maxBufferedDocs>-->
|
||||
<!-- Sets the amount of RAM that may be used by Lucene indexing
|
||||
for buffering added documents and deletions before they are
|
||||
flushed to the Directory. -->
|
||||
<ramBufferSizeMB>32</ramBufferSizeMB>
|
||||
<!-- <maxMergeDocs>2147483647</maxMergeDocs> -->
|
||||
<maxFieldLength>10000</maxFieldLength>
|
||||
<writeLockTimeout>1000</writeLockTimeout>
|
||||
<commitLockTimeout>10000</commitLockTimeout>
|
||||
<!--
|
||||
Expert: Turn on Lucene's auto commit capability. This causes intermediate
|
||||
segment flushes to write a new lucene index descriptor, enabling it to be
|
||||
opened by an external IndexReader. This can greatly slow down indexing
|
||||
speed. NOTE: Despite the name, this value does not have any relation to
|
||||
Solr's autoCommit functionality
|
||||
-->
|
||||
<!--<luceneAutoCommit>false</luceneAutoCommit>-->
|
||||
<!--
|
||||
Expert: The Merge Policy in Lucene controls how merging is handled by
|
||||
Lucene. The default in 2.3 is the LogByteSizeMergePolicy, previous
|
||||
versions used LogDocMergePolicy.
|
||||
|
||||
LogByteSizeMergePolicy chooses segments to merge based on their size. The
|
||||
Lucene 2.2 default, LogDocMergePolicy chose when to merge based on number
|
||||
of documents
|
||||
|
||||
Other implementations of MergePolicy must have a no-argument constructor
|
||||
-->
|
||||
<!--<mergePolicy class="org.apache.lucene.index.LogByteSizeMergePolicy"/>-->
|
||||
<!--
|
||||
Expert:
|
||||
The Merge Scheduler in Lucene controls how merges are performed. The
|
||||
ConcurrentMergeScheduler (Lucene 2.3 default) can perform merges in the
|
||||
background using separate threads. The SerialMergeScheduler (Lucene 2.2
|
||||
default) does not.
|
||||
-->
|
||||
<!--<mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/>-->
|
||||
<!--
|
||||
This option specifies which Lucene LockFactory implementation to use.
|
||||
|
||||
single = SingleInstanceLockFactory - suggested for a read-only index
|
||||
or when there is no possibility of another process trying
|
||||
to modify the index.
|
||||
native = NativeFSLockFactory - uses OS native file locking
|
||||
simple = SimpleFSLockFactory - uses a plain file for locking
|
||||
|
||||
(For backwards compatibility with Solr 1.2, 'simple' is the default
|
||||
if not specified.)
|
||||
-->
|
||||
<lockType>native</lockType>
|
||||
<!--
|
||||
Expert:
|
||||
Controls how often Lucene loads terms into memory -->
|
||||
<!--<termIndexInterval>256</termIndexInterval>-->
|
||||
</indexDefaults>
|
||||
<mainIndex>
|
||||
<!-- options specific to the main on-disk lucene index -->
|
||||
<useCompoundFile>false</useCompoundFile>
|
||||
<ramBufferSizeMB>32</ramBufferSizeMB>
|
||||
<mergeFactor>10</mergeFactor>
|
||||
<!-- Deprecated -->
|
||||
<!--<maxBufferedDocs>1000</maxBufferedDocs>-->
|
||||
<!--<maxMergeDocs>2147483647</maxMergeDocs>-->
|
||||
<!-- inherit from indexDefaults <maxFieldLength>10000</maxFieldLength> -->
|
||||
<!-- If true, unlock any held write or commit locks on startup.
|
||||
This defeats the locking mechanism that allows multiple
|
||||
processes to safely access a lucene index, and should be
|
||||
used with care.
|
||||
This is not needed if lock type is 'none' or 'single'
|
||||
-->
|
||||
<unlockOnStartup>false</unlockOnStartup>
|
||||
<!-- If true, IndexReaders will be reopened (often more efficient) instead
|
||||
of closed and then opened. -->
|
||||
<reopenReaders>true</reopenReaders>
|
||||
<!--
|
||||
Expert:
|
||||
Controls how often Lucene loads terms into memory. Default is 128 and is likely good for most everyone. -->
|
||||
<!--<termIndexInterval>256</termIndexInterval>-->
|
||||
<!--
|
||||
Custom deletion policies can specified here. The class must
|
||||
implement org.apache.lucene.index.IndexDeletionPolicy.
|
||||
|
||||
http://lucene.apache.org/java/2_3_2/api/org/apache/lucene/index/IndexDeletionPolicy.html
|
||||
|
||||
The standard Solr IndexDeletionPolicy implementation supports deleting
|
||||
index commit points on number of commits, age of commit point and
|
||||
optimized status.
|
||||
|
||||
The latest commit point should always be preserved regardless
|
||||
of the criteria.
|
||||
-->
|
||||
<deletionPolicy class="solr.SolrDeletionPolicy">
|
||||
<!-- The number of commit points to be kept -->
|
||||
<str name="maxCommitsToKeep">1</str>
|
||||
<!-- The number of optimized commit points to be kept -->
|
||||
<str name="maxOptimizedCommitsToKeep">0</str>
|
||||
<!--
|
||||
Delete all commit points once they have reached the given age.
|
||||
Supports DateMathParser syntax e.g.
|
||||
|
||||
<str name="maxCommitAge">30MINUTES</str>
|
||||
<str name="maxCommitAge">1DAY</str>
|
||||
-->
|
||||
</deletionPolicy>
|
||||
<!-- To aid in advanced debugging, you may turn on IndexWriter debug logging.
|
||||
Setting to true will set the file that the underlying Lucene IndexWriter
|
||||
will write its debug infostream to. -->
|
||||
<infoStream file="INFOSTREAM.txt">false</infoStream>
|
||||
</mainIndex>
|
||||
<!-- Enables JMX if and only if an existing MBeanServer is found, use this
|
||||
if you want to configure JMX through JVM parameters. Remove this to disable
|
||||
exposing Solr configuration and statistics to JMX.
|
||||
|
||||
If you want to connect to a particular server, specify the agentId
|
||||
e.g. <jmx agentId="myAgent" />
|
||||
|
||||
If you want to start a new MBeanServer, specify the serviceUrl
|
||||
e.g <jmx serviceUrl="service:jmx:rmi:///jndi/rmi://localhost:9999/solr"/>
|
||||
|
||||
For more details see http://wiki.apache.org/solr/SolrJmx
|
||||
-->
|
||||
<jmx/>
|
||||
<!-- the default high-performance update handler -->
|
||||
<updateHandler class="solr.DirectUpdateHandler2">
|
||||
<!-- A prefix of "solr." for class names is an alias that
|
||||
causes solr to search appropriate packages, including
|
||||
org.apache.solr.(search|update|request|core|analysis)
|
||||
-->
|
||||
<!-- Perform a <commit/> automatically under certain conditions:
|
||||
maxDocs - number of updates since last commit is greater than this
|
||||
maxTime - oldest uncommited update (in ms) is this long ago
|
||||
Instead of enabling autoCommit, consider using "commitWithin"
|
||||
when adding documents. http://wiki.apache.org/solr/UpdateXmlMessages
|
||||
<autoCommit>
|
||||
<maxDocs>10000</maxDocs>
|
||||
<maxTime>1000</maxTime>
|
||||
</autoCommit>
|
||||
-->
|
||||
<!-- The RunExecutableListener executes an external command from a
|
||||
hook such as postCommit or postOptimize.
|
||||
exe - the name of the executable to run
|
||||
dir - dir to use as the current working directory. default="."
|
||||
wait - the calling thread waits until the executable returns. default="true"
|
||||
args - the arguments to pass to the program. default=nothing
|
||||
env - environment variables to set. default=nothing
|
||||
-->
|
||||
<!-- A postCommit event is fired after every commit or optimize command
|
||||
<listener event="postCommit" class="solr.RunExecutableListener">
|
||||
<str name="exe">solr/bin/snapshooter</str>
|
||||
<str name="dir">.</str>
|
||||
<bool name="wait">true</bool>
|
||||
<arr name="args"> <str>arg1</str> <str>arg2</str> </arr>
|
||||
<arr name="env"> <str>MYVAR=val1</str> </arr>
|
||||
</listener>
|
||||
-->
|
||||
<!-- A postOptimize event is fired only after every optimize command
|
||||
<listener event="postOptimize" class="solr.RunExecutableListener">
|
||||
<str name="exe">snapshooter</str>
|
||||
<str name="dir">solr/bin</str>
|
||||
<bool name="wait">true</bool>
|
||||
</listener>
|
||||
-->
|
||||
</updateHandler>
|
||||
<!-- Use the following format to specify a custom IndexReaderFactory - allows for alternate
|
||||
IndexReader implementations.
|
||||
|
||||
** Experimental Feature **
|
||||
Please note - Using a custom IndexReaderFactory may prevent certain other features
|
||||
from working. The API to IndexReaderFactory may change without warning or may even
|
||||
be removed from future releases if the problems cannot be resolved.
|
||||
|
||||
** Features that may not work with custom IndexReaderFactory **
|
||||
The ReplicationHandler assumes a disk-resident index. Using a custom
|
||||
IndexReader implementation may cause incompatibility with ReplicationHandler and
|
||||
may cause replication to not work correctly. See SOLR-1366 for details.
|
||||
|
||||
<indexReaderFactory name="IndexReaderFactory" class="package.class">
|
||||
Parameters as required by the implementation
|
||||
</indexReaderFactory >
|
||||
-->
|
||||
<!-- To set the termInfosIndexDivisor, do this: -->
|
||||
<!--<indexReaderFactory name="IndexReaderFactory" class="org.apache.solr.core.StandardIndexReaderFactory">
|
||||
<int name="termInfosIndexDivisor">12</int>
|
||||
</indexReaderFactory >-->
|
||||
<query>
|
||||
<!-- Maximum number of clauses in a boolean query... in the past, this affected
|
||||
range or prefix queries that expanded to big boolean queries - built in Solr
|
||||
query parsers no longer create queries with this limitation.
|
||||
An exception is thrown if exceeded. -->
|
||||
<maxBooleanClauses>1024</maxBooleanClauses>
|
||||
<!-- There are two implementations of cache available for Solr,
|
||||
LRUCache, based on a synchronized LinkedHashMap, and
|
||||
FastLRUCache, based on a ConcurrentHashMap. FastLRUCache has faster gets
|
||||
and slower puts in single threaded operation and thus is generally faster
|
||||
than LRUCache when the hit ratio of the cache is high (> 75%), and may be
|
||||
faster under other scenarios on multi-cpu systems. -->
|
||||
<!-- Cache used by SolrIndexSearcher for filters (DocSets),
|
||||
unordered sets of *all* documents that match a query.
|
||||
When a new searcher is opened, its caches may be prepopulated
|
||||
or "autowarmed" using data from caches in the old searcher.
|
||||
autowarmCount is the number of items to prepopulate. For LRUCache,
|
||||
the autowarmed items will be the most recently accessed items.
|
||||
Parameters:
|
||||
class - the SolrCache implementation LRUCache or FastLRUCache
|
||||
size - the maximum number of entries in the cache
|
||||
initialSize - the initial capacity (number of entries) of
|
||||
the cache. (seel java.util.HashMap)
|
||||
autowarmCount - the number of entries to prepopulate from
|
||||
and old cache.
|
||||
-->
|
||||
<filterCache class="solr.FastLRUCache" size="512" initialSize="512" autowarmCount="0"/>
|
||||
<!-- Cache used to hold field values that are quickly accessible
|
||||
by document id. The fieldValueCache is created by default
|
||||
even if not configured here.
|
||||
<fieldValueCache
|
||||
class="solr.FastLRUCache"
|
||||
size="512"
|
||||
autowarmCount="128"
|
||||
showItems="32"
|
||||
/>
|
||||
-->
|
||||
<!-- queryResultCache caches results of searches - ordered lists of
|
||||
document ids (DocList) based on a query, a sort, and the range
|
||||
of documents requested. -->
|
||||
<queryResultCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
|
||||
<!-- documentCache caches Lucene Document objects (the stored fields for each document).
|
||||
Since Lucene internal document ids are transient, this cache will not be autowarmed. -->
|
||||
<documentCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
|
||||
<!-- If true, stored fields that are not requested will be loaded lazily.
|
||||
This can result in a significant speed improvement if the usual case is to
|
||||
not load all stored fields, especially if the skipped fields are large
|
||||
compressed text fields.
|
||||
-->
|
||||
<enableLazyFieldLoading>true</enableLazyFieldLoading>
|
||||
<!-- Example of a generic cache. These caches may be accessed by name
|
||||
through SolrIndexSearcher.getCache(),cacheLookup(), and cacheInsert().
|
||||
The purpose is to enable easy caching of user/application level data.
|
||||
The regenerator argument should be specified as an implementation
|
||||
of solr.search.CacheRegenerator if autowarming is desired. -->
|
||||
<!--
|
||||
<cache name="myUserCache"
|
||||
class="solr.LRUCache"
|
||||
size="4096"
|
||||
initialSize="1024"
|
||||
autowarmCount="1024"
|
||||
regenerator="org.mycompany.mypackage.MyRegenerator"
|
||||
/>
|
||||
-->
|
||||
<!-- An optimization that attempts to use a filter to satisfy a search.
|
||||
If the requested sort does not include score, then the filterCache
|
||||
will be checked for a filter matching the query. If found, the filter
|
||||
will be used as the source of document ids, and then the sort will be
|
||||
applied to that.
|
||||
<useFilterForSortedQuery>true</useFilterForSortedQuery>
|
||||
-->
|
||||
<!-- An optimization for use with the queryResultCache. When a search
|
||||
is requested, a superset of the requested number of document ids
|
||||
are collected. For example, if a search for a particular query
|
||||
requests matching documents 10 through 19, and queryWindowSize is 50,
|
||||
then documents 0 through 49 will be collected and cached. Any further
|
||||
requests in that range can be satisfied via the cache. -->
|
||||
<queryResultWindowSize>20</queryResultWindowSize>
|
||||
<!-- Maximum number of documents to cache for any entry in the
|
||||
queryResultCache. -->
|
||||
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
||||
<!-- a newSearcher event is fired whenever a new searcher is being prepared
|
||||
and there is a current searcher handling requests (aka registered).
|
||||
It can be used to prime certain caches to prevent long request times for
|
||||
certain requests.
|
||||
-->
|
||||
<!-- QuerySenderListener takes an array of NamedList and executes a
|
||||
local query request for each NamedList in sequence. -->
|
||||
<listener event="newSearcher" class="solr.QuerySenderListener">
|
||||
<arr name="queries">
|
||||
<!--
|
||||
<lst> <str name="q">solr</str> <str name="start">0</str> <str name="rows">10</str> </lst>
|
||||
<lst> <str name="q">rocks</str> <str name="start">0</str> <str name="rows">10</str> </lst>
|
||||
<lst><str name="q">static newSearcher warming query from solrconfig.xml</str></lst>
|
||||
-->
|
||||
</arr>
|
||||
</listener>
|
||||
<!-- a firstSearcher event is fired whenever a new searcher is being
|
||||
prepared but there is no current registered searcher to handle
|
||||
requests or to gain autowarming data from. -->
|
||||
<listener event="firstSearcher" class="solr.QuerySenderListener">
|
||||
<arr name="queries">
|
||||
<lst>
|
||||
<str name="q">solr rocks</str>
|
||||
<str name="start">0</str>
|
||||
<str name="rows">10</str>
|
||||
</lst>
|
||||
<lst>
|
||||
<str name="q">static firstSearcher warming query from solrconfig.xml</str>
|
||||
</lst>
|
||||
</arr>
|
||||
</listener>
|
||||
<!-- If a search request comes in and there is no current registered searcher,
|
||||
then immediately register the still warming searcher and use it. If
|
||||
"false" then all requests will block until the first searcher is done
|
||||
warming. -->
|
||||
<useColdSearcher>false</useColdSearcher>
|
||||
<!-- Maximum number of searchers that may be warming in the background
|
||||
concurrently. An error is returned if this limit is exceeded. Recommend
|
||||
1-2 for read-only slaves, higher for masters w/o cache warming. -->
|
||||
<maxWarmingSearchers>2</maxWarmingSearchers>
|
||||
</query>
|
||||
<!--
|
||||
Let the dispatch filter handler /select?qt=XXX
|
||||
handleSelect=true will use consistent error handling for /select and /update
|
||||
handleSelect=false will use solr1.1 style error formatting
|
||||
-->
|
||||
<requestDispatcher handleSelect="true">
|
||||
<!--Make sure your system has some authentication before enabling remote streaming! -->
|
||||
<requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000"/>
|
||||
<!-- Set HTTP caching related parameters (for proxy caches and clients).
|
||||
|
||||
To get the behaviour of Solr 1.2 (ie: no caching related headers)
|
||||
use the never304="true" option and do not specify a value for
|
||||
<cacheControl>
|
||||
-->
|
||||
<!-- <httpCaching never304="true"> -->
|
||||
<httpCaching lastModifiedFrom="openTime" etagSeed="Solr">
|
||||
<!-- lastModFrom="openTime" is the default, the Last-Modified value
|
||||
(and validation against If-Modified-Since requests) will all be
|
||||
relative to when the current Searcher was opened.
|
||||
You can change it to lastModFrom="dirLastMod" if you want the
|
||||
value to exactly corrispond to when the physical index was last
|
||||
modified.
|
||||
|
||||
etagSeed="..." is an option you can change to force the ETag
|
||||
header (and validation against If-None-Match requests) to be
|
||||
differnet even if the index has not changed (ie: when making
|
||||
significant changes to your config file)
|
||||
|
||||
lastModifiedFrom and etagSeed are both ignored if you use the
|
||||
never304="true" option.
|
||||
-->
|
||||
<!-- If you include a <cacheControl> directive, it will be used to
|
||||
generate a Cache-Control header, as well as an Expires header
|
||||
if the value contains "max-age="
|
||||
|
||||
By default, no Cache-Control header is generated.
|
||||
|
||||
You can use the <cacheControl> option even if you have set
|
||||
never304="true"
|
||||
-->
|
||||
<!-- <cacheControl>max-age=30, public</cacheControl> -->
|
||||
</httpCaching>
|
||||
</requestDispatcher>
|
||||
<!-- requestHandler plugins... incoming queries will be dispatched to the
|
||||
correct handler based on the path or the qt (query type) param.
|
||||
Names starting with a '/' are accessed with the a path equal to the
|
||||
registered name. Names without a leading '/' are accessed with:
|
||||
http://host/app/select?qt=name
|
||||
If no qt is defined, the requestHandler that declares default="true"
|
||||
will be used.
|
||||
-->
|
||||
<requestHandler name="standard" class="solr.SearchHandler" default="true">
|
||||
<!-- default values for query parameters -->
|
||||
<lst name="defaults">
|
||||
<str name="echoParams">explicit</str>
|
||||
<!--
|
||||
<int name="rows">10</int>
|
||||
<str name="fl">*</str>
|
||||
<str name="version">2.1</str>
|
||||
-->
|
||||
</lst>
|
||||
</requestHandler>
|
||||
<!-- Please refer to http://wiki.apache.org/solr/SolrReplication for details on configuring replication -->
|
||||
<!-- remove the <lst name="master"> section if this is just a slave -->
|
||||
<!-- remove the <lst name="slave"> section if this is just a master -->
|
||||
<!--
|
||||
<requestHandler name="/replication" class="solr.ReplicationHandler" >
|
||||
<lst name="master">
|
||||
<str name="replicateAfter">commit</str>
|
||||
<str name="replicateAfter">startup</str>
|
||||
<str name="confFiles">schema.xml,stopwords.txt</str>
|
||||
</lst>
|
||||
<lst name="slave">
|
||||
<str name="masterUrl">http://localhost:8983/solr/replication</str>
|
||||
<str name="pollInterval">00:00:60</str>
|
||||
</lst>
|
||||
</requestHandler>-->
|
||||
<!-- DisMaxRequestHandler allows easy searching across multiple fields
|
||||
for simple user-entered phrases. It's implementation is now
|
||||
just the standard SearchHandler with a default query type
|
||||
of "dismax".
|
||||
see http://wiki.apache.org/solr/DisMaxRequestHandler
|
||||
-->
|
||||
<requestHandler name="dismax" class="solr.SearchHandler">
|
||||
<lst name="defaults">
|
||||
<str name="defType">dismax</str>
|
||||
<str name="echoParams">explicit</str>
|
||||
<float name="tie">0.01</float>
|
||||
<str name="qf">
|
||||
text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4
|
||||
</str>
|
||||
<str name="pf">
|
||||
text^0.2 features^1.1 name^1.5 manu^1.4 manu_exact^1.9
|
||||
</str>
|
||||
<str name="bf">
|
||||
popularity^0.5 recip(price,1,1000,1000)^0.3
|
||||
</str>
|
||||
<str name="fl">
|
||||
id,name,price,score
|
||||
</str>
|
||||
<str name="mm">
|
||||
2<-1 5<-2 6<90%
|
||||
</str>
|
||||
<int name="ps">100</int>
|
||||
<str name="q.alt">*:*</str>
|
||||
<!-- example highlighter config, enable per-query with hl=true -->
|
||||
<str name="hl.fl">text features name</str>
|
||||
<!-- for this field, we want no fragmenting, just highlighting -->
|
||||
<str name="f.name.hl.fragsize">0</str>
|
||||
<!-- instructs Solr to return the field itself if no query terms are
|
||||
found -->
|
||||
<str name="f.name.hl.alternateField">name</str>
|
||||
<str name="f.text.hl.fragmenter">regex</str>
|
||||
<!-- defined below -->
|
||||
</lst>
|
||||
</requestHandler>
|
||||
<!-- Note how you can register the same handler multiple times with
|
||||
different names (and different init parameters)
|
||||
-->
|
||||
<requestHandler name="partitioned" class="solr.SearchHandler">
|
||||
<lst name="defaults">
|
||||
<str name="defType">dismax</str>
|
||||
<str name="echoParams">explicit</str>
|
||||
<str name="qf">text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0</str>
|
||||
<str name="mm">2<-1 5<-2 6<90%</str>
|
||||
<!-- This is an example of using Date Math to specify a constantly
|
||||
moving date range in a config...
|
||||
-->
|
||||
<str name="bq">incubationdate_dt:[* TO NOW/DAY-1MONTH]^2.2</str>
|
||||
</lst>
|
||||
<!-- In addition to defaults, "appends" params can be specified
|
||||
to identify values which should be appended to the list of
|
||||
multi-val params from the query (or the existing "defaults").
|
||||
|
||||
In this example, the param "fq=instock:true" will be appended to
|
||||
any query time fq params the user may specify, as a mechanism for
|
||||
partitioning the index, independent of any user selected filtering
|
||||
that may also be desired (perhaps as a result of faceted searching).
|
||||
|
||||
NOTE: there is *absolutely* nothing a client can do to prevent these
|
||||
"appends" values from being used, so don't use this mechanism
|
||||
unless you are sure you always want it.
|
||||
-->
|
||||
<lst name="appends">
|
||||
<str name="fq">inStock:true</str>
|
||||
</lst>
|
||||
<!-- "invariants" are a way of letting the Solr maintainer lock down
|
||||
the options available to Solr clients. Any params values
|
||||
specified here are used regardless of what values may be specified
|
||||
in either the query, the "defaults", or the "appends" params.
|
||||
|
||||
In this example, the facet.field and facet.query params are fixed,
|
||||
limiting the facets clients can use. Faceting is not turned on by
|
||||
default - but if the client does specify facet=true in the request,
|
||||
these are the only facets they will be able to see counts for;
|
||||
regardless of what other facet.field or facet.query params they
|
||||
may specify.
|
||||
|
||||
NOTE: there is *absolutely* nothing a client can do to prevent these
|
||||
"invariants" values from being used, so don't use this mechanism
|
||||
unless you are sure you always want it.
|
||||
-->
|
||||
<lst name="invariants">
|
||||
<str name="facet.field">cat</str>
|
||||
<str name="facet.field">manu_exact</str>
|
||||
<str name="facet.query">price:[* TO 500]</str>
|
||||
<str name="facet.query">price:[500 TO *]</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
|
||||
<searchComponent name="query" class="org.apache.solr.handler.component.QueryComponent" />
|
||||
|
||||
<searchComponent name="debug" class="org.apache.solr.handler.component.DebugComponent" />
|
||||
<!--
|
||||
Search components are registered to SolrCore and used by Search Handlers
|
||||
|
||||
By default, the following components are avaliable:
|
||||
|
||||
<searchComponent name="query" class="org.apache.solr.handler.component.QueryComponent" />
|
||||
<searchComponent name="facet" class="org.apache.solr.handler.component.FacetComponent" />
|
||||
<searchComponent name="mlt" class="org.apache.solr.handler.component.MoreLikeThisComponent" />
|
||||
<searchComponent name="highlight" class="org.apache.solr.handler.component.HighlightComponent" />
|
||||
<searchComponent name="stats" class="org.apache.solr.handler.component.StatsComponent" />
|
||||
<searchComponent name="debug" class="org.apache.solr.handler.component.DebugComponent" />
|
||||
|
||||
Default configuration in a requestHandler would look like:
|
||||
<arr name="components">
|
||||
<str>query</str>
|
||||
<str>facet</str>
|
||||
<str>mlt</str>
|
||||
<str>highlight</str>
|
||||
<str>stats</str>
|
||||
<str>debug</str>
|
||||
</arr>
|
||||
|
||||
If you register a searchComponent to one of the standard names, that will be used instead.
|
||||
To insert components before or after the 'standard' components, use:
|
||||
|
||||
<arr name="first-components">
|
||||
<str>myFirstComponentName</str>
|
||||
</arr>
|
||||
|
||||
<arr name="last-components">
|
||||
<str>myLastComponentName</str>
|
||||
</arr>
|
||||
-->
|
||||
<!-- The spell check component can return a list of alternative spelling
|
||||
suggestions. -->
|
||||
<searchComponent name="spellcheck" class="solr.SpellCheckComponent">
|
||||
<str name="queryAnalyzerFieldType">textSpell</str>
|
||||
<lst name="spellchecker">
|
||||
<str name="name">default</str>
|
||||
<str name="field">name</str>
|
||||
<str name="spellcheckIndexDir">./spellchecker</str>
|
||||
</lst>
|
||||
<!-- a spellchecker that uses a different distance measure
|
||||
<lst name="spellchecker">
|
||||
<str name="name">jarowinkler</str>
|
||||
<str name="field">spell</str>
|
||||
<str name="distanceMeasure">org.apache.lucene.search.spell.JaroWinklerDistance</str>
|
||||
<str name="spellcheckIndexDir">./spellchecker2</str>
|
||||
</lst>
|
||||
-->
|
||||
<!-- a file based spell checker
|
||||
<lst name="spellchecker">
|
||||
<str name="classname">solr.FileBasedSpellChecker</str>
|
||||
<str name="name">file</str>
|
||||
<str name="sourceLocation">spellings.txt</str>
|
||||
<str name="characterEncoding">UTF-8</str>
|
||||
<str name="spellcheckIndexDir">./spellcheckerFile</str>
|
||||
</lst>
|
||||
-->
|
||||
</searchComponent>
|
||||
<!-- A request handler utilizing the spellcheck component.
|
||||
#############################################################################
|
||||
NOTE: This is purely as an example. The whole purpose of the
|
||||
SpellCheckComponent is to hook it into the request handler that handles (i.e.
|
||||
the standard or dismax SearchHandler) queries such that a separate request is
|
||||
not needed to get suggestions.
|
||||
|
||||
IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS NOT WHAT YOU
|
||||
WANT FOR YOUR PRODUCTION SYSTEM!
|
||||
#############################################################################
|
||||
-->
|
||||
<requestHandler name="/spell" class="solr.SearchHandler" lazy="true">
|
||||
<lst name="defaults">
|
||||
<!-- omp = Only More Popular -->
|
||||
<str name="spellcheck.onlyMorePopular">false</str>
|
||||
<!-- exr = Extended Results -->
|
||||
<str name="spellcheck.extendedResults">false</str>
|
||||
<!-- The number of suggestions to return -->
|
||||
<str name="spellcheck.count">1</str>
|
||||
</lst>
|
||||
<arr name="last-components">
|
||||
<str>spellcheck</str>
|
||||
</arr>
|
||||
</requestHandler>
|
||||
<searchComponent name="tvComponent" class="org.apache.solr.handler.component.TermVectorComponent"/>
|
||||
<!-- A Req Handler for working with the tvComponent. This is purely as an example.
|
||||
You will likely want to add the component to your already specified request handlers. -->
|
||||
<requestHandler name="tvrh" class="org.apache.solr.handler.component.SearchHandler">
|
||||
<lst name="defaults">
|
||||
<bool name="tv">true</bool>
|
||||
</lst>
|
||||
<arr name="last-components">
|
||||
<str>tvComponent</str>
|
||||
</arr>
|
||||
</requestHandler>
|
||||
<!-- Clustering Component
|
||||
http://wiki.apache.org/solr/ClusteringComponent
|
||||
This relies on third party jars which are not included in the release.
|
||||
To use this component (and the "/clustering" handler)
|
||||
Those jars will need to be downloaded, and you'll need to set the
|
||||
solr.cluster.enabled system property when running solr...
|
||||
java -Dsolr.clustering.enabled=true -jar start.jar
|
||||
-->
|
||||
<searchComponent name="clusteringComponent" enable="${solr.clustering.enabled:false}" class="org.apache.solr.handler.clustering.ClusteringComponent">
|
||||
<!-- Declare an engine -->
|
||||
<lst name="engine">
|
||||
<!-- The name, only one can be named "default" -->
|
||||
<str name="name">default</str>
|
||||
<!--
|
||||
Class name of Carrot2 clustering algorithm. Currently available algorithms are:
|
||||
|
||||
* org.carrot2.clustering.lingo.LingoClusteringAlgorithm
|
||||
* org.carrot2.clustering.stc.STCClusteringAlgorithm
|
||||
|
||||
See http://project.carrot2.org/algorithms.html for the algorithm's characteristics.
|
||||
-->
|
||||
<str name="carrot.algorithm">org.carrot2.clustering.lingo.LingoClusteringAlgorithm</str>
|
||||
<!--
|
||||
Overriding values for Carrot2 default algorithm attributes. For a description
|
||||
of all available attributes, see: http://download.carrot2.org/stable/manual/#chapter.components.
|
||||
Use attribute key as name attribute of str elements below. These can be further
|
||||
overridden for individual requests by specifying attribute key as request
|
||||
parameter name and attribute value as parameter value.
|
||||
-->
|
||||
<str name="LingoClusteringAlgorithm.desiredClusterCountBase">20</str>
|
||||
</lst>
|
||||
<lst name="engine">
|
||||
<str name="name">stc</str>
|
||||
<str name="carrot.algorithm">org.carrot2.clustering.stc.STCClusteringAlgorithm</str>
|
||||
</lst>
|
||||
</searchComponent>
|
||||
<requestHandler name="/clustering" enable="${solr.clustering.enabled:false}" class="solr.SearchHandler">
|
||||
<lst name="defaults">
|
||||
<bool name="clustering">true</bool>
|
||||
<str name="clustering.engine">default</str>
|
||||
<bool name="clustering.results">true</bool>
|
||||
<!-- The title field -->
|
||||
<str name="carrot.title">name</str>
|
||||
<str name="carrot.url">id</str>
|
||||
<!-- The field to cluster on -->
|
||||
<str name="carrot.snippet">features</str>
|
||||
<!-- produce summaries -->
|
||||
<bool name="carrot.produceSummary">true</bool>
|
||||
<!-- the maximum number of labels per cluster -->
|
||||
<!--<int name="carrot.numDescriptions">5</int>-->
|
||||
<!-- produce sub clusters -->
|
||||
<bool name="carrot.outputSubClusters">false</bool>
|
||||
</lst>
|
||||
<arr name="last-components">
|
||||
<str>clusteringComponent</str>
|
||||
</arr>
|
||||
</requestHandler>
|
||||
<!-- Solr Cell: http://wiki.apache.org/solr/ExtractingRequestHandler -->
|
||||
<requestHandler name="/update/extract" class="org.apache.solr.handler.extraction.ExtractingRequestHandler" startup="lazy">
|
||||
<lst name="defaults">
|
||||
<!-- All the main content goes into "text"... if you need to return
|
||||
the extracted text or do highlighting, use a stored field. -->
|
||||
<str name="fmap.content">text</str>
|
||||
<str name="lowernames">true</str>
|
||||
<str name="uprefix">ignored_</str>
|
||||
<!-- capture link hrefs but ignore div attributes -->
|
||||
<str name="captureAttr">true</str>
|
||||
<str name="fmap.a">links</str>
|
||||
<str name="fmap.div">ignored_</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
<!-- A component to return terms and document frequency of those terms.
|
||||
This component does not yet support distributed search. -->
|
||||
<searchComponent name="termsComponent" class="org.apache.solr.handler.component.TermsComponent"/>
|
||||
<requestHandler name="/terms" class="org.apache.solr.handler.component.SearchHandler">
|
||||
<lst name="defaults">
|
||||
<bool name="terms">true</bool>
|
||||
</lst>
|
||||
<arr name="components">
|
||||
<str>termsComponent</str>
|
||||
</arr>
|
||||
</requestHandler>
|
||||
<!-- a search component that enables you to configure the top results for
|
||||
a given query regardless of the normal lucene scoring.-->
|
||||
<searchComponent name="elevator" class="solr.QueryElevationComponent">
|
||||
<!-- pick a fieldType to analyze queries -->
|
||||
<str name="queryFieldType">string</str>
|
||||
<str name="config-file">elevate.xml</str>
|
||||
</searchComponent>
|
||||
<!-- a request handler utilizing the elevator component -->
|
||||
<requestHandler name="/elevate" class="solr.SearchHandler" startup="lazy">
|
||||
<lst name="defaults">
|
||||
<str name="echoParams">explicit</str>
|
||||
</lst>
|
||||
<arr name="last-components">
|
||||
<str>elevator</str>
|
||||
</arr>
|
||||
</requestHandler>
|
||||
<!-- Update request handler.
|
||||
|
||||
Note: Since solr1.1 requestHandlers requires a valid content type header if posted in
|
||||
the body. For example, curl now requires: -H 'Content-type:text/xml; charset=utf-8'
|
||||
The response format differs from solr1.1 formatting and returns a standard error code.
|
||||
To enable solr1.1 behavior, remove the /update handler or change its path
|
||||
-->
|
||||
<requestHandler name="/update" class="solr.XmlUpdateRequestHandler"/>
|
||||
<requestHandler name="/update/javabin" class="solr.BinaryUpdateRequestHandler"/>
|
||||
<!--
|
||||
Analysis request handler. Since Solr 1.3. Use to return how a document is analyzed. Useful
|
||||
for debugging and as a token server for other types of applications.
|
||||
|
||||
This is deprecated in favor of the improved DocumentAnalysisRequestHandler and FieldAnalysisRequestHandler
|
||||
|
||||
<requestHandler name="/analysis" class="solr.AnalysisRequestHandler" />
|
||||
-->
|
||||
<!--
|
||||
An analysis handler that provides a breakdown of the analysis process of provided docuemnts. This handler expects a
|
||||
(single) content stream with the following format:
|
||||
|
||||
<docs>
|
||||
<doc>
|
||||
<field name="id">1</field>
|
||||
<field name="name">The Name</field>
|
||||
<field name="text">The Text Value</field>
|
||||
<doc>
|
||||
<doc>...</doc>
|
||||
<doc>...</doc>
|
||||
...
|
||||
</docs>
|
||||
|
||||
Note: Each document must contain a field which serves as the unique key. This key is used in the returned
|
||||
response to assoicate an analysis breakdown to the analyzed document.
|
||||
|
||||
Like the FieldAnalysisRequestHandler, this handler also supports query analysis by
|
||||
sending either an "analysis.query" or "q" request paraemter that holds the query text to be analyized. It also
|
||||
supports the "analysis.showmatch" parameter which when set to true, all field tokens that match the query
|
||||
tokens will be marked as a "match".
|
||||
-->
|
||||
<requestHandler name="/analysis/document" class="solr.DocumentAnalysisRequestHandler"/>
|
||||
<!--
|
||||
RequestHandler that provides much the same functionality as analysis.jsp. Provides the ability
|
||||
to specify multiple field types and field names in the same request and outputs index-time and
|
||||
query-time analysis for each of them.
|
||||
|
||||
Request parameters are:
|
||||
analysis.fieldname - The field name whose analyzers are to be used
|
||||
analysis.fieldtype - The field type whose analyzers are to be used
|
||||
analysis.fieldvalue - The text for index-time analysis
|
||||
q (or analysis.q) - The text for query time analysis
|
||||
analysis.showmatch (true|false) - When set to true and when query analysis is performed, the produced
|
||||
tokens of the field value analysis will be marked as "matched" for every
|
||||
token that is produces by the query analysis
|
||||
-->
|
||||
<requestHandler name="/analysis/field" class="solr.FieldAnalysisRequestHandler"/>
|
||||
<!-- CSV update handler, loaded on demand -->
|
||||
<requestHandler name="/update/csv" class="solr.CSVRequestHandler" startup="lazy"/>
|
||||
<!--
|
||||
Admin Handlers - This will register all the standard admin RequestHandlers. Adding
|
||||
this single handler is equivalent to registering:
|
||||
|
||||
<requestHandler name="/admin/luke" class="org.apache.solr.handler.admin.LukeRequestHandler" />
|
||||
<requestHandler name="/admin/system" class="org.apache.solr.handler.admin.SystemInfoHandler" />
|
||||
<requestHandler name="/admin/plugins" class="org.apache.solr.handler.admin.PluginInfoHandler" />
|
||||
<requestHandler name="/admin/threads" class="org.apache.solr.handler.admin.ThreadDumpHandler" />
|
||||
<requestHandler name="/admin/properties" class="org.apache.solr.handler.admin.PropertiesRequestHandler" />
|
||||
<requestHandler name="/admin/file" class="org.apache.solr.handler.admin.ShowFileRequestHandler" >
|
||||
|
||||
If you wish to hide files under ${solr.home}/conf, explicitly register the ShowFileRequestHandler using:
|
||||
<requestHandler name="/admin/file" class="org.apache.solr.handler.admin.ShowFileRequestHandler" >
|
||||
<lst name="invariants">
|
||||
<str name="hidden">synonyms.txt</str>
|
||||
<str name="hidden">anotherfile.txt</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
-->
|
||||
<requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers"/>
|
||||
<!-- ping/healthcheck -->
|
||||
<requestHandler name="/admin/ping" class="PingRequestHandler">
|
||||
<lst name="defaults">
|
||||
<str name="qt">standard</str>
|
||||
<str name="q">solrpingquery</str>
|
||||
<str name="echoParams">all</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
<!-- Echo the request contents back to the client -->
|
||||
<requestHandler name="/debug/dump" class="solr.DumpRequestHandler">
|
||||
<lst name="defaults">
|
||||
<str name="echoParams">explicit</str>
|
||||
<!-- for all params (including the default etc) use: 'all' -->
|
||||
<str name="echoHandler">true</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
<highlighting>
|
||||
<!-- Configure the standard fragmenter -->
|
||||
<!-- This could most likely be commented out in the "default" case -->
|
||||
<fragmenter name="gap" class="org.apache.solr.highlight.GapFragmenter" default="true">
|
||||
<lst name="defaults">
|
||||
<int name="hl.fragsize">100</int>
|
||||
</lst>
|
||||
</fragmenter>
|
||||
<!-- A regular-expression-based fragmenter (f.i., for sentence extraction) -->
|
||||
<fragmenter name="regex" class="org.apache.solr.highlight.RegexFragmenter">
|
||||
<lst name="defaults">
|
||||
<!-- slightly smaller fragsizes work better because of slop -->
|
||||
<int name="hl.fragsize">70</int>
|
||||
<!-- allow 50% slop on fragment sizes -->
|
||||
<float name="hl.regex.slop">0.5</float>
|
||||
<!-- a basic sentence pattern -->
|
||||
<str name="hl.regex.pattern">[-\w ,/\n\"']{20,200}</str>
|
||||
</lst>
|
||||
</fragmenter>
|
||||
<!-- Configure the standard formatter -->
|
||||
<formatter name="html" class="org.apache.solr.highlight.HtmlFormatter" default="true">
|
||||
<lst name="defaults">
|
||||
<str name="hl.simple.pre"><![CDATA[<em>]]></str>
|
||||
<str name="hl.simple.post"><![CDATA[</em>]]></str>
|
||||
</lst>
|
||||
</formatter>
|
||||
</highlighting>
|
||||
<!-- An example dedup update processor that creates the "id" field on the fly
|
||||
based on the hash code of some other fields. This example has overwriteDupes
|
||||
set to false since we are using the id field as the signatureField and Solr
|
||||
will maintain uniqueness based on that anyway.
|
||||
|
||||
You have to link the chain to an update handler above to use it ie:
|
||||
<requestHandler name="/update "class="solr.XmlUpdateRequestHandler">
|
||||
<lst name="defaults">
|
||||
<str name="update.processor">dedupe</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
-->
|
||||
<!--
|
||||
<updateRequestProcessorChain name="dedupe">
|
||||
<processor class="org.apache.solr.update.processor.SignatureUpdateProcessorFactory">
|
||||
<bool name="enabled">true</bool>
|
||||
<str name="signatureField">id</str>
|
||||
<bool name="overwriteDupes">false</bool>
|
||||
<str name="fields">name,features,cat</str>
|
||||
<str name="signatureClass">org.apache.solr.update.processor.Lookup3Signature</str>
|
||||
</processor>
|
||||
<processor class="solr.LogUpdateProcessorFactory" />
|
||||
<processor class="solr.RunUpdateProcessorFactory" />
|
||||
</updateRequestProcessorChain>
|
||||
-->
|
||||
<!-- queryResponseWriter plugins... query responses will be written using the
|
||||
writer specified by the 'wt' request parameter matching the name of a registered
|
||||
writer.
|
||||
The "default" writer is the default and will be used if 'wt' is not specified
|
||||
in the request. XMLResponseWriter will be used if nothing is specified here.
|
||||
The json, python, and ruby writers are also available by default.
|
||||
|
||||
<queryResponseWriter name="xml" class="org.apache.solr.request.XMLResponseWriter" default="true"/>
|
||||
<queryResponseWriter name="json" class="org.apache.solr.request.JSONResponseWriter"/>
|
||||
<queryResponseWriter name="python" class="org.apache.solr.request.PythonResponseWriter"/>
|
||||
<queryResponseWriter name="ruby" class="org.apache.solr.request.RubyResponseWriter"/>
|
||||
<queryResponseWriter name="php" class="org.apache.solr.request.PHPResponseWriter"/>
|
||||
<queryResponseWriter name="phps" class="org.apache.solr.request.PHPSerializedResponseWriter"/>
|
||||
|
||||
<queryResponseWriter name="custom" class="com.example.MyResponseWriter"/>
|
||||
-->
|
||||
<!-- XSLT response writer transforms the XML output by any xslt file found
|
||||
in Solr's conf/xslt directory. Changes to xslt files are checked for
|
||||
every xsltCacheLifetimeSeconds.
|
||||
-->
|
||||
<queryResponseWriter name="xslt" class="org.apache.solr.request.XSLTResponseWriter">
|
||||
<int name="xsltCacheLifetimeSeconds">5</int>
|
||||
</queryResponseWriter>
|
||||
<!-- example of registering a query parser
|
||||
<queryParser name="lucene" class="org.apache.solr.search.LuceneQParserPlugin"/>
|
||||
-->
|
||||
<!-- example of registering a custom function parser
|
||||
<valueSourceParser name="myfunc" class="com.mycompany.MyValueSourceParser" />
|
||||
-->
|
||||
<!-- config for the admin interface -->
|
||||
<admin>
|
||||
<defaultQuery>solr</defaultQuery>
|
||||
<!-- configure a healthcheck file for servers behind a loadbalancer
|
||||
<healthcheck type="file">server-enabled</healthcheck>
|
||||
-->
|
||||
</admin>
|
||||
<requestHandler class="solr.MoreLikeThisHandler" name="/mlt">
|
||||
<lst name="defaults">
|
||||
<str name="mlt.mintf">1</str>
|
||||
<str name="mlt.mindf">2</str>
|
||||
</lst>
|
||||
</requestHandler>
|
||||
</config>
|
|
@ -1,2 +0,0 @@
|
|||
pizza
|
||||
history
|
|
@ -1,58 +0,0 @@
|
|||
# Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
# contributor license agreements. See the NOTICE file distributed with
|
||||
# this work for additional information regarding copyright ownership.
|
||||
# The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
# (the "License"); you may not use this file except in compliance with
|
||||
# the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
#-----------------------------------------------------------------------
|
||||
# a couple of test stopwords to test that the words are really being
|
||||
# configured from this file:
|
||||
stopworda
|
||||
stopwordb
|
||||
|
||||
#Standard english stop words taken from Lucene's StopAnalyzer
|
||||
a
|
||||
an
|
||||
and
|
||||
are
|
||||
as
|
||||
at
|
||||
be
|
||||
but
|
||||
by
|
||||
for
|
||||
if
|
||||
in
|
||||
into
|
||||
is
|
||||
it
|
||||
no
|
||||
not
|
||||
of
|
||||
on
|
||||
or
|
||||
s
|
||||
such
|
||||
t
|
||||
that
|
||||
the
|
||||
their
|
||||
then
|
||||
there
|
||||
these
|
||||
they
|
||||
this
|
||||
to
|
||||
was
|
||||
will
|
||||
with
|
||||
|
|
@ -1,31 +0,0 @@
|
|||
# The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
# (the "License"); you may not use this file except in compliance with
|
||||
# the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
#-----------------------------------------------------------------------
|
||||
#some test synonym mappings unlikely to appear in real input text
|
||||
aaa => aaaa
|
||||
bbb => bbbb1 bbbb2
|
||||
ccc => cccc1,cccc2
|
||||
a\=>a => b\=>b
|
||||
a\,a => b\,b
|
||||
fooaaa,baraaa,bazaaa
|
||||
|
||||
# Some synonym groups specific to this example
|
||||
GB,gib,gigabyte,gigabytes
|
||||
MB,mib,megabyte,megabytes
|
||||
Television, Televisions, TV, TVs
|
||||
#notice we use "gib" instead of "GiB" so any WordDelimiterFilter coming
|
||||
#after us won't split it into two words.
|
||||
|
||||
# Synonym mappings can be used for spelling correction too
|
||||
pixima => pixma
|
||||
|
|
@ -0,0 +1,885 @@
|
|||
# encoding: UTF-8
|
||||
#
|
||||
# **Tire** provides rich and comfortable Ruby API for the
|
||||
# [_ElasticSearch_](http://www.elasticsearch.org/) search engine/database.
|
||||
#
|
||||
# _ElasticSearch_ is a scalable, distributed, cloud-ready, highly-available
|
||||
# full-text search engine and database, communicating by JSON over RESTful HTTP,
|
||||
# based on [Lucene](http://lucene.apache.org/), written in Java.
|
||||
#
|
||||
# <img src="http://github.com/favicon.ico" style="position:relative; top:2px">
|
||||
# _Tire_ is open source, and you can download or clone the source code
|
||||
# from <https://github.com/karmi/tire>.
|
||||
#
|
||||
# By following these instructions you should have the search running
|
||||
# on a sane operation system in less then 10 minutes.
|
||||
|
||||
# Note, that this file can be executed directly:
|
||||
#
|
||||
# ruby -I lib examples/tire-dsl.rb
|
||||
#
|
||||
|
||||
|
||||
#### Installation
|
||||
|
||||
# Install _Tire_ with _Rubygems_:
|
||||
|
||||
#
|
||||
# gem install tire
|
||||
#
|
||||
require 'rubygems'
|
||||
require 'colorize'
|
||||
|
||||
# _Tire_ uses the [_multi_json_](https://github.com/intridea/multi_json) gem as a generic JSON library.
|
||||
# We want to use the [_yajl-ruby_](https://github.com/brianmario/yajl-ruby) gem in its full on mode here.
|
||||
#
|
||||
require 'yajl/json_gem'
|
||||
|
||||
# Now, let's require the _Tire_ gem itself, and we're ready to go.
|
||||
#
|
||||
require 'tire'
|
||||
|
||||
#### Prerequisites
|
||||
|
||||
# We'll need a working and running _ElasticSearch_ server, of course. Thankfully, that's easy.
|
||||
( puts <<-"INSTALL" ; exit(1) ) unless (RestClient.get('http://localhost:9200') rescue false)
|
||||
|
||||
[ERROR] You don’t appear to have ElasticSearch installed. Please install and launch it with the following commands:
|
||||
|
||||
curl -k -L -o elasticsearch-0.19.0.tar.gz http://github.com/downloads/elasticsearch/elasticsearch/elasticsearch-0.19.0.tar.gz
|
||||
tar -zxvf elasticsearch-0.19.0.tar.gz
|
||||
./elasticsearch-0.19.0/bin/elasticsearch -f
|
||||
INSTALL
|
||||
|
||||
### Storing and indexing documents
|
||||
|
||||
# Let's initialize an index named “articles”.
|
||||
#
|
||||
Tire.index 'articles' do
|
||||
# To make sure it's fresh, let's delete any existing index with the same name.
|
||||
#
|
||||
delete
|
||||
# And then, let's create it.
|
||||
#
|
||||
create
|
||||
|
||||
# We want to store and index some articles with `title`, `tags` and `published_on` properties.
|
||||
# Simple Hashes are OK. The default type is „document”.
|
||||
#
|
||||
store :title => '復興「校球」 政大男足決戰UFA足球聯賽', :tags => ['足球'], :published_on => '2011-01-01'
|
||||
store :title => '社科院舉辦碩博士班畢業生撥穗典禮', :tags => ['博士班', '畢業'], :published_on => '2011-01-02'
|
||||
|
||||
# We usually want to set a specific _type_ for the document in _ElasticSearch_.
|
||||
# Simply setting a `type` property is OK.
|
||||
#
|
||||
store :type => 'article',
|
||||
:title => '支持政大學子 羅家倫之女設立獎學金',
|
||||
:tags => ['獎學金'],
|
||||
:published_on => '2011-01-02'
|
||||
|
||||
# We may want to wrap your data in a Ruby class, and use it when storing data.
|
||||
# The contract required of such a class is very simple.
|
||||
#
|
||||
class Article
|
||||
|
||||
#
|
||||
attr_reader :title, :tags, :published_on
|
||||
def initialize(attributes={})
|
||||
@attributes = attributes
|
||||
@attributes.each_pair { |name,value| instance_variable_set :"@#{name}", value }
|
||||
end
|
||||
|
||||
# It must provide a `type`, `_type` or `document_type` method for propper mapping.
|
||||
#
|
||||
def type
|
||||
'article'
|
||||
end
|
||||
|
||||
# And it must provide a `to_indexed_json` method for conversion to JSON.
|
||||
#
|
||||
def to_indexed_json
|
||||
@attributes.to_json
|
||||
end
|
||||
end
|
||||
|
||||
# Note: Since our class takes a Hash of attributes on initialization, we may even
|
||||
# wrap the results in instances of this class; we'll see how to do that further below.
|
||||
#
|
||||
article = Article.new :title => '親身感受臺灣特色 日本田野研究團政大學習',
|
||||
:tags => ['臺灣特色', '日本'],
|
||||
:published_on => '2011-01-03'
|
||||
|
||||
# Let's store the `article`, now.
|
||||
#
|
||||
store article
|
||||
|
||||
# And let's „force refresh“ the index, so we can query it immediately.
|
||||
#
|
||||
refresh
|
||||
end
|
||||
|
||||
# We may want to define a specific [mapping](http://www.elasticsearch.org/guide/reference/api/admin-indices-create-index.html)
|
||||
# for the index.
|
||||
|
||||
Tire.index 'articles' do
|
||||
# To do so, let's just pass a Hash containing the specified mapping to the `Index#create` method.
|
||||
#
|
||||
create :mappings => {
|
||||
|
||||
# Let's specify for which _type_ of documents this mapping should be used:
|
||||
# „article”, in our case.
|
||||
#
|
||||
:article => {
|
||||
:properties => {
|
||||
|
||||
# Let's specify the type of the field, whether it should be analyzed, ...
|
||||
#
|
||||
:id => { :type => 'string', :index => 'not_analyzed', :include_in_all => false },
|
||||
|
||||
# ... set the boost or analyzer settings for the field, etc. The _ElasticSearch_ guide
|
||||
# has [more information](http://elasticsearch.org/guide/reference/mapping/index.html).
|
||||
# Don't forget, that proper mapping is key to efficient and effective search.
|
||||
# But don't fret about getting the mapping right the first time, you won't.
|
||||
# In most cases, the default, dynamic mapping is just fine for prototyping.
|
||||
#
|
||||
:title => { :type => 'string', :analyzer => 'cjk', :boost => 2.0 },
|
||||
:tags => { :type => 'string', :analyzer => 'keyword' },
|
||||
:content => { :type => 'string', :analyzer => 'cjk' }
|
||||
}
|
||||
}
|
||||
}
|
||||
end
|
||||
|
||||
#### Bulk Indexing
|
||||
|
||||
# Of course, we may have large amounts of data, and adding them to the index one by one really isn't the best idea.
|
||||
# We can use _ElasticSearch's_ [bulk API](http://www.elasticsearch.org/guide/reference/api/bulk.html)
|
||||
# for importing the data.
|
||||
|
||||
# So, for demonstration purposes, let's suppose we have a simple collection of hashes to store.
|
||||
#
|
||||
articles = [
|
||||
|
||||
# Notice that such objects must have an `id` property!
|
||||
#
|
||||
{ :id => '1', :type => 'article', :title => '復興「校球」 政大男足決戰UFA足球聯賽', :tags => ['足球'], :published_on => '2011-01-01' },
|
||||
|
||||
# And, of course, they should contain the `type` property for the mapping to work!
|
||||
#
|
||||
{ :id => '2', :type => 'article', :title => '社科院舉辦碩博士班畢業生撥穗典禮', :tags => ['博士班', '畢業','社科院'], :published_on => '2011-01-02' },
|
||||
{ :id => '3', :type => 'article', :title => '支持政大學子 羅家倫之女設立獎學金', :tags => ['獎學金'], :published_on => '2011-01-02' },
|
||||
{ :id => '4', :type => 'article', :title => '親身感受臺灣特色 日本田野研究團政大學習', :tags => ['臺灣特色', '日本'], :published_on => '2011-01-03' }
|
||||
]
|
||||
|
||||
# We can just push them into the index in one go.
|
||||
#
|
||||
Tire.index 'articles' do
|
||||
import articles
|
||||
end
|
||||
|
||||
# Of course, we can easily manipulate the documents before storing them in the index.
|
||||
#
|
||||
Tire.index 'articles' do
|
||||
delete
|
||||
|
||||
# ... by passing a block to the `import` method. The collection will
|
||||
# be available in the block argument.
|
||||
#
|
||||
import articles do |documents|
|
||||
|
||||
# We will capitalize every _title_ and return the manipulated collection
|
||||
# back to the `import` method.
|
||||
#
|
||||
documents.map { |document| document.update(:title => document[:title].capitalize) }
|
||||
end
|
||||
|
||||
refresh
|
||||
end
|
||||
|
||||
### Searching
|
||||
|
||||
# With the documents indexed and stored in the _ElasticSearch_ database, we can search them, finally.
|
||||
#
|
||||
# _Tire_ exposes the search interface via simple domain-specific language.
|
||||
|
||||
#### Simple Query String Searches
|
||||
|
||||
# We can do simple searches, like searching for articles containing “One” in their title.
|
||||
#
|
||||
s = Tire.search('news_bulletins') do
|
||||
query do
|
||||
string "title:政大"
|
||||
end
|
||||
end
|
||||
|
||||
# The results:
|
||||
# * One [tags: ruby]
|
||||
#
|
||||
s.results.each do |document|
|
||||
puts "Test1==============================Has results: #{s.results.count}".yellow
|
||||
puts "* #{ document.title } [tags: ]"
|
||||
end
|
||||
|
||||
# Or, we can search for articles published between January, 1st and January, 2nd.
|
||||
#
|
||||
puts "Test2==Or, we can search for articles published between January, 1st and January, 2nd.=Has results: #{s.results.count}".yellow
|
||||
s = Tire.search('articles') do
|
||||
query do
|
||||
string "published_on:[2011-01-01 TO 2011-01-02]"
|
||||
end
|
||||
end
|
||||
|
||||
# The results:
|
||||
# * One [published: 2011-01-01]
|
||||
# * Two [published: 2011-01-02]
|
||||
# * Three [published: 2011-01-02]
|
||||
#
|
||||
s.results.each do |document|
|
||||
puts "* #{ document.title } [published: #{document.published_on}]"
|
||||
end
|
||||
|
||||
# Notice, that we can access local variables from the _enclosing scope_.
|
||||
# (Of course, we may write the blocks in shorter notation.)
|
||||
|
||||
# We will define the query in a local variable named `q`...
|
||||
#
|
||||
q = "title:T*"
|
||||
# ... and we can use it inside the `query` block.
|
||||
#
|
||||
s = Tire.search('articles') { query { string q } }
|
||||
|
||||
# The results:
|
||||
# * Two [tags: ruby, python]
|
||||
# * Three [tags: java]
|
||||
#
|
||||
puts "Test3==and we can use it inside the `query` block..[ #{q} ]=Has results: #{s.results.count}".yellow
|
||||
s.results.each do |document|
|
||||
puts "* #{ document.title } [tags:]"
|
||||
end
|
||||
|
||||
# Often, we need to access variables or methods defined in the _outer scope_.
|
||||
# To do that, we have to use a slight variation of the DSL.
|
||||
#
|
||||
|
||||
# Let's assume we have a plain Ruby class, named `Article`.
|
||||
#
|
||||
class Article
|
||||
|
||||
# We will define the query in a class method...
|
||||
#
|
||||
def self.q
|
||||
"title:T*"
|
||||
end
|
||||
|
||||
# ... and wrap the _Tire_ search method in another one.
|
||||
def self.search
|
||||
|
||||
# Notice how we pass the `search` object around as a block argument.
|
||||
#
|
||||
Tire.search('articles') do |search|
|
||||
|
||||
# And we pass the query object in a similar matter.
|
||||
#
|
||||
search.query do |query|
|
||||
|
||||
# Which means we can access the `q` class method.
|
||||
#
|
||||
query.string self.q
|
||||
end
|
||||
end.results
|
||||
end
|
||||
end
|
||||
|
||||
# We may use any valid [Lucene query syntax](http://lucene.apache.org/java/3_0_3/queryparsersyntax.html)
|
||||
# for the `query_string` queries.
|
||||
|
||||
# For debugging our queries, we can display the JSON which is being sent to _ElasticSearch_.
|
||||
#
|
||||
# {"query":{"query_string":{"query":"title:T*"}}}
|
||||
#
|
||||
puts "", "Query:", "-"*80
|
||||
puts s.to_json.green
|
||||
|
||||
# Or better yet, we may display a complete `curl` command to recreate the request in terminal,
|
||||
# so we can see the naked response, tweak request parameters and meditate on problems.
|
||||
#
|
||||
# curl -X POST "http://localhost:9200/articles/_search?pretty=true" \
|
||||
# -d '{"query":{"query_string":{"query":"title:T*"}}}'
|
||||
#
|
||||
puts "", "Try the query in Curl:", "-"*80
|
||||
puts s.to_curl.green
|
||||
|
||||
|
||||
### Logging
|
||||
|
||||
# For debugging more complex situations, we can enable logging, so requests and responses
|
||||
# will be logged using this `curl`-friendly format.
|
||||
|
||||
Tire.configure do
|
||||
|
||||
# By default, at the _info_ level, only the `curl`-format of request and
|
||||
# basic information about the response will be logged:
|
||||
#
|
||||
# # 2011-04-24 11:34:01:150 [CREATE] ("articles")
|
||||
# #
|
||||
# curl -X POST "http://localhost:9200/articles"
|
||||
#
|
||||
# # 2011-04-24 11:34:01:152 [200]
|
||||
#
|
||||
logger 'elasticsearch.log'
|
||||
|
||||
# For debugging, we can switch to the _debug_ level, which will log the complete JSON responses.
|
||||
#
|
||||
# That's very convenient if we want to post a recreation of some problem or solution
|
||||
# to the mailing list, IRC channel, etc.
|
||||
#
|
||||
logger 'elasticsearch.log', :level => 'debug'
|
||||
|
||||
# Note that we can pass any [`IO`](http://www.ruby-doc.org/core/classes/IO.html)-compatible Ruby object as a logging device.
|
||||
#
|
||||
logger STDERR
|
||||
end
|
||||
|
||||
### Configuration
|
||||
|
||||
# As we have just seen with logging, we can configure various parts of _Tire_.
|
||||
#
|
||||
Tire.configure do
|
||||
|
||||
# First of all, we can configure the URL for _ElasticSearch_.
|
||||
#
|
||||
url "http://search.example.com"
|
||||
|
||||
# Second, we may want to wrap the result items in our own class, for instance
|
||||
# the `Article` class set above.
|
||||
#
|
||||
wrapper Article
|
||||
|
||||
# Finally, we can reset one or all configuration settings to their defaults.
|
||||
#
|
||||
reset :url
|
||||
reset
|
||||
|
||||
end
|
||||
|
||||
|
||||
### Complex Searching
|
||||
|
||||
# Query strings are convenient for simple searches, but we may want to define our queries more expressively,
|
||||
# using the _ElasticSearch_ [Query DSL](http://www.elasticsearch.org/guide/reference/query-dsl/index.html).
|
||||
#
|
||||
s = Tire.search('articles') do
|
||||
|
||||
# Let's suppose we want to search for articles with specific _tags_, in our case “ruby” _or_ “python”.
|
||||
#
|
||||
query do
|
||||
|
||||
# That's a great excuse to use a [_terms_](http://elasticsearch.org/guide/reference/query-dsl/terms-query.html)
|
||||
# query.
|
||||
#
|
||||
terms :tags, ['ruby', 'python']
|
||||
end
|
||||
end
|
||||
|
||||
# The search, as expected, returns three articles, all tagged “ruby” — among other tags:
|
||||
#
|
||||
# * Two [tags: ruby, python]
|
||||
# * One [tags: ruby]
|
||||
# * Four [tags: ruby, php]
|
||||
#
|
||||
puts "Test4==The search, as expected, returns three articles, all tagged “STHs” — among other tags.Has results: #{s.results.count}".yellow
|
||||
s.results.each do |document|
|
||||
puts "* #{ document.title } [tags: ]"
|
||||
end
|
||||
|
||||
# What if we wanted to search for articles tagged both “ruby” _and_ “python”?
|
||||
#
|
||||
s = Tire.search('articles') do
|
||||
query do
|
||||
|
||||
# That's a great excuse to specify `minimum_match` for the query.
|
||||
#
|
||||
terms :tags, ['ruby', 'python'], :minimum_match => 2
|
||||
end
|
||||
end
|
||||
|
||||
# The search, as expected, returns one article, tagged with _both_ “ruby” and “python”:
|
||||
#
|
||||
# * Two [tags: ruby, python]
|
||||
#
|
||||
puts "Test5==The search, as expected, returns one article, tagged with _both_ 'ruby' and 'python'.Has results: #{s.results.count}".yellow
|
||||
s.results.each do |document|
|
||||
puts "* #{ document.title } [tags: ]"
|
||||
end
|
||||
|
||||
#### Boolean Queries
|
||||
|
||||
# Quite often, we need complex queries with boolean logic.
|
||||
# Instead of composing long query strings such as `tags:ruby OR tags:java AND NOT tags:python`,
|
||||
# we can use the [_bool_](http://www.elasticsearch.org/guide/reference/query-dsl/bool-query.html)
|
||||
# query.
|
||||
|
||||
s = Tire.search('news_bulletins') do
|
||||
query do
|
||||
|
||||
# In _Tire_, we can build `bool` queries declaratively, as usual.
|
||||
boolean do
|
||||
|
||||
# Let's define a `should` (`OR`) query for _ruby_,
|
||||
#
|
||||
should { string 'title:政大' }
|
||||
|
||||
# as well as for _java_,
|
||||
must_not { string 'title:復興' }
|
||||
|
||||
# while defining a `must_not` (`AND NOT`) query for _python_.
|
||||
# must_not { string 'tags:python' }
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
# The search returns these documents:
|
||||
#
|
||||
# * One [tags: ruby]
|
||||
# * Three [tags: java]
|
||||
# * Four [tags: ruby, php]
|
||||
puts "Test6==Boolean Queries.Has results: #{s.results.count}".yellow
|
||||
s.results.each do |document|
|
||||
puts "* #{ document.title } [tags: ]"
|
||||
end
|
||||
|
||||
puts "Test7== mix and reuse Boolean Queries: #{s.results.count}".yellow
|
||||
# The best thing about `boolean` queries is that we can very easily save these partial queries as Ruby blocks,
|
||||
# to mix and reuse them later, since we can call the `boolean` method multiple times.
|
||||
#
|
||||
|
||||
# Let's define the query for the _tags_ property,
|
||||
#
|
||||
tags_query = lambda do |boolean|
|
||||
boolean.should { string 'tags:ruby' }
|
||||
boolean.should { string 'tags:java' }
|
||||
end
|
||||
|
||||
# ... and a query for the _published_on_ property.
|
||||
published_on_query = lambda do |boolean|
|
||||
boolean.must { string 'published_on:[2011-01-01 TO 2011-01-02]' }
|
||||
end
|
||||
|
||||
# Now, we can use the `tags_query` on its own.
|
||||
#
|
||||
Tire.search('articles') { query { boolean &tags_query } }
|
||||
|
||||
# Or, we can combine it with the `published_on` query.
|
||||
#
|
||||
Tire.search('articles') do
|
||||
query do
|
||||
boolean &tags_query
|
||||
boolean &published_on_query
|
||||
end
|
||||
end
|
||||
|
||||
# _ElasticSearch_ supports many types of [queries](http://www.elasticsearch.org/guide/reference/query-dsl/).
|
||||
#
|
||||
# Eventually, _Tire_ will support all of them. So far, only these are supported:
|
||||
#
|
||||
# * [string](http://www.elasticsearch.org/guide/reference/query-dsl/query-string-query.html)
|
||||
# * [text](http://www.elasticsearch.org/guide/reference/query-dsl/text-query.html)
|
||||
# * [term](http://elasticsearch.org/guide/reference/query-dsl/term-query.html)
|
||||
# * [terms](http://elasticsearch.org/guide/reference/query-dsl/terms-query.html)
|
||||
# * [bool](http://www.elasticsearch.org/guide/reference/query-dsl/bool-query.html)
|
||||
# * [custom_score](http://www.elasticsearch.org/guide/reference/query-dsl/custom-score-query.html)
|
||||
# * [fuzzy](http://www.elasticsearch.org/guide/reference/query-dsl/fuzzy-query.html)
|
||||
# * [all](http://www.elasticsearch.org/guide/reference/query-dsl/match-all-query.html)
|
||||
# * [ids](http://www.elasticsearch.org/guide/reference/query-dsl/ids-query.html)
|
||||
|
||||
puts "Topic#### Faceted Search ==> SKIP".yellow
|
||||
|
||||
|
||||
|
||||
# # _ElasticSearch_ makes it trivial to retrieve complex aggregated data from our index/database,
|
||||
# # so called [_facets_](http://www.elasticsearch.org/guide/reference/api/search/facets/index.html).
|
||||
|
||||
# # Let's say we want to display article counts for every tag in the database.
|
||||
# # For that, we'll use a _terms_ facet.
|
||||
|
||||
# #
|
||||
# s = Tire.search 'articles' do
|
||||
|
||||
# # We will search for articles whose title begins with letter “T”,
|
||||
# #
|
||||
# query { string 'title:T*' }
|
||||
|
||||
# # and retrieve the counts “bucketed” by `tags`.
|
||||
# #
|
||||
# facet 'tags' do
|
||||
# terms :tags
|
||||
# end
|
||||
# end
|
||||
|
||||
# # As we see, our query has found two articles, and if you recall our articles from above,
|
||||
# # _Two_ is tagged with “ruby” and “python”, while _Three_ is tagged with “java”.
|
||||
# #
|
||||
# # Found 2 articles: Three, Two
|
||||
# #
|
||||
# # The counts shouldn't surprise us:
|
||||
# #
|
||||
# # Counts by tag:
|
||||
# # -------------------------
|
||||
# # ruby 1
|
||||
# # python 1
|
||||
# # java 1
|
||||
# #
|
||||
# puts "Found #{s.results.count} articles: #{s.results.map(&:title).join(', ')}"
|
||||
# puts "Counts by tag:", "-"*25
|
||||
# s.results.facets['tags']['terms'].each do |f|
|
||||
# puts "#{f['term'].ljust(10)} #{f['count']}"
|
||||
# end
|
||||
|
||||
# # These counts are based on the scope of our current query.
|
||||
# # What if we wanted to display aggregated counts by `tags` across the whole database?
|
||||
|
||||
# #
|
||||
# s = Tire.search 'articles' do
|
||||
|
||||
# # Let's repeat the search for “T”...
|
||||
# #
|
||||
# query { string 'title:T*' }
|
||||
|
||||
# facet 'global-tags', :global => true do
|
||||
|
||||
# # ...but set the `global` scope for the facet in this case.
|
||||
# #
|
||||
# terms :tags
|
||||
# end
|
||||
|
||||
# # We can even _combine_ facets scoped to the current query
|
||||
# # with globally scoped facets — we'll just use a different name.
|
||||
# #
|
||||
# facet 'current-tags' do
|
||||
# terms :tags
|
||||
# end
|
||||
# end
|
||||
|
||||
# # Aggregated results for the current query are the same as previously:
|
||||
# #
|
||||
# # Current query facets:
|
||||
# # -------------------------
|
||||
# # ruby 1
|
||||
# # python 1
|
||||
# # java 1
|
||||
# #
|
||||
# puts "Current query facets:", "-"*25
|
||||
# s.results.facets['current-tags']['terms'].each do |f|
|
||||
# puts "#{f['term'].ljust(10)} #{f['count']}"
|
||||
# end
|
||||
|
||||
# # On the other hand, aggregated results for the global scope include also
|
||||
# # tags for articles not matched by the query, such as “java” or “php”:
|
||||
# #
|
||||
# # Global facets:
|
||||
# # -------------------------
|
||||
# # ruby 3
|
||||
# # python 1
|
||||
# # php 1
|
||||
# # java 1
|
||||
# #
|
||||
# puts "Global facets:", "-"*25
|
||||
# s.results.facets['global-tags']['terms'].each do |f|
|
||||
# puts "#{f['term'].ljust(10)} #{f['count']}"
|
||||
# end
|
||||
|
||||
# # _ElasticSearch_ supports many advanced types of facets, such as those for computing statistics or geographical distance.
|
||||
# #
|
||||
# # Eventually, _Tire_ will support all of them. So far, only these are supported:
|
||||
# #
|
||||
# # * [terms](http://www.elasticsearch.org/guide/reference/api/search/facets/terms-facet.html)
|
||||
# # * [date](http://www.elasticsearch.org/guide/reference/api/search/facets/date-histogram-facet.html)
|
||||
# # * [range](http://www.elasticsearch.org/guide/reference/api/search/facets/range-facet.html)
|
||||
# # * [histogram](http://www.elasticsearch.org/guide/reference/api/search/facets/histogram-facet.html)
|
||||
# # * [statistical](http://www.elasticsearch.org/guide/reference/api/search/facets/statistical-facet.html)
|
||||
# # * [terms_stats](http://www.elasticsearch.org/guide/reference/api/search/facets/terms-stats-facet.html)
|
||||
# # * [query](http://www.elasticsearch.org/guide/reference/api/search/facets/query-facet.html)
|
||||
|
||||
# # We have seen that _ElasticSearch_ facets enable us to fetch complex aggregations from our data.
|
||||
# #
|
||||
# # They are frequently used for another feature, „faceted navigation“.
|
||||
# # We can be combine query and facets with
|
||||
# # [filters](http://elasticsearch.org/guide/reference/api/search/filter.html),
|
||||
# # so the returned documents are restricted by certain criteria — for example to a specific category —,
|
||||
# # but the aggregation calculations are still based on the original query.
|
||||
|
||||
|
||||
# #### Filtered Search
|
||||
|
||||
# # So, let's make our search a bit more complex. Let's search for articles whose titles begin
|
||||
# # with letter “T”, again, but filter the results, so only the articles tagged “ruby”
|
||||
# # are returned.
|
||||
# #
|
||||
# s = Tire.search 'articles' do
|
||||
|
||||
# # We will use just the same **query** as before.
|
||||
# #
|
||||
# query { string 'title:T*' }
|
||||
|
||||
# # But we will add a _terms_ **filter** based on tags.
|
||||
# #
|
||||
# filter :terms, :tags => ['ruby']
|
||||
|
||||
# # And, of course, our facet definition.
|
||||
# #
|
||||
# facet('tags') { terms :tags }
|
||||
|
||||
# end
|
||||
|
||||
# # We see that only the article _Two_ (tagged “ruby” and “python”) is returned,
|
||||
# # _not_ the article _Three_ (tagged “java”):
|
||||
# #
|
||||
# # * Two [tags: ruby, python]
|
||||
# #
|
||||
# s.results.each do |document|
|
||||
# puts "* #{ document.title } [tags: ]"
|
||||
# end
|
||||
|
||||
# # The _count_ for article _Three_'s tags, “java”, on the other hand, _is_ in fact included:
|
||||
# #
|
||||
# # Counts by tag:
|
||||
# # -------------------------
|
||||
# # ruby 1
|
||||
# # python 1
|
||||
# # java 1
|
||||
# #
|
||||
# puts "Counts by tag:", "-"*25
|
||||
# s.results.facets['tags']['terms'].each do |f|
|
||||
# puts "#{f['term'].ljust(10)} #{f['count']}"
|
||||
# end
|
||||
|
||||
# #### Sorting
|
||||
|
||||
# # By default, the results are sorted according to their relevancy.
|
||||
# #
|
||||
# s = Tire.search('articles') { query { string 'tags:ruby' } }
|
||||
|
||||
# s.results.each do |document|
|
||||
# puts "* #{ document.title } " +
|
||||
# "[tags: ; " +
|
||||
|
||||
# # The score is available as the `_score` property.
|
||||
# #
|
||||
# "score: #{document._score}]"
|
||||
# end
|
||||
|
||||
# # The results:
|
||||
# #
|
||||
# # * One [tags: ruby; score: 0.30685282]
|
||||
# # * Four [tags: ruby, php; score: 0.19178301]
|
||||
# # * Two [tags: ruby, python; score: 0.19178301]
|
||||
|
||||
# # But, what if we want to sort the results based on some other criteria,
|
||||
# # such as published date or product price? We can do that.
|
||||
# #
|
||||
# s = Tire.search 'articles' do
|
||||
|
||||
# # We will search for articles tagged “ruby”, again, ...
|
||||
# #
|
||||
# query { string 'tags:ruby' }
|
||||
|
||||
# # ... but will sort them by their `title`, in descending order.
|
||||
# #
|
||||
# sort { by :title, 'desc' }
|
||||
# end
|
||||
|
||||
# # The results:
|
||||
# #
|
||||
# # * Two
|
||||
# # * One
|
||||
# # * Four
|
||||
# #
|
||||
# s.results.each do |document|
|
||||
# puts "* #{ document.title }"
|
||||
# end
|
||||
|
||||
# # Of course, it's possible to combine more fields in the sorting definition.
|
||||
|
||||
# s = Tire.search 'articles' do
|
||||
|
||||
# # We will just get all articles in this case.
|
||||
# #
|
||||
# query { all }
|
||||
|
||||
# sort do
|
||||
|
||||
# # We will sort the results by their `published_on` property in _ascending_ order (the default),
|
||||
# #
|
||||
# by :published_on
|
||||
|
||||
# # and by their `title` property, in _descending_ order.
|
||||
# #
|
||||
# by :title, 'desc'
|
||||
# end
|
||||
# end
|
||||
|
||||
# # The results:
|
||||
# # * One (Published on: 2011-01-01)
|
||||
# # * Two (Published on: 2011-01-02)
|
||||
# # * Three (Published on: 2011-01-02)
|
||||
# # * Four (Published on: 2011-01-03)
|
||||
# #
|
||||
# s.results.each do |document|
|
||||
# puts "* #{ document.title.ljust(10) } (Published on: #{ document.published_on })"
|
||||
# end
|
||||
|
||||
# #### Highlighting
|
||||
|
||||
# # Often, we want to highlight the snippets matching our query in the displayed results.
|
||||
# # _ElasticSearch_ provides rich
|
||||
# # [highlighting](http://www.elasticsearch.org/guide/reference/api/search/highlighting.html)
|
||||
# # features, and _Tire_ makes them trivial to use.
|
||||
# #
|
||||
# s = Tire.search 'articles' do
|
||||
|
||||
# # Let's search for documents containing word “Two” in their titles,
|
||||
# query { string 'title:Two' }
|
||||
|
||||
# # and instruct _ElasticSearch_ to highlight relevant snippets.
|
||||
# #
|
||||
# highlight :title
|
||||
# end
|
||||
|
||||
# # The results:
|
||||
# # Title: Two; Highlighted: <em>Two</em>
|
||||
# #
|
||||
# s.results.each do |document|
|
||||
# puts "Title: #{ document.title }; Highlighted: #{document.highlight.title}"
|
||||
# end
|
||||
|
||||
# # We can configure many options for highlighting, such as:
|
||||
# #
|
||||
# s = Tire.search 'articles' do
|
||||
# query { string 'title:Two' }
|
||||
|
||||
# # • specify the fields to highlight
|
||||
# #
|
||||
# highlight :title, :body
|
||||
|
||||
# # • specify their individual options
|
||||
# #
|
||||
# highlight :title, :body => { :number_of_fragments => 0 }
|
||||
|
||||
# # • or specify global highlighting options, such as the wrapper tag
|
||||
# #
|
||||
# highlight :title, :body, :options => { :tag => '<strong class="highlight">' }
|
||||
# end
|
||||
|
||||
# #### Percolation
|
||||
|
||||
# # _ElasticSearch_ comes with one very interesting, and rather unique feature:
|
||||
# # [_percolation_](http://www.elasticsearch.org/guide/reference/api/percolate.html).
|
||||
|
||||
# # It works in a „reverse search“ manner to regular search workflow of adding
|
||||
# # documents to the index and then querying them.
|
||||
# # Percolation allows us to register a query, and ask if a specific document
|
||||
# # matches it, either on demand, or immediately as the document is being indexed.
|
||||
|
||||
# # Let's review an example for an index named _weather_.
|
||||
# # We will register three queries for percolation against this index.
|
||||
# #
|
||||
# index = Tire.index('weather') do
|
||||
# delete
|
||||
# create
|
||||
|
||||
# # First, a query named _warning_,
|
||||
# #
|
||||
# register_percolator_query('warning', :tags => ['warning']) { string 'warning OR severe OR extreme' }
|
||||
|
||||
# # a query named _tsunami_,
|
||||
# #
|
||||
# register_percolator_query('tsunami', :tags => ['tsunami']) { string 'tsunami' }
|
||||
|
||||
# # and a query named _floods_.
|
||||
# #
|
||||
# register_percolator_query('floods', :tags => ['floods']) { string 'flood*' }
|
||||
|
||||
# end
|
||||
|
||||
# # Notice, that we have added a _tags_ field to the query document, because it behaves
|
||||
# # just like any other document in _ElasticSearch_.
|
||||
|
||||
# # We will refresh the `_percolator` index for immediate access.
|
||||
# #
|
||||
# Tire.index('_percolator').refresh
|
||||
|
||||
# # Now, let's _percolate_ a document containing some trigger words against all registered queries.
|
||||
# #
|
||||
# matches = index.percolate(:message => '[Warning] Extreme flooding expected after tsunami wave.')
|
||||
|
||||
# # The result will contain, unsurprisingly, names of all the three registered queries:
|
||||
# #
|
||||
# # Matching queries: ["floods", "tsunami", "warning"]
|
||||
# #
|
||||
# puts "Matching queries: " + matches.inspect
|
||||
|
||||
# # We can filter the executed queries with a regular _ElasticSearch_ query passed as a block to
|
||||
# # the `percolate` method.
|
||||
# #
|
||||
# matches = index.percolate(:message => '[Warning] Extreme flooding expected after tsunami wave.') do
|
||||
# # Let's use a _terms_ query against the `tags` field.
|
||||
# term :tags, 'tsunami'
|
||||
# end
|
||||
|
||||
# # In this case, the result will contain only the name of the “tsunami” query.
|
||||
# #
|
||||
# # Matching queries: ["tsunami"]
|
||||
# #
|
||||
# puts "Matching queries: " + matches.inspect
|
||||
|
||||
# # What if we percolate another document, without the “tsunami” trigger word?
|
||||
# #
|
||||
# matches = index.percolate(:message => '[Warning] Extreme temperatures expected.') { term :tags, 'tsunami' }
|
||||
|
||||
# # As expected, we will get an empty array:
|
||||
# #
|
||||
# # Matching queries: []
|
||||
# #
|
||||
# puts "Matching queries: " + matches.inspect
|
||||
|
||||
# # Well, that's of course immensely useful for real-time search systems. But, there's more.
|
||||
# # We can _percolate_ a document _at the same time_ it is being stored in the index,
|
||||
# # getting back a list of matching queries.
|
||||
|
||||
# # Let's store a document with some trigger words in the index, and mark it for percolation.
|
||||
# #
|
||||
# response = index.store :message => '[Warning] Severe floods expected after tsunami wave.', :percolate => true
|
||||
|
||||
# # We will get the names of all matching queries in response.
|
||||
# #
|
||||
# # Matching queries: ["floods", "tsunami", "warning"]
|
||||
# #
|
||||
# puts "Matching queries: " + response['matches'].inspect
|
||||
|
||||
# # As with the _percolate_ example, we can filter the executed queries.
|
||||
# #
|
||||
# response = index.store :message => '[Warning] Severe floods expected after tsunami wave.',
|
||||
# # Let's use a simple string query for the “tsunami” tag.
|
||||
# :percolate => 'tags:tsunami'
|
||||
|
||||
# # Unsurprisingly, the response will contain just the name of the “tsunami” query.
|
||||
# #
|
||||
# # Matching queries: ["tsunami"]
|
||||
# #
|
||||
# puts "Matching queries: " + response['matches'].inspect
|
||||
|
||||
# ### ActiveModel Integration
|
||||
|
||||
# # As you can see, [_Tire_](https://github.com/karmi/tire) supports the
|
||||
# # main features of _ElasticSearch_ in Ruby.
|
||||
# #
|
||||
# # It allows you to create and delete indices, add documents, search them, retrieve the facets, highlight the results,
|
||||
# # and comes with a usable logging facility.
|
||||
# #
|
||||
# # Of course, the holy grail of any search library is easy, painless integration with your Ruby classes, and,
|
||||
# # most importantly, with ActiveRecord/ActiveModel classes.
|
||||
# #
|
||||
# # Please, check out the [README](https://github.com/karmi/tire/tree/master#readme) file for instructions
|
||||
# # how to include _Tire_-based search in your models..
|
||||
# #
|
||||
# # Send any feedback via Github issues, or ask questions in the [#elasticsearch](irc://irc.freenode.net/#elasticsearch) IRC channel.
|
|
@ -10,12 +10,22 @@ class Panel::News::FrontEnd::NewsBulletinsController < OrbitWidgetController
|
|||
|
||||
def index
|
||||
if !params[:search_query].blank?
|
||||
@news_bulletins = NewsBulletin.solr_search do
|
||||
fulltext params[:search_query] do
|
||||
fields(:text,:title=>2.0)
|
||||
end
|
||||
end.each_hit_with_result
|
||||
search_query =params[:search_query].gsub(/"/,"").split(" ")
|
||||
|
||||
words_query = lambda do |boolean|
|
||||
search_query.each do |word|
|
||||
boolean.should { string "title:#{word}" }
|
||||
#boolean.should { string "sub_title:#{word}" }
|
||||
#boolean.should { string "text:#{word}" }
|
||||
end
|
||||
end
|
||||
|
||||
search_result=Tire.search('news_bulletins') do
|
||||
query {boolean &words_query }
|
||||
#raise to_curl
|
||||
end.results.collect{|t| t.id}
|
||||
|
||||
@news_bulletins = NewsBulletin.can_display.any_in(_id:search_result).page( params[:page_main]).per(10)
|
||||
else
|
||||
date_now = Time.now
|
||||
if !params[:category_id].blank?
|
||||
|
|
|
@ -5,16 +5,13 @@ class NewsBulletin
|
|||
include Mongoid::Timestamps
|
||||
include Mongoid::MultiParameterAttributes
|
||||
include Impressionist::Impressionable
|
||||
# include OrbitBasis::BaseModel
|
||||
# include OrbitSearchLib::ObjectSearchable
|
||||
# include NccuSearch
|
||||
include Tire::Model::Search
|
||||
include Tire::Model::Callbacks
|
||||
# include Redis::Objects
|
||||
include Mongoid::BaseModel
|
||||
|
||||
include Sunspot::Mongoid
|
||||
|
||||
|
||||
# scope :searchable,where(:is_checked=>true,:is_hidden=>false,:is_pending=>false)
|
||||
|
||||
scope :searchable,where(:is_checked=>true,:is_hidden=>false,:is_pending=>false)
|
||||
|
||||
is_impressionable :counter_cache => { :column_name => :view_count }
|
||||
|
||||
|
@ -64,61 +61,43 @@ class NewsBulletin
|
|||
|
||||
after_save :save_news_bulletin_links
|
||||
after_save :save_news_bulletin_files
|
||||
# include OrbitBasis::ClassMethods
|
||||
|
||||
|
||||
searchable do
|
||||
text :title do
|
||||
titles = ""
|
||||
titles << (self.title.zh_tw.nil? ? '':self.title.zh_tw)
|
||||
titles << (self.title.en.nil? ? '':self.title.en)
|
||||
#(titles << self.title.en )unless self.title.nil?
|
||||
doc = Nokogiri::HTML(titles)
|
||||
doc.text
|
||||
#VALID_LOCALES
|
||||
end
|
||||
|
||||
text :text do
|
||||
texts = ""
|
||||
texts << (self.text.zh_tw.nil? ? '':self.text.zh_tw)
|
||||
texts << (self.text.en.nil? ? '':self.text.en)
|
||||
#texts << self.text.en )unless self.text.en.nil?
|
||||
doc = Nokogiri::HTML(texts)
|
||||
doc.text
|
||||
#VALID_LOCALES
|
||||
end
|
||||
# text :sub_titles do
|
||||
# self.subtitle.zh_tw
|
||||
# #VALID_LOCALES
|
||||
# Tire.index 'news_bulletin' do
|
||||
# delete
|
||||
# create :mappings =>{
|
||||
# :news_bulletin_by_title => {
|
||||
# :properties=> {
|
||||
# :title => { :type => 'string', :index => 'not_analyzed', :include_in_all => false },
|
||||
# :body => {}
|
||||
# }
|
||||
# }
|
||||
# :news_bulletin_by_body => {
|
||||
# :properties=> {
|
||||
# :body => { :type => 'string', :index => 'not_analyzed', :include_in_all => false },
|
||||
# }
|
||||
# }
|
||||
# }
|
||||
# end
|
||||
# text :text do
|
||||
# self.text.zh_tw
|
||||
# #VALID_LOCALES
|
||||
# end
|
||||
# text :content, :publish_month
|
||||
# text :comments do
|
||||
# comments.map(&:content)
|
||||
# end
|
||||
# time :published_at
|
||||
# string :publish_month
|
||||
end
|
||||
# mapping do
|
||||
# indexes :title, :analyzer => 'cjk', :boost => 10
|
||||
# indexes :sub_titles, :analyzer => 'cjk', :boost => 5
|
||||
# indexes :text, :analyzer => 'cjk'
|
||||
# end
|
||||
def type
|
||||
"news_bulletin"
|
||||
end
|
||||
|
||||
# def to_indexed_json
|
||||
# titles = title.zh_tw + title.en
|
||||
# sub_titles = subtitle.zh_tw + subtitle.en
|
||||
# texts = text.zh_tw + text.en
|
||||
# {
|
||||
# :id => id,
|
||||
# :title => titles,
|
||||
# :sub_titles => sub_titles,
|
||||
# :text => texts
|
||||
# }.to_json
|
||||
# end
|
||||
def to_indexed_json
|
||||
titles = title.zh_tw #+ title.en
|
||||
sub_titles = subtitle.zh_tw #+ subtitle.en
|
||||
texts = text.zh_tw #+ text.en
|
||||
{
|
||||
:_id => _id,
|
||||
:title => Nokogiri::HTML(titles).text,
|
||||
:sub_title => Nokogiri::HTML(sub_titles).text,
|
||||
:text => Nokogiri::HTML(texts).text
|
||||
}.to_json
|
||||
end
|
||||
|
||||
def self.search( search = nil, category_id = nil )
|
||||
if category_id.to_s.size > 0 and search.to_s.size > 0
|
||||
|
|
Loading…
Reference in New Issue