fauna / ultrasphinx

Ruby on Rails configurator and client to the Sphinx full text search engine

This URL has Read+Write access

Matt Gleeson (author)
Thu Jun 18 12:40:45 -0700 2009
fauna (committer)
Sat Jun 27 11:04:12 -0700 2009
ultrasphinx / examples / default.base
100644 91 lines (77 sloc) 3.013 kb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
 
#
# Sphinx/Ultrasphinx user-configurable options.
#
# Copy this file to RAILS_ROOT/config/ultrasphinx. You can use individual
# namespaces if you want (e.g. development.base, production.base,
# test.base). Note that ERb is also allowed.
#
# This file should not be handed directly to Sphinx. Use the rake task
#
# rake ultrasphinx::configure
#
# to generate a parallel default.conf file. This is the file that Sphinx itself will
# use. The Ultrasphinx rake tasks automatically pass the correct file to
# to Sphinx.
#
# It is safe to edit .base files by hand. It is not safe to edit the generated
# .conf files. Do not symlink the .conf file to the .base file; it's wrong.
#
 
<% path = "/opt/local/var/db/sphinx/" %>
 
# Indexing options
indexer
{
  mem_limit = 256M
 
  # Ultrasphinx-specific key
  delta = <%= 1.day + 30.minutes %>
}
 
# Daemon options
searchd
{
  # What interface the search daemon should listen on and where to store its logs
  address = 0.0.0.0
  port = 3313
  seamless_rotate = 1
  log = <%= path %>log/searchd.log
  query_log = <%= path %>log/query.log
  read_timeout = 5
  max_children = 300
  pid_file = <%= path %>log/searchd.pid
  max_matches = 100000
}
 
# Client options
client
{
  # Name of the Aspell dictionary (two letters max)
  dictionary_name = ap
  
  # How your application connects to the search daemon (not necessarily the same as above)
  server_host = localhost
  server_port = 3313
}
 
# Individual SQL source options
source
{
  sql_ranged_throttle = 0
  sql_range_step = 5000
  sql_query_post =
}
 
# Index building options
index
{
  path = <%= path %>
  docinfo = extern # Just leave this alone
  morphology = stem_en
  stopwords = # <%= path %>/ap-stopwords.txt
  min_word_len = 1
 
  # HTML-specific options
  html_strip = 0
  html_index_attrs =
  
  # Enable these if you need wildcard searching. They will slow down indexing significantly.
  # min_infix_len = 1
  # enable_star = 1
 
  # # URL search options
  # # add " @, /, :," before " a-z," in the charset_table and uncomment prefix_fields
  # to seach URL and email addresses
  # prefix_fields = url, domain
    
  charset_type = utf-8 # or sbcs (Single Byte Character Set)
  charset_table = 0..9, A..Z->a..z, -, _, ., &, a..z, U+410..U+42F->U+430..U+44F, U+430..U+44F,U+C5->U+E5, U+E5, U+C4->U+E4, U+E4, U+D6->U+F6, U+F6, U+16B, U+0c1->a, U+0c4->a, U+0c9->e, U+0cd->i, U+0d3->o, U+0d4->o, U+0da->u, U+0dd->y, U+0e1->a, U+0e4->a, U+0e9->e, U+0ed->i, U+0f3->o, U+0f4->o, U+0fa->u, U+0fd->y, U+104->U+105, U+105, U+106->U+107, U+10c->c, U+10d->c, U+10e->d, U+10f->d, U+116->U+117, U+117, U+118->U+119, U+11a->e, U+11b->e, U+12E->U+12F, U+12F, U+139->l, U+13a->l, U+13d->l, U+13e->l, U+141->U+142, U+142, U+143->U+144, U+144,U+147->n, U+148->n, U+154->r, U+155->r, U+158->r, U+159->r, U+15A->U+15B, U+15B, U+160->s, U+160->U+161, U+161->s, U+164->t, U+165->t, U+16A->U+16B, U+16B, U+16e->u, U+16f->u, U+172->U+173, U+173, U+179->U+17A, U+17A, U+17B->U+17C, U+17C, U+17d->z, U+17e->z,
}