<?xml version="1.0" encoding="UTF-8"?>
<commit>
  <added type="array"/>
  <modified type="array">
    <modified>
      <diff>@@ -79,6 +79,11 @@ index
   # Enable these if you need wildcard searching. They will slow down indexing significantly.
   #   min_infix_len = 1    
   #   enable_star = 1 
+
+  # # URL search options
+  # # add &quot; @, /, :,&quot; before &quot; a-z,&quot; in the charset_table and uncomment prefix_fields
+  # to seach URL and email addresses
+  # prefix_fields = url, domain
     
   charset_type = utf-8 # or sbcs (Single Byte Character Set)
   charset_table = 0..9, A..Z-&gt;a..z, -, _, ., &amp;, a..z, U+410..U+42F-&gt;U+430..U+44F, U+430..U+44F,U+C5-&gt;U+E5, U+E5, U+C4-&gt;U+E4, U+E4, U+D6-&gt;U+F6, U+F6, U+16B, U+0c1-&gt;a, U+0c4-&gt;a, U+0c9-&gt;e, U+0cd-&gt;i, U+0d3-&gt;o, U+0d4-&gt;o, U+0da-&gt;u, U+0dd-&gt;y, U+0e1-&gt;a, U+0e4-&gt;a, U+0e9-&gt;e, U+0ed-&gt;i, U+0f3-&gt;o, U+0f4-&gt;o, U+0fa-&gt;u, U+0fd-&gt;y, U+104-&gt;U+105, U+105, U+106-&gt;U+107, U+10c-&gt;c, U+10d-&gt;c, U+10e-&gt;d, U+10f-&gt;d, U+116-&gt;U+117, U+117, U+118-&gt;U+119, U+11a-&gt;e, U+11b-&gt;e, U+12E-&gt;U+12F, U+12F, U+139-&gt;l, U+13a-&gt;l, U+13d-&gt;l, U+13e-&gt;l, U+141-&gt;U+142, U+142, U+143-&gt;U+144, U+144,U+147-&gt;n, U+148-&gt;n, U+154-&gt;r, U+155-&gt;r, U+158-&gt;r, U+159-&gt;r, U+15A-&gt;U+15B, U+15B, U+160-&gt;s, U+160-&gt;U+161, U+161-&gt;s, U+164-&gt;t, U+165-&gt;t, U+16A-&gt;U+16B, U+16B, U+16e-&gt;u, U+16f-&gt;u, U+172-&gt;U+173, U+173, U+179-&gt;U+17A, U+17A, U+17B-&gt;U+17C, U+17C, U+17d-&gt;z, U+17e-&gt;z,</diff>
      <filename>examples/default.base</filename>
    </modified>
    <modified>
      <diff>@@ -131,7 +131,14 @@ module Ultrasphinx
           # Remove some spaces
           content.gsub!(/^&quot;\s+|\s+&quot;$/, '&quot;')
           # Convert fields into sphinx style, reformat the stream object
-          if content =~ /(.*?):(.*)/
+          if content =~ /(^(http|https):\/\/[a-z0-9]+([-.]{1}[a-z0-9]*)+. [a-z]{2,5}(([0-9]{1,5})?\/.*)?$)/ix
+            # XXX hack, its somewhat common to search for URLs.  be sure to add 
+            # &quot; @, /,&quot; in the charset_type of the US config to search on all 
+            # URLs and email addresses, and add:
+            # prefix_fields = url, domain
+            # to your US config
+            token_hash[nil] += [[operator, content]]
+          elsif content =~ /(.*?):(.*)/
             token_hash[$1] += [[operator, $2]]
           else
             token_hash[nil] += [[operator, content]]
@@ -143,4 +150,4 @@ module Ultrasphinx
 
     end
   end
-end
\ No newline at end of file
+end</diff>
      <filename>lib/ultrasphinx/search/parser.rb</filename>
    </modified>
  </modified>
  <removed type="array"/>
  <parents type="array">
    <parent>
      <id>518c24765c6f2baa6cdc90831949af1dc5bb97cf</id>
    </parent>
  </parents>
  <author>
    <name>Mike Mondragon</name>
    <email>mikemondragon@gmail.com</email>
  </author>
  <url>http://github.com/fauna/ultrasphinx/commit/053ab3a8e8f4b5b4a1a3dc2cb6ef2d5599268582</url>
  <id>053ab3a8e8f4b5b4a1a3dc2cb6ef2d5599268582</id>
  <committed-date>2009-02-02T01:14:00-08:00</committed-date>
  <authored-date>2008-09-08T17:01:04-07:00</authored-date>
  <message>Hack on the token_stream_to_hash to account for searching for URL
strings.  Also notes in the default.base on enabling URL searching from
the Spinx side.

Signed-off-by: Snax Fauna &lt;evan+fauna@cloudbur.st&gt;</message>
  <tree>d64d42358ee4ec2230346218a861482f4301d901</tree>
  <committer>
    <name>Snax Fauna</name>
    <email>evan+fauna@cloudbur.st</email>
  </committer>
</commit>
