# = Picky Applications
#
# A Picky Application is where you configure the whole search engine.
#
# This is a step-by-step description on how to configure your Picky app.
#
# Start by subclassing Application:
# class MyGreatSearch < Application
# # Your configuration goes here.
# end
# The generator
# $ picky project project_name
# will generate an example project_name/app/application.rb file for you
# with some example code inside.
#
# == index(name, source)
#
# Next, define where your data comes from. You use the index method for that:
# my_index = index :some_index_name, some_source
# You give the index a name (or identifier), and a source (see Sources), where its data comes from. Let's do that:
# class MyGreatSearch < Application
#
# books = index :books, Sources::CSV.new(:title, :author, :isbn, file:'app/library.csv')
#
# end
# Now we have an index books.
#
# That on itself won't do much good.
#
# == index.define_category(identifier, options = {})
#
# Picky needs us to define categories on the data.
#
# Categories help your user find data.
# It's best if you look at an example yourself: http://floere.github.com/picky/examples.html
#
# Let's go ahead and define a category:
# class MyGreatSearch < Application
#
# books = index :books, Sources::CSV.new(:title, :author, :isbn, file:'app/library.csv')
# books.define_category :title
#
# end
# Now we could already run the indexer:
# $ rake index
#
# (You can define similarity or partial search capabilities on a category, see http://github.com/floere/picky/wiki/Categories-configuration for info)
#
# So now we have indexed data (the title), but nobody to ask the index anything.
#
# == Query::Full.new(*indexes, options = {})
#
# We need somebody who asks the index (a Query object, also see http://github.com/floere/picky/wiki/Queries-Configuration). That works like this:
# full_books_query = Query::Full.new books
# Full just means that the ids are returned with the results.
# Picky also offers a Query that returns live results, Query::Live. But that's not important right now.
#
# Now we have somebody we can ask about the index. But no external interface.
#
# == route(/regexp1/ => query1, /regexp2/ => query2, ...)
#
# Let's add a URL path (a Route, see http://github.com/floere/picky/wiki/Routing-configuration) to which we can send our queries. We do that with the route method:
# route %r{^/books/full$} => full_books_query
# In full glory:
# class MyGreatSearch < Application
#
# books = index :books, Sources::CSV.new(:title, :author, :isbn, file:'app/library.csv')
# books.define_category :title
#
# full_books_query = Query::Full.new books
#
# route %r{^/books/full$} => full_books_query
#
# end
# That's it!
#
# Now run the indexer and server:
# $ rake index
# $ rake start
# Run your first query:
# $ curl 'localhost:8080/books/full?query=hello server'
#
# Nice, right? Your first query!
#
# Maybe you don't find everything. We need to process the data before it goes into the index.
#
# == default_indexing(options = {})
#
# That's what the default_indexing method is for:
# default_indexing options
# Read more about the options here: http://github.com/floere/picky/wiki/Indexing-configuration
#
# Same thing with the search text – we need to process that as well.
#
# == default_querying(options = {})
#
# Analog to the default_indexing method, we use the default_querying method.
# default_querying options
# Read more about the options here: http://github.com/floere/picky/wiki/Querying-Configuration
#
# And that's all there is. It's incredibly powerful though, as you can combine, weigh, refine to the max.
#
# == Wiki
#
# Read more in the Wiki: http://github.com/floere/picky/wiki
#
# Have fun!
#
# == Full example
#
# Our example, fully fleshed out with indexing, querying, and weights:
# class MyGreatSearch < Application
#
# default_indexing removes_characters: /[^a-zA-Z0-9\.]/,
# stopwords: /\b(and|or|in|on|is|has)\b/,
# splits_text_on: /\s/,
# removes_characters_after_splitting: /\./,
# substitutes_characters_with: CharacterSubstituters::WestEuropean.new,
# normalizes_words: [
# [/(.*)hausen/, 'hn'],
# [/\b(\w*)str(eet)?/, 'st']
# ]
#
# default_querying removes_characters: /[^a-zA-Z0-9\s\/\-\,\&\"\~\*\:]/,
# stopwords: /\b(and|the|of|it|in|for)\b/,
# splits_text_on: /[\s\/\-\,\&]+/,
# removes_characters_after_splitting: /\./,
# substitutes_characters_with: CharacterSubstituters::WestEuropean.new,
# maximum_tokens: 4
#
# books = index :books, Sources::CSV.new(:title, :author, :isbn, file:'app/library.csv')
# books.define_category :title,
# qualifiers: [:t, :title, :titre],
# partial: Partial::Substring.new(:from => 1),
# similarity: Similarity::Phonetic.new(2)
# books.define_category :author,
# partial: Partial::Substring.new(:from => -2)
# books.define_category :isbn
#
# query_options = { :weights => { [:title, :author] => +3, [:author, :title] => -1 } }
#
# full_books_query = Query::Full.new books, query_options
# live_books_query = Query::Full.new books, query_options
#
# route %r{^/books/full$} => full_books_query
# route %r{^/books/live$} => live_books_query
#
# end
# That's actually already a full-blown Picky App!
#
class Application
class << self
# API
#
# Returns a configured tokenizer that
# is used for indexing by default.
#
def default_indexing options = {}
Tokenizers::Index.default = Tokenizers::Index.new(options)
end
# Returns a configured tokenizer that
# is used for querying by default.
#
def default_querying options = {}
Tokenizers::Query.default = Tokenizers::Query.new(options)
end
# Create a new index for indexing and for querying.
#
# Parameters:
# * name: The identifier of the index. Used:
# - to identify an index (e.g. by you in Rake tasks).
# - in the frontend to describe which index a result came from.
# - index directory naming (index/development/the_identifier/)
# * source: The source the data comes from. See Sources::Base. # TODO Sources (all).
#
# Options:
# * result_type: # TODO Rename.
#
def index name, source, options = {}
IndexAPI.new name, source, options
end
# Routes.
#
delegate :route, :root, :to => :routing
#
# API
# A Picky application implements the Rack interface.
#
# Delegates to its routing to handle a request.
#
def call env
routing.call env
end
def routing # :nodoc:
@routing ||= Routing.new
end
# Finalize the subclass as soon as it
# has finished loading.
#
attr_reader :apps # :nodoc:
def initialize_apps # :nodoc:
@apps ||= []
end
def inherited app # :nodoc:
initialize_apps
apps << app
end
def finalize_apps # :nodoc:
initialize_apps
apps.each &:finalize
end
# Finalizes the routes.
#
def finalize # :nodoc:
routing.freeze
end
# TODO Add more info if possible.
#
def to_s # :nodoc:
"#{self.name}:\n#{routing}"
end
end
end