NewsBlur-viq/apps/search/models.py

import time
import datetime
import pyes
import redis
import mongoengine as mongo
from pyes.query import MatchQuery
from django.conf import settings
from django.contrib.auth.models import User
from apps.search.tasks import IndexSubscriptionsForSearch
from utils import log as logging

class MUserSearch(mongo.Document):
    '''Search index state of a user's subscriptions.'''
    user_id                  = mongo.IntField(unique=True)
    last_search_date         = mongo.DateTimeField()
    subscriptions_indexed    = mongo.BooleanField()
    subscriptions_indexing   = mongo.BooleanField()
    
    meta = {
        'collection': 'user_search',
        'indexes': ['user_id'],
        'index_drop_dups': True,
        'allow_inheritance': False,
    }
    
    @classmethod
    def get_user(cls, user_id):
        try:
            user_search = cls.objects.get(user_id=user_id)
        except cls.DoesNotExist:
            user_search = cls.objects.create(user_id=user_id)
        
        return user_search
    
    def touch_search_date(self):
        if not self.subscriptions_indexed and not self.subscriptions_indexing:
            self.schedule_index_subscriptions_for_search()
            self.subscriptions_indexing = True

        self.last_search_date = datetime.datetime.now()
        self.save()

    def schedule_index_subscriptions_for_search(self):
        IndexSubscriptionsForSearch.apply_async(kwargs=dict(user_id=self.user_id))
        
    # Should be run as a background task
    def index_subscriptions_for_search(self):
        from apps.rss_feeds.models import Feed
        from apps.reader.models import UserSubscription
        
        SearchStory.create_elasticsearch_mapping()
        
        start = time.time()
        not_found = 0
        processed = 0
        user = User.objects.get(pk=self.user_id)
        r = redis.Redis(connection_pool=settings.REDIS_PUBSUB_POOL)
        r.publish(user.username, 'search_index_complete:start')
        throttle = time.time()
        
        subscriptions = UserSubscription.objects.filter(user=user)
        total = subscriptions.count()
        logging.user(user, "~FCIndexing ~SB%s feeds~SN for ~SB~FB%s~FC~SN..." % 
                     (total, user.username))
        
        for sub in subscriptions:
            try:
                feed = sub.feed
            except Feed.DoesNotExist:
                not_found += 1
                continue
            
            feed.index_stories_for_search()
            processed += 1
            
            # Throttle notifications to client as to not flood them
            if time.time() - throttle > 0.05:
                r.publish(user.username, 'search_index_complete:%.4s' % (float(processed)/total))
                throttle = time.time()
        
        duration = time.time() - start
        logging.user(user, "~FCIndexed ~SB%s/%s feeds~SN for ~SB~FB%s~FC~SN in ~FM~SB%s~FC~SN sec." % 
                     (processed, total, user.username, round(duration, 2)))
        r.publish(user.username, 'search_index_complete:done')
        
        self.subscriptions_indexed = True
        self.subscriptions_indexing = False
        self.save()

class SearchStory:
    
    ES = pyes.ES(settings.ELASTICSEARCH_HOSTS)
    name = "stories"
    
    @classmethod
    def index_name(cls):
        return "%s-index" % cls.name
        
    @classmethod
    def type_name(cls):
        return "%s-type" % cls.name
        
    @classmethod
    def create_elasticsearch_mapping(cls, delete=False):
        if delete:
            cls.ES.indices.delete_index_if_exists("%s-index" % cls.name)
        cls.ES.indices.create_index_if_missing("%s-index" % cls.name)
        mapping = { 
            'title': {
                'boost': 3.0,
                'index': 'analyzed',
                'store': 'no',
                'type': 'string',
                'analyzer': 'snowball',
            },
            'content': {
                'boost': 1.0,
                'index': 'analyzed',
                'store': 'no',
                'type': 'string',
                'analyzer': 'snowball',
                "_source" : {"enabled" : False},
            },
            'author': {
                'boost': 1.0,
                'index': 'analyzed',
                'store': 'no',
                'type': 'string',   
                'analyzer': 'keyword',
            },
            'feed_id': {
                'store': 'no',
                'type': 'integer'
            },
            'date': {
                'store': 'no',
                'type': 'date',
            }
        }
        cls.ES.indices.put_mapping("%s-type" % cls.name, {'properties': mapping}, ["%s-index" % cls.name])
        
    @classmethod
    def index(cls, story_hash, story_title, story_content, story_author, story_feed_id, 
              story_date):
        doc = {
            "content"   : story_content,
            "title"     : story_title,
            "author"    : story_author,
            "feed_id"   : story_feed_id,
            "date"      : story_date,
        }
        cls.ES.index(doc, "%s-index" % cls.name, "%s-type" % cls.name, story_hash)
    
    @classmethod
    def remove(cls, story_hash):
        cls.ES.delete("%s-index" % cls.name, "%s-type" % cls.name, story_hash)
        
    @classmethod
    def query(cls, feed_ids, query, order, offset, limit):
        cls.ES.indices.refresh()
        
        sort     = "date:desc" if order == "newest" else "date:asc"
        string_q = pyes.query.StringQuery(query, default_operator="AND")
        feed_q   = pyes.query.TermsQuery('feed_id', feed_ids)
        q        = pyes.query.BoolQuery(must=[string_q, feed_q])
        results  = cls.ES.search(q, indices=cls.index_name(), doc_types=[cls.type_name()],
                                 partial_fields={}, sort=sort, start=offset, size=limit)
        logging.info("~FGSearch ~FCstories~FG for: ~SB%s (across %s feed%s)" % 
                     (query, len(feed_ids), 's' if len(feed_ids) != 1 else ''))
        
        return [r.get_id() for r in results]


class SearchFeed:
    
    ES = pyes.ES(settings.ELASTICSEARCH_HOSTS)
    name = "feeds"
    
    @classmethod
    def index_name(cls):
        return "%s-index" % cls.name
        
    @classmethod
    def type_name(cls):
        return "%s-type" % cls.name
        
    @classmethod
    def create_elasticsearch_mapping(cls, delete=False):
        if delete:
            cls.ES.indices.delete_index_if_exists("%s-index" % cls.name)
        settings =  {
            "index" : {
                "analysis": {
                    "analyzer": {
                        "edgengram_analyzer": {
                            "filter": ["edgengram"],
                            "tokenizer": "lowercase",
                            "type": "custom"
                        },
                        "ngram_analyzer": {
                            "filter": ["ngram"],
                            "tokenizer": "lowercase",
                            "type": "custom"
                        }
                    },
                    "filter": {
                        "edgengram": {
                            "max_gram": "15",
                            "min_gram": "2",
                            "type": "edgeNGram"
                        },
                        "ngram": {
                            "max_gram": "15",
                            "min_gram": "3",
                            "type": "nGram"
                        }
                    },
                    "tokenizer": {
                        "edgengram_tokenizer": {
                            "max_gram": "15",
                            "min_gram": "2",
                            "side": "front",
                            "type": "edgeNGram"
                        },
                        "ngram_tokenizer": {
                            "max_gram": "15",
                            "min_gram": "3",
                            "type": "nGram"
                        }
                    }
                }
            }
        }
        cls.ES.indices.create_index_if_missing("%s-index" % cls.name, settings)

        mapping = {
            "address": {
                "analyzer": "edgengram_analyzer",
                "store": True,
                "term_vector": "with_positions_offsets",
                "type": "string"
            },
            "feed_id": {
                "store": True,
                "type": "string"
            },
            "num_subscribers": {
                "index": "analyzed",
                "store": True,
                "type": "long"
            },
            "title": {
                "analyzer": "edgengram_analyzer",
                "store": True,
                "term_vector": "with_positions_offsets",
                "type": "string"
            }
        }
        cls.ES.indices.put_mapping("%s-type" % cls.name, {'properties': mapping}, ["%s-index" % cls.name])
        
    @classmethod
    def index(cls, feed_id, title, address, link, num_subscribers):
        doc = {
            "feed_id"           : feed_id,
            "title"             : title,
            "address"           : address,
            "link"              : link,
            "num_subscribers"   : num_subscribers,
        }
        cls.ES.index(doc, "%s-index" % cls.name, "%s-type" % cls.name, feed_id)
        
    @classmethod
    def query(cls, text):
        cls.ES.default_indices = cls.index_name()
        cls.ES.indices.refresh()
        
        logging.info("~FGSearch ~FCfeeds~FG by address: ~SB%s" % text)
        q = MatchQuery('address', text, operator="and", type="phrase")
        results = cls.ES.search(query=q, sort="num_subscribers:desc", size=5,
                                doc_types=[cls.type_name()])

        if not results.total:
            logging.info("~FGSearch ~FCfeeds~FG by title: ~SB%s" % text)
            q = MatchQuery('title', text, operator="and")
            results = cls.ES.search(query=q, sort="num_subscribers:desc", size=5,
                                    doc_types=[cls.type_name()])
            
        if not results.total:
            logging.info("~FGSearch ~FCfeeds~FG by link: ~SB%s" % text)
            q = MatchQuery('link', text, operator="and")
            results = cls.ES.search(query=q, sort="num_subscribers:desc", size=5,
                                    doc_types=[cls.type_name()])
            
        return results
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`import time`
			`import datetime`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`import pyes`
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`import redis`
			`import mongoengine as mongo`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`from pyes.query import MatchQuery`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`from django.conf import settings`
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`from django.contrib.auth.models import User`
			`from apps.search.tasks import IndexSubscriptionsForSearch`
Adding new maintenance page. 2012-12-21 15:05:38 -08:00			`from utils import log as logging`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`class MUserSearch(mongo.Document):`
			`'''Search index state of a user's subscriptions.'''`
			`user_id = mongo.IntField(unique=True)`
			`last_search_date = mongo.DateTimeField()`
			`subscriptions_indexed = mongo.BooleanField()`
			`subscriptions_indexing = mongo.BooleanField()`

			`meta = {`
			`'collection': 'user_search',`
			`'indexes': ['user_id'],`
			`'index_drop_dups': True,`
			`'allow_inheritance': False,`
			`}`

			`@classmethod`
			`def get_user(cls, user_id):`
			`try:`
			`user_search = cls.objects.get(user_id=user_id)`
			`except cls.DoesNotExist:`
			`user_search = cls.objects.create(user_id=user_id)`

			`return user_search`

			`def touch_search_date(self):`
			`if not self.subscriptions_indexed and not self.subscriptions_indexing:`
			`self.schedule_index_subscriptions_for_search()`
			`self.subscriptions_indexing = True`

			`self.last_search_date = datetime.datetime.now()`
			`self.save()`

			`def schedule_index_subscriptions_for_search(self):`
			`IndexSubscriptionsForSearch.apply_async(kwargs=dict(user_id=self.user_id))`

			`# Should be run as a background task`
			`def index_subscriptions_for_search(self):`
			`from apps.rss_feeds.models import Feed`
			`from apps.reader.models import UserSubscription`

			`SearchStory.create_elasticsearch_mapping()`

			`start = time.time()`
			`not_found = 0`
			`processed = 0`
			`user = User.objects.get(pk=self.user_id)`
			`r = redis.Redis(connection_pool=settings.REDIS_PUBSUB_POOL)`
			`r.publish(user.username, 'search_index_complete:start')`
			`throttle = time.time()`

			`subscriptions = UserSubscription.objects.filter(user=user)`
			`total = subscriptions.count()`
			`logging.user(user, "~FCIndexing ~SB%s feeds~SN for ~SB~FB%s~FC~SN..." %`
			`(total, user.username))`

			`for sub in subscriptions:`
			`try:`
			`feed = sub.feed`
			`except Feed.DoesNotExist:`
			`not_found += 1`
			`continue`

			`feed.index_stories_for_search()`
			`processed += 1`

			`# Throttle notifications to client as to not flood them`
			`if time.time() - throttle > 0.05:`
			`r.publish(user.username, 'search_index_complete:%.4s' % (float(processed)/total))`
			`throttle = time.time()`

			`duration = time.time() - start`
			`logging.user(user, "~FCIndexed ~SB%s/%s feeds~SN for ~SB~FB%s~FC~SN in ~FM~SB%s~FC~SN sec." %`
Retrying search on search indexing completion. Hiding story content preview when too short. 2014-04-16 16:06:39 -07:00			`(processed, total, user.username, round(duration, 2)))`
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`r.publish(user.username, 'search_index_complete:done')`

			`self.subscriptions_indexed = True`
			`self.subscriptions_indexing = False`
			`self.save()`

Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`class SearchStory:`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00
Making poor progress on search. Can't even query yet. 2012-07-13 14:33:16 -07:00			`ES = pyes.ES(settings.ELASTICSEARCH_HOSTS)`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`name = "stories"`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`@classmethod`
			`def index_name(cls):`
			`return "%s-index" % cls.name`

			`@classmethod`
			`def type_name(cls):`
			`return "%s-type" % cls.name`

Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`@classmethod`
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`def create_elasticsearch_mapping(cls, delete=False):`
			`if delete:`
			`cls.ES.indices.delete_index_if_exists("%s-index" % cls.name)`
			`cls.ES.indices.create_index_if_missing("%s-index" % cls.name)`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`mapping = {`
			`'title': {`
Indexing stories on indexes feeds during feed fetch. 2014-04-15 16:52:25 -07:00			`'boost': 3.0,`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`'index': 'analyzed',`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'store': 'no',`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`'type': 'string',`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'analyzer': 'snowball',`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`},`
			`'content': {`
			`'boost': 1.0,`
			`'index': 'analyzed',`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'store': 'no',`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`'type': 'string',`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'analyzer': 'snowball',`
Indexing stories on indexes feeds during feed fetch. 2014-04-15 16:52:25 -07:00			`"_source" : {"enabled" : False},`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`},`
			`'author': {`
			`'boost': 1.0,`
			`'index': 'analyzed',`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'store': 'no',`
Updating search for saved stories to search fuzzy queries. Connected to UI. 2012-12-20 16:07:22 -08:00			`'type': 'string',`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'analyzer': 'keyword',`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`},`
			`'feed_id': {`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'store': 'no',`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`'type': 'integer'`
			`},`
			`'date': {`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`'store': 'no',`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`'type': 'date',`
			`}`
			`}`
Adding stories to search index. 2014-04-11 17:25:13 -07:00			`cls.ES.indices.put_mapping("%s-type" % cls.name, {'properties': mapping}, ["%s-index" % cls.name])`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00
			`@classmethod`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`def index(cls, story_hash, story_title, story_content, story_author, story_feed_id,`
			`story_date):`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`doc = {`
Removing stories from search index on delete. 2014-04-15 14:59:00 -07:00			`"content" : story_content,`
			`"title" : story_title,`
			`"author" : story_author,`
			`"feed_id" : story_feed_id,`
			`"date" : story_date,`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00			`}`
Adding stories to search index. 2014-04-11 17:25:13 -07:00			`cls.ES.index(doc, "%s-index" % cls.name, "%s-type" % cls.name, story_hash)`
Removing stories from search index on delete. 2014-04-15 14:59:00 -07:00
			`@classmethod`
			`def remove(cls, story_hash):`
			`cls.ES.delete("%s-index" % cls.name, "%s-type" % cls.name, story_hash)`
Adding Search app and object, used to index stories and then search them. Needs views, ui, and support for saved stories. 2012-03-11 16:13:05 -07:00
			`@classmethod`
Preserving order on searches. Also using elasticsearch's paging. 2014-04-16 17:21:53 -07:00			`def query(cls, feed_ids, query, order, offset, limit):`
Changing param names. 2014-04-11 18:02:25 -07:00			`cls.ES.indices.refresh()`
Preserving order on searches. Also using elasticsearch's paging. 2014-04-16 17:21:53 -07:00
			`sort = "date:desc" if order == "newest" else "date:asc"`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`string_q = pyes.query.StringQuery(query, default_operator="AND")`
Removing stories from search index on delete. 2014-04-15 14:59:00 -07:00			`feed_q = pyes.query.TermsQuery('feed_id', feed_ids)`
			`q = pyes.query.BoolQuery(must=[string_q, feed_q])`
Indexing stories on indexes feeds during feed fetch. 2014-04-15 16:52:25 -07:00			`results = cls.ES.search(q, indices=cls.index_name(), doc_types=[cls.type_name()],`
Fixing size issue with elasticsearch. 2014-04-16 17:26:44 -07:00			`partial_fields={}, sort=sort, start=offset, size=limit)`
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`logging.info("~FGSearch ~FCstories~FG for: ~SB%s (across %s feed%s)" %`
			`(query, len(feed_ids), 's' if len(feed_ids) != 1 else ''))`
Indexing stories on indexes feeds during feed fetch. 2014-04-15 16:52:25 -07:00
Rewriting search to use Elasticsearch across feeds. Much faster, just needs indexing. 2014-04-15 14:17:15 -07:00			`return [r.get_id() for r in results]`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00

			`class SearchFeed:`

			`ES = pyes.ES(settings.ELASTICSEARCH_HOSTS)`
			`name = "feeds"`

Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`@classmethod`
			`def index_name(cls):`
			`return "%s-index" % cls.name`

			`@classmethod`
			`def type_name(cls):`
			`return "%s-type" % cls.name`

Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`@classmethod`
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`def create_elasticsearch_mapping(cls, delete=False):`
			`if delete:`
			`cls.ES.indices.delete_index_if_exists("%s-index" % cls.name)`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`settings = {`
			`"index" : {`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`"analysis": {`
			`"analyzer": {`
			`"edgengram_analyzer": {`
			`"filter": ["edgengram"],`
			`"tokenizer": "lowercase",`
			`"type": "custom"`
			`},`
			`"ngram_analyzer": {`
			`"filter": ["ngram"],`
			`"tokenizer": "lowercase",`
			`"type": "custom"`
			`}`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`},`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`"filter": {`
			`"edgengram": {`
			`"max_gram": "15",`
			`"min_gram": "2",`
			`"type": "edgeNGram"`
			`},`
			`"ngram": {`
			`"max_gram": "15",`
			`"min_gram": "3",`
			`"type": "nGram"`
			`}`
			`},`
			`"tokenizer": {`
			`"edgengram_tokenizer": {`
			`"max_gram": "15",`
			`"min_gram": "2",`
			`"side": "front",`
			`"type": "edgeNGram"`
			`},`
			`"ngram_tokenizer": {`
			`"max_gram": "15",`
			`"min_gram": "3",`
			`"type": "nGram"`
			`}`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`}`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`}`
			`}`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`}`
Updating search indexing progress in real-time. 2014-04-16 15:31:44 -07:00			`cls.ES.indices.create_index_if_missing("%s-index" % cls.name, settings)`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`mapping = {`
			`"address": {`
			`"analyzer": "edgengram_analyzer",`
			`"store": True,`
			`"term_vector": "with_positions_offsets",`
			`"type": "string"`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`},`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`"feed_id": {`
			`"store": True,`
			`"type": "string"`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`},`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`"num_subscribers": {`
			`"index": "analyzed",`
			`"store": True,`
			`"type": "long"`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`},`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`"title": {`
			`"analyzer": "edgengram_analyzer",`
			`"store": True,`
			`"term_vector": "with_positions_offsets",`
			`"type": "string"`
			`}`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`}`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`cls.ES.indices.put_mapping("%s-type" % cls.name, {'properties': mapping}, ["%s-index" % cls.name])`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00
			`@classmethod`
			`def index(cls, feed_id, title, address, link, num_subscribers):`
			`doc = {`
Removing stories from search index on delete. 2014-04-15 14:59:00 -07:00			`"feed_id" : feed_id,`
			`"title" : title,`
			`"address" : address,`
			`"link" : link,`
			`"num_subscribers" : num_subscribers,`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00			`}`
			`cls.ES.index(doc, "%s-index" % cls.name, "%s-type" % cls.name, feed_id)`

			`@classmethod`
			`def query(cls, text):`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`cls.ES.default_indices = cls.index_name()`
			`cls.ES.indices.refresh()`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00
			`logging.info("~FGSearch ~FCfeeds~FG by address: ~SB%s" % text)`
Forcing all terms to be found. 2014-04-11 16:26:09 -07:00			`q = MatchQuery('address', text, operator="and", type="phrase")`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`results = cls.ES.search(query=q, sort="num_subscribers:desc", size=5,`
			`doc_types=[cls.type_name()])`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00
			`if not results.total:`
			`logging.info("~FGSearch ~FCfeeds~FG by title: ~SB%s" % text)`
Cribbing mapping from haystack. 2014-04-11 16:04:30 -07:00			`q = MatchQuery('title', text, operator="and")`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`results = cls.ES.search(query=q, sort="num_subscribers:desc", size=5,`
			`doc_types=[cls.type_name()])`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00
			`if not results.total:`
			`logging.info("~FGSearch ~FCfeeds~FG by link: ~SB%s" % text)`
Forcing all terms to be found. 2014-04-11 16:26:09 -07:00			`q = MatchQuery('link', text, operator="and")`
Swapping out haystack for pyes. 2014-04-11 15:40:58 -07:00			`results = cls.ES.search(query=q, sort="num_subscribers:desc", size=5,`
			`doc_types=[cls.type_name()])`
Adding broken search for feeds. 2013-01-04 16:34:27 -08:00
			`return results`