2010-07-06 16:37:49 -04:00
|
|
|
import datetime
|
2010-08-21 20:42:38 -04:00
|
|
|
import mongoengine as mongo
|
2010-08-16 15:45:35 -04:00
|
|
|
from utils import log as logging
|
2010-09-16 10:35:36 -04:00
|
|
|
from utils import json
|
2009-06-16 03:08:55 +00:00
|
|
|
from django.db import models
|
2010-09-19 11:30:18 -04:00
|
|
|
from django.conf import settings
|
2009-06-16 03:08:55 +00:00
|
|
|
from django.contrib.auth.models import User
|
2009-07-25 15:24:27 +00:00
|
|
|
from django.core.cache import cache
|
2010-08-21 23:49:36 -04:00
|
|
|
from apps.rss_feeds.models import Feed, Story, MStory
|
2010-08-22 18:34:40 -04:00
|
|
|
from apps.analyzer.models import MClassifierFeed, MClassifierAuthor, MClassifierTag, MClassifierTitle
|
2010-01-21 13:12:29 -05:00
|
|
|
from apps.analyzer.models import apply_classifier_titles, apply_classifier_feeds, apply_classifier_authors, apply_classifier_tags
|
|
|
|
|
|
|
|
DAYS_OF_UNREAD = 14
|
2010-09-19 11:30:18 -04:00
|
|
|
UNREAD_CUTOFF = datetime.datetime.utcnow() - datetime.timedelta(days=settings.DAYS_OF_UNREAD)
|
2009-06-16 03:08:55 +00:00
|
|
|
|
|
|
|
class UserSubscription(models.Model):
|
2010-07-20 20:23:49 -04:00
|
|
|
"""
|
|
|
|
A feed which a user has subscrubed to. Carries all of the cached information
|
|
|
|
about the subscription, including unread counts of the three primary scores.
|
|
|
|
|
|
|
|
Also has a dirty flag (needs_unread_recalc) which means that the unread counts
|
|
|
|
are not accurate and need to be calculated with `self.calculate_feed_scores()`.
|
|
|
|
"""
|
2010-09-16 14:35:20 -04:00
|
|
|
user = models.ForeignKey(User, related_name='subscriptions')
|
|
|
|
feed = models.ForeignKey(Feed, related_name='subscribers')
|
2010-09-19 11:30:18 -04:00
|
|
|
last_read_date = models.DateTimeField(default=UNREAD_CUTOFF)
|
|
|
|
mark_read_date = models.DateTimeField(default=UNREAD_CUTOFF)
|
2010-01-21 13:12:29 -05:00
|
|
|
unread_count_neutral = models.IntegerField(default=0)
|
|
|
|
unread_count_positive = models.IntegerField(default=0)
|
|
|
|
unread_count_negative = models.IntegerField(default=0)
|
2010-09-01 08:29:43 -04:00
|
|
|
unread_count_updated = models.DateTimeField(auto_now=True)
|
2010-04-08 18:36:48 -04:00
|
|
|
needs_unread_recalc = models.BooleanField(default=False)
|
2010-07-20 20:23:49 -04:00
|
|
|
feed_opens = models.IntegerField(default=0)
|
2010-08-01 19:12:42 -04:00
|
|
|
is_trained = models.BooleanField(default=False)
|
2009-06-16 03:08:55 +00:00
|
|
|
|
|
|
|
def __unicode__(self):
|
2009-07-25 00:57:39 +00:00
|
|
|
return '[' + self.feed.feed_title + '] '
|
2009-06-16 03:08:55 +00:00
|
|
|
|
|
|
|
def mark_feed_read(self):
|
2010-09-16 22:04:18 -04:00
|
|
|
now = datetime.datetime.utcnow()
|
2010-08-21 23:49:36 -04:00
|
|
|
if MStory.objects(story_feed_id=self.feed.pk).first():
|
|
|
|
latest_story_date = MStory.objects(story_feed_id=self.feed.pk).order_by('-story_date')[0].story_date\
|
2010-06-14 01:01:21 -04:00
|
|
|
+ datetime.timedelta(minutes=1)
|
|
|
|
else:
|
|
|
|
latest_story_date = now
|
2010-04-09 16:14:11 -04:00
|
|
|
self.last_read_date = max(now, latest_story_date)
|
|
|
|
self.mark_read_date = max(now, latest_story_date)
|
2010-04-08 18:36:48 -04:00
|
|
|
self.unread_count_negative = 0
|
|
|
|
self.unread_count_positive = 0
|
|
|
|
self.unread_count_neutral = 0
|
2010-04-09 16:14:11 -04:00
|
|
|
self.unread_count_updated = max(now, latest_story_date)
|
2010-09-20 09:34:18 -04:00
|
|
|
self.needs_unread_recalc = False
|
2009-06-16 03:08:55 +00:00
|
|
|
self.save()
|
|
|
|
|
2010-09-19 11:30:18 -04:00
|
|
|
def calculate_feed_scores(self, silent=False, stories_db=None):
|
2010-09-20 18:22:07 -04:00
|
|
|
if self.user.profile.last_seen_on < UNREAD_CUTOFF:
|
2010-08-19 10:43:07 -04:00
|
|
|
if not silent:
|
2010-09-20 09:34:18 -04:00
|
|
|
logging.info(' ---> [%s] SKIPPING Computing scores: %s (1 week+)' % (self.user, self.feed))
|
2010-08-19 10:43:07 -04:00
|
|
|
return
|
|
|
|
|
2010-08-11 14:42:40 -04:00
|
|
|
if not self.feed.fetched_once:
|
2010-08-15 12:04:26 -04:00
|
|
|
if not silent:
|
2010-08-17 17:45:51 -04:00
|
|
|
logging.info(' ---> [%s] NOT Computing scores: %s' % (self.user, self.feed))
|
2010-08-11 14:44:25 -04:00
|
|
|
self.needs_unread_recalc = False
|
|
|
|
self.save()
|
2010-08-11 14:42:40 -04:00
|
|
|
return
|
2010-09-18 16:15:59 -04:00
|
|
|
now = datetime.datetime.now()
|
2010-08-15 12:07:19 -04:00
|
|
|
if not silent:
|
2010-08-17 17:45:51 -04:00
|
|
|
logging.info(' ---> [%s] Computing scores: %s' % (self.user, self.feed))
|
2010-01-21 13:12:29 -05:00
|
|
|
feed_scores = dict(negative=0, neutral=0, positive=0)
|
2010-02-17 00:53:05 -05:00
|
|
|
|
|
|
|
# Two weeks in age. If mark_read_date is older, mark old stories as read.
|
2010-09-19 11:30:18 -04:00
|
|
|
date_delta = UNREAD_CUTOFF
|
2010-01-21 13:12:29 -05:00
|
|
|
if date_delta < self.mark_read_date:
|
|
|
|
date_delta = self.mark_read_date
|
2010-02-17 00:53:05 -05:00
|
|
|
else:
|
|
|
|
self.mark_read_date = date_delta
|
|
|
|
|
2010-08-21 23:49:36 -04:00
|
|
|
read_stories = MUserStory.objects(user_id=self.user.pk,
|
2010-09-10 08:38:50 -07:00
|
|
|
feed_id=self.feed.pk,
|
|
|
|
read_date__gte=self.mark_read_date)
|
2010-09-18 16:15:59 -04:00
|
|
|
if not silent:
|
2010-09-18 16:19:30 -04:00
|
|
|
logging.info(' ---> [%s] Read stories: %s' % (self.user, datetime.datetime.now() - now))
|
2010-09-10 08:38:50 -07:00
|
|
|
read_stories_ids = []
|
|
|
|
for us in read_stories:
|
|
|
|
if hasattr(us.story, 'story_guid') and isinstance(us.story.story_guid, unicode):
|
|
|
|
read_stories_ids.append(us.story.story_guid)
|
|
|
|
elif hasattr(us.story, 'id') and isinstance(us.story.id, unicode):
|
|
|
|
read_stories_ids.append(us.story.id) # TODO: Remove me after migration from story.id->guid
|
2010-09-19 11:30:18 -04:00
|
|
|
stories_db = stories_db or MStory.objects(story_feed_id=self.feed.pk,
|
|
|
|
story_date__gte=date_delta)
|
2010-09-18 16:15:59 -04:00
|
|
|
if not silent:
|
2010-09-18 16:19:30 -04:00
|
|
|
logging.info(' ---> [%s] MStory: %s' % (self.user, datetime.datetime.now() - now))
|
2010-09-10 08:38:50 -07:00
|
|
|
unread_stories_db = []
|
|
|
|
for story in stories_db:
|
2010-09-19 11:48:38 -04:00
|
|
|
if story.story_date < date_delta:
|
|
|
|
continue
|
2010-09-10 08:56:30 -07:00
|
|
|
if hasattr(story, 'story_guid') and story.story_guid not in read_stories_ids:
|
2010-09-10 08:38:50 -07:00
|
|
|
unread_stories_db.append(story)
|
2010-09-10 08:56:30 -07:00
|
|
|
elif isinstance(story.id, unicode) and story.id not in read_stories_ids:
|
2010-09-10 08:38:50 -07:00
|
|
|
unread_stories_db.append(story)
|
2010-09-10 08:56:30 -07:00
|
|
|
stories = self.feed.format_stories(unread_stories_db)
|
2010-09-18 16:15:59 -04:00
|
|
|
if not silent:
|
2010-09-18 16:19:30 -04:00
|
|
|
logging.info(' ---> [%s] Format stories: %s' % (self.user, datetime.datetime.now() - now))
|
2010-08-21 23:49:36 -04:00
|
|
|
|
2010-08-22 18:34:40 -04:00
|
|
|
classifier_feeds = MClassifierFeed.objects(user_id=self.user.pk, feed_id=self.feed.pk)
|
|
|
|
classifier_authors = MClassifierAuthor.objects(user_id=self.user.pk, feed_id=self.feed.pk)
|
|
|
|
classifier_titles = MClassifierTitle.objects(user_id=self.user.pk, feed_id=self.feed.pk)
|
|
|
|
classifier_tags = MClassifierTag.objects(user_id=self.user.pk, feed_id=self.feed.pk)
|
2010-01-21 13:12:29 -05:00
|
|
|
|
2010-09-18 16:15:59 -04:00
|
|
|
if not silent:
|
2010-09-19 11:41:22 -04:00
|
|
|
logging.info(' ---> [%s] Classifiers: %s (%s)' % (self.user, datetime.datetime.now() - now, classifier_feeds.count() + classifier_authors.count() + classifier_tags.count() + classifier_titles.count()))
|
2010-09-18 16:15:59 -04:00
|
|
|
|
2010-01-21 13:12:29 -05:00
|
|
|
scores = {
|
|
|
|
'feed': apply_classifier_feeds(classifier_feeds, self.feed),
|
|
|
|
}
|
|
|
|
|
|
|
|
for story in stories:
|
2010-09-07 17:55:40 -07:00
|
|
|
classifier_authors.rewind()
|
|
|
|
classifier_tags.rewind()
|
|
|
|
classifier_titles.rewind()
|
2010-01-21 13:12:29 -05:00
|
|
|
scores.update({
|
|
|
|
'author': apply_classifier_authors(classifier_authors, story),
|
|
|
|
'tags': apply_classifier_tags(classifier_tags, story),
|
|
|
|
'title': apply_classifier_titles(classifier_titles, story),
|
|
|
|
})
|
|
|
|
|
|
|
|
max_score = max(scores['feed'], scores['author'], scores['tags'], scores['title'])
|
|
|
|
min_score = min(scores['feed'], scores['author'], scores['tags'], scores['title'])
|
|
|
|
if max_score > 0:
|
|
|
|
feed_scores['positive'] += 1
|
|
|
|
if min_score < 0:
|
|
|
|
feed_scores['negative'] += 1
|
|
|
|
if max_score == 0 and min_score == 0:
|
|
|
|
feed_scores['neutral'] += 1
|
|
|
|
|
2010-09-18 16:15:59 -04:00
|
|
|
if not silent:
|
2010-09-18 16:19:30 -04:00
|
|
|
logging.info(' ---> [%s] End classifiers: %s' % (self.user, datetime.datetime.now() - now))
|
2010-09-18 16:15:59 -04:00
|
|
|
|
2010-01-21 13:12:29 -05:00
|
|
|
self.unread_count_positive = feed_scores['positive']
|
|
|
|
self.unread_count_neutral = feed_scores['neutral']
|
|
|
|
self.unread_count_negative = feed_scores['negative']
|
2010-04-08 18:36:48 -04:00
|
|
|
self.needs_unread_recalc = False
|
2009-08-29 19:34:42 +00:00
|
|
|
|
|
|
|
self.save()
|
|
|
|
|
2010-07-06 16:37:49 -04:00
|
|
|
if (self.unread_count_positive == 0 and
|
2010-08-16 12:52:39 -04:00
|
|
|
self.unread_count_neutral == 0):
|
2010-07-06 16:37:49 -04:00
|
|
|
self.mark_feed_read()
|
|
|
|
|
2010-01-27 18:28:57 -05:00
|
|
|
cache.delete('usersub:%s' % self.user.id)
|
|
|
|
|
2010-01-21 13:12:29 -05:00
|
|
|
return
|
2009-08-29 19:34:42 +00:00
|
|
|
|
2009-06-16 03:08:55 +00:00
|
|
|
class Meta:
|
|
|
|
unique_together = ("user", "feed")
|
|
|
|
|
|
|
|
|
2009-07-28 02:27:27 +00:00
|
|
|
class UserStory(models.Model):
|
2010-07-20 20:23:49 -04:00
|
|
|
"""
|
|
|
|
Stories read by the user. These are deleted as the mark_read_date for the
|
|
|
|
UserSubscription passes the UserStory date.
|
|
|
|
"""
|
2009-06-16 03:08:55 +00:00
|
|
|
user = models.ForeignKey(User)
|
|
|
|
feed = models.ForeignKey(Feed)
|
|
|
|
story = models.ForeignKey(Story)
|
|
|
|
read_date = models.DateTimeField(auto_now=True)
|
2009-07-28 02:27:27 +00:00
|
|
|
opinion = models.IntegerField(default=0)
|
2009-06-16 03:08:55 +00:00
|
|
|
|
|
|
|
def __unicode__(self):
|
2009-07-25 00:57:39 +00:00
|
|
|
return ('[' + self.feed.feed_title + '] '
|
2009-06-16 03:08:55 +00:00
|
|
|
+ self.story.story_title)
|
|
|
|
|
|
|
|
class Meta:
|
2009-07-28 02:27:27 +00:00
|
|
|
verbose_name_plural = "user stories"
|
|
|
|
verbose_name = "user story"
|
|
|
|
unique_together = ("user", "feed", "story")
|
2009-07-05 21:45:46 +00:00
|
|
|
|
2010-08-21 23:49:36 -04:00
|
|
|
|
2010-08-21 20:42:38 -04:00
|
|
|
class MUserStory(mongo.Document):
|
|
|
|
"""
|
|
|
|
Stories read by the user. These are deleted as the mark_read_date for the
|
|
|
|
UserSubscription passes the UserStory date.
|
|
|
|
"""
|
2010-08-21 23:49:36 -04:00
|
|
|
user_id = mongo.IntField()
|
|
|
|
feed_id = mongo.IntField()
|
|
|
|
read_date = mongo.DateTimeField()
|
|
|
|
story = mongo.ReferenceField(MStory, unique_with=('user_id', 'feed_id'))
|
2010-08-21 20:42:38 -04:00
|
|
|
|
2010-08-21 23:49:36 -04:00
|
|
|
meta = {
|
|
|
|
'collection': 'userstories',
|
|
|
|
'indexes': [('user_id', 'feed_id')],
|
|
|
|
'allow_inheritance': False,
|
|
|
|
}
|
2010-08-21 20:42:38 -04:00
|
|
|
|
2010-09-19 11:30:18 -04:00
|
|
|
@classmethod
|
|
|
|
def delete_old_stories(cls):
|
|
|
|
MUserStory.objects(read_date__lte=UNREAD_CUTOFF).delete()
|
|
|
|
|
2010-08-21 20:42:38 -04:00
|
|
|
|
2009-06-16 03:08:55 +00:00
|
|
|
class UserSubscriptionFolders(models.Model):
|
2010-07-20 20:23:49 -04:00
|
|
|
"""
|
|
|
|
A JSON list of folders and feeds for while a user has subscribed. The list
|
|
|
|
is a recursive descent of feeds and folders in folders. Used to layout
|
|
|
|
the feeds and folders in the Reader's feed navigation pane.
|
|
|
|
"""
|
2009-06-16 03:08:55 +00:00
|
|
|
user = models.ForeignKey(User)
|
2010-05-11 22:49:41 -04:00
|
|
|
folders = models.TextField(default="[]")
|
2009-06-16 03:08:55 +00:00
|
|
|
|
|
|
|
def __unicode__(self):
|
2010-02-11 01:28:47 -05:00
|
|
|
return "[%s]: %s" % (self.user, len(self.folders),)
|
2009-06-16 03:08:55 +00:00
|
|
|
|
|
|
|
class Meta:
|
|
|
|
verbose_name_plural = "folders"
|
2010-06-12 21:20:06 -04:00
|
|
|
verbose_name = "folder"
|
2010-09-16 10:35:36 -04:00
|
|
|
|
|
|
|
def delete_feed(self, feed_id, in_folder):
|
|
|
|
def _find_feed_in_folders(old_folders, folder_name='', multiples_found=False, deleted=False):
|
|
|
|
new_folders = []
|
|
|
|
for k, folder in enumerate(old_folders):
|
|
|
|
if isinstance(folder, int):
|
|
|
|
if (folder == feed_id and (
|
|
|
|
(folder_name != in_folder) or
|
|
|
|
(folder_name == in_folder and deleted))):
|
|
|
|
multiples_found = True
|
|
|
|
logging.info(" ---> [%s] Deleting feed, and a multiple has been found in '%s'" % (self.user, folder_name))
|
|
|
|
if folder == feed_id and folder_name == in_folder and not deleted:
|
|
|
|
logging.info(" ---> [%s] Delete feed: %s'th item: %s folders/feeds" % (
|
|
|
|
self.user, k, len(old_folders)
|
|
|
|
))
|
|
|
|
deleted = True
|
|
|
|
else:
|
|
|
|
new_folders.append(folder)
|
|
|
|
elif isinstance(folder, dict):
|
|
|
|
for f_k, f_v in folder.items():
|
|
|
|
nf, multiples_found, deleted = _find_feed_in_folders(f_v, f_k, multiples_found, deleted)
|
|
|
|
new_folders.append({f_k: nf})
|
|
|
|
|
|
|
|
return new_folders, multiples_found, deleted
|
|
|
|
|
|
|
|
user_sub_folders = json.decode(self.folders)
|
|
|
|
user_sub_folders, multiples_found, deleted = _find_feed_in_folders(user_sub_folders)
|
|
|
|
self.folders = json.encode(user_sub_folders)
|
|
|
|
self.save()
|
2010-07-20 20:23:49 -04:00
|
|
|
|
2010-09-16 10:35:36 -04:00
|
|
|
if not multiples_found and deleted:
|
|
|
|
user_sub = UserSubscription.objects.get(user=self.user, feed=feed_id)
|
|
|
|
user_sub.delete()
|
|
|
|
MUserStory.objects(user_id=self.user.pk, feed_id=feed_id).delete()
|
|
|
|
|
2010-09-22 10:12:38 -04:00
|
|
|
def delete_folder(self, folder_to_delete, in_folder, feed_ids_in_folder):
|
|
|
|
def _find_folder_in_folders(old_folders, folder_name, feeds_to_delete):
|
2010-09-16 10:35:36 -04:00
|
|
|
new_folders = []
|
|
|
|
for k, folder in enumerate(old_folders):
|
|
|
|
if isinstance(folder, int):
|
2010-09-22 10:12:38 -04:00
|
|
|
new_folders.append(folder)
|
|
|
|
if folder in feeds_to_delete:
|
|
|
|
feeds_to_delete.remove(folder)
|
2010-09-16 10:35:36 -04:00
|
|
|
elif isinstance(folder, dict):
|
|
|
|
for f_k, f_v in folder.items():
|
2010-09-22 10:12:38 -04:00
|
|
|
if f_k == folder_to_delete and folder_name == in_folder:
|
|
|
|
logging.info(" ---> [%s] Deleting folder '%s' in '%s': %s" % (self.user, f_k, folder_name, folder))
|
|
|
|
else:
|
|
|
|
nf, feeds_to_delete = _find_folder_in_folders(f_v, f_k, feeds_to_delete)
|
|
|
|
new_folders.append({f_k: nf})
|
2010-09-16 10:35:36 -04:00
|
|
|
|
2010-09-22 10:12:38 -04:00
|
|
|
return new_folders, feeds_to_delete
|
2010-09-16 10:35:36 -04:00
|
|
|
|
|
|
|
user_sub_folders = json.decode(self.folders)
|
2010-09-22 10:12:38 -04:00
|
|
|
user_sub_folders, feeds_to_delete = _find_folder_in_folders(user_sub_folders, '', feed_ids_in_folder)
|
2010-09-16 10:35:36 -04:00
|
|
|
self.folders = json.encode(user_sub_folders)
|
|
|
|
self.save()
|
2010-09-22 10:12:38 -04:00
|
|
|
|
|
|
|
UserSubscription.objects.filter(user=self.user, feed__in=feeds_to_delete).delete()
|
2010-07-20 20:23:49 -04:00
|
|
|
|
2010-06-12 21:20:06 -04:00
|
|
|
class Feature(models.Model):
|
2010-07-20 20:23:49 -04:00
|
|
|
"""
|
|
|
|
Simple blog-like feature board shown to all users on the home page.
|
|
|
|
"""
|
2010-06-12 21:20:06 -04:00
|
|
|
description = models.TextField(default="")
|
|
|
|
date = models.DateTimeField(default=datetime.datetime.now)
|
|
|
|
|
|
|
|
def __unicode__(self):
|
|
|
|
return "[%s] %s" % (self.date, self.description[:50])
|
|
|
|
|
|
|
|
class Meta:
|
2010-07-20 20:23:49 -04:00
|
|
|
ordering = ["-date"]
|
|
|
|
|