2009-08-14 01:48:21 +00:00
|
|
|
from django.core.management.base import BaseCommand
|
2010-08-16 12:52:39 -04:00
|
|
|
from django.conf import settings
|
2010-12-14 23:10:13 -05:00
|
|
|
from django.contrib.auth.models import User
|
2010-08-16 12:52:39 -04:00
|
|
|
from apps.rss_feeds.models import Feed
|
|
|
|
from optparse import make_option
|
2009-08-29 19:34:42 +00:00
|
|
|
from utils import feed_fetcher
|
2009-08-30 00:43:13 +00:00
|
|
|
from utils.management_functions import daemonize
|
2011-11-27 02:41:12 -05:00
|
|
|
import django
|
2009-08-20 02:43:01 +00:00
|
|
|
import socket
|
2010-04-19 12:09:04 -04:00
|
|
|
import datetime
|
2011-11-05 17:08:31 -07:00
|
|
|
import redis
|
2009-08-14 01:48:21 +00:00
|
|
|
|
2009-08-21 13:14:44 +00:00
|
|
|
|
2009-08-14 01:48:21 +00:00
|
|
|
class Command(BaseCommand):
|
|
|
|
option_list = BaseCommand.option_list + (
|
2009-08-23 00:00:55 +00:00
|
|
|
make_option("-f", "--feed", default=None),
|
2009-08-14 01:48:21 +00:00
|
|
|
make_option("-d", "--daemon", dest="daemonize", action="store_true"),
|
2010-08-21 20:42:38 -04:00
|
|
|
make_option("-F", "--force", dest="force", action="store_true"),
|
2010-04-09 16:37:19 -04:00
|
|
|
make_option("-s", "--single_threaded", dest="single_threaded", action="store_true"),
|
2009-08-20 02:43:01 +00:00
|
|
|
make_option('-t', '--timeout', type='int', default=10,
|
|
|
|
help='Wait timeout in seconds when connecting to feeds.'),
|
2010-12-14 23:10:13 -05:00
|
|
|
make_option('-u', '--username', type='str', dest='username'),
|
2009-08-21 13:14:44 +00:00
|
|
|
make_option('-V', '--verbose', action='store_true',
|
|
|
|
dest='verbose', default=False, help='Verbose output.'),
|
2010-08-16 13:21:32 -04:00
|
|
|
make_option('-S', '--skip', type='int',
|
|
|
|
dest='skip', default=0, help='Skip stories per month < #.'),
|
2010-03-02 17:04:54 +00:00
|
|
|
make_option('-w', '--workerthreads', type='int', default=4,
|
2009-08-20 02:43:01 +00:00
|
|
|
help='Worker threads that will fetch feeds in parallel.'),
|
2009-08-14 01:48:21 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
def handle(self, *args, **options):
|
|
|
|
if options['daemonize']:
|
|
|
|
daemonize()
|
2010-04-19 12:09:04 -04:00
|
|
|
|
2010-08-16 12:52:39 -04:00
|
|
|
settings.LOG_TO_STREAM = True
|
2010-10-10 23:55:00 -04:00
|
|
|
now = datetime.datetime.utcnow()
|
2010-08-16 13:21:32 -04:00
|
|
|
|
|
|
|
if options['skip']:
|
|
|
|
feeds = Feed.objects.filter(next_scheduled_update__lte=now,
|
2010-08-18 20:35:45 -04:00
|
|
|
average_stories_per_month__lt=options['skip'],
|
2010-08-18 21:54:33 -04:00
|
|
|
active=True)
|
2010-08-16 13:21:32 -04:00
|
|
|
print " ---> Skipping %s feeds" % feeds.count()
|
|
|
|
for feed in feeds:
|
|
|
|
feed.set_next_scheduled_update()
|
|
|
|
print '.',
|
2010-08-30 13:33:29 -04:00
|
|
|
return
|
2010-08-16 12:52:39 -04:00
|
|
|
|
2010-04-19 12:09:04 -04:00
|
|
|
socket.setdefaulttimeout(options['timeout'])
|
2010-08-21 20:42:38 -04:00
|
|
|
if options['force']:
|
|
|
|
feeds = Feed.objects.all()
|
2010-12-14 23:10:13 -05:00
|
|
|
elif options['username']:
|
|
|
|
feeds = Feed.objects.filter(subscribers__user=User.objects.get(username=options['username']))
|
|
|
|
else:
|
|
|
|
feeds = Feed.objects.filter(next_scheduled_update__lte=now, active=True)
|
|
|
|
|
|
|
|
feeds = feeds.order_by('?')
|
|
|
|
|
2010-12-23 13:29:31 -05:00
|
|
|
for f in feeds:
|
|
|
|
f.queued_date = datetime.datetime.utcnow()
|
|
|
|
f.set_next_scheduled_update()
|
2010-09-08 18:30:46 -07:00
|
|
|
|
2009-09-16 03:54:33 +00:00
|
|
|
num_workers = min(len(feeds), options['workerthreads'])
|
2010-04-09 16:37:19 -04:00
|
|
|
if options['single_threaded']:
|
|
|
|
num_workers = 1
|
2009-08-21 13:14:44 +00:00
|
|
|
|
2010-11-10 18:04:17 -05:00
|
|
|
options['compute_scores'] = True
|
|
|
|
|
2009-09-16 03:54:33 +00:00
|
|
|
disp = feed_fetcher.Dispatcher(options, num_workers)
|
2009-08-20 02:43:01 +00:00
|
|
|
|
2009-09-16 03:54:33 +00:00
|
|
|
feeds_queue = []
|
|
|
|
for _ in range(num_workers):
|
|
|
|
feeds_queue.append([])
|
2011-11-27 02:41:12 -05:00
|
|
|
|
2009-09-16 03:54:33 +00:00
|
|
|
i = 0
|
2009-08-14 01:48:21 +00:00
|
|
|
for feed in feeds:
|
2010-10-03 18:04:40 -04:00
|
|
|
feeds_queue[i%num_workers].append(feed.pk)
|
2009-09-16 03:54:33 +00:00
|
|
|
i += 1
|
2010-04-23 21:19:19 -04:00
|
|
|
disp.add_jobs(feeds_queue, i)
|
2009-08-20 02:43:01 +00:00
|
|
|
|
2011-11-27 02:41:12 -05:00
|
|
|
django.db.connection.close()
|
|
|
|
|
2010-08-16 12:52:39 -04:00
|
|
|
print " ---> Fetching %s feeds..." % feeds.count()
|
2009-09-10 03:48:22 +00:00
|
|
|
disp.run_jobs()
|