mirror of
				https://github.com/viq/NewsBlur.git
				synced 2025-09-18 21:43:31 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			174 lines
		
	
	
	
		
			5.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			174 lines
		
	
	
	
		
			5.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import datetime
 | |
| import os
 | |
| import shutil
 | |
| import time
 | |
| from celery.task import Task
 | |
| from utils import log as logging
 | |
| from utils import s3_utils as s3
 | |
| from django.conf import settings
 | |
| 
 | |
| class TaskFeeds(Task):
 | |
|     name = 'task-feeds'
 | |
| 
 | |
|     def run(self, **kwargs):
 | |
|         from apps.rss_feeds.models import Feed        
 | |
|         settings.LOG_TO_STREAM = True
 | |
|         now = datetime.datetime.utcnow()
 | |
|         
 | |
|         # Active feeds
 | |
|         feeds = Feed.objects.filter(
 | |
|             next_scheduled_update__lte=now,
 | |
|             active=True
 | |
|         ).exclude(
 | |
|             active_subscribers=0
 | |
|         ).order_by('?')
 | |
|         active_count = feeds.count()
 | |
|         
 | |
|         # Mistakenly inactive feeds
 | |
|         day = now - datetime.timedelta(days=1)
 | |
|         inactive_feeds = Feed.objects.filter(
 | |
|             last_update__lte=day, 
 | |
|             queued_date__lte=day,
 | |
|             min_to_decay__lte=60*24,
 | |
|             active_subscribers__gte=1
 | |
|         ).order_by('?')[:20]
 | |
|         inactive_count = inactive_feeds.count()
 | |
|         
 | |
|         week = now - datetime.timedelta(days=7)
 | |
|         old_feeds = Feed.objects.filter(
 | |
|             last_update__lte=week, 
 | |
|             queued_date__lte=day,
 | |
|             active_subscribers__gte=1
 | |
|         ).order_by('?')[:20]
 | |
|         old_count = old_feeds.count()
 | |
|         
 | |
|         logging.debug(" ---> ~FBTasking ~SB~FC%s~SN~FB/~FC%s~FB/~FC%s~SN~FB feeds..." % (
 | |
|             active_count,
 | |
|             inactive_count,
 | |
|             old_count,
 | |
|         ))        
 | |
|         
 | |
|         Feed.task_feeds(feeds, verbose=False)
 | |
|         if inactive_feeds: Feed.task_feeds(inactive_feeds, verbose=False)
 | |
|         if old_feeds: Feed.task_feeds(old_feeds, verbose=False)
 | |
|         
 | |
|         
 | |
| class UpdateFeeds(Task):
 | |
|     name = 'update-feeds'
 | |
|     max_retries = 0
 | |
|     ignore_result = True
 | |
| 
 | |
|     def run(self, feed_pks, **kwargs):
 | |
|         from apps.rss_feeds.models import Feed
 | |
|         from apps.statistics.models import MStatistics
 | |
|         
 | |
|         mongodb_replication_lag = int(MStatistics.get('mongodb_replication_lag', 0))
 | |
|         compute_scores = bool(mongodb_replication_lag < 10)
 | |
|         
 | |
|         options = {
 | |
|             'fake': bool(MStatistics.get('fake_fetch')),
 | |
|             'quick': float(MStatistics.get('quick_fetch', 0)),
 | |
|             'compute_scores': compute_scores,
 | |
|             'mongodb_replication_lag': mongodb_replication_lag,
 | |
|         }
 | |
|         
 | |
|         if not isinstance(feed_pks, list):
 | |
|             feed_pks = [feed_pks]
 | |
|             
 | |
|         for feed_pk in feed_pks:
 | |
|             try:
 | |
|                 feed = Feed.get_by_id(feed_pk)
 | |
|                 feed.update(**options)
 | |
|             except Feed.DoesNotExist:
 | |
|                 logging.info(" ---> Feed doesn't exist: [%s]" % feed_pk)
 | |
|             # logging.debug(' Updating: [%s] %s' % (feed_pks, feed))
 | |
| 
 | |
| class NewFeeds(Task):
 | |
|     name = 'new-feeds'
 | |
|     max_retries = 0
 | |
|     ignore_result = True
 | |
| 
 | |
|     def run(self, feed_pks, **kwargs):
 | |
|         from apps.rss_feeds.models import Feed
 | |
|         if not isinstance(feed_pks, list):
 | |
|             feed_pks = [feed_pks]
 | |
|         
 | |
|         options = {
 | |
|             'force': True,
 | |
|         }
 | |
|         for feed_pk in feed_pks:
 | |
|             feed = Feed.get_by_id(feed_pk)
 | |
|             feed.update(options=options)
 | |
| 
 | |
| class PushFeeds(Task):
 | |
|     name = 'push-feeds'
 | |
|     max_retries = 0
 | |
|     ignore_result = True
 | |
| 
 | |
|     def run(self, feed_id, xml, **kwargs):
 | |
|         from apps.rss_feeds.models import Feed
 | |
|         from apps.statistics.models import MStatistics
 | |
|         
 | |
|         mongodb_replication_lag = int(MStatistics.get('mongodb_replication_lag', 0))
 | |
|         compute_scores = bool(mongodb_replication_lag < 60)
 | |
|         
 | |
|         options = {
 | |
|             'feed_xml': xml,
 | |
|             'compute_scores': compute_scores,
 | |
|             'mongodb_replication_lag': mongodb_replication_lag,
 | |
|         }
 | |
|         feed = Feed.get_by_id(feed_id)
 | |
|         feed.update(options=options)
 | |
| 
 | |
| class BackupMongo(Task):
 | |
|     name = 'backup-mongo'
 | |
|     max_retries = 0
 | |
|     ignore_result = True
 | |
|     
 | |
|     def run(self, **kwargs):
 | |
|         COLLECTIONS = "classifier_tag classifier_author classifier_feed classifier_title userstories starred_stories shared_stories category category_site sent_emails social_profile social_subscription social_services statistics feedback"
 | |
| 
 | |
|         date = time.strftime('%Y-%m-%d-%H-%M')
 | |
|         collections = COLLECTIONS.split(' ')
 | |
|         db_name = 'newsblur'
 | |
|         dir_name = 'backup_mongo_%s' % date
 | |
|         filename = '%s.tgz' % dir_name
 | |
| 
 | |
|         os.mkdir(dir_name)
 | |
| 
 | |
|         for collection in collections:
 | |
|             cmd = 'mongodump  --db %s --collection %s -o %s' % (db_name, collection, dir_name)
 | |
|             logging.debug(' ---> ~FMDumping ~SB%s~SN: %s' % (collection, cmd))
 | |
|             os.system(cmd)
 | |
| 
 | |
|         cmd = 'tar -jcf %s %s' % (filename, dir_name)
 | |
|         os.system(cmd)
 | |
| 
 | |
|         logging.debug(' ---> ~FRUploading ~SB~FM%s~SN~FR to S3...' % filename)
 | |
|         s3.save_file_in_s3(filename)
 | |
|         shutil.rmtree(dir_name)
 | |
|         os.remove(filename)
 | |
|         logging.debug(' ---> ~FRFinished uploading ~SB~FM%s~SN~FR to S3.' % filename)
 | |
| 
 | |
| 
 | |
| class ScheduleImmediateFetches(Task):
 | |
|     
 | |
|     def run(self, feed_ids, **kwargs):
 | |
|         from apps.rss_feeds.models import Feed
 | |
|         
 | |
|         if not isinstance(feed_ids, list):
 | |
|             feed_ids = [feed_ids]
 | |
|         
 | |
|         Feed.schedule_feed_fetches_immediately(feed_ids)
 | |
| 
 | |
| 
 | |
| class SchedulePremiumSetup(Task):
 | |
|     
 | |
|     def run(self, feed_ids, **kwargs):
 | |
|         from apps.rss_feeds.models import Feed
 | |
|         
 | |
|         if not isinstance(feed_ids, list):
 | |
|             feed_ids = [feed_ids]
 | |
|         
 | |
|         Feed.setup_feeds_for_premium_subscribers(feed_ids)
 | |
|         
 | 
