88 lines
2.4 KiB
Python
88 lines
2.4 KiB
Python
# -*- coding: utf-8 -*-
|
|
import os
|
|
import logging
|
|
import feedparser
|
|
|
|
from urllib.request import urlretrieve
|
|
from django.core.files import File
|
|
from django.utils.timezone import make_aware
|
|
from stdimage.utils import render_variations
|
|
|
|
# from scaffold.readers.rss_reader import feed_reader
|
|
|
|
from mhackspace.feeds.models import Feed, Article, image_variations
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
def feed_reader(feeds):
|
|
for feed in feeds:
|
|
print(feed)
|
|
yield feedparser.parse(feed['url'])
|
|
|
|
|
|
def import_feeds(feed=False):
|
|
remove_old_articles()
|
|
rss_articles = feed_reader(get_active_feeds(feed))
|
|
|
|
articles = []
|
|
for article in rss_articles:
|
|
print(article)
|
|
articles.append(
|
|
Article(
|
|
url=article["url"].decode(),
|
|
feed=Feed.objects.get(pk=article["id"]),
|
|
title=article["title"].decode(),
|
|
original_image=article["image"],
|
|
description=article["description"].decode(),
|
|
date=make_aware(article["date"]),
|
|
)
|
|
)
|
|
|
|
articles = Article.objects.bulk_create(articles)
|
|
download_remote_images()
|
|
return articles
|
|
|
|
|
|
def remove_old_articles():
|
|
for article in Article.objects.all():
|
|
article.image.delete(save=False)
|
|
Article.objects.all().delete()
|
|
|
|
|
|
def download_remote_images():
|
|
for article in Article.objects.all():
|
|
if not article.original_image:
|
|
continue
|
|
try:
|
|
result = urlretrieve(article.original_image.__str__())
|
|
article.image.save(
|
|
os.path.basename(article.original_image.__str__()),
|
|
File(open(result[0], "rb")),
|
|
)
|
|
render_variations(result[0], image_variations, replace=True)
|
|
article.save()
|
|
except Exception as e:
|
|
logger.exception(result)
|
|
logger.exception(result[0])
|
|
logger.exception(
|
|
"Unable to download remote image for %s"
|
|
% article.original_image
|
|
)
|
|
|
|
|
|
def get_active_feeds(feed=False):
|
|
if feed is not False:
|
|
feeds = Feed.objects.filter(pk__in=feed)
|
|
else:
|
|
feeds = Feed.objects.all()
|
|
|
|
rss_feeds = []
|
|
for feed in feeds:
|
|
if feed.enabled is False:
|
|
continue
|
|
rss_feeds.append(
|
|
{"id": feed.id, "author": feed.author, "url": feed.feed_url}
|
|
)
|
|
return rss_feeds
|