forked from getpelican/pelican-plugins
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrepresentative_image.py
63 lines (53 loc) · 2.42 KB
/
representative_image.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
import six
from bs4 import BeautifulSoup
from pelican import signals
from pelican.contents import Article, Page
from pelican.generators import ArticlesGenerator, PagesGenerator
def images_extraction(instance):
representativeImage = None
if type(instance) in (Article, Page):
if 'image' in instance.metadata:
representativeImage = instance.metadata['image']
# Process Summary:
# If summary contains images, extract one to be the representativeImage
# and remove images from summary
soup = BeautifulSoup(instance.summary, 'html.parser')
images = soup.find_all('img')
for i in images:
if not representativeImage:
representativeImage = i['src']
i.extract()
if len(images) > 0:
# set _summary field which is based on metadata. summary field is
# only based on article's content and not settable
instance._summary = six.text_type(soup)
# If there are no image in summary, look for it in the content body
if not representativeImage:
soup = BeautifulSoup(instance._content, 'html.parser')
imageTag = soup.find('img')
if imageTag:
representativeImage = imageTag['src']
# Set the attribute to content instance
instance.featured_image = representativeImage
instance.featured_alt = instance.metadata.get('alt', None)
instance.featured_link = instance.metadata.get('link', None)
instance.featured_caption = instance.metadata.get('caption', None)
def run_plugin(generators):
for generator in generators:
if isinstance(generator, ArticlesGenerator):
for article in generator.articles:
images_extraction(article)
for translation in article.translations:
images_extraction(translation)
elif isinstance(generator, PagesGenerator):
for page in generator.pages:
images_extraction(page)
for translation in page.translations:
images_extraction(translation)
def register():
try:
signals.all_generators_finalized.connect(run_plugin)
except AttributeError:
# NOTE: This results in #314 so shouldn't really be relied on
# https://github.com/getpelican/pelican-plugins/issues/314
signals.content_object_init.connect(images_extraction)