better_figures_and_images.py 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138
  1. """
  2. Better Figures & Images
  3. ------------------------
  4. This plugin:
  5. - Adds a style="width: ???px; height: auto;" to each image in the content
  6. - Also adds the width of the contained image to any parent div.figures.
  7. - If RESPONSIVE_IMAGES == True, also adds style="max-width: 100%;"
  8. - Corrects alt text: if alt == image filename, set alt = ''
  9. TODO: Need to add a test.py for this plugin.
  10. """
  11. from __future__ import unicode_literals
  12. from os import path, access, R_OK
  13. import os
  14. from pelican import signals
  15. from bs4 import BeautifulSoup
  16. from PIL import Image
  17. import pysvg.parser
  18. import cssutils
  19. import logging
  20. logger = logging.getLogger(__name__)
  21. def content_object_init(instance):
  22. if instance._content is not None:
  23. content = instance._content
  24. soup = BeautifulSoup(content, 'html.parser')
  25. for img in soup(['img', 'object']):
  26. logger.debug('Better Fig. PATH: %s', instance.settings['PATH'])
  27. if img.name == 'img':
  28. logger.debug('Better Fig. img.src: %s', img['src'])
  29. img_path, img_filename = path.split(img['src'])
  30. else:
  31. logger.debug('Better Fig. img.data: %s', img['data'])
  32. img_path, img_filename = path.split(img['data'])
  33. logger.debug('Better Fig. img_path: %s', img_path)
  34. logger.debug('Better Fig. img_fname: %s', img_filename)
  35. # If the image already has attributes... then we can skip it. Assuming it's already optimised
  36. if 'style' in img.attrs:
  37. sheet = cssutils.parseStyle(img['style'])
  38. if len(sheet.width) > 0 or len(sheet.height) > 0:
  39. continue
  40. # Pelican 3.5+ supports {attach} macro for auto copy, in this use case the content does not exist in output
  41. # due to the fact it has not been copied, hence we take it from the source (same as current document)
  42. if img_filename.startswith('{attach}'):
  43. img_path = os.path.dirname(instance.source_path)
  44. img_filename = img_filename[8:]
  45. src = os.path.join(img_path, img_filename)
  46. elif img_path.startswith(('{filename}', '|filename|')):
  47. # Strip off {filename}, |filename| or /static
  48. img_path = img_path[10:]
  49. elif img_path.startswith('/static'):
  50. img_path = img_path[7:]
  51. elif img_path.startswith('data:image'):
  52. # Image is encoded in-line (not a file).
  53. continue
  54. else:
  55. # Check the location in the output as some plugins create them there.
  56. output_path = path.dirname(instance.save_as)
  57. image_output_location = path.join(instance.settings['OUTPUT_PATH'], output_path, img_filename)
  58. if path.isfile(image_output_location):
  59. src = image_output_location
  60. logger.info('{src} located in output, missing from content.'.format(src=img_filename))
  61. else:
  62. logger.warning('Better Fig. Error: img_path should start with either {attach}, {filename}, |filename| or /static')
  63. if src is None:
  64. # search src path list
  65. # 1. Build the source image filename from PATH
  66. # 2. Build the source image filename from STATIC_PATHS
  67. # if img_path start with '/', remove it.
  68. img_path = os.path.sep.join([el for el in img_path.split("/") if len(el) > 0])
  69. # style: {filename}/static/foo/bar.png
  70. src = os.path.join(instance.settings['PATH'], img_path, img_filename)
  71. src_candidates = [src]
  72. # style: {filename}../static/foo/bar.png
  73. src_candidates += [os.path.join(instance.settings['PATH'], static_path, img_path, img_filename) for static_path in instance.settings['STATIC_PATHS']]
  74. src_candidates = [f for f in src_candidates if path.isfile(f) and access(f, R_OK)]
  75. if not src_candidates:
  76. logger.error('Better Fig. Error: image not found: %s', src)
  77. logger.debug('Better Fig. Skip src: %s', img_path + '/' + img_filename)
  78. continue
  79. src = src_candidates[0]
  80. logger.debug('Better Fig. src: %s', src)
  81. # Open the source image and query dimensions; build style string
  82. try:
  83. if img.name == 'img':
  84. im = Image.open(src)
  85. extra_style = 'width: {}px; height: auto;'.format(im.size[0])
  86. else:
  87. svg = pysvg.parser.parse(src)
  88. extra_style = 'width: {}px; height: auto;'.format(svg.get_width())
  89. except IOError as e:
  90. logger.debug('Better Fig. Failed to open: %s', src)
  91. extra_style = 'width: 100%; height: auto;'
  92. if 'RESPONSIVE_IMAGES' in instance.settings and instance.settings['RESPONSIVE_IMAGES']:
  93. extra_style += ' max-width: 100%;'
  94. if img.get('style'):
  95. img['style'] += extra_style
  96. else:
  97. img['style'] = extra_style
  98. if img.name == 'img':
  99. if img['alt'] == img['src']:
  100. img['alt'] = ''
  101. fig = img.find_parent('div', 'figure')
  102. if fig:
  103. if fig.get('style'):
  104. fig['style'] += extra_style
  105. else:
  106. fig['style'] = extra_style
  107. instance._content = soup.decode()
  108. def register():
  109. signals.content_object_init.connect(content_object_init)