rmd_reader.py 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112
  1. #-*- conding: utf-8 -*-
  2. import os
  3. import warnings
  4. import logging
  5. logger = logging.getLogger('RMD_READER')
  6. from pelican import readers
  7. from pelican import signals
  8. from pelican import settings
  9. knitr = None
  10. rmd = False
  11. fig_path = None
  12. def initsignal(pelicanobj):
  13. global knitr, rmd, fig_path, robjects
  14. try:
  15. with warnings.catch_warnings():
  16. warnings.simplefilter("ignore")
  17. import rpy2.rinterface
  18. rpy2.rinterface.set_initoptions((b'rpy2', b'--no-save', b'--vanilla', b'--quiet'))
  19. from rpy2.robjects.packages import importr
  20. import rpy2.robjects as robjects
  21. robjects.r('Sys.setlocale("LC_ALL", "C")')
  22. robjects.r('Sys.setlocale("LC_NUMERIC", "C")')
  23. robjects.r('Sys.setlocale("LC_MESSAGES", "C")')
  24. knitr = importr('knitr')
  25. idx = knitr.opts_knit.names.index('set')
  26. PATH = pelicanobj.settings.get('PATH','%s/content' % settings.DEFAULT_CONFIG.get('PATH'))
  27. logger.debug("RMD_READER PATH = %s", PATH)
  28. knitr.opts_knit[idx](**{'base.dir': PATH})
  29. knitroptsknit = pelicanobj.settings.get('RMD_READER_KNITR_OPTS_KNIT', None)
  30. if knitroptsknit:
  31. knitr.opts_knit[idx](**{str(k): v for k,v in knitroptsknit.items()})
  32. idx = knitr.opts_chunk.names.index('set')
  33. knitroptschunk = pelicanobj.settings.get('RMD_READER_KNITR_OPTS_CHUNK', None)
  34. if knitroptschunk:
  35. fig_path = knitroptschunk['fig.path'] if 'fig.path' in knitroptschunk else 'figure/'
  36. knitr.opts_chunk[idx](**{str(k): v for k,v in knitroptschunk.items()})
  37. rmd = True
  38. except ImportError as ex:
  39. rmd = False
  40. class RmdReader(readers.BaseReader):
  41. file_extensions = ['Rmd', 'rmd']
  42. @property
  43. def enabled():
  44. return rmd
  45. # You need to have a read method, which takes a filename and returns
  46. # some content and the associated metadata.
  47. def read(self, filename):
  48. """Parse content and metadata of markdown files"""
  49. QUIET = self.settings.get('RMD_READER_KNITR_QUIET', True)
  50. ENCODING = self.settings.get('RMD_READER_KNITR_ENCODING', 'UTF-8')
  51. CLEANUP = self.settings.get('RMD_READER_CLEANUP', True)
  52. RENAME_PLOT = self.settings.get('RMD_READER_RENAME_PLOT', 'chunklabel')
  53. if type(RENAME_PLOT) is bool:
  54. logger.error("RMD_READER_RENAME_PLOT takes a string value (either chunklabel or directory), please see the readme.")
  55. if RENAME_PLOT:
  56. RENAME_PLOT = 'chunklabel'
  57. logger.error("Defaulting to chunklabel")
  58. else:
  59. RENAME_PLOT = 'disabled'
  60. logger.error("Disabling plot renaming")
  61. logger.debug("RMD_READER_KNITR_QUIET = %s", QUIET)
  62. logger.debug("RMD_READER_KNITR_ENCODING = %s", ENCODING)
  63. logger.debug("RMD_READER_CLEANUP = %s", CLEANUP)
  64. logger.debug("RMD_READER_RENAME_PLOT = %s", RENAME_PLOT)
  65. # replace single backslashes with double backslashes
  66. filename = filename.replace('\\', '\\\\')
  67. # parse Rmd file - generate md file
  68. md_filename = filename.replace('.Rmd', '.aux').replace('.rmd', '.aux')
  69. if RENAME_PLOT == 'chunklabel' or RENAME_PLOT == 'directory':
  70. if RENAME_PLOT == 'chunklabel':
  71. chunk_label = os.path.splitext(os.path.basename(filename))[0]
  72. logger.debug('Chunk label: %s', chunk_label)
  73. elif RENAME_PLOT == 'directory':
  74. chunk_label = 'unnamed-chunk'
  75. PATH = self.settings.get('PATH','%s/content' % settings.DEFAULT_CONFIG.get('PATH'))
  76. src_name = os.path.splitext(os.path.relpath(filename, PATH))[0]
  77. idx = knitr.opts_chunk.names.index('set')
  78. knitroptschunk = { 'fig.path': '%s-' % os.path.join(fig_path, src_name) }
  79. knitr.opts_chunk[idx](**{str(k): v for k,v in knitroptschunk.items()})
  80. logger.debug('Figures path: %s, chunk label: %s', knitroptschunk['fig.path'], chunk_label)
  81. robjects.r('''
  82. opts_knit$set(unnamed.chunk.label="{unnamed_chunk_label}")
  83. render_markdown()
  84. hook_plot <- knit_hooks$get('plot')
  85. knit_hooks$set(plot=function(x, options) hook_plot(paste0("{{filename}}/", x), options))
  86. '''.format(unnamed_chunk_label=chunk_label))
  87. with warnings.catch_warnings():
  88. warnings.simplefilter("ignore")
  89. knitr.knit(filename, md_filename, quiet=QUIET, encoding=ENCODING)
  90. # read md file - create a MarkdownReader
  91. md_reader = readers.MarkdownReader(self.settings)
  92. content, metadata = md_reader.read(md_filename)
  93. # remove md file
  94. if CLEANUP:
  95. os.remove(md_filename)
  96. return content, metadata
  97. def add_reader(readers):
  98. readers.reader_classes['rmd'] = RmdReader
  99. def register():
  100. signals.readers_init.connect(add_reader)
  101. signals.initialized.connect(initsignal)