devscripts/prepare_manpage.py

   1 #!/usr/bin/env python3
   2 from __future__ import unicode_literals
   3
   4 import io
   5 import optparse
   6 import os.path
   7 import re
   8
   9 ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
  10 README_FILE = os.path.join(ROOT_DIR, 'README.md')
  11
  12 PREFIX = r'''%yt-dlp(1)
  13
  14 # NAME
  15
  16 yt\-dlp \- A youtube-dl fork with additional features and patches
  17
  18 # SYNOPSIS
  19
  20 **yt-dlp** \[OPTIONS\] URL [URL...]
  21
  22 # DESCRIPTION
  23
  24 '''
  25
  26
  27 def main():
  28     parser = optparse.OptionParser(usage='%prog OUTFILE.md')
  29     options, args = parser.parse_args()
  30     if len(args) != 1:
  31         parser.error('Expected an output filename')
  32
  33     outfile, = args
  34
  35     with io.open(README_FILE, encoding='utf-8') as f:
  36         readme = f.read()
  37
  38     readme = filter_excluded_sections(readme)
  39     readme = move_sections(readme)
  40     readme = filter_options(readme)
  41
  42     with io.open(outfile, 'w', encoding='utf-8') as outf:
  43         outf.write(PREFIX + readme)
  44
  45
  46 def filter_excluded_sections(readme):
  47     EXCLUDED_SECTION_BEGIN_STRING = re.escape('<!-- MANPAGE: BEGIN EXCLUDED SECTION -->')
  48     EXCLUDED_SECTION_END_STRING = re.escape('<!-- MANPAGE: END EXCLUDED SECTION -->')
  49     return re.sub(
  50         rf'(?s){EXCLUDED_SECTION_BEGIN_STRING}.+?{EXCLUDED_SECTION_END_STRING}\n',
  51         '', readme)
  52
  53
  54 def move_sections(readme):
  55     MOVE_TAG_TEMPLATE = '<!-- MANPAGE: MOVE "%s" SECTION HERE -->'
  56     sections = re.findall(r'(?m)^%s$' % (
  57         re.escape(MOVE_TAG_TEMPLATE).replace(r'\%', '%') % '(.+)'), readme)
  58
  59     for section_name in sections:
  60         move_tag = MOVE_TAG_TEMPLATE % section_name
  61         if readme.count(move_tag) > 1:
  62             raise Exception(f'There is more than one occurrence of "{move_tag}". This is unexpected')
  63
  64         sections = re.findall(rf'(?sm)(^# {re.escape(section_name)}.+?)(?=^# )', readme)
  65         if len(sections) < 1:
  66             raise Exception(f'The section {section_name} does not exist')
  67         elif len(sections) > 1:
  68             raise Exception(f'There are multiple occurrences of section {section_name}, this is unhandled')
  69
  70         readme = readme.replace(sections[0], '', 1).replace(move_tag, sections[0], 1)
  71     return readme
  72
  73
  74 def filter_options(readme):
  75     section = re.search(r'(?sm)^# USAGE AND OPTIONS\n.+?(?=^# )', readme).group(0)
  76     options = '# OPTIONS\n'
  77     for line in section.split('\n')[1:]:
  78         mobj = re.fullmatch(r'\s{4}(?P<opt>-(?:,\s|[^\s])+)(?:\s(?P<meta>([^\s]|\s(?!\s))+))?(\s{2,}(?P<desc>.+))?', line)
  79         if not mobj:
  80             options += f'{line.lstrip()}\n'
  81             continue
  82         option, metavar, description = mobj.group('opt', 'meta', 'desc')
  83
  84         # Pandoc's definition_lists. See http://pandoc.org/README.html
  85         option = f'{option} *{metavar}*' if metavar else option
  86         description = f'{description}\n' if description else ''
  87         options += f'\n{option}\n:   {description}'
  88         continue
  89
  90     return readme.replace(section, options, 1)
  91
  92
  93 if __name__ == '__main__':
  94     main()