]> jfr.im git - yt-dlp.git/blob - devscripts/prepare_manpage.py
[devscripts] Improve `prepare_manpage`
[yt-dlp.git] / devscripts / prepare_manpage.py
1 #!/usr/bin/env python3
2 from __future__ import unicode_literals
3
4 import io
5 import optparse
6 import os.path
7 import re
8
9 ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
10 README_FILE = os.path.join(ROOT_DIR, 'README.md')
11
12 PREFIX = r'''%yt-dlp(1)
13
14 # NAME
15
16 yt\-dlp \- A youtube-dl fork with additional features and patches
17
18 # SYNOPSIS
19
20 **yt-dlp** \[OPTIONS\] URL [URL...]
21
22 # DESCRIPTION
23
24 '''
25
26
27 def main():
28 parser = optparse.OptionParser(usage='%prog OUTFILE.md')
29 options, args = parser.parse_args()
30 if len(args) != 1:
31 parser.error('Expected an output filename')
32
33 outfile, = args
34
35 with io.open(README_FILE, encoding='utf-8') as f:
36 readme = f.read()
37
38 readme = filter_excluded_sections(readme)
39 readme = move_sections(readme)
40 readme = filter_options(readme)
41
42 with io.open(outfile, 'w', encoding='utf-8') as outf:
43 outf.write(PREFIX + readme)
44
45
46 def filter_excluded_sections(readme):
47 EXCLUDED_SECTION_BEGIN_STRING = re.escape('<!-- MANPAGE: BEGIN EXCLUDED SECTION -->')
48 EXCLUDED_SECTION_END_STRING = re.escape('<!-- MANPAGE: END EXCLUDED SECTION -->')
49 return re.sub(
50 rf'(?s){EXCLUDED_SECTION_BEGIN_STRING}.+?{EXCLUDED_SECTION_END_STRING}\n',
51 '', readme)
52
53
54 def move_sections(readme):
55 MOVE_TAG_TEMPLATE = '<!-- MANPAGE: MOVE "%s" SECTION HERE -->'
56 sections = re.findall(r'(?m)^%s$' % (
57 re.escape(MOVE_TAG_TEMPLATE).replace(r'\%', '%') % '(.+)'), readme)
58
59 for section_name in sections:
60 move_tag = MOVE_TAG_TEMPLATE % section_name
61 if readme.count(move_tag) > 1:
62 raise Exception(f'There is more than one occurrence of "{move_tag}". This is unexpected')
63
64 sections = re.findall(rf'(?sm)(^# {re.escape(section_name)}.+?)(?=^# )', readme)
65 if len(sections) < 1:
66 raise Exception(f'The section {section_name} does not exist')
67 elif len(sections) > 1:
68 raise Exception(f'There are multiple occurrences of section {section_name}, this is unhandled')
69
70 readme = readme.replace(sections[0], '', 1).replace(move_tag, sections[0], 1)
71 return readme
72
73
74 def filter_options(readme):
75 section = re.search(r'(?sm)^# USAGE AND OPTIONS\n.+?(?=^# )', readme).group(0)
76 options = '# OPTIONS\n'
77 for line in section.split('\n')[1:]:
78 mobj = re.fullmatch(r'\s{4}(?P<opt>-(?:,\s|[^\s])+)(?:\s(?P<meta>([^\s]|\s(?!\s))+))?(\s{2,}(?P<desc>.+))?', line)
79 if not mobj:
80 options += f'{line.lstrip()}\n'
81 continue
82 option, metavar, description = mobj.group('opt', 'meta', 'desc')
83
84 # Pandoc's definition_lists. See http://pandoc.org/README.html
85 option = f'{option} *{metavar}*' if metavar else option
86 description = f'{description}\n' if description else ''
87 options += f'\n{option}\n: {description}'
88 continue
89
90 return readme.replace(section, options, 1)
91
92
93 if __name__ == '__main__':
94 main()