[yt-dlp.git] / devscripts / prepare_manpage.py

#!/usr/bin/env python3

import optparse
import os.path
import re

ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
README_FILE = os.path.join(ROOT_DIR, 'README.md')

PREFIX = r'''%yt-dlp(1)

# NAME

yt\-dlp \- A youtube-dl fork with additional features and patches

# SYNOPSIS

**yt-dlp** \[OPTIONS\] URL [URL...]

# DESCRIPTION

'''


def main():
    parser = optparse.OptionParser(usage='%prog OUTFILE.md')
    _, args = parser.parse_args()
    if len(args) != 1:
        parser.error('Expected an output filename')

    outfile, = args

    with open(README_FILE, encoding='utf-8') as f:
        readme = f.read()

    readme = filter_excluded_sections(readme)
    readme = move_sections(readme)
    readme = filter_options(readme)

    with open(outfile, 'w', encoding='utf-8') as outf:
        outf.write(PREFIX + readme)


def filter_excluded_sections(readme):
    EXCLUDED_SECTION_BEGIN_STRING = re.escape('<!-- MANPAGE: BEGIN EXCLUDED SECTION -->')
    EXCLUDED_SECTION_END_STRING = re.escape('<!-- MANPAGE: END EXCLUDED SECTION -->')
    return re.sub(
        rf'(?s){EXCLUDED_SECTION_BEGIN_STRING}.+?{EXCLUDED_SECTION_END_STRING}\n',
        '', readme)


def move_sections(readme):
    MOVE_TAG_TEMPLATE = '<!-- MANPAGE: MOVE "%s" SECTION HERE -->'
    sections = re.findall(r'(?m)^%s$' % (
        re.escape(MOVE_TAG_TEMPLATE).replace(r'\%', '%') % '(.+)'), readme)

    for section_name in sections:
        move_tag = MOVE_TAG_TEMPLATE % section_name
        if readme.count(move_tag) > 1:
            raise Exception(f'There is more than one occurrence of "{move_tag}". This is unexpected')

        sections = re.findall(rf'(?sm)(^# {re.escape(section_name)}.+?)(?=^# )', readme)
        if len(sections) < 1:
            raise Exception(f'The section {section_name} does not exist')
        elif len(sections) > 1:
            raise Exception(f'There are multiple occurrences of section {section_name}, this is unhandled')

        readme = readme.replace(sections[0], '', 1).replace(move_tag, sections[0], 1)
    return readme


def filter_options(readme):
    section = re.search(r'(?sm)^# USAGE AND OPTIONS\n.+?(?=^# )', readme).group(0)
    options = '# OPTIONS\n'
    for line in section.split('\n')[1:]:
        mobj = re.fullmatch(r'''(?x)
                \s{4}(?P<opt>-(?:,\s|[^\s])+)
                (?:\s(?P<meta>(?:[^\s]|\s(?!\s))+))?
                (\s{2,}(?P<desc>.+))?
            ''', line)
        if not mobj:
            options += f'{line.lstrip()}\n'
            continue
        option, metavar, description = mobj.group('opt', 'meta', 'desc')

        # Pandoc's definition_lists. See http://pandoc.org/README.html
        option = f'{option} *{metavar}*' if metavar else option
        description = f'{description}\n' if description else ''
        options += f'\n{option}\n:   {description}'
        continue

    return readme.replace(section, options, 1)


if __name__ == '__main__':
    main()
Commit	Line	Data
cc52de43	1	#!/usr/bin/env python3
54007a45	2
44c88923	3	import optparse
1800eeef	4	import os.path
1800eeef PH	5	import re
	6
	7	ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
	8	README_FILE = os.path.join(ROOT_DIR, 'README.md')
	9
7a5c1cfe	10	PREFIX = r'''%yt-dlp(1)
44c88923 S	11
	12	# NAME
	13
ec2e44fc	14	yt\-dlp \- A youtube-dl fork with additional features and patches
44c88923 S	15
	16	# SYNOPSIS
	17
7a5c1cfe	18	yt-dlp \[OPTIONS\] URL [URL...]
44c88923	19
ec2e44fc	20	# DESCRIPTION
ec2e44fc	21
44c88923 S	22	'''
	23
	24
	25	def main():
	26	parser = optparse.OptionParser(usage='%prog OUTFILE.md')
54007a45	27	_, args = parser.parse_args()
44c88923 S	28	if len(args) != 1:
	29	parser.error('Expected an output filename')
	30
	31	outfile, = args
	32
86e5f3ed	33	with open(README_FILE, encoding='utf-8') as f:
44c88923 S	34	readme = f.read()
44c88923 S	35
ec2e44fc	36	readme = filter_excluded_sections(readme)
ec2e44fc	37	readme = move_sections(readme)
44c88923 S	38	readme = filter_options(readme)
44c88923 S	39
86e5f3ed	40	with open(outfile, 'w', encoding='utf-8') as outf:
ec2e44fc	41	outf.write(PREFIX + readme)
	42
	43
	44	def filter_excluded_sections(readme):
	45	EXCLUDED_SECTION_BEGIN_STRING = re.escape('<!-- MANPAGE: BEGIN EXCLUDED SECTION -->')
	46	EXCLUDED_SECTION_END_STRING = re.escape('<!-- MANPAGE: END EXCLUDED SECTION -->')
	47	return re.sub(
	48	rf'(?s){EXCLUDED_SECTION_BEGIN_STRING}.+?{EXCLUDED_SECTION_END_STRING}\n',
	49	'', readme)
	50
	51
	52	def move_sections(readme):
	53	MOVE_TAG_TEMPLATE = '<!-- MANPAGE: MOVE "%s" SECTION HERE -->'
0fcba15d	54	sections = re.findall(r'(?m)^%s$' % (
0fcba15d	55	re.escape(MOVE_TAG_TEMPLATE).replace(r'\%', '%') % '(.+)'), readme)
ec2e44fc	56
	57	for section_name in sections:
	58	move_tag = MOVE_TAG_TEMPLATE % section_name
	59	if readme.count(move_tag) > 1:
	60	raise Exception(f'There is more than one occurrence of "{move_tag}". This is unexpected')
	61
	62	sections = re.findall(rf'(?sm)(^# {re.escape(section_name)}.+?)(?=^# )', readme)
	63	if len(sections) < 1:
	64	raise Exception(f'The section {section_name} does not exist')
	65	elif len(sections) > 1:
	66	raise Exception(f'There are multiple occurrences of section {section_name}, this is unhandled')
	67
	68	readme = readme.replace(sections[0], '', 1).replace(move_tag, sections[0], 1)
	69	return readme
44c88923	70
bad84757 YCH	71
bad84757 YCH	72	def filter_options(readme):
ec2e44fc	73	section = re.search(r'(?sm)^# USAGE AND OPTIONS\n.+?(?=^# )', readme).group(0)
	74	options = '# OPTIONS\n'
	75	for line in section.split('\n')[1:]:
08d30158	76	mobj = re.fullmatch(r'''(?x)
	77	\s{4}(?P<opt>-(?:,\s\|[^\s])+)
	78	(?:\s(?P<meta>(?:[^\s]\|\s(?!\s))+))?
	79	(\s{2,}(?P<desc>.+))?
	80	''', line)
b440e1bb	81	if not mobj:
	82	options += f'{line.lstrip()}\n'
	83	continue
	84	option, metavar, description = mobj.group('opt', 'meta', 'desc')
	85
	86	# Pandoc's definition_lists. See http://pandoc.org/README.html
	87	option = f'{option} {metavar}' if metavar else option
	88	description = f'{description}\n' if description else ''
	89	options += f'\n{option}\n: {description}'
	90	continue
ec2e44fc	91
ec2e44fc	92	return readme.replace(section, options, 1)
bad84757	93
582be358	94
44c88923 S	95	if __name__ == '__main__':
44c88923 S	96	main()