yt-dlp/devscripts/prepare_manpage.py

#!/usr/bin/env python3

# Allow direct execution
import os
import sys

sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))


import os.path
import re

from devscripts.utils import (
    compose_functions,
    get_filename_args,
    read_file,
    write_file,
)

ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
README_FILE = os.path.join(ROOT_DIR, 'README.md')

PREFIX = r'''%yt-dlp(1)

# NAME

yt\-dlp \- A feature\-rich command\-line audio/video downloader

# SYNOPSIS

**yt-dlp** \[OPTIONS\] URL [URL...]

# DESCRIPTION

'''


def filter_excluded_sections(readme):
    EXCLUDED_SECTION_BEGIN_STRING = re.escape('<!-- MANPAGE: BEGIN EXCLUDED SECTION -->')
    EXCLUDED_SECTION_END_STRING = re.escape('<!-- MANPAGE: END EXCLUDED SECTION -->')
    return re.sub(
        rf'(?s){EXCLUDED_SECTION_BEGIN_STRING}.+?{EXCLUDED_SECTION_END_STRING}\n',
        '', readme)


def _convert_code_blocks(readme):
    current_code_block = None

    for line in readme.splitlines(True):
        if current_code_block:
            if line == current_code_block:
                current_code_block = None
                yield '\n'
            else:
                yield f'    {line}'
        elif line.startswith('```'):
            current_code_block = line.count('`') * '`' + '\n'
            yield '\n'
        else:
            yield line


def convert_code_blocks(readme):
    return ''.join(_convert_code_blocks(readme))


def move_sections(readme):
    MOVE_TAG_TEMPLATE = '<!-- MANPAGE: MOVE "%s" SECTION HERE -->'
    sections = re.findall(r'(?m)^%s$' % (
        re.escape(MOVE_TAG_TEMPLATE).replace(r'\%', '%') % '(.+)'), readme)

    for section_name in sections:
        move_tag = MOVE_TAG_TEMPLATE % section_name
        if readme.count(move_tag) > 1:
            raise Exception(f'There is more than one occurrence of "{move_tag}". This is unexpected')

        sections = re.findall(rf'(?sm)(^# {re.escape(section_name)}.+?)(?=^# )', readme)
        if len(sections) < 1:
            raise Exception(f'The section {section_name} does not exist')
        elif len(sections) > 1:
            raise Exception(f'There are multiple occurrences of section {section_name}, this is unhandled')

        readme = readme.replace(sections[0], '', 1).replace(move_tag, sections[0], 1)
    return readme


def filter_options(readme):
    section = re.search(r'(?sm)^# USAGE AND OPTIONS\n.+?(?=^# )', readme).group(0)
    section_new = section.replace('*', R'\*')

    options = '# OPTIONS\n'
    for line in section_new.split('\n')[1:]:
        mobj = re.fullmatch(r'''(?x)
                \s{4}(?P<opt>-(?:,\s|[^\s])+)
                (?:\s(?P<meta>(?:[^\s]|\s(?!\s))+))?
                (\s{2,}(?P<desc>.+))?
            ''', line)
        if not mobj:
            options += f'{line.lstrip()}\n'
            continue
        option, metavar, description = mobj.group('opt', 'meta', 'desc')

        # Pandoc's definition_lists. See http://pandoc.org/README.html
        option = f'{option} *{metavar}*' if metavar else option
        description = f'{description}\n' if description else ''
        options += f'\n{option}\n:   {description}'
        continue

    return readme.replace(section, options, 1)


TRANSFORM = compose_functions(filter_excluded_sections, convert_code_blocks, move_sections, filter_options)


def main():
    write_file(get_filename_args(), PREFIX + TRANSFORM(read_file(README_FILE)))


if __name__ == '__main__':
    main()
[cleanup] Point all shebang to `python3` (#372) Authored by: fstirlitz 2021-06-03 09:43:42 +00:00			`#!/usr/bin/env python3`
[cleanup] Consistent style for file heads 2022-06-24 11:06:16 +00:00
[devscripts] Create `utils` and refactor 2022-08-08 19:38:47 +00:00			`# Allow direct execution`
			`import os`
			`import sys`

			`sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))`


add prepare_manpage 2014-05-13 12:21:21 +00:00			`import os.path`
			`import re`

[devscripts] Create `utils` and refactor 2022-08-08 19:38:47 +00:00			`from devscripts.utils import (`
			`compose_functions,`
			`get_filename_args,`
			`read_file,`
			`write_file,`
			`)`

add prepare_manpage 2014-05-13 12:21:21 +00:00			`ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))`
			`README_FILE = os.path.join(ROOT_DIR, 'README.md')`

Completely change project name to yt-dlp (#85) * All modules and binary names are changed * All documentation references changed * yt-dlp no longer loads youtube-dlc config files * All URLs changed to point to organization account Co-authored-by: Pccode66 Co-authored-by: pukkandan 2021-02-24 18:45:56 +00:00			`PREFIX = r'''%yt-dlp(1)`
[devscripts/prepare_manpage] Fix manpage generation on Windows 2016-05-29 03:06:10 +00:00
			`# NAME`

[docs] Update yt-dlp tagline (#9481) Authored by: seproDev, bashonly, coletdjnz, Grub4K, pukkandan 2024-03-19 17:14:04 +00:00			`yt\-dlp \- A feature\-rich command\-line audio/video downloader`
[devscripts/prepare_manpage] Fix manpage generation on Windows 2016-05-29 03:06:10 +00:00
			`# SYNOPSIS`

Completely change project name to yt-dlp (#85) * All modules and binary names are changed * All documentation references changed * yt-dlp no longer loads youtube-dlc config files * All URLs changed to point to organization account Co-authored-by: Pccode66 Co-authored-by: pukkandan 2021-02-24 18:45:56 +00:00			`yt-dlp \[OPTIONS\] URL [URL...]`
[devscripts/prepare_manpage] Fix manpage generation on Windows 2016-05-29 03:06:10 +00:00
[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00			`# DESCRIPTION`

[devscripts/prepare_manpage] Fix manpage generation on Windows 2016-05-29 03:06:10 +00:00			`'''`


[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00			`def filter_excluded_sections(readme):`
			`EXCLUDED_SECTION_BEGIN_STRING = re.escape('<!-- MANPAGE: BEGIN EXCLUDED SECTION -->')`
			`EXCLUDED_SECTION_END_STRING = re.escape('<!-- MANPAGE: END EXCLUDED SECTION -->')`
			`return re.sub(`
			`rf'(?s){EXCLUDED_SECTION_BEGIN_STRING}.+?{EXCLUDED_SECTION_END_STRING}\n',`
			`'', readme)`


[docs] Various manpage fixes Authored by: leoheitmannruiz 2024-04-08 19:18:04 +00:00			`def _convert_code_blocks(readme):`
			`current_code_block = None`

			`for line in readme.splitlines(True):`
			`if current_code_block:`
			`if line == current_code_block:`
			`current_code_block = None`
			`yield '\n'`
			`else:`
			`yield f' {line}'`
			elif line.startswith('```'):
			current_code_block = line.count('`') * '`' + '\n'
			`yield '\n'`
			`else:`
			`yield line`


			`def convert_code_blocks(readme):`
			`return ''.join(_convert_code_blocks(readme))`


[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00			`def move_sections(readme):`
			`MOVE_TAG_TEMPLATE = '<!-- MANPAGE: MOVE "%s" SECTION HERE -->'`
[docs] Fix bug in regex escape in python 3.6 Bug in ec2e44fc5752ca15fb7ce2e31994453226507f8b Closes #2060 2021-12-20 13:13:33 +00:00			`sections = re.findall(r'(?m)^%s$' % (`
			`re.escape(MOVE_TAG_TEMPLATE).replace(r'\%', '%') % '(.+)'), readme)`
[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00
			`for section_name in sections:`
			`move_tag = MOVE_TAG_TEMPLATE % section_name`
			`if readme.count(move_tag) > 1:`
			`raise Exception(f'There is more than one occurrence of "{move_tag}". This is unexpected')`

			`sections = re.findall(rf'(?sm)(^# {re.escape(section_name)}.+?)(?=^# )', readme)`
			`if len(sections) < 1:`
			`raise Exception(f'The section {section_name} does not exist')`
			`elif len(sections) > 1:`
			`raise Exception(f'There are multiple occurrences of section {section_name}, this is unhandled')`

			`readme = readme.replace(sections[0], '', 1).replace(move_tag, sections[0], 1)`
			`return readme`
[devscripts/prepare_manpage] Fix manpage generation on Windows 2016-05-29 03:06:10 +00:00
[doc] Better formatting of youtube-dl.1 (closes #6510) 2015-09-13 12:10:23 +00:00
			`def filter_options(readme):`
[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00			`section = re.search(r'(?sm)^# USAGE AND OPTIONS\n.+?(?=^# )', readme).group(0)`
[docs] Various manpage fixes Authored by: leoheitmannruiz 2024-04-08 19:18:04 +00:00			`section_new = section.replace('', R'\')`

[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00			`options = '# OPTIONS\n'`
[docs] Various manpage fixes Authored by: leoheitmannruiz 2024-04-08 19:18:04 +00:00			`for line in section_new.split('\n')[1:]:`
[cleanup, docs] Misc cleanup Closes #2828, closes #2734, closes #2802, closes #2937 2022-03-04 14:08:55 +00:00			`mobj = re.fullmatch(r'''(?x)`
			`\s{4}(?P<opt>-(?:,\s\|[^\s])+)`
			`(?:\s(?P<meta>(?:[^\s]\|\s(?!\s))+))?`
			`(\s{2,}(?P<desc>.+))?`
			`''', line)`
[devscripts] Improve `prepare_manpage` Closes #2873 2022-02-24 11:32:19 +00:00			`if not mobj:`
			`options += f'{line.lstrip()}\n'`
			`continue`
			`option, metavar, description = mobj.group('opt', 'meta', 'desc')`

			`# Pandoc's definition_lists. See http://pandoc.org/README.html`
			`option = f'{option} {metavar}' if metavar else option`
			`description = f'{description}\n' if description else ''`
			`options += f'\n{option}\n: {description}'`
			`continue`
[docs] Improve manpage format (#2003) Closes #1448 Authored by: iw0nderhow, pukkandan 2021-12-17 01:23:04 +00:00
			`return readme.replace(section, options, 1)`
[doc] Better formatting of youtube-dl.1 (closes #6510) 2015-09-13 12:10:23 +00:00
Update coding style after pycodestyle 2.1.0 In pycodestyle 2.1.0, E305 was introduced, which requires two blank lines after top level declarations, too. See https://github.com/PyCQA/pycodestyle/issues/400 See also #10689; thanks @stepshal for first mentioning this issue and initial patches 2016-11-17 11:42:56 +00:00
[docs] Various manpage fixes Authored by: leoheitmannruiz 2024-04-08 19:18:04 +00:00			`TRANSFORM = compose_functions(filter_excluded_sections, convert_code_blocks, move_sections, filter_options)`
[devscripts] Create `utils` and refactor 2022-08-08 19:38:47 +00:00

			`def main():`
			`write_file(get_filename_args(), PREFIX + TRANSFORM(read_file(README_FILE)))`


[devscripts/prepare_manpage] Fix manpage generation on Windows 2016-05-29 03:06:10 +00:00			`if __name__ == '__main__':`
			`main()`