#!/usr/bin/env python import argparse import sys from markdownify import markdownify, ATX, ATX_CLOSED, UNDERLINED, \ SPACES, BACKSLASH, ASTERISK, UNDERSCORE def main(argv=sys.argv[1:]): parser = argparse.ArgumentParser( prog='markdownify', description='Converts html to markdown.', ) parser.add_argument('html', nargs='?', type=argparse.FileType('r'), default=sys.stdin, help="The html file to convert. Defaults to STDIN if not " "provided.") parser.add_argument('-s', '--strip', nargs='*', help="A list of tags to strip. This option can't be used with " "the --convert option.") parser.add_argument('-c', '--convert', nargs='*', help="A list of tags to convert. This option can't be used with " "the --strip option.") parser.add_argument('-a', '--autolinks', action='store_true', help="A boolean indicating whether the 'automatic link' style " "should be used when a 'a' tag's contents match its href.") parser.add_argument('--default-title', action='store_false', help="A boolean to enable setting the title of a link to its " "href, if no title is given.") parser.add_argument('--heading-style', default=UNDERLINED, choices=(ATX, ATX_CLOSED, UNDERLINED), help="Defines how headings should be converted.") parser.add_argument('-b', '--bullets', default='*+-', help="A string of bullet styles to use; the bullet will " "alternate based on nesting level.") parser.add_argument('--strong-em-symbol', default=ASTERISK, choices=(ASTERISK, UNDERSCORE), help="Use * or _ to convert strong and italics text"), parser.add_argument('--sub-symbol', default='', help="Define the chars that surround ''.") parser.add_argument('--sup-symbol', default='', help="Define the chars that surround ''.") parser.add_argument('--newline-style', default=SPACES, choices=(SPACES, BACKSLASH), help="Defines the style of
conversions: two spaces " "or backslash at the and of the line thet should break.") parser.add_argument('--code-language', default='', help="Defines the language that should be assumed for all " "'
' sections.")
    parser.add_argument('--no-escape-asterisks', dest='escape_asterisks',
                        action='store_false',
                        help="Do not escape '*' to '\\*' in text.")
    parser.add_argument('--no-escape-underscores', dest='escape_underscores',
                        action='store_false',
                        help="Do not escape '_' to '\\_' in text.")
    parser.add_argument('-i', '--keep-inline-images-in',
                        default=[],
                        nargs='*',
                        help="Images are converted to their alt-text when the images are "
                        "located inside headlines or table cells. If some inline images "
                        "should be converted to markdown images instead, this option can "
                        "be set to a list of parent tags that should be allowed to "
                        "contain inline images.")
    parser.add_argument('--table-infer-header', dest='table_infer_header',
                        action='store_true',
                        help="When a table has no header row (as indicated by '' "
                        "or ''), use the first body row as the header row.")
    parser.add_argument('-w', '--wrap', action='store_true',
                        help="Wrap all text paragraphs at --wrap-width characters.")
    parser.add_argument('--wrap-width', type=int, default=80)
    parser.add_argument('--bs4-options',
                        default='html.parser',
                        help="Specifies the parser that BeautifulSoup should use to parse "
                             "the HTML markup. Examples include 'html5.parser', 'lxml', and "
                             "'html5lib'.")

    args = parser.parse_args(argv)
    print(markdownify(**vars(args)))


if __name__ == '__main__':
    main()