{
    "content": [
        {
            "type": "text",
            "text": "# pdftohtml (man)\n\n## NAME\n\npdftohtml - program to convert PDF files into HTML, XML and PNG images\n\n## SYNOPSIS\n\npdftohtml [options] <PDF-file> [<HTML-file> <XML-file>]\n\n## DESCRIPTION\n\nThis  manual  page documents briefly the pdftohtml command.  This manual page was written for\nthe Debian GNU/Linux distribution because the original program does not have a manual page.\n\n## TLDR\n\n> Convert PDF files into HTML, XML, and PNG images.\n\n- Convert a PDF file to an HTML file:\n  `pdftohtml {{path/to/file.pdf}} {{path/to/output_file.html}}`\n- Ignore images in the PDF file:\n  `pdftohtml -i {{path/to/file.pdf}} {{path/to/output_file.html}}`\n- Generate a single HTML file that includes all PDF pages:\n  `pdftohtml -s {{path/to/file.pdf}} {{path/to/output_file.html}}`\n- Convert a PDF file to an XML file:\n  `pdftohtml -xml {{path/to/file.pdf}} {{path/to/output_file.xml}}`\n\n*Source: tldr-pages*\n\n## Sections\n\n- **NAME**\n- **SYNOPSIS**\n- **DESCRIPTION**\n- **OPTIONS** (24 subsections)\n- **AUTHOR**\n- **SEE ALSO**\n\nUse structuredContent.sections for detailed options, examples, and full documentation.\n"
        }
    ],
    "structuredContent": {
        "command": "pdftohtml",
        "section": "",
        "mode": "man",
        "summary": "pdftohtml - program to convert PDF files into HTML, XML and PNG images",
        "synopsis": "pdftohtml [options] <PDF-file> [<HTML-file> <XML-file>]",
        "tldr_summary": "Convert PDF files into HTML, XML, and PNG images.",
        "tldr_examples": [
            {
                "description": "Convert a PDF file to an HTML file",
                "command": "pdftohtml {{path/to/file.pdf}} {{path/to/output_file.html}}"
            },
            {
                "description": "Ignore images in the PDF file",
                "command": "pdftohtml -i {{path/to/file.pdf}} {{path/to/output_file.html}}"
            },
            {
                "description": "Generate a single HTML file that includes all PDF pages",
                "command": "pdftohtml -s {{path/to/file.pdf}} {{path/to/output_file.html}}"
            },
            {
                "description": "Convert a PDF file to an XML file",
                "command": "pdftohtml -xml {{path/to/file.pdf}} {{path/to/output_file.xml}}"
            }
        ],
        "tldr_source": "official",
        "flags": [
            {
                "flag": "-h",
                "long": null,
                "arg": null,
                "description": "Show summary of options."
            },
            {
                "flag": "-f",
                "long": null,
                "arg": "<int>",
                "description": "first page to print"
            },
            {
                "flag": "-l",
                "long": null,
                "arg": "<int>",
                "description": "last page to print"
            },
            {
                "flag": "-q",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "-v",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "-p",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "-c",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "-s",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "use data URLs instead of external images in HTML. No available in all platforms"
            },
            {
                "flag": "-i",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "generate no frames. Not supported in complex output mode."
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "use standard output"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "zoom the PDF document (default 1.5) (1 means 72 DPI)"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "do not round coordinates (with XML output only)"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "output text encoding name"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "owner password (for encrypted files)"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "user password (for encrypted files)"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "force hidden text extraction"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "not specified, -fmt png will be assumed"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "do not merge paragraphs"
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": ""
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "adjust the word break threshold percent. Default is 10. Word break occurs when dis‐ tance between two adjacent characters is greater than this percent of character height."
            },
            {
                "flag": "",
                "long": null,
                "arg": null,
                "description": "outputs the font name without any substitutions."
            }
        ],
        "examples": [],
        "see_also": [
            {
                "name": "pdfdetach",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdfdetach/1/json"
            },
            {
                "name": "pdffonts",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdffonts/1/json"
            },
            {
                "name": "pdfimages",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdfimages/1/json"
            },
            {
                "name": "pdfinfo",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdfinfo/1/json"
            },
            {
                "name": "pdftocairo",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdftocairo/1/json"
            },
            {
                "name": "pdftoppm",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdftoppm/1/json"
            },
            {
                "name": "pdftops",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdftops/1/json"
            },
            {
                "name": "pdftotext",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdftotext/1/json"
            },
            {
                "name": "pdfseparate",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdfseparate/1/json"
            },
            {
                "name": "pdfsig",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdfsig/1/json"
            },
            {
                "name": "pdfunite",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/pdfunite/1/json"
            },
            {
                "name": "PDFTOHTML",
                "section": "1",
                "url": "https://www.chedong.com/phpMan.php/man/PDFTOHTML/1/json"
            }
        ],
        "section_outline": [
            {
                "name": "NAME",
                "lines": 2,
                "subsections": []
            },
            {
                "name": "SYNOPSIS",
                "lines": 2,
                "subsections": []
            },
            {
                "name": "DESCRIPTION",
                "lines": 6,
                "subsections": []
            },
            {
                "name": "OPTIONS",
                "lines": 2,
                "subsections": [
                    {
                        "name": "-h, -help",
                        "lines": 2,
                        "flag": "-h"
                    },
                    {
                        "name": "-f <int>",
                        "lines": 2,
                        "flag": "-f",
                        "arg": "<int>"
                    },
                    {
                        "name": "-l <int>",
                        "lines": 2,
                        "flag": "-l",
                        "arg": "<int>"
                    },
                    {
                        "name": "-q",
                        "lines": 1,
                        "flag": "-q"
                    },
                    {
                        "name": "-v",
                        "lines": 1,
                        "flag": "-v"
                    },
                    {
                        "name": "-p",
                        "lines": 1,
                        "flag": "-p"
                    },
                    {
                        "name": "-c",
                        "lines": 1,
                        "flag": "-c"
                    },
                    {
                        "name": "-s",
                        "lines": 1,
                        "flag": "-s"
                    },
                    {
                        "name": "-dataurls",
                        "lines": 2
                    },
                    {
                        "name": "-i",
                        "lines": 1,
                        "flag": "-i"
                    },
                    {
                        "name": "-noframes",
                        "lines": 2
                    },
                    {
                        "name": "-stdout",
                        "lines": 2
                    },
                    {
                        "name": "-zoom <fp>",
                        "lines": 2
                    },
                    {
                        "name": "-xml",
                        "lines": 1
                    },
                    {
                        "name": "-noroundcoord",
                        "lines": 2
                    },
                    {
                        "name": "-enc <string>",
                        "lines": 2
                    },
                    {
                        "name": "-opw <string>",
                        "lines": 2
                    },
                    {
                        "name": "-upw <string>",
                        "lines": 2
                    },
                    {
                        "name": "-hidden",
                        "lines": 2
                    },
                    {
                        "name": "-fmt",
                        "lines": 2
                    },
                    {
                        "name": "-nomerge",
                        "lines": 2
                    },
                    {
                        "name": "-nodrm",
                        "lines": 1
                    },
                    {
                        "name": "-wbt <fp>",
                        "lines": 4
                    },
                    {
                        "name": "-fontfullname",
                        "lines": 3
                    }
                ]
            },
            {
                "name": "AUTHOR",
                "lines": 6,
                "subsections": []
            },
            {
                "name": "SEE ALSO",
                "lines": 6,
                "subsections": []
            }
        ],
        "sections": {
            "NAME": {
                "content": "pdftohtml - program to convert PDF files into HTML, XML and PNG images\n",
                "subsections": []
            },
            "SYNOPSIS": {
                "content": "pdftohtml [options] <PDF-file> [<HTML-file> <XML-file>]\n",
                "subsections": []
            },
            "DESCRIPTION": {
                "content": "This  manual  page documents briefly the pdftohtml command.  This manual page was written for\nthe Debian GNU/Linux distribution because the original program does not have a manual page.\n\npdftohtml is a program that converts PDF documents into HTML. It generates its output in  the\ncurrent working directory.  If PDF-file is ´-', it reads the PDF file from stdin.\n",
                "subsections": []
            },
            "OPTIONS": {
                "content": "A summary of options are included below.\n",
                "subsections": [
                    {
                        "name": "-h, -help",
                        "content": "Show summary of options.\n",
                        "flag": "-h"
                    },
                    {
                        "name": "-f <int>",
                        "content": "first page to print\n",
                        "flag": "-f",
                        "arg": "<int>"
                    },
                    {
                        "name": "-l <int>",
                        "content": "last page to print\n",
                        "flag": "-l",
                        "arg": "<int>"
                    },
                    {
                        "name": "-q",
                        "content": "",
                        "flag": "-q"
                    },
                    {
                        "name": "-v",
                        "content": "",
                        "flag": "-v"
                    },
                    {
                        "name": "-p",
                        "content": "",
                        "flag": "-p"
                    },
                    {
                        "name": "-c",
                        "content": "",
                        "flag": "-c"
                    },
                    {
                        "name": "-s",
                        "content": "",
                        "flag": "-s"
                    },
                    {
                        "name": "-dataurls",
                        "content": "use data URLs instead of external images in HTML. No available in all platforms\n"
                    },
                    {
                        "name": "-i",
                        "content": "",
                        "flag": "-i"
                    },
                    {
                        "name": "-noframes",
                        "content": "generate no frames. Not supported in complex output mode.\n"
                    },
                    {
                        "name": "-stdout",
                        "content": "use standard output\n"
                    },
                    {
                        "name": "-zoom <fp>",
                        "content": "zoom the PDF document (default 1.5) (1 means 72 DPI)\n"
                    },
                    {
                        "name": "-xml",
                        "content": ""
                    },
                    {
                        "name": "-noroundcoord",
                        "content": "do not round coordinates (with XML output only)\n"
                    },
                    {
                        "name": "-enc <string>",
                        "content": "output text encoding name\n"
                    },
                    {
                        "name": "-opw <string>",
                        "content": "owner password (for encrypted files)\n"
                    },
                    {
                        "name": "-upw <string>",
                        "content": "user password (for encrypted files)\n"
                    },
                    {
                        "name": "-hidden",
                        "content": "force hidden text extraction\n"
                    },
                    {
                        "name": "-fmt",
                        "content": "not specified, -fmt png will be assumed\n"
                    },
                    {
                        "name": "-nomerge",
                        "content": "do not merge paragraphs\n"
                    },
                    {
                        "name": "-nodrm",
                        "content": ""
                    },
                    {
                        "name": "-wbt <fp>",
                        "content": "adjust the word break threshold percent. Default is 10.  Word break occurs  when  dis‐\ntance  between  two  adjacent  characters  is  greater  than this percent of character\nheight.\n"
                    },
                    {
                        "name": "-fontfullname",
                        "content": "outputs the font name without any substitutions.\n\n"
                    }
                ]
            },
            "AUTHOR": {
                "content": "Pdftohtml was developed by Gueorgui Ovtcharov and Rainer Dorsch. It is based and  benefits  a\nlot from Derek Noonburg's xpdf package.\n\nThis  manual  page  was  written  by  Søren  Boll Overgaard <boll@debian.org>, for the Debian\nGNU/Linux system (but may be used by others).\n",
                "subsections": []
            },
            "SEE ALSO": {
                "content": "pdfdetach(1), pdffonts(1), pdfimages(1), pdfinfo(1), pdftocairo(1), pdftoppm(1),  pdftops(1),\npdftotext(1) pdfseparate(1), pdfsig(1), pdfunite(1)\n\n\n\nPDFTOHTML(1)",
                "subsections": []
            }
        }
    }
}