{toc_full_title}

Documentation path: {file_path.replace(chr(92),'/').replace('.mdx', '').replace(repo_dir + '/' + docs_dir,'')}

Description: {data.get('description', 'No description')}

Related:

Title: {data.get('related', {}).get('title', 'Related')}

Related Description: {data.get('related', {}).get('description', 'No related description')}

Links:

{link}

{toc}

""" html_all_content = toc_html + html_all_pages_content html_all_pages_content = html_header + html_all_pages_content + "" toc_html = html_header + toc_html + "" html_all_content = html_header + html_all_content + "" return(html_all_content, toc_html, html_all_pages_content) def find_latest_version(html_content): version_pattern = re.compile(r"v(\d+\.\d+\.\d+)") versions = version_pattern.findall(html_content) unique_versions = sorted(set(versions), key=lambda v: version.parse(v), reverse=True) return unique_versions[0] if unique_versions else None def generate_pdf(html_content, output_pdf, format_options=None): """ Generate PDF from HTML content using Playwright """ default_format = { 'format': 'A4', 'margin': { 'top': '50px', 'right': '50px', 'bottom': '50px', 'left': '50px' }, 'print_background': True, 'display_header_footer': True, 'header_template': '

', 'footer_template': '

' } format_options = format_options or default_format with sync_playwright() as p: browser = p.chromium.launch() page = browser.new_page() # Set viewport size to ensure consistent rendering page.set_viewport_size({"width": 1280, "height": 1024}) # Set content and wait for network idle page.set_content(html_content, wait_until='networkidle') # Wait for any images and fonts to load page.wait_for_load_state('networkidle') page.wait_for_load_state('domcontentloaded') # Generate PDF page.pdf(path=output_pdf, **format_options) browser.close() if __name__ == "__main__": export_html = False repo_dir = "nextjs-docs" repo_url = "https://github.com/vercel/next.js.git" branch = "canary" docs_dir = "docs" Change_img_url = True base_path = "https://nextjs.org/_next/image?url=" path_args = "&w=1920&q=75" clone_repo(repo_url, branch, docs_dir, repo_dir) print("Converting the Documentation to HTML...") docs_dir_full_path = os.path.join(repo_dir, docs_dir) files_to_process = get_files_sorted(docs_dir_full_path) html_all_content, _, _ = process_files(files_to_process, repo_dir, docs_dir) print("Converted all MDX to HTML.") if export_html: with open('output.html', 'w', encoding='utf8') as f: f.write(html_all_content) print("HTML Content exported.") latest_version = find_latest_version(html_all_content) if latest_version: project_title = f"""Next.js Documentation v{latest_version}""" output_pdf = f"""Next.js_Docs_v{latest_version}_{datetime.now().strftime("%Y-%m-%d")}.pdf""" else: project_title = "Next.js Documentation" output_pdf = "Next.js_Documentation.pdf" cover_html = f"""

{project_title}

Date: {datetime.now().strftime("%Y-%m-%d")}

""" format_options = { 'format': 'A4', 'margin': { 'top': '50px', 'right': '50px', 'bottom': '50px', 'left': '50px' }, 'print_background': True, 'display_header_footer': True, 'header_template': f'''

{project_title} Page of

''', 'footer_template': f'''

Generated on {datetime.now().strftime("%Y-%m-%d")}

''' } # Check if file is open if is_file_open(output_pdf): print("The output file is already open in another process. Please close it and try again.") else: try: print("Generating PDF...") # Generate PDF with cover page and content generate_pdf(cover_html + html_all_content, output_pdf, format_options) print("Created the PDF file successfully.") except Exception as e: print(f"Error generating PDF: {str(e)}")

{toc_full_title}

Table of Contents