{toc_full_title}

Documentation path: {file_path.replace(chr(92),'/').replace('.mdx', '').replace(repo_dir + '/' + docs_dir,'')}

Description: {data.get('description', 'No description')}

Related:

Title: {data.get('related', {}).get('title', 'Related')}

Related Description: {data.get('related', {}).get('description', 'No related description')}

Links:

{link}

{toc}

""" html_all_content = toc_html + html_all_pages_content # Finalize html formatting html_all_pages_content = html_header + html_all_pages_content + "" toc_html = html_header + toc_html + "" html_all_content = html_header + html_all_content + "" return(html_all_content, toc_html, html_all_pages_content) def find_latest_version(html_content): # Regular expression to find versions like v14.2.0 version_pattern = re.compile(r"v(\d+\.\d+\.\d+)") versions = version_pattern.findall(html_content) # Remove duplicates and sort versions unique_versions = sorted(set(versions), key=lambda v: version.parse(v), reverse=True) return unique_versions[0] if unique_versions else None if __name__ == "__main__": # Define the output PDF file name # project_title = "Next.js v14 Documentation" # output_pdf = "Next.js_v14_Documentation.pdf" export_html = False # Clone the repository and checkout the canary branch repo_dir = "nextjs-docs" repo_url = "https://github.com/vercel/next.js.git" branch = "canary" docs_dir = "docs" # Define a base path and quality for the image URLs Change_img_url = True base_path = "https://nextjs.org/_next/image?url=" path_args = "&w=1920&q=75" # Clone the repository clone_repo(repo_url, branch, docs_dir, repo_dir) # Traverse the docs directory and convert each markdown file to HTML print ("Converting the Documentation to HTML...") docs_dir_full_path = os.path.join(repo_dir, docs_dir) files_to_process = get_files_sorted(docs_dir_full_path) html_all_content, _, _ = process_files(files_to_process, repo_dir, docs_dir) print("Converted all MDX to HTML.") # Save the HTML content to a file for inspection if export_html: with open('output.html', 'w', encoding='utf8') as f: f.write(html_all_content) print("HTML Content exported.") # Find the latest version in the HTML content latest_version = find_latest_version(html_all_content) if latest_version: project_title = f"""Next.js Documentation v{latest_version}""" output_pdf = f"""Next.js_Docs_v{latest_version}_{datetime.now().strftime("%Y-%m-%d")}.pdf""" else: project_title = "Next.js Documentation" output_pdf = "Next.js_Documentation.pdf" # Define the cover HTML with local CSS file cover_html = f"""

{project_title}

Date: {datetime.now().strftime("%Y-%m-%d")}

""" # Write the cover HTML to a temporary file with tempfile.NamedTemporaryFile(delete=False, suffix='.html') as cover_file: cover_file.write(cover_html.encode('utf-8')) print("HTML Cover exported.") # Convert the combined HTML content to PDF with a cover and a table of contents if is_file_open(output_pdf): print("The output file is already open in another process. Please close it and try again.") else: options = { 'encoding': 'UTF-8', 'page-size': 'A4', 'quiet': '', 'image-dpi': 150, # General reco.: printer - hq, 300 dpi| ebook - low quality, 150 dpi| screen-view-only quality, 72 dpi 'image-quality': 75, # 'no-outline': None, # 'no-images': None, } pdfkit.from_string(html_all_content, output_pdf, options=options, cover=cover_file.name, toc={}) print("Created the PDF file successfully.") # Delete the temporary file os.unlink(cover_file.name)

{toc_full_title}

Table of Contents