mezhgano · May 1, 2023 14:58 · lzy37ld · May 13, 2024
diff --git a/playwright_save_mhtml.py b/playwright_save_mhtml.py
 from playwright.sync_api import sync_playwright


 def save_mhtml(path: str, text: str):
    with open(path, mode='w', encoding='UTF-8', newline='\n') as file:
        file.write(text)

 def save_page(url: str, path: str):
    with sync_playwright() as playwright:
        browser = playwright.chromium.launch(headless=False)
        page = browser.new_page()
        page.goto(url)

        client = page.context.new_cdp_session(page)
        mhtml = client.send("Page.captureSnapshot")['data']
        save_mhtml(path, mhtml)
        browser.close()

 if __name__ == '__main__':
    save_page('https://example.com/', 'example.mhtml')
	from playwright.sync_api import sync_playwright


	def save_mhtml(path: str, text: str):
	with open(path, mode='w', encoding='UTF-8', newline='\n') as file:
	file.write(text)

	def save_page(url: str, path: str):
	with sync_playwright() as playwright:
	browser = playwright.chromium.launch(headless=False)
	page = browser.new_page()
	page.goto(url)

	client = page.context.new_cdp_session(page)
	mhtml = client.send("Page.captureSnapshot")['data']
	save_mhtml(path, mhtml)
	browser.close()

	if __name__ == '__main__':
	save_page('https://example.com/', 'example.mhtml')