from bs4 import BeautifulSoup from urllib.parse import urljoin import requests import os import re from pathlib import Path