Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- """
- Created on 2024
- @Creator: Juan Bautista Gonzalez
- @Position: Student electronic engineering and programmer part-time
- @Contact:
- - Email: contacto@juangonzalez.com.ar
- """
- import os
- import requests
- from bs4 import BeautifulSoup
- from urllib.parse import urljoin
- html_content= """AQUI DATA
- """
- url = "https://www.fceia.unr.edu.ar/tesys/html/"
- soup = BeautifulSoup(html_content, "html.parser")
- download_folder = "descargas"
- os.makedirs(download_folder, exist_ok=True)
- file_number = 1
- previous_number = None
- for row in soup.find_all("tr"):
- columns = row.find_all("td")
- if len(columns) >= 4:
- number = columns[1].text.strip().zfill(3)
- if number != previous_number:
- file_number = 1
- for link in columns[3].find_all("a"):
- href = link.get("href")
- if href:
- file_url = urljoin(url, href)
- file_name = os.path.join(download_folder, f"{number}_{file_number:03d}_{os.path.basename(href)}")
- try:
- response = requests.get(file_url)
- with open(file_name, "wb") as file:
- file.write(response.content)
- print(f"Archivo descargado: {file_name}")
- except Exception as e:
- print(f"Error al descargar {file_url}: {e}")
- file_number += 1
- previous_number = number
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement