Advertisement
juanchixd

Untitled

Apr 19th, 2024 (edited)
689
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.41 KB | Source Code | 0 0
  1. """
  2. Created on 2024
  3. @Creator: Juan Bautista Gonzalez
  4. @Position: Student electronic engineering and programmer part-time
  5. @Contact:
  6.    - Email: contacto@juangonzalez.com.ar
  7. """
  8. import os
  9. import requests
  10. from bs4 import BeautifulSoup
  11. from urllib.parse import urljoin
  12.  
  13. html_content= """AQUI DATA
  14. """
  15.  
  16. url = "https://www.fceia.unr.edu.ar/tesys/html/"
  17. soup = BeautifulSoup(html_content, "html.parser")
  18.  
  19. download_folder = "descargas"
  20. os.makedirs(download_folder, exist_ok=True)
  21. file_number = 1
  22. previous_number = None
  23.  
  24. for row in soup.find_all("tr"):
  25.     columns = row.find_all("td")
  26.     if len(columns) >= 4:
  27.         number = columns[1].text.strip().zfill(3)
  28.         if number != previous_number:
  29.             file_number = 1
  30.         for link in columns[3].find_all("a"):
  31.             href = link.get("href")
  32.             if href:
  33.                 file_url = urljoin(url, href)
  34.                 file_name = os.path.join(download_folder, f"{number}_{file_number:03d}_{os.path.basename(href)}")
  35.                 try:
  36.                     response = requests.get(file_url)
  37.                     with open(file_name, "wb") as file:
  38.                         file.write(response.content)
  39.                     print(f"Archivo descargado: {file_name}")
  40.                 except Exception as e:
  41.                     print(f"Error al descargar {file_url}: {e}")
  42.             file_number += 1
  43.         previous_number = number
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement