1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
| import requests
from bs4 import BeautifulSoup
from csv import writer
#C2RP - financeur : Conseil Régional / Niveau : tous sauf 1 / Caractéristiques : Formations certifiantes
url = "https://formations-en-hauts-de-france.c2rp.fr/recherche/resultats?size=20&type=FC&radius=100&financeurs=Conseil+R%C3%A9gional+Hauts-de-France%7CConseil%20R%C3%A9gional%20Hauts-de-France&niveaux=2%7C3%7C4%7C5%7C6%7C7%7C8%7C9%7C0&caracteristiques=FL_FOR_CER&query=&codePostal="
page = requests.get(url)
#links_with_text = []
soup = BeautifulSoup(page.content, 'html.parser')
listes = soup.find_all('article', class_="Formation")
#with open('housing.csv', 'w', encoding='utf8', newline='') as f:
# thewriter = writer(f)
# header = ['Intitule', 'OF', 'Session', 'Prochaine Session', 'Ville', 'Duree']
for liste in listes :
# intitule = liste.find('a', href=True).text.replace('\n', '')
# of = liste.find('div', class_='Formation-organism').text.replace('\n', '')
# session = liste.find('div', class_='Formation-sessions').text.replace('\n', '')
prochaine_session = liste.find('div', class_='Formation-nextsession')
# ville = liste.find('div', class_="Formation-details")
# duree = liste.find('div', class_="Formation-details")
info = [prochaine_session]
print(info) |
Partager