Path: blob/main/modules/official_documents/dirigeants_bfmtv.py
235 views
import requests, bs41from bs4 import BeautifulSoup23def bfmtv_search(name,pren):4try:5r = requests.get("https://www.verif.com/dirigeants/recherche/q/{}6+{}5".format(name,pren))6page = r.content7features = "html.parser"8soup = BeautifulSoup(page, features)9try:10full_name = soup.find('a',{'class':'nom'}).text+" "+soup.find('td',{'class':'verif_col2'}).text11naissance = soup.find('td',{'class':'verif_col3'}).text.replace('Né le ','')12mandats = soup.find('td',{'class':'verif_col5'}).text13fonction = soup.find('td',{'class':'verif_col4'}).text14link = str(soup.find('td',{'class':'verif_col4'})).split('href="')[1].split('"')[0]15link = str(link).replace('<a class="nom" href="/','')16r = requests.get(link)17page = r.content18features = "html.parser"19soup = BeautifulSoup(page, features)2021desc = soup.find('p',{'class':'mid hidden-smallDevice'}).text.strip()22capital = soup.find('span',{'class':'number'}).text.strip()23entreprise = soup.find('h3',{'class':'subtitle'}).text.strip()24adresse_full= str(soup.find('a',{'class':'visible-smallDevice link'})).split('"_blank">')[1]25adresse = adresse_full.split("<br/>")[0]26cp = adresse_full.split("<br/>")[1].split("</a>")[0]27text = {"Capital":capital,"Desc":desc,"addr":adresse+cp,'company':entreprise,'link':link,'full_name':full_name,'naissance':naissance,'mandats':mandats,'fonction':fonction}28return text29except AttributeError:30return None31except:32return None333435