import requests
from bs4 import BeautifulSoup
import pandas as pd
URL_BASE = '
https://www.mbi.com.br'
def open_url(url):
return requests.get(f'{URL_BASE}{url}')
def soup_code(html):
soup = BeautifulSoup(html, 'html.parser')
return soup.find_all('div', {'class': 'simbolopedia-index-element'})
def get_links():
url = '/mbi/biblioteca/simbolopedia/municipios-estado-sao-paulo-br/'
source_code = open_url(url)
tags_list = soup_code(source_code.text)
tags_list = tags_list[:3]
# Sem brasao
# return [{"name": city.h3.string, "img": city.img["src"], "city_url": city.a['href']} for city in tags_list]
# Com brasao
return [{"name": city.h3.string, "brasao": city.img['src'].replace("-bandeira-mini-", "-brasao-simb-"),
"img": city.img["src"], "city_url": city.a['href']} for city in tags_list]
for city in get_links():
print(f"Nome: {city['name']} -- Bandeira: {URL_BASE + city['img']} -- Brasao: {URL_BASE + city['brasao']}")