import re
from bs4 import BeautifulSoup
def parse_platforms(data):
soup = BeautifulSoup(data, 'html.parser')
results = []
spans = soup.find_all('span', style="font-size: 18px")
for span in spans:
platform_element = span.find(['b', 'strong'])
if not platform_element:
continue
platform = platform_element.text.strip()
# Проверяем, содержит ли платформа 'win' или 'android' (игнорируя регистр)
if re.search(r'win|android', platform, re.IGNORECASE):
links = span.find_all('a', class_='link link--external')
for link in links:
url = link['href']
host = link.text.strip()
results.append(f"{platform} ({url}) {host}")
return results
# Пример использования
data = """[Win/Linux: GOFILE - MEGA - MIXDROP - PIXELDRAIN - UPLOADHAVEN
Mac , : GOFILE - MEGA - MIXDROP - UPLOADHAVEN
Android , : GOFILE - MEGA - MIXDROP - UPLOADHAVEN
Other: CMPRESSED*, "Bridg