Help using Python and Selenium

Hello,

I’m new to Python and Selenium, but I can’t extract company emails stored in a file via a French site which is: mappy + com

I would like the “On va ou ?” is automatically populated with names and addresses stored in a “Test extraction-mail-mappy.txt” file, examples:

SANI-CHAUFF 247 rue Félix Faure 76320 Caudebec les Elbeuf
Dyneff SA 27 avenue Léonard de Vinci 33600 Pessac
Cotib 11 avenue Vieux Moulins 74000 Annecy

When we validate or click OK, then the email is in the source code, but I cannot get there.
this with variable proxies that I have and also the random User-Agent on each search.
Examples of proxies:
IP Address
209.121.164.50
8.219.97.248

But I can’t do it, because the field is not populated with the attached code?
Can you help me ?
Here is my code:

from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.chrome.service import Service as ChromeService
from selenium.webdriver.chrome.options import Options as ChromeOptions
from webdriver_manager.chrome import ChromeDriverManager
from bs4 import BeautifulSoup
import random
import time
import re
import logging

# Configurer le logging
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

# Chemins des fichiers
url_file_path = 'D:/Test extraction-mail-mappy.txt'
output_file_path = 'D:/RecupMail.txt'

# User-Agent pour différents navigateurs
user_agents = [
     "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/126.0.0.0 Safari/537.36"
     "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:127.0) Gecko/20100101 Firefox/127.0"
     "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36 Edg/91.0.864.59",
     "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36",
     "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:89.0) Gecko/20100101 Firefox/89.0"
]

# Lecture des URL à scraper à partir du fichier
with open(url_file_path) as f:
    locations = f.read().splitlines()

# Initialisation du fichier de sortie
with open(output_file_path, 'w') as f:
    f.write("Location,Email\n")

# Fonction pour initialiser le driver avec un User-Agent aléatoire
def init_driver():
    user_agent = random.choice(user_agents)
    
    options = ChromeOptions()
    options.add_argument(f"user-agent={user_agent}")
    options.add_argument('--ignore-certificate-errors')
    options.add_argument('--ignore-ssl-errors')
    options.add_argument('--disable-web-security')
    
    logging.info(f"Initialising Chrome driver with User-Agent: {user_agent}")
    
    # Utiliser webdriver_manager pour installer et gérer chromedriver automatiquement
    service = ChromeService(ChromeDriverManager().install())
    driver = webdriver.Chrome(service=service, options=options)
    
    return driver

# Fonction pour extraire les emails de la page
def extract_emails(page_source):
    logging.info("Extracting emails from the page source")
    soup = BeautifulSoup(page_source, 'html.parser')
    emails = set(re.findall(r'"email":\s*"([a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,})"', soup.text))
    logging.info(f"Found emails: {emails}")
    return emails

# Boucle sur toutes les URL et extraction des emails
for location in locations:
    logging.info(f"Processing location: {location}")
    driver = init_driver()
    try:
        driver.get("flink of Mappy in France")
        time.sleep(4)  # Augmenter le délai pour s'assurer que la page est complètement chargée
        
        # Gestion de la fenêtre de consentement
        try:
            accept_button = driver.find_element(By.XPATH, "//button[text()='Accepter & fermer']")
            accept_button.click()
            logging.info("Accepted consent window")
            time.sleep(3)  # Augmenter le délai après acceptation
        except Exception as e:
            logging.warning("Consent window not found or could not be clicked")
        
        # Remplissage du champ de recherche
        search_field = driver.find_element(By.ID, "SearchHomePage withToaster withSuggest")
        search_field.clear()
        search_field.send_keys(location)
        search_field.send_keys(Keys.ENTER)
        logging.info(f"Search initiated for location: {location}")
        time.sleep(5)  # Augmenter le délai pour s'assurer que les résultats sont chargés
        
        # Extraction des emails
        emails = extract_emails(driver.page_source)
        
        # Enregistrement des résultats
        with open(output_file_path, 'a') as f:
            for email in emails:
                f.write(f"{location},{email}\n")
        
        logging.info(f"Emails found for {location}: {emails}")
    except Exception as e:
        logging.error(f"Error processing {location}: {e}")
    finally:
        driver.quit()
    
    time.sleep(random.randint(1, 3))  # Temporisation aléatoire entre les recherches

I can’t see the problem here , would recommend also trying something like the Scraping Browser instead of your proxies and user agent rotation (works with Selenium) and it might solve it