Welcome to WuJiGu Developer Q&A Community for programmer and developer-Open, Learning and Share
Welcome To Ask or Share your Answers For Others

Categories

0 votes
162 views
in Technique[技术] by (71.8m points)

Scraping followers list in Selenium python

import time
import random
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.common.action_chains import ActionChains
from selenium.webdriver.common.keys import Keys
PATH = r"C:Userswelcomechromedriver.exe"
driver = webdriver.Chrome(PATH)

driver.get("https://www.instagram.com/")
WebDriverWait(driver, 10).until(EC.element_to_be_clickable((By.XPATH, "//input[@name='username']"))).send_keys("username") #replace with your username
driver.find_element_by_xpath("//input[@name='password']").send_keys("some_password") #replace with your password

driver.find_element_by_xpath("//button/div[text()='Log In']").click()

#driver.find_element_by_class_name("_2dbep qNELH").click()

element = WebDriverWait(driver, 10).until(
                EC.presence_of_element_located((By.CLASS_NAME, "qNELH"))
            )
element.click()

driver.find_element_by_xpath("//div[text()='Profile']").click()
driver.implicitly_wait(5)
driver.find_element_by_xpath("//a[text() = ' followers']").click()
driver.implicitly_wait(3)


FList = driver.find_element_by_css_selector('div[role='dialog'] ul')
numberOfFollowersInList = len(FList.find_elements_by_css_selector('li'))
FList.click()
divL=driver.find_element_by_class_name("eiUFA")
actionChain = ActionChains(driver)
time.sleep(random.randint(2,4))

while (numberOfFollowersInList < 290):      
        actionChain.key_down(Keys.PAGE_DOWN,element=FList).key_up(Keys.PAGE_DOWN,element=FList).perform()        
        numberOfFollowersInList = len(FList.find_elements_by_css_selector('li'))
        time.sleep(0.4)
        print(numberOfFollowersInList)
        actionChain.key_down(Keys.PAGE_DOWN).key_up(Keys.PAGE_DOWN).perform()
        divL.click()
        time.sleep(2)

While executing this script, the page gets scrolled a few times but clicks on one of the follower's link and goes to his/her page. Someone, please suggest a change in the code to not click on the links.


与恶龙缠斗过久,自身亦成为恶龙;凝视深渊过久,深渊将回以凝视…
Welcome To Ask or Share your Answers For Others

1 Answer

0 votes
by (71.8m points)
import random
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
import time
from selenium.webdriver.common.action_chains import ActionChains

driver = webdriver.Firefox()


time.sleep(5)

driver.get("https://www.instagram.com/")
WebDriverWait(driver, 10).until(EC.element_to_be_clickable(
    (By.XPATH, "//input[@name='username']"))).send_keys("email")  # replace with your username
# replace with your password
driver.find_element_by_xpath(
    "//input[@name='password']").send_keys("pasword")

driver.find_element_by_xpath("//button/div[text()='Log In']").click()

#driver.find_element_by_class_name("_2dbep qNELH").click()

element = WebDriverWait(driver, 10).until(
    EC.presence_of_element_located((By.CSS_SELECTOR, "span._2dbep.qNELH"))
)
element.click()

driver.find_element_by_xpath("//div[text()='Profile']").click()
driver.implicitly_wait(5)
driver.find_element_by_xpath("//a[text() = ' followers']").click()
driver.implicitly_wait(3)


FList = driver.find_element_by_css_selector('div[role='dialog'] ul')
numberOfFollowersInList = len(FList.find_elements_by_css_selector('li'))
FList.click()
divL = driver.find_element_by_class_name("eiUFA")
actionChain = ActionChains(driver)
time.sleep(random.randint(2, 4))
frame = driver.find_element_by_css_selector("[class='isgrP']")
while (numberOfFollowersInList < 290):
    actionChain.key_down(Keys.PAGE_DOWN, element=FList).key_up(
        Keys.PAGE_DOWN, element=FList).perform()
    numberOfFollowersInList = len(
        FList.find_elements_by_css_selector('li'))
    time.sleep(0.4)
    print(numberOfFollowersInList)
    frame.send_keys(Keys.PAGE_DOWN)
    time.sleep(2)

you can send page_down key stroke to driver.find_element_by_css_selector("[class='isgrP']") (identifier frame in my code)

I am not sure why actionchain clicks the element


与恶龙缠斗过久,自身亦成为恶龙;凝视深渊过久,深渊将回以凝视…
Welcome to WuJiGu Developer Q&A Community for programmer and developer-Open, Learning and Share
...