crawler_instagram.py
2.25 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
import time
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.chrome.options import Options
from config.admin import ID, PW, LOCAL_PROJECT_PATH
from config.URLs import INSTAGRAM_URL
def get_description(driver):
element = driver.find_element_by_css_selector('.Igw0E .IwRSH .eGOV_ ._4EzTm')
data = element.get_attribute('innerHTML')
return str(data)
def check_people(driver):
result = []
navigations = driver.find_elements_by_class_name('-nal3')
navigations[1].click()
time.sleep(2)
elem = driver.find_elements_by_css_selector('.Jv7Aj ._0imsa')
for obj in elem:
result.append(obj.text)
return result
def login(driver):
elem = driver.find_elements_by_css_selector('._9GP1n .f0n8F ._2hvTZ')
time.sleep(1)
elem[0].send_keys(ID)
elem[1].send_keys(PW)
elem[1].send_keys(Keys.RETURN)
time.sleep(1)
def get_list(insta_id, driver):
desc = get_description(driver)
# check followers
followers_list = check_people(driver)
# close followers
driver.find_element_by_css_selector('.WaOAr .wpO6b').click()
time.sleep(1)
# update at firebase
data = {
"followers": followers_list,
"insta_id": insta_id,
"description": desc,
"follower_num": len(followers_list)
}
return data
def crawler_instagram(insta_id):
options = Options()
# options.add_argument("--headless")
options.add_argument("window-size=1920,1080")
driver = webdriver.Chrome(chrome_options=options, executable_path=LOCAL_PROJECT_PATH + '/crawler/chromedriver')
driver.get(url=INSTAGRAM_URL)
time.sleep(2)
print('hi')
login(driver)
print(insta_id)
time.sleep(2)
url = "%s/%s" % (INSTAGRAM_URL, insta_id)
driver.get(url=url)
time.sleep(2)
data = {}
try:
isPrivate = driver.find_element_by_class_name('rkEop').text
except Exception as e:
isPrivate = ""
pass
# account is private
if isPrivate:
print('private!!')
else:
data = get_list(insta_id, driver)
driver.close()
return data
if __name__ == "__main__":
print("-" * 60)
print(" crawler is start")
print("-" * 60)
crawler_instagram("__re.mind.er__")