enesmanan commited on
Commit
6b48b71
·
verified ·
1 Parent(s): 9cbdd01
Files changed (1) hide show
  1. scrape/trendyol_scraper.py +3 -12
scrape/trendyol_scraper.py CHANGED
@@ -7,8 +7,6 @@ from selenium.webdriver.chrome.options import Options
7
  import time
8
  import pandas as pd
9
  import os
10
- from webdriver_manager.chrome import ChromeDriverManager
11
- from selenium.webdriver.chrome.service import Service as ChromeService
12
 
13
  def scrape_reviews(url):
14
  # Create data directory if it doesn't exist
@@ -26,22 +24,15 @@ def scrape_reviews(url):
26
  break
27
  last_height = new_height
28
 
29
- # Chrome options for Linux/Space environment
30
  chrome_options = Options()
31
  chrome_options.add_argument('--headless')
32
  chrome_options.add_argument('--no-sandbox')
33
  chrome_options.add_argument('--disable-dev-shm-usage')
34
- chrome_options.add_argument("--disable-gpu")
35
- chrome_options.add_argument("--window-size=1920,1080")
36
- chrome_options.add_argument('--disable-blink-features=AutomationControlled')
37
 
38
  try:
39
- # Linux için Chrome ve ChromeDriver kurulumu
40
- os.system('apt-get update && apt-get install -y chromium-browser chromium-chromedriver')
41
-
42
- # ChromeDriver'ı otomatik yönet
43
- service = ChromeService()
44
- driver = webdriver.Chrome(service=service, options=chrome_options)
45
 
46
  driver.get(url)
47
 
 
7
  import time
8
  import pandas as pd
9
  import os
 
 
10
 
11
  def scrape_reviews(url):
12
  # Create data directory if it doesn't exist
 
24
  break
25
  last_height = new_height
26
 
27
+ # Space'in kendi Chrome ayarlarını kullan
28
  chrome_options = Options()
29
  chrome_options.add_argument('--headless')
30
  chrome_options.add_argument('--no-sandbox')
31
  chrome_options.add_argument('--disable-dev-shm-usage')
 
 
 
32
 
33
  try:
34
+ # Space'in ChromeDriver path'ini kullan
35
+ driver = webdriver.Chrome(options=chrome_options)
 
 
 
 
36
 
37
  driver.get(url)
38