Spaces:

AIRider
/

naverstock_1

Sleeping

App Files Files Community

AIRider commited on Jan 13

Commit

3544f83

verified ·

1 Parent(s): b3b13e7

Update app.py

Browse files

Files changed (1) hide show

app.py +62 -68

app.py CHANGED Viewed

@@ -3,78 +3,72 @@ from bs4 import BeautifulSoup
 import pandas as pd
 import gradio as gr
-# 네이버 코스닥 URL
-KOSDAQ_URL = "https://finance.naver.com/sise/sise_rise.naver?sosok=1"
-def scrape_kosdaq_data():
-    print("디버깅: 네이버 증권 페이지 요청 시작...")
-    # 요청 헤더 추가
     headers = {
-        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
     }
-    # 페이지 요청
-    response = requests.get(KOSDAQ_URL, headers=headers)
-    if response.status_code == 200:
-        print("디버깅: 네이버 증권 페이지 요청 성공")
-    else:
-        print(f"디버깅: 요청 실패, 상태 코드: {response.status_code}")
-        return pd.DataFrame()  # 빈 DataFrame 반환
-    # HTML 파싱
-    soup = BeautifulSoup(response.text, "html.parser")
-    print("디버깅: 표 헤더 추출 시작...")
-    # 표의 헤더 추출
-    headers = []
-    header_tags = soup.select("table.type_2 thead tr th")
-    for tag in header_tags:
-        header_text = tag.get_text(strip=True)
-        if header_text:  # 빈 값 제거
-            headers.append(header_text)
-    print(f"디버깅: 추출된 헤더 - {headers}")
-    print("디버깅: 표 데이터 추출 시작...")
-    # 표의 데이터 추출
-    rows = soup.select("table.type_2 tbody tr")
-    data = []
-    for row in rows:
-        cols = row.find_all("td")
-        if cols:  # 빈 행 제외
-            # 각 열의 텍스트를 추출
-            row_data = [col.get_text(strip=True) for col in cols]
-            # 링크가 있는 경우 종목명을 추가
-            link = row.find("a", class_="tltle")
-            if link:
-                row_data[1] = link.text.strip()
-            data.append(row_data)
-    print(f"디버깅: 추출된 데이터 행 수 - {len(data)}")
-    if data:
-        print(f"디버깅: 첫 번째 데이터 행 - {data[0]}")
-    else:
-        print("디버깅: 데이터 추출 실패")
-        return pd.DataFrame(columns=headers)  # 빈 DataFrame 반환
-    # DataFrame 생성
-    df = pd.DataFrame(data, columns=headers)
-    print("디버깅: DataFrame 생성 완료")
     return df
-def display_kosdaq_info():
-    # 데이터 스크래핑 및 반환
-    df = scrape_kosdaq_data()
-    if not df.empty:
-        return df
-    else:
-        return pd.DataFrame({"결과": ["데이터를 가져오는 데 실패했습니다."]})
-# Gradio UI 설정
-gr.Interface(
-    fn=display_kosdaq_info,
-    inputs=None,
-    outputs="dataframe",
-    title="코스닥 종목 정보 스크래퍼",
-    description="네이버 증권 사이트에서 코스닥 종목 정보를 스크래핑하여 표시��니다."
-).launch()

 import pandas as pd
 import gradio as gr
+def scrape_kosdaq():
+    url = "https://finance.naver.com/sise/sise_rise.naver?sosok=1"
     headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/89.0.4389.82 Safari/537.36"
     }
+    try:
+        # Request the webpage
+        response = requests.get(url, headers=headers)
+        response.raise_for_status()
+        print("[INFO] Page fetched successfully.")
+        # Parse the HTML
+        soup = BeautifulSoup(response.content, "html.parser")
+        # Locate the table
+        table = soup.find("table", class_="type_2")
+        rows = table.find_all("tr")[2:]  # Skip the header rows
+        data = []
+        # Extract data row by row
+        for row in rows:
+            cols = row.find_all("td")
+            if len(cols) < 12:  # Skip blank or irrelevant rows
+                continue
+            entry = {
+                "Rank": cols[0].get_text(strip=True),
+                "Name": cols[1].get_text(strip=True),
+                "Price": cols[2].get_text(strip=True),
+                "Change": cols[3].get_text(strip=True),
+                "Change_Rate": cols[4].get_text(strip=True),
+                "Volume": cols[5].get_text(strip=True),
+                "Buy_Price": cols[6].get_text(strip=True),
+                "Sell_Price": cols[7].get_text(strip=True),
+                "Total_Buy_Quantity": cols[8].get_text(strip=True),
+                "Total_Sell_Quantity": cols[9].get_text(strip=True),
+                "PER": cols[10].get_text(strip=True),
+                "ROE": cols[11].get_text(strip=True),
+            }
+            data.append(entry)
+        print(f"[DEBUG] Extracted {len(data)} rows.")
+        return pd.DataFrame(data)
+    except requests.exceptions.RequestException as e:
+        print(f"[ERROR] Failed to fetch page: {e}")
+        return pd.DataFrame()
+def display_data():
+    df = scrape_kosdaq()
+    if df.empty:
+        return "Failed to fetch data or no data available."
     return df
+# Gradio Interface
+def gradio_interface():
+    with gr.Blocks() as demo:
+        gr.Markdown("### Naver Kosdaq Stock Scraper")
+        output = gr.Dataframe()
+        fetch_button = gr.Button("Fetch Data")
+        fetch_button.click(display_data, inputs=[], outputs=output)
+    return demo
+if __name__ == "__main__":
+    gradio_interface().launch()