openfree's picture
Update app.py
2d4a3da verified
raw
history blame
17.9 kB
import os
import random
import base64
import requests
from selenium import webdriver
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.common.by import By
from selenium.common.exceptions import WebDriverException, TimeoutException
from PIL import Image
from io import BytesIO
from datetime import datetime
import gradio as gr
from typing import Tuple
import time
from pathlib import Path # ์ถ”๊ฐ€
# ์Šคํฌ๋ฆฐ์ƒท ์บ์‹œ ๋””๋ ‰ํ† ๋ฆฌ ์„ค์ •
CACHE_DIR = Path("screenshot_cache")
CACHE_DIR.mkdir(exist_ok=True)
# ์ „์—ญ ๋ณ€์ˆ˜๋กœ ์Šคํฌ๋ฆฐ์ƒท ์บ์‹œ ์„ ์–ธ
SCREENSHOT_CACHE = {}
def get_cached_screenshot(url: str) -> str:
"""์บ์‹œ๋œ ์Šคํฌ๋ฆฐ์ƒท ๊ฐ€์ ธ์˜ค๊ธฐ ๋˜๋Š” ์ƒˆ๋กœ ์ƒ์„ฑ"""
cache_file = CACHE_DIR / f"{base64.b64encode(url.encode()).decode()}.png"
if cache_file.exists():
with open(cache_file, "rb") as f:
return base64.b64encode(f.read()).decode()
return take_screenshot(url)
def take_screenshot(url):
"""์›น์‚ฌ์ดํŠธ ์Šคํฌ๋ฆฐ์ƒท ์ดฌ์˜ ํ•จ์ˆ˜ (๋กœ๋”ฉ ๋Œ€๊ธฐ ์‹œ๊ฐ„ ์ถ”๊ฐ€)"""
if url in SCREENSHOT_CACHE:
return SCREENSHOT_CACHE[url]
if not url.startswith('http'):
url = f"https://{url}"
options = webdriver.ChromeOptions()
options.add_argument('--headless')
options.add_argument('--no-sandbox')
options.add_argument('--disable-dev-shm-usage')
options.add_argument('--window-size=1080,720')
try:
driver = webdriver.Chrome(options=options)
driver.get(url)
# ๋ช…์‹œ์  ๋Œ€๊ธฐ: body ์š”์†Œ๊ฐ€ ๋กœ๋“œ๋  ๋•Œ๊นŒ์ง€ ๋Œ€๊ธฐ (์ตœ๋Œ€ 10์ดˆ)
try:
WebDriverWait(driver, 10).until(
EC.presence_of_element_located((By.TAG_NAME, "body"))
)
except TimeoutException:
print(f"ํŽ˜์ด์ง€ ๋กœ๋”ฉ ํƒ€์ž„์•„์›ƒ: {url}")
# ์ถ”๊ฐ€ ๋Œ€๊ธฐ ์‹œ๊ฐ„์„ 2์ดˆ๋กœ ์ฆ๊ฐ€
time.sleep(2) # 1์ดˆ์—์„œ 2์ดˆ๋กœ ๋ณ€๊ฒฝ
# JavaScript ์‹คํ–‰ ์™„๋ฃŒ ๋Œ€๊ธฐ
driver.execute_script("return document.readyState") == "complete"
# ์Šคํฌ๋ฆฐ์ƒท ์ดฌ์˜
screenshot = driver.get_screenshot_as_png()
img = Image.open(BytesIO(screenshot))
buffered = BytesIO()
img.save(buffered, format="PNG")
base64_image = base64.b64encode(buffered.getvalue()).decode()
# ์บ์‹œ์— ์ €์žฅ
SCREENSHOT_CACHE[url] = base64_image
return base64_image
except WebDriverException as e:
print(f"์Šคํฌ๋ฆฐ์ƒท ์ดฌ์˜ ์‹คํŒจ: {str(e)} for URL: {url}")
return None
except Exception as e:
print(f"์˜ˆ์ƒ์น˜ ๋ชปํ•œ ์˜ค๋ฅ˜: {str(e)} for URL: {url}")
return None
finally:
if 'driver' in locals():
driver.quit()
def get_card(item: dict, index: int, card_type: str = "space") -> str:
"""ํ†ตํ•ฉ ์นด๋“œ HTML ์ƒ์„ฑ"""
item_id = item.get('id', '')
author, title = item_id.split('/', 1)
likes = format(item.get('likes', 0), ',')
created = item.get('createdAt', '').split('T')[0]
# URL ์ •์˜
if card_type == "space":
url = f"https://huggingface.co/spaces/{item_id}"
elif card_type == "model":
url = f"https://huggingface.co/{item_id}"
else: # dataset
url = f"https://huggingface.co/datasets/{item_id}"
# ๋ฉ”ํƒ€๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ
tags = item.get('tags', [])
pipeline_tag = item.get('pipeline_tag', '')
license = item.get('license', '')
sdk = item.get('sdk', 'N/A')
# ํ•˜๋“œ์›จ์–ด ์š”๊ตฌ์‚ฌํ•ญ ์ฒ˜๋ฆฌ
hardware = item.get('hardware', {})
cpu_info = hardware.get('cpu', 'Standard')
gpu_info = hardware.get('gpu', 'None')
if isinstance(gpu_info, dict):
gpu_type = gpu_info.get('type', 'N/A')
gpu_memory = gpu_info.get('memory', 'N/A')
gpu_info = f"{gpu_type} ({gpu_memory}GB)"
# ์นด๋“œ ํƒ€์ž…๋ณ„ ๊ทธ๋ผ๋ฐ์ด์…˜ ์„ค์ •
if card_type == "space":
gradient_colors = """
rgba(255, 182, 193, 0.7), /* ํŒŒ์Šคํ…” ํ•‘ํฌ */
rgba(173, 216, 230, 0.7), /* ํŒŒ์Šคํ…” ๋ธ”๋ฃจ */
rgba(255, 218, 185, 0.7) /* ํŒŒ์Šคํ…” ํ”ผ์น˜ */
"""
bg_content = f"""
background-image: url(data:image/png;base64,{get_cached_screenshot(url) if get_cached_screenshot(url) else ''});
background-size: cover;
background-position: center;
"""
content_bg = f"""
background: linear-gradient(135deg, {gradient_colors});
backdrop-filter: blur(10px);
"""
type_icon = "๐ŸŽฏ"
type_label = "SPACE"
elif card_type == "model":
gradient_colors = """
rgba(110, 142, 251, 0.7), /* ๋ชจ๋ธ ๋ธ”๋ฃจ */
rgba(130, 158, 251, 0.7),
rgba(150, 174, 251, 0.7)
"""
bg_content = f"""
background: linear-gradient(135deg, #6e8efb, #4a6cf7);
padding: 15px;
"""
content_bg = f"""
background: linear-gradient(135deg, {gradient_colors});
backdrop-filter: blur(10px);
"""
type_icon = "๐Ÿค–"
type_label = "MODEL"
else: # dataset
gradient_colors = """
rgba(255, 107, 107, 0.7), /* ๋ฐ์ดํ„ฐ์…‹ ๋ ˆ๋“œ */
rgba(255, 127, 127, 0.7),
rgba(255, 147, 147, 0.7)
"""
bg_content = f"""
background: linear-gradient(135deg, #ff6b6b, #ff8787);
padding: 15px;
"""
content_bg = f"""
background: linear-gradient(135deg, {gradient_colors});
backdrop-filter: blur(10px);
"""
type_icon = "๐Ÿ“Š"
type_label = "DATASET"
# ํ•˜๋“œ์›จ์–ด ์ •๋ณด HTML
hardware_info = f"""
<div style='
margin-top: 15px;
padding: 10px;
background: rgba(255,255,255,0.3);
border-radius: 10px;
font-size: 0.9em;'>
<div style='
display: grid;
grid-template-columns: repeat(3, 1fr);
gap: 10px;'>
<div style='color: #444;'>
<span style='margin-right: 5px;'>๐Ÿ’ป</span> CPU: {cpu_info}
</div>
<div style='color: #444;'>
<span style='margin-right: 5px;'>๐ŸŽฎ</span> GPU: {gpu_info}
</div>
<div style='color: #444;'>
<span style='margin-right: 5px;'>๐Ÿ› ๏ธ</span> SDK: {sdk}
</div>
</div>
</div>
"""
# ํƒœ๊ทธ ํ‘œ์‹œ (models์™€ datasets์šฉ)
tags_html = ""
if card_type != "space":
tags_html = f"""
<div style='
position: absolute;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
display: flex;
flex-wrap: wrap;
gap: 5px;
justify-content: center;
width: 90%;'>
{' '.join([f'''
<span style='
background: rgba(255,255,255,0.2);
padding: 5px 10px;
border-radius: 15px;
color: white;
font-size: 0.8em;'>
#{tag}
</span>
''' for tag in tags[:5]])}
</div>
"""
# ์นด๋“œ HTML ๋ฐ˜ํ™˜
return f"""
<div class="card" style='
position: relative;
border: none;
padding: 0;
margin: 10px;
border-radius: 20px;
box-shadow: 0 10px 20px rgba(0,0,0,0.1);
background: white;
transition: all 0.3s ease;
overflow: hidden;
min-height: 400px;
cursor: pointer;
transform-origin: center;'
onmouseover="this.style.transform='scale(0.98) translateY(5px)'; this.style.boxShadow='0 5px 15px rgba(0,0,0,0.2)';"
onmouseout="this.style.transform='scale(1) translateY(0)'; this.style.boxShadow='0 10px 20px rgba(0,0,0,0.1)';"
onclick="window.open('{url}', '_blank')">
<!-- ์ƒ๋‹จ ์˜์—ญ -->
<div style='
width: 100%;
height: 200px;
{bg_content}
position: relative;'>
<!-- ์ˆœ์œ„ ๋ฑƒ์ง€ -->
<div style='
position: absolute;
top: 10px;
left: 10px;
background: rgba(0,0,0,0.7);
color: white;
padding: 5px 15px;
border-radius: 20px;
font-weight: bold;
font-size: 0.9em;
backdrop-filter: blur(5px);'>
#{index + 1}
</div>
<!-- ํƒ€์ž… ๋ฑƒ์ง€ -->
<div style='
position: absolute;
top: 10px;
right: 10px;
background: rgba(255,255,255,0.9);
padding: 5px 15px;
border-radius: 20px;
font-weight: bold;
font-size: 0.8em;'>
{type_icon} {type_label}
</div>
{tags_html}
</div>
<!-- ์ฝ˜ํ…์ธ  ์˜์—ญ -->
<div style='
padding: 20px;
{content_bg}
border-radius: 0 0 20px 20px;
border-top: 1px solid rgba(255,255,255,0.5);'>
<h3 style='
margin: 0 0 15px 0;
color: #333;
font-size: 1.3em;
line-height: 1.4;
display: -webkit-box;
-webkit-line-clamp: 2;
-webkit-box-orient: vertical;
overflow: hidden;
text-overflow: ellipsis;
text-shadow: 1px 1px 1px rgba(255,255,255,0.8);'>
{title}
</h3>
<div style='
display: grid;
grid-template-columns: repeat(2, 1fr);
gap: 10px;
font-size: 0.9em;
background: rgba(255,255,255,0.3);
padding: 10px;
border-radius: 10px;'>
<div style='color: #444;'>
<span style='margin-right: 5px;'>๐Ÿ‘ค</span> {author}
</div>
<div style='color: #444;'>
<span style='margin-right: 5px;'>โค๏ธ</span> {likes}
</div>
<div style='color: #444; grid-column: span 2;'>
<span style='margin-right: 5px;'>๐Ÿ“…</span> {created}
</div>
</div>
{hardware_info}
</div>
</div>
"""
def get_trending_spaces(progress=gr.Progress()) -> Tuple[str, str]:
"""ํŠธ๋ Œ๋”ฉ ์ŠคํŽ˜์ด์Šค ๊ฐ€์ ธ์˜ค๊ธฐ"""
url = "https://huggingface.co/api/spaces"
try:
progress(0, desc="Fetching spaces data...")
response = requests.get(url)
response.raise_for_status()
spaces = response.json()
# ์ƒ์œ„ 10๊ฐœ๋งŒ ์„ ํƒ (์›๋ณธ ์ˆœ์„œ ์œ ์ง€)
top_spaces = spaces[:10]
progress(0.1, desc="Creating gallery...")
html_content = """
<div style='padding: 20px; background: #f5f5f5;'>
<div style='display: grid; grid-template-columns: repeat(auto-fill, minmax(300px, 1fr)); gap: 20px;'>
"""
for idx, space in enumerate(top_spaces):
html_content += get_card(space, idx, "space")
progress((0.1 + 0.9 * idx/10), desc=f"Loading space {idx+1}/10...")
html_content += "</div></div>"
progress(1.0, desc="Complete!")
return html_content, "Gallery refresh complete!"
except Exception as e:
error_html = f'<div style="color: red; padding: 20px;">Error: {str(e)}</div>'
return error_html, f"Error: {str(e)}"
def get_models(progress=gr.Progress()) -> Tuple[str, str]:
"""์ธ๊ธฐ ๋ชจ๋ธ ๊ฐ€์ ธ์˜ค๊ธฐ"""
url = "https://huggingface.co/api/models"
try:
progress(0, desc="Fetching models data...")
response = requests.get(url)
response.raise_for_status()
models = response.json()
# ์ƒ์œ„ 10๊ฐœ๋งŒ ์„ ํƒ
top_models = models[:10]
progress(0.1, desc="Creating gallery...")
html_content = """
<div style='padding: 20px; background: #f5f5f5;'>
<div style='display: grid; grid-template-columns: repeat(auto-fill, minmax(300px, 1fr)); gap: 20px;'>
"""
for idx, model in enumerate(top_models):
model_id = model.get('id', '')
author = model_id.split('/')[0]
title = model_id.split('/')[-1]
likes = format(model.get('likes', 0), ',')
downloads = format(model.get('downloads', 0), ',')
created = model.get('createdAt', '').split('T')[0]
url = f"https://huggingface.co/{model_id}"
screenshot = get_cached_screenshot(url)
html_content += get_card(model, idx, "model")
progress((0.1 + 0.9 * idx/10), desc=f"Loading model {idx+1}/10...")
html_content += "</div></div>"
progress(1.0, desc="Complete!")
return html_content, "Models gallery refresh complete!"
except Exception as e:
error_html = f'<div style="color: red; padding: 20px;">Error: {str(e)}</div>'
return error_html, f"Error: {str(e)}"
def get_datasets(progress=gr.Progress()) -> Tuple[str, str]:
"""์ธ๊ธฐ ๋ฐ์ดํ„ฐ์…‹ ๊ฐ€์ ธ์˜ค๊ธฐ"""
url = "https://huggingface.co/api/datasets"
try:
progress(0, desc="Fetching datasets data...")
response = requests.get(url)
response.raise_for_status()
datasets = response.json()
# ์ƒ์œ„ 10๊ฐœ๋งŒ ์„ ํƒ
top_datasets = datasets[:10]
progress(0.1, desc="Creating gallery...")
html_content = """
<div style='padding: 20px; background: #f5f5f5;'>
<div style='display: grid; grid-template-columns: repeat(auto-fill, minmax(300px, 1fr)); gap: 20px;'>
"""
for idx, dataset in enumerate(top_datasets):
dataset_id = dataset.get('id', '')
author = dataset_id.split('/')[0]
title = dataset_id.split('/')[-1]
likes = format(dataset.get('likes', 0), ',')
downloads = format(dataset.get('downloads', 0), ',')
created = dataset.get('createdAt', '').split('T')[0]
url = f"https://huggingface.co/datasets/{dataset_id}"
screenshot = get_cached_screenshot(url)
html_content += get_card(dataset, idx, "dataset")
progress((0.1 + 0.9 * idx/10), desc=f"Loading dataset {idx+1}/10...")
html_content += "</div></div>"
progress(1.0, desc="Complete!")
return html_content, "Datasets gallery refresh complete!"
except Exception as e:
error_html = f'<div style="color: red; padding: 20px;">Error: {str(e)}</div>'
return error_html, f"Error: {str(e)}"
def create_interface():
"""Gradio ์ธํ„ฐํŽ˜์ด์Šค ์ƒ์„ฑ"""
with gr.Blocks(title="HuggingFace Trending Board") as interface:
gr.Markdown("# ๐Ÿค— HuggingFace Trending Board")
with gr.Tabs() as tabs:
# Spaces ํƒญ
with gr.Tab("๐ŸŽฏ Trending Spaces"):
gr.Markdown("Shows top 300 trending spaces on Hugging Face")
with gr.Row():
spaces_refresh_btn = gr.Button("Refresh Spaces", variant="primary")
spaces_gallery = gr.HTML()
spaces_status = gr.Markdown("Ready")
# Models ํƒญ
with gr.Tab("๐Ÿค– Trending Models"):
gr.Markdown("Shows top 10 trending models on Hugging Face")
with gr.Row():
models_refresh_btn = gr.Button("Refresh Models", variant="primary")
models_gallery = gr.HTML()
models_status = gr.Markdown("Ready")
# Datasets ํƒญ
with gr.Tab("๐Ÿ“Š Trending Datasets"):
gr.Markdown("Shows top 10 trending datasets on Hugging Face")
with gr.Row():
datasets_refresh_btn = gr.Button("Refresh Datasets", variant="primary")
datasets_gallery = gr.HTML()
datasets_status = gr.Markdown("Ready")
# Event handlers
spaces_refresh_btn.click(
fn=get_trending_spaces,
outputs=[spaces_gallery, spaces_status],
show_progress=True
)
models_refresh_btn.click(
fn=get_models,
outputs=[models_gallery, models_status],
show_progress=True
)
datasets_refresh_btn.click(
fn=get_datasets,
outputs=[datasets_gallery, datasets_status],
show_progress=True
)
# ์ดˆ๊ธฐ ๋กœ๋“œ
interface.load(
fn=get_trending_spaces,
outputs=[spaces_gallery, spaces_status]
)
interface.load(
fn=get_models,
outputs=[models_gallery, models_status]
)
interface.load(
fn=get_datasets,
outputs=[datasets_gallery, datasets_status]
)
return interface
if __name__ == "__main__":
try:
demo = create_interface()
demo.launch(
share=True,
inbrowser=True,
show_api=False
)
except Exception as e:
print(f"Error launching app: {e}")