Spaces:

dwb2023
/

hf_extractor

Runtime error

App Files Files Community

dwb2023 commited on Jun 1, 2024

Commit

c700267

verified ·

1 Parent(s): e361a15

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -9

app.py CHANGED Viewed

@@ -4,22 +4,28 @@ import gradio as gr
 from magika import Magika
 from huggingface_hub import login
-# Get the HF token from environment variables
 hf_token = os.getenv("HF_TOKEN")
-if hf_token:
-    login(token=hf_token, add_to_git_credential=True)
-else:
     raise ValueError("HF_TOKEN environment variable is not set")
 SUPPORTED_FILE_TYPES = ["txt", "python", "markdown", "yaml", "json", "csv", "tsv", "xml", "html"]
 def validate_url(url):
     return url.startswith('https://')
-def clone_repo(url, repo_dir, token):
     env = os.environ.copy()
     env['GIT_LFS_SKIP_SMUDGE'] = '1'
-    token_url = url.replace('https://', f'https://{token}:x-oauth-basic@')
     result = subprocess.run(["git", "clone", token_url, repo_dir], env=env, capture_output=True, text=True)
     if result.returncode != 0:
         return False, result.stderr
@@ -54,7 +60,7 @@ def validate_file_types(directory):
                 file_types[file_path] = f"Error: {str(e)}"
     return file_types
-def extract_repo_content(url, token):
     if not validate_url(url):
         return [{"header": {"name": "Error", "type": "error", "size": 0}, "content": "Invalid URL"}]
@@ -62,7 +68,7 @@ def extract_repo_content(url, token):
     if os.path.exists(repo_dir):
         subprocess.run(["rm", "-rf", repo_dir])
-    success, error = clone_repo(url, repo_dir, token)
     if not success:
         return [{"header": {"name": "Error", "type": "error", "size": 0}, "content": f"Failed to clone repository: {error}"}]
@@ -101,7 +107,7 @@ def format_output(extracted_content, repo_url):
     return formatted_output
 def extract_and_display(url):
-    extracted_content = extract_repo_content(url, hf_token)
     formatted_output = format_output(extracted_content, url)
     return formatted_output

 from magika import Magika
 from huggingface_hub import login
+# Get the HF token and space author name from environment variables
 hf_token = os.getenv("HF_TOKEN")
+hf_user = os.getenv("SPACE_AUTHOR_NAME")
+if not hf_token:
     raise ValueError("HF_TOKEN environment variable is not set")
+if not hf_user:
+    raise ValueError("SPACE_AUTHOR_NAME environment variable is not set")
+# Perform login using the token
+login(token=hf_token, add_to_git_credential=True)
 SUPPORTED_FILE_TYPES = ["txt", "python", "markdown", "yaml", "json", "csv", "tsv", "xml", "html"]
 def validate_url(url):
     return url.startswith('https://')
+def clone_repo(url, repo_dir, hf_token, hf_user):
     env = os.environ.copy()
     env['GIT_LFS_SKIP_SMUDGE'] = '1'
+    # Construct the Git URL with the token and author name for authentication
+    token_url = url.replace('https://', f'https://{hf_user}:{hf_token}@')
     result = subprocess.run(["git", "clone", token_url, repo_dir], env=env, capture_output=True, text=True)
     if result.returncode != 0:
         return False, result.stderr
                 file_types[file_path] = f"Error: {str(e)}"
     return file_types
+def extract_repo_content(url, hf_token, hf_user):
     if not validate_url(url):
         return [{"header": {"name": "Error", "type": "error", "size": 0}, "content": "Invalid URL"}]
     if os.path.exists(repo_dir):
         subprocess.run(["rm", "-rf", repo_dir])
+    success, error = clone_repo(url, repo_dir, hf_token, hf_user)
     if not success:
         return [{"header": {"name": "Error", "type": "error", "size": 0}, "content": f"Failed to clone repository: {error}"}]
     return formatted_output
 def extract_and_display(url):
+    extracted_content = extract_repo_content(url, hf_token, hf_user)
     formatted_output = format_output(extracted_content, url)
     return formatted_output