import os import re import tempfile import git from huggingface_hub import ( create_repo, upload_folder, list_repo_files, Repository, whoami, ) import logging from pathlib import Path from PIL import Image try: from keylock_decode import decode_from_image_pil KEYLOCK_DECODE_AVAILABLE = True except ImportError: KEYLOCK_DECODE_AVAILABLE = False decode_from_image_pil = None logging.warning("keylock-decode library not found. Image decoding feature will be disabled.") logging.basicConfig( level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s" ) logger = logging.getLogger(__name__) # --- Helper Function to Get API Token (Unchanged) --- def _get_api_token(ui_token_from_textbox=None): env_token = os.getenv('HF_TOKEN') if env_token: logger.info("Using HF_TOKEN from environment.") return env_token, None if ui_token_from_textbox: logger.info("Using API token from UI textbox.") return ui_token_from_textbox, None logger.warning("HF API token not found in environment or UI textbox.") return None, "Error: Hugging Face API token not provided. Please enter it in the textbox or load it from an image." # --- `load_token_from_image_and_set_env` (Unchanged from previous debug version) --- def load_token_from_image_and_set_env(image_pil_object: Image.Image, password: str): if not KEYLOCK_DECODE_AVAILABLE: return "Error: KeyLock-Decode library is not installed. This feature is disabled." if image_pil_object is None: return "Error: No image provided for decoding." if not password: return "Error: Password cannot be empty for image decoding." status_messages_display = [] debug_image_path_str = "Not saved (error or no image)." try: if image_pil_object: original_mode = getattr(image_pil_object, 'mode', 'N/A') original_format = getattr(image_pil_object, 'format', 'N/A') original_size = getattr(image_pil_object, 'size', 'N/A') logger.info(f"Received PIL Image from Gradio. Mode: {original_mode}, Original Format: {original_format}, Size: {original_size}") status_messages_display.append(f"[DEBUG] Gradio provided PIL Image - Mode: {original_mode}, Original Format: {original_format}, Size: {original_size}") temp_dir = Path(tempfile.gettempdir()) / "gradio_image_debug" temp_dir.mkdir(parents=True, exist_ok=True) debug_image_path = temp_dir / "image_from_gradio.png" image_pil_object.save(debug_image_path, "PNG") debug_image_path_str = str(debug_image_path) status_messages_display.append(f"**[DEBUG ACTION REQUIRED]** Image from Gradio saved to: `{debug_image_path_str}`. Try decoding this file with the standalone `keylock-decode` CLI.") logger.info(f"Debug image from Gradio saved to: {debug_image_path_str}") else: status_messages_display.append("[DEBUG] No PIL image object received for debug-saving.") except Exception as save_exc: logger.exception("Error during debug-saving of image from Gradio:") status_messages_display.append(f"[DEBUG] Error saving image for debugging: {str(save_exc)}. Path: {debug_image_path_str}") try: decoded_data, status_msgs_from_lib = decode_from_image_pil(image_pil_object, password, set_environment_variables=True) status_messages_display.extend(status_msgs_from_lib) if decoded_data: status_messages_display.append("\n**Decoded Data Summary (sensitive values masked):**") for key, value in decoded_data.items(): display_value = '********' if any(k_word in key.upper() for k_word in ['TOKEN', 'KEY', 'SECRET', 'PASS']) else value status_messages_display.append(f"- {key}: {display_value}") if os.getenv('HF_TOKEN'): status_messages_display.append(f"\n**SUCCESS: HF_TOKEN was found and set in environment.**") elif 'HF_TOKEN' in decoded_data: status_messages_display.append(f"\nWarning: HF_TOKEN decoded but os.getenv('HF_TOKEN') not found.") else: status_messages_display.append("\nNote: HF_TOKEN not specifically found in decoded image data.") except ValueError as e: status_messages_display.append(f"**Decoding Error (e.g., bad password, corrupted data):** {e}") except Exception as e: status_messages_display.append(f"**An unexpected error occurred during decoding:** {str(e)}") return "\n".join(status_messages_display) # --- Updated `parse_markdown` function --- def parse_markdown(markdown_input): """ Parse markdown input to extract space details and file structure. Correctly handles code blocks by excluding the ``` fences. """ space_info = {"repo_name_md": "", "owner_md": "", "files": []} current_file_path = None current_file_content_lines = [] # State machine variables # in_file_definition: True when we are after "### File: " and before the next "### File: " or end of input. # in_code_block: True when we are between ``` and ```. in_file_definition = False in_code_block = False lines = markdown_input.strip().split("\n") for line_content_orig in lines: line_content_stripped = line_content_orig.strip() # Check for new file definition first if line_content_stripped.startswith("### File:"): # Save previous file's content if any if current_file_path and in_file_definition: space_info["files"].append({ "path": current_file_path, "content": "\n".join(current_file_content_lines) }) current_file_content_lines = [] # Reset for the new file current_file_path = line_content_stripped.replace("### File:", "").strip() in_file_definition = True in_code_block = False # Reset code block state for a new file continue # Move to next line, don't process "### File:" as content # If we are not in any file definition, skip lines until we find one if not in_file_definition: if line_content_stripped.startswith("# Space:"): # Parse space name from markdown full_space_name_md = line_content_stripped.replace("# Space:", "").strip() if "/" in full_space_name_md: space_info["owner_md"], space_info["repo_name_md"] = full_space_name_md.split("/", 1) else: space_info["repo_name_md"] = full_space_name_md # Other top-level constructs like "## File Structure" can be ignored or parsed if needed continue # Now, we are definitely within a "### File: ..." block's content area # Handle code block fences ``` if line_content_stripped.startswith("```"): if in_code_block: in_code_block = False # Exiting a code block else: in_code_block = True # Entering a code block # In either case, we *don't* append the ``` line itself to content continue # Move to next line # If we are inside a code block OR not (i.e., plain text lines for the file), # append the original line (preserving leading/trailing whitespace for that line). current_file_content_lines.append(line_content_orig) # After loop, append the last file's content if any if current_file_path and in_file_definition: # Ensure we were actually defining a file space_info["files"].append({ "path": current_file_path, "content": "\n".join(current_file_content_lines) }) # Filter out any entries that might have been added with no path (shouldn't happen with current logic) space_info["files"] = [f for f in space_info["files"] if f.get("path")] return space_info # --- `_determine_repo_id` (Unchanged) --- def _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui): if not space_name_ui: return None, "Error: Space Name cannot be empty." if "/" in space_name_ui: return None, "Error: Space Name should not contain '/'. Use Owner field." final_owner = owner_ui; error_message = None if not final_owner: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return None, token_err if not resolved_api_token: return None, "Error: API token required for auto owner determination." try: user_info = whoami(token=resolved_api_token) if user_info and 'name' in user_info: final_owner = user_info['name'] else: error_message = "Error: Could not retrieve username. Check token/permissions or specify Owner." except Exception as e: error_message = f"Error retrieving username: {str(e)}. Specify Owner." if error_message: return None, error_message if not final_owner: return None, "Error: Owner could not be determined." return f"{final_owner}/{space_name_ui}", None # --- Core Functions: `create_space`, `view_space_files`, `update_space_file` (Unchanged) --- def create_space(ui_api_token_from_textbox, space_name_ui, owner_ui, sdk_ui, markdown_input): repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return token_err repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return err repo_id_for_error_logging = repo_id space_info = parse_markdown(markdown_input) # Uses the updated parser if not space_info["files"]: return "Error: No files found in markdown. Use '### File: path/to/file.ext'." with tempfile.TemporaryDirectory() as temp_dir: repo_local_path = Path(temp_dir) / "repo_upload_content" repo_local_path.mkdir(exist_ok=True) for file_info in space_info["files"]: if not file_info.get("path"): continue file_path_abs = repo_local_path / file_info["path"] file_path_abs.parent.mkdir(parents=True, exist_ok=True) with open(file_path_abs, "w", encoding="utf-8") as f: f.write(file_info["content"]) # Content is now clean try: create_repo(repo_id=repo_id, token=resolved_api_token, repo_type="space", space_sdk=sdk_ui, private=False) except Exception as e: err_str = str(e).lower() if not ("already exists" in err_str or "you already created this repo" in err_str or "exists" in err_str): return f"Error creating Space '{repo_id}': {str(e)}" upload_folder(repo_id=repo_id, folder_path=str(repo_local_path), path_in_repo=".", token=resolved_api_token, repo_type="space", commit_message=f"Initial Space setup of {repo_id} via Builder") return f"Successfully created/updated Space: [{repo_id}](https://huggingface.co/spaces/{repo_id})" except Exception as e: logger.exception(f"Error in create_space for {repo_id_for_error_logging}:") return f"Error during Space creation/update: {str(e)}" def view_space_files(ui_api_token_from_textbox, space_name_ui, owner_ui): repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return token_err repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return err repo_id_for_error_logging = repo_id files = list_repo_files(repo_id=repo_id, token=resolved_api_token, repo_type="space") if files: return f"Files in `{repo_id}`:\n\n" + "\n".join([f"- `{f}`" for f in files]) return f"No files found in Space `{repo_id}`." except Exception as e: logger.exception(f"Error in view_space_files for {repo_id_for_error_logging}:") return f"Error listing files for `{repo_id_for_error_logging}`: {str(e)}" def update_space_file(ui_api_token_from_textbox, space_name_ui, owner_ui, file_path_in_repo, file_content, commit_message_ui): repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return token_err repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return err repo_id_for_error_logging = repo_id if not file_path_in_repo: return "Error: File Path cannot be empty." commit_message_ui = commit_message_ui or f"Update {file_path_in_repo} via Space Builder" with tempfile.TemporaryDirectory() as temp_dir: repo_local_clone_path = Path(temp_dir) / "cloned_space_repo_for_update" cloned_repo = Repository(local_dir=str(repo_local_clone_path), clone_from=f"https://huggingface.co/spaces/{repo_id}", repo_type="space", use_auth_token=resolved_api_token, git_user="Space Builder Bot", git_email="space-builder@huggingface.co") full_local_file_path = Path(cloned_repo.local_dir) / file_path_in_repo full_local_file_path.parent.mkdir(parents=True, exist_ok=True) with open(full_local_file_path, "w", encoding="utf-8") as f: f.write(file_content) cloned_repo.push_to_hub(commit_message=commit_message_ui) return f"Successfully updated `{file_path_in_repo}` in Space [{repo_id}](https://huggingface.co/spaces/{repo_id})" except Exception as e: logger.exception(f"Error in update_space_file for {repo_id_for_error_logging}:") return f"Error updating file for `{repo_id_for_error_logging}`: {str(e)}"