import os import re import tempfile import shutil import git import re from huggingface_hub import ( create_repo, upload_folder, list_repo_files, Repository, whoami, hf_hub_download, # New import ) import logging from pathlib import Path from PIL import Image try: from keylock_decode import decode_from_image_pil KEYLOCK_DECODE_AVAILABLE = True except ImportError: KEYLOCK_DECODE_AVAILABLE = False decode_from_image_pil = None logging.warning("keylock-decode library not found. KeyLock Wallet image feature will be disabled.") logging.basicConfig( level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s" ) logger = logging.getLogger(__name__) # --- Helper Function to Get API Token (Unchanged) --- def _get_api_token(ui_token_from_textbox=None): env_token = os.getenv('HF_TOKEN') if env_token: return env_token, None if ui_token_from_textbox: return ui_token_from_textbox, None return None, "Error: Hugging Face API token not provided." # --- `load_token_from_image_and_set_env` (Unchanged - Terminology and debug logic as before) --- def load_token_from_image_and_set_env(image_pil_object: Image.Image, password: str): if not KEYLOCK_DECODE_AVAILABLE: return "Error: KeyLock-Decode library is not installed." if image_pil_object is None: return "Error: No KeyLock Wallet image provided." if not password: return "Error: Password cannot be empty." status_messages_display = [] # ... (rest of the function, ensure debug logic is as intended or removed) try: logger.info(f"Attempting to decode from KeyLock Wallet image...") decoded_data, status_msgs_from_lib = decode_from_image_pil(image_pil_object, password, set_environment_variables=True) status_messages_display.extend(status_msgs_from_lib) if decoded_data: status_messages_display.append("\n**Decoded Data Summary (sensitive values masked):**") for key, value in decoded_data.items(): display_value = '********' if any(k_word in key.upper() for k_word in ['TOKEN', 'KEY', 'SECRET', 'PASS']) else value status_messages_display.append(f"- {key}: {display_value}") if os.getenv('HF_TOKEN'): status_messages_display.append(f"\n**SUCCESS: HF_TOKEN set from KeyLock Wallet image.**") # ... (other status messages) except ValueError as e: status_messages_display.append(f"**Decoding Error:** {e}") except Exception as e: status_messages_display.append(f"**Unexpected decoding error:** {str(e)}") return "\n".join(status_messages_display) '''def process_commented_markdown(commented_input): """Process a commented markdown string by stripping '# ' from each line if '# # Space:' is present.""" lines = commented_input.strip().split("\n") print(type(lines)) # Check for '# # Space:' or variations (e.g., '# Space:') in any line if any( "# # Space:" in line.strip() for line in lines): print("YES") cleaned_lines = [line.lstrip("# ") for line in lines] return cleaned_lines return lines''' def process_commented_markdown(commented_input): """Process a commented markdown string by stripping '# ' from each line if '# # Space:' is present.""" lines = commented_input.strip().split("\n") print(type(lines)) # Original debug print # Check for '# # Space:' or variations (e.g., '# Space:') in any line if any( "# # Space:" in line.strip() for line in lines): print("YES") # Original debug print cleaned_lines = [line[2:] if line.startswith("# ") else line for line in lines] return cleaned_lines return lines def parse_markdown(markdown_input): space_info = {"repo_name_md": "", "owner_md": "", "files": []} current_file_path = None; current_file_content_lines = [] in_file_definition = False; in_code_block = False print(markdown_input) lines = process_commented_markdown(markdown_input) print(lines) #lines = markdown_input.strip().split("\n") for line_content_orig in lines: line_content_stripped = line_content_orig.strip() if line_content_stripped.startswith("### File:"): if current_file_path and in_file_definition: space_info["files"].append({"path": current_file_path, "content": "\n".join(current_file_content_lines)}) current_file_path = line_content_stripped.replace("### File:", "").strip() current_file_content_lines = [] in_file_definition = True; in_code_block = False continue if not in_file_definition: if line_content_stripped.startswith("# Space:"): full_space_name_md = line_content_stripped.replace("# Space:", "").strip() if "/" in full_space_name_md: space_info["owner_md"], space_info["repo_name_md"] = full_space_name_md.split("/", 1) else: space_info["repo_name_md"] = full_space_name_md continue if line_content_stripped.startswith("```"): in_code_block = not in_code_block continue current_file_content_lines.append(line_content_orig) if current_file_path and in_file_definition: space_info["files"].append({"path": current_file_path, "content": "\n".join(current_file_content_lines)}) space_info["files"] = [f for f in space_info["files"] if f.get("path")] return space_info # --- `_determine_repo_id` (Unchanged) --- def _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui): if not space_name_ui: return None, "Error: Space Name cannot be empty." if "/" in space_name_ui: return None, "Error: Space Name should not contain '/'. Use Owner field." final_owner = owner_ui; error_message = None if not final_owner: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return None, token_err if not resolved_api_token: return None, "Error: API token required for auto owner determination." try: user_info = whoami(token=resolved_api_token) if user_info and 'name' in user_info: final_owner = user_info['name'] else: error_message = "Error: Could not retrieve username. Check token/permissions or specify Owner." except Exception as e: error_message = f"Error retrieving username: {str(e)}. Specify Owner." if error_message: return None, error_message if not final_owner: return None, "Error: Owner could not be determined." return f"{final_owner}/{space_name_ui}", None # --- New Function to Fetch File Content from Hub --- def get_space_file_content(ui_api_token_from_textbox, space_name_ui, owner_ui, file_path_in_repo): """Fetches content of a specific file from a Hugging Face Space.""" repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return None, token_err # Return error as second element for consistency repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return None, err repo_id_for_error_logging = repo_id if not file_path_in_repo: return None, "Error: File path cannot be empty." logger.info(f"Attempting to download file: {file_path_in_repo} from Space: {repo_id}") downloaded_file_path = hf_hub_download( repo_id=repo_id, filename=file_path_in_repo, repo_type="space", token=resolved_api_token, # revision="main", # Optional: specify a branch/commit # cache_dir=... # Optional: manage cache ) content = Path(downloaded_file_path).read_text(encoding="utf-8") logger.info(f"Successfully downloaded and read file: {file_path_in_repo} from {repo_id}") return content, None # Return content and no error except Exception as e: # Catch specific huggingface_hub.utils.HFValidationError for not found etc. if "404" in str(e) or "not found" in str(e).lower(): logger.warning(f"File not found {file_path_in_repo} in {repo_id_for_error_logging}: {e}") return None, f"Error: File '{file_path_in_repo}' not found in Space '{repo_id_for_error_logging}'." logger.exception(f"Error fetching file content for {file_path_in_repo} from {repo_id_for_error_logging}:") return None, f"Error fetching file content: {str(e)}" # --- Function to list files (reused, but now distinct from fetching content) --- def list_space_files_for_browsing(ui_api_token_from_textbox, space_name_ui, owner_ui): """Lists files in a Hugging Face Space, returns list or error.""" repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return None, token_err repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return None, err repo_id_for_error_logging = repo_id files = list_repo_files(repo_id=repo_id, token=resolved_api_token, repo_type="space") if not files: return [], f"No files found in Space `{repo_id}`." # Return empty list and info message return files, None # Return list of files and no error except Exception as e: logger.exception(f"Error listing files for {repo_id_for_error_logging}:") return None, f"Error listing files for `{repo_id_for_error_logging}`: {str(e)}" # --- Core Functions: `create_space`, `update_space_file` (Unchanged from previous correct versions) --- def create_space(ui_api_token_from_textbox, space_name_ui, owner_ui, sdk_ui, markdown_input): repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return token_err repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return err repo_id_for_error_logging = repo_id space_info = parse_markdown(markdown_input) if not space_info["files"]: return "Error: No files found in markdown." with tempfile.TemporaryDirectory() as temp_dir: repo_staging_path = Path(temp_dir) / "repo_staging_content" repo_staging_path.mkdir(exist_ok=True) for file_info in space_info["files"]: if not file_info.get("path"): continue file_path_abs = repo_staging_path / file_info["path"] file_path_abs.parent.mkdir(parents=True, exist_ok=True) with open(file_path_abs, "w", encoding="utf-8") as f: f.write(file_info["content"]) try: create_repo(repo_id=repo_id, token=resolved_api_token, repo_type="space", space_sdk=sdk_ui, private=False) except Exception as e: err_str = str(e).lower() if not ("already exists" in err_str or "you already created this repo" in err_str or "exists" in err_str): return f"Error creating Space '{repo_id}': {str(e)}" upload_folder(repo_id=repo_id, folder_path=str(repo_staging_path), path_in_repo=".", token=resolved_api_token, repo_type="space", commit_message=f"Initial Space setup of {repo_id} via Builder") return f"Successfully created/updated Space: [{repo_id}](https://huggingface.co/spaces/{repo_id})" except Exception as e: logger.exception(f"Error in create_space for {repo_id_for_error_logging}:") return f"Error during Space creation/update: {str(e)}" def update_space_file(ui_api_token_from_textbox, space_name_ui, owner_ui, file_path_in_repo, file_content, commit_message_ui): repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui try: resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox) if token_err: return token_err repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui) if err: return err repo_id_for_error_logging = repo_id if not file_path_in_repo: return "Error: File Path to update cannot be empty." file_path_in_repo = file_path_in_repo.lstrip('/').replace(os.sep, '/') commit_message_ui = commit_message_ui or f"Update {file_path_in_repo} via Space Builder" with tempfile.TemporaryDirectory() as temp_dir_for_update: repo_local_clone_path = Path(temp_dir_for_update) / "update_clone" cloned_repo = Repository(local_dir=str(repo_local_clone_path), clone_from=f"https://huggingface.co/spaces/{repo_id}", repo_type="space", use_auth_token=resolved_api_token, git_user="Space Builder Bot", git_email="space-builder@huggingface.co") full_local_file_path = Path(cloned_repo.local_dir) / file_path_in_repo full_local_file_path.parent.mkdir(parents=True, exist_ok=True) with open(full_local_file_path, "w", encoding="utf-8") as f: f.write(file_content) cloned_repo.push_to_hub(commit_message=commit_message_ui) return f"Successfully updated `{file_path_in_repo}` in Space [{repo_id}](https://huggingface.co/spaces/{repo_id})" except Exception as e: logger.exception(f"Error in update_space_file for {repo_id_for_error_logging}, file {file_path_in_repo}:") return f"Error updating file for `{repo_id_for_error_logging}`: {str(e)}"