Spaces:
Sleeping
Sleeping
import os | |
import json | |
import tempfile | |
import logging | |
from streamlit.delta_generator import DeltaGenerator | |
import streamlit as st | |
from huggingface_hub import HfApi, CommitInfo | |
# get a global var for logger accessor in this module | |
LOG_LEVEL = logging.DEBUG | |
g_logger = logging.getLogger(__name__) | |
g_logger.setLevel(LOG_LEVEL) | |
def push_observation(image_hash:str, api:HfApi, enable_push:False) -> CommitInfo: | |
''' | |
push one observation to the Hugging Face dataset | |
''' | |
# get the observation | |
observation = st.session_state.public_observations.get(image_hash) | |
if observation is None: | |
msg = f"Could not find observation with hash {image_hash}" | |
g_logger.error(msg) | |
st.error(msg) | |
return None | |
# convert to json | |
metadata_str = json.dumps(observation) # doesn't work yet, TODO | |
st.toast(f"Uploading observation: {metadata_str}", icon="🦭") | |
g_logger.info(f"Uploading observation: {metadata_str}") | |
# write to temp file so we can send it (why is this not using context mgr?) | |
f = tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) | |
f.write(metadata_str) | |
f.close() | |
#st.info(f"temp file: {f.name} with metadata written...") | |
path_in_repo = f"metadata/{observation['author_email']}/{observation['image_md5']}.json" | |
msg = f"fname: {f.name} | path: {path_in_repo}" | |
print(msg) | |
st.warning(msg) | |
if enable_push: | |
rv = api.upload_file( | |
path_or_fileobj=f.name, | |
path_in_repo=path_in_repo, | |
repo_id="Saving-Willy/temp_dataset", | |
repo_type="dataset", | |
) | |
print(rv) | |
msg = f"observation attempted tx to repo happy walrus: {rv}" | |
g_logger.info(msg) | |
st.info(msg) | |
else: | |
rv = None # temp don't send anything | |
return rv | |
def push_all_observations(enable_push:bool=False): | |
''' | |
open an API connection to Hugging Face, and push all observation one by one | |
''' | |
# get huggingface api | |
token = os.environ.get("HF_TOKEN", None) | |
api = HfApi(token=token) | |
# iterate over the list of observations | |
for hash in st.session_state.public_observations.keys(): | |
rv = push_observation(hash, api, enable_push=enable_push) | |
def push_observations(tab_log:DeltaGenerator=None): | |
""" | |
Push the observations to the Hugging Face dataset | |
Args: | |
tab_log (streamlit.container): The container to log messages to. If not provided, | |
log messages are in any case written to the global logger (TODO: test - didn't | |
push any observation since generating the logger) | |
""" | |
raise DeprecationWarning("This function is deprecated. Use push_all_observations instead.") | |
# we get the observation from session state: 1 is the dict 2 is the image. | |
# first, lets do an info display (popup) | |
metadata_str = json.dumps(st.session_state.public_observation) | |
st.toast(f"Uploading observations: {metadata_str}", icon="🦭") | |
g_logger.info(f"Uploading observations: {metadata_str}") | |
# get huggingface api | |
token = os.environ.get("HF_TOKEN", None) | |
api = HfApi(token=token) | |
f = tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) | |
f.write(metadata_str) | |
f.close() | |
st.info(f"temp file: {f.name} with metadata written...") | |
path_in_repo= f"metadata/{st.session_state.public_observation['author_email']}/{st.session_state.public_observation['image_md5']}.json" | |
msg = f"fname: {f.name} | path: {path_in_repo}" | |
print(msg) | |
st.warning(msg) | |
# rv = api.upload_file( | |
# path_or_fileobj=f.name, | |
# path_in_repo=path_in_repo, | |
# repo_id="Saving-Willy/temp_dataset", | |
# repo_type="dataset", | |
# ) | |
# print(rv) | |
# msg = f"observation attempted tx to repo happy walrus: {rv}" | |
g_logger.info(msg) | |
st.info(msg) | |