Spaces:

Saving-Willy
/

saving-willy-dev

Sleeping

saving-willy-dev / src /classifier /classifier_image.py

rmm

feat: first implementation of an FSM to keep track of phase

d7725f6 10 months ago

7.89 kB

	import streamlit as st
	import logging

	# get a global var for logger accessor in this module
	LOG_LEVEL = logging.DEBUG
	g_logger = logging.getLogger(__name__)
	g_logger.setLevel(LOG_LEVEL)

	import whale_viewer as viewer
	from hf_push_observations import push_observations
	from utils.grid_maker import gridder
	from utils.metadata_handler import metadata2md

	# need to divide this into two functions, one for the classification and one for the display
	# it is currently somewhat interleaved, not totally clear how to separate them.
	# perhaps we have more stages than I realised.
	# ML started, ML completed, manual review completed, data uploaded

	# for now, let's implement the division between ML classification, and display+manual review.

	def cetacean_classify_list(cetacean_classifier):
	success = False

	files = st.session_state.files
	images = st.session_state.images
	observations = st.session_state.observations

	#batch_size, row_size, page = gridder(files)
	#grid = st.columns(row_size)
	#col = 0

	for file in files:
	key = file.name
	image = images[key]

	observation = observations[key].to_dict()
	# run classifier model on `image`, and persistently store the output
	out = cetacean_classifier(image) # get top 3 matches
	st.session_state.whale_prediction1[key] = out['predictions'][0]
	st.session_state.classify_whale_done[key] = True # TODO 25.01 unclear what this is for;
	msg = f"[D]2 classify_whale_done: {st.session_state.classify_whale_done[key]}, whale_prediction1: {st.session_state.whale_prediction1[key]}"
	g_logger.info(msg)

	observations[key].set_top_predictions(out['predictions'][:])

	st.session_state.public_observation[key] = observation #
	msg = f"[D] full observation after inference: {observation}"
	g_logger.debug(msg)
	print(msg)

	# TODO: add some mech to test if it was successful.
	success = True
	st.balloons()
	return success

	def cetacean_show_classifications():
	st.write("TOP TEXT")
	st.write("Reviewing the classifications :construction:")
	files = st.session_state.files
	images = st.session_state.images
	observations = st.session_state.observations

	batch_size, row_size, page = gridder(files)

	grid = st.columns(row_size)
	col = 0

	for file in files:
	key = file.name
	image = images[key]

	with grid[col]:
	st.image(image, use_column_width=True)
	observation = observations[key].to_dict()
	# fetch the classification results
	# run classifier model on `image`, and persistently store the output
	msg = f"[D]2b classify_whale_done ({file}): {st.session_state.classify_whale_done[key]}, whale_prediction1: {st.session_state.whale_prediction1[key]}"
	g_logger.info(msg)

	# dropdown for selecting/overriding the species prediction
	# TODO: the "it's done" flag seems to get reset when we re-load the tab. Not quite right.
	if not st.session_state.classify_whale_done[key]:
	#selected_class = st.sidebar.selectbox("Species", viewer.WHALE_CLASSES,
	# TODO: ask LV why it is in the sidebar, and not in the grid
	selected_class = st.selectbox("Species", viewer.WHALE_CLASSES,
	index=None, placeholder="Species not yet identified...",
	disabled=True, key=f"cldd_{key}")
	else:
	pred1 = st.session_state.whale_prediction1[key]
	# get index of pred1 from WHALE_CLASSES, none if not present
	print(f"[D] pred1: {pred1}")
	ix = viewer.WHALE_CLASSES.index(pred1) if pred1 in viewer.WHALE_CLASSES else None
	selected_class = st.selectbox(f"Species for {file.name}", viewer.WHALE_CLASSES, index=ix)

	observation['predicted_class'] = selected_class
	if selected_class != st.session_state.whale_prediction1[key]:
	observation['class_overriden'] = selected_class

	st.session_state.public_observation = observation
	st.button(f"Upload observation for {file.name} to THE INTERNET!", on_click=push_observations)
	# TODO: the metadata only fills properly if `validate` was clicked.
	st.markdown(metadata2md())

	msg = f"[D] full observation after inference: {observation}"
	g_logger.debug(msg)
	print(msg)
	# TODO: add a link to more info on the model, next to the button.
	whale_classes = observations[key].top_predictions
	# render images for the top 3 (that is what the model api returns)
	n = len(whale_classes)
	st.markdown(f"Top {n} Predictions for {file.name}")
	for i in range(n):
	viewer.display_whale(whale_classes, i)
	col = (col + 1) % row_size
	return True


	def cetacean_classify_and_review(cetacean_classifier):
	files = st.session_state.files
	images = st.session_state.images
	observations = st.session_state.observations

	batch_size, row_size, page = gridder(files)

	grid = st.columns(row_size)
	col = 0

	for file in files:
	image = images[file.name]

	with grid[col]:
	st.image(image, use_column_width=True)
	observation = observations[file.name].to_dict()
	# run classifier model on `image`, and persistently store the output
	out = cetacean_classifier(image) # get top 3 matches
	st.session_state.whale_prediction1 = out['predictions'][0]
	st.session_state.classify_whale_done = True
	msg = f"[D]2 classify_whale_done: {st.session_state.classify_whale_done}, whale_prediction1: {st.session_state.whale_prediction1}"
	g_logger.info(msg)

	# dropdown for selecting/overriding the species prediction
	if not st.session_state.classify_whale_done:
	selected_class = st.sidebar.selectbox("Species", viewer.WHALE_CLASSES,
	index=None, placeholder="Species not yet identified...",
	disabled=True)
	else:
	pred1 = st.session_state.whale_prediction1
	# get index of pred1 from WHALE_CLASSES, none if not present
	print(f"[D] pred1: {pred1}")
	ix = viewer.WHALE_CLASSES.index(pred1) if pred1 in viewer.WHALE_CLASSES else None
	selected_class = st.selectbox(f"Species for {file.name}", viewer.WHALE_CLASSES, index=ix)

	observation['predicted_class'] = selected_class
	if selected_class != st.session_state.whale_prediction1:
	observation['class_overriden'] = selected_class

	st.session_state.public_observation = observation
	st.button(f"Upload observation for {file.name} to THE INTERNET!", on_click=push_observations)
	# TODO: the metadata only fills properly if `validate` was clicked.
	st.markdown(metadata2md())

	msg = f"[D] full observation after inference: {observation}"
	g_logger.debug(msg)
	print(msg)
	# TODO: add a link to more info on the model, next to the button.

	whale_classes = out['predictions'][:]
	# render images for the top 3 (that is what the model api returns)
	st.markdown(f"Top 3 Predictions for {file.name}")
	for i in range(len(whale_classes)):
	viewer.display_whale(whale_classes, i)
	col = (col + 1) % row_size