Spaces:

fecia
/

CXR

Runtime error

App Files Files Community

CXR / app.py

fecia

Update app.py

08879e2 verified 12 days ago

raw

history blame contribute delete

13.5 kB

	import gradio as gr
	import os
	import io
	import png
	import tensorflow as tf
	import tensorflow_text as tf_text
	import tensorflow_hub as tf_hub
	import numpy as np
	from PIL import Image
	from huggingface_hub import snapshot_download
	from sklearn.metrics.pairwise import cosine_similarity
	import traceback
	import time

	# --- Configuración ---
	MODEL_REPO_ID = "google/cxr-foundation"
	MODEL_DOWNLOAD_DIR = './hf_cxr_foundation_space'
	SIMILARITY_DIFFERENCE_THRESHOLD = 0.1
	POSITIVE_SIMILARITY_THRESHOLD = 0.1

	print(f"Usando umbrales: Comp Δ={SIMILARITY_DIFFERENCE_THRESHOLD}, Simp τ={POSITIVE_SIMILARITY_THRESHOLD}")

	# Prompts por defecto mejorados
	criteria_list_positive = [
	"optimal centering mediastinum",
	"deep inspiration",
	"adequate penetration",
	"complete lung fields",
	"scapulae retracted outside lungs",
	"sharp contrast",
	"artifact-free image"
	]
	criteria_list_negative = [
	"poor centering",
	"shallow inspiration",
	"overexposed image",
	"underexposed image",
	"cropped lung fields",
	"scapular overlay on lungs",
	"blurred image with artifacts"
	]

	# --- Funciones Auxiliares ---
	def bert_tokenize(text, preprocessor):
	if preprocessor is None:
	raise ValueError("BERT preprocessor no está cargado.")
	text = str(text).lower()
	out = preprocessor(tf.constant([text]))
	ids = out['input_word_ids'].numpy().astype(np.int32)
	masks = out['input_mask'].numpy().astype(np.float32)
	paddings = 1.0 - masks
	# Ajustes para el token de fin
	end_token_idx = (ids == 102)
	ids[end_token_idx] = 0
	paddings[end_token_idx] = 1.0
	# Asegurar forma (1,1,128)
	if ids.ndim == 2: ids = np.expand_dims(ids, 1)
	if paddings.ndim == 2: paddings = np.expand_dims(paddings, 1)
	return ids, paddings

	def png_to_tfexample(image_array: np.ndarray) -> tf.train.Example:
	# (sin cambios, convierte array NumPy a tf.Example PNG)
	if image_array.ndim == 3 and image_array.shape[2] == 1:
	image_array = np.squeeze(image_array, axis=2)
	elif image_array.ndim != 2:
	raise ValueError(f'Array debe ser 2-D. Dimensiones: {image_array.ndim}')
	image = image_array.astype(np.float32)
	min_val, max_val = image.min(), image.max()
	if max_val <= min_val:
	if image_array.dtype == np.uint8 or (min_val >= 0 and max_val <= 255):
	pixel_array = image.astype(np.uint8); bitdepth = 8
	else:
	pixel_array = np.zeros_like(image, dtype=np.uint16); bitdepth = 16
	else:
	image -= min_val
	current_max = max_val - min_val
	if image_array.dtype != np.uint8:
	image *= 65535 / current_max
	pixel_array = image.astype(np.uint16); bitdepth = 16
	else:
	image *= 255 / current_max
	pixel_array = image.astype(np.uint8); bitdepth = 8
	output = io.BytesIO()
	png.Writer(width=pixel_array.shape[1], height=pixel_array.shape[0],
	greyscale=True, bitdepth=bitdepth).write(output, pixel_array.tolist())
	example = tf.train.Example()
	features = example.features.feature
	features['image/encoded'].bytes_list.value.append(output.getvalue())
	features['image/format'].bytes_list.value.append(b'png')
	return example

	def generate_image_embedding(img_np, elixrc_infer, qformer_infer):
	if elixrc_infer is None or qformer_infer is None:
	raise ValueError("Modelos ELIXR-C o QFormer no cargados.")
	try:
	serialized = png_to_tfexample(img_np).SerializeToString()
	elixrc_out = elixrc_infer(input_example=tf.constant([serialized]))
	elixr_emb = elixrc_out['feature_maps_0'].numpy()
	q_in = {
	'image_feature': elixr_emb.tolist(),
	'ids': np.zeros((1,1,128),dtype=np.int32).tolist(),
	'paddings': np.ones((1,1,128),dtype=np.float32).tolist(),
	}
	q_out = qformer_infer(**q_in)
	img_emb = q_out['all_contrastive_img_emb'].numpy()
	if img_emb.ndim > 2:
	img_emb = img_emb.mean(axis=tuple(range(1, img_emb.ndim-1)))
	if img_emb.ndim == 1:
	img_emb = img_emb[np.newaxis, :]
	return img_emb
	except Exception as e:
	print(f"Error embedding imagen: {e}")
	traceback.print_exc()
	raise

	def calculate_similarities_and_classify(image_embedding, bert_preprocessor, qformer_infer,
	criteria_positive, criteria_negative):
	results = {}
	for pos, neg in zip(criteria_positive, criteria_negative):
	sim_pos = sim_neg = diff = None
	comp = simp = "ERROR"
	try:
	# Embedding texto positivo
	ids_p, pad_p = bert_tokenize(pos, bert_preprocessor)
	inp_p = {'image_feature': np.zeros([1,8,8,1376],dtype=np.float32).tolist(),
	'ids': ids_p.tolist(), 'paddings': pad_p.tolist()}
	txt_p = qformer_infer(**inp_p)['contrastive_txt_emb'].numpy()
	# Embedding texto negativo
	ids_n, pad_n = bert_tokenize(neg, bert_preprocessor)
	inp_n = {'image_feature': np.zeros([1,8,8,1376],dtype=np.float32).tolist(),
	'ids': ids_n.tolist(), 'paddings': pad_n.tolist()}
	txt_n = qformer_infer(**inp_n)['contrastive_txt_emb'].numpy()

	sim_pos = float(cosine_similarity(image_embedding, txt_p.reshape(1,-1))[0][0])
	sim_neg = float(cosine_similarity(image_embedding, txt_n.reshape(1,-1))[0][0])
	diff = sim_pos - sim_neg
	comp = "PASS" if diff > SIMILARITY_DIFFERENCE_THRESHOLD else "FAIL"
	simp = "PASS" if sim_pos > POSITIVE_SIMILARITY_THRESHOLD else "FAIL"
	except Exception as e:
	print(f"Error en criterio '{pos}': {e}")
	results[pos] = {
	'positive_prompt': pos,
	'negative_prompt': neg,
	'sim_pos': sim_pos,
	'sim_neg': sim_neg,
	'difference': diff,
	'comp': comp,
	'simp': simp
	}
	return results

	# --- Carga Global de Modelos ---
	print("--- Iniciando carga de modelos ---")
	start_time = time.time()
	models_loaded = False
	bert_preproc = elixrc = qformer = None
	try:
	hf_token = os.environ.get("HF_TOKEN")
	os.makedirs(MODEL_DOWNLOAD_DIR, exist_ok=True)
	snapshot_download(repo_id=MODEL_REPO_ID, local_dir=MODEL_DOWNLOAD_DIR,
	allow_patterns=['elixr-c-v2-pooled/','pax-elixr-b-text/'],
	local_dir_use_symlinks=False, token=hf_token)
	bert_preproc = tf_hub.KerasLayer("https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3")
	elixr = tf.saved_model.load(os.path.join(MODEL_DOWNLOAD_DIR,'elixr-c-v2-pooled')).signatures['serving_default']
	qformer = tf.saved_model.load(os.path.join(MODEL_DOWNLOAD_DIR,'pax-elixr-b-text')).signatures['serving_default']
	models_loaded = True
	print(f"Modelos cargados en {time.time()-start_time:.2f}s")
	except Exception as e:
	print("ERROR cargando modelos:", e)
	traceback.print_exc()

	# --- Función Principal para Gradio ---
	def assess_quality_and_update_ui(image_pil, pos_input, neg_input):
	if not models_loaded:
	raise gr.Error("No se pudieron cargar los modelos.")
	if image_pil is None:
	# devuelve: welcome visible, results oculto, imagen None, etiqueta N/A, html vacío, json vacío
	return (
	gr.update(visible=True),
	gr.update(visible=False),
	None,
	"N/A",
	"",
	{}
	)
	# Parsear listas de prompts
	pos_list = [l.strip() for l in pos_input.splitlines() if l.strip()]
	neg_list = [l.strip() for l in neg_input.splitlines() if l.strip()]
	if len(pos_list) != len(neg_list):
	raise gr.Error("El número de prompts positivos y negativos debe coincidir.")
	# Embedding imagen
	img_np = np.array(image_pil.convert('L'))
	emb = generate_image_embedding(img_np, elixr, qformer)
	# Calcular similitudes
	details = calculate_similarities_and_classify(emb, bert_preproc, qformer, pos_list, neg_list)
	# Generar HTML
	passed = total = 0
	rows = ""
	for crit, d in details.items():
	total += 1
	if d['comp']=="PASS": passed+=1
	c_style = "color:#22c55e;font-weight:bold;" if d['comp']=="PASS" else "color:#ef4444;font-weight:bold;"
	s_style = "color:#22c55e;font-weight:bold;" if d['simp']=="PASS" else "color:#ef4444;font-weight:bold;"
	rows += (
	f"<tr>"
	f"<td>{crit}</td>"
	f"<td>{d['sim_pos']:.4f}</td>"
	f"<td>{d['sim_neg']:.4f}</td>"
	f"<td>{d['difference']:.4f}</td>"
	f"<td style='{c_style}'>{d['comp']}</td>"
	f"<td style='{s_style}'>{d['simp']}</td>"
	f"</tr>"
	)
	html = f"""
	<table style="width:100%;border-collapse:collapse;">
	<thead style="background:#f2f2f2;">
	<tr>
	<th>Criterion</th><th>Sim (+)</th><th>Sim (-)</th><th>Diff</th>
	<th>Assessment (Comp)</th><th>Assessment (Simp)</th>
	</tr>
	</thead>
	<tbody>{rows}</tbody>
	</table>
	"""
	# Etiqueta general
	pass_rate = passed/total if total>0 else 0
	if pass_rate>=0.85: overall="Excellent"
	elif pass_rate>=0.70: overall="Good"
	elif pass_rate>=0.50: overall="Fair"
	else: overall="Poor"
	quality_label = f"{overall} ({passed}/{total} passed)"
	# Devolver actualizaciones UI
	return (
	gr.update(visible=False),
	gr.update(visible=True),
	image_pil,
	quality_label,
	html,
	details
	)

	def reset_ui():
	return (
	gr.update(visible=True),
	gr.update(visible=False),
	None, # limpia input_image
	None, # limpia output_image
	"N/A", # etiqueta calidad
	"", # HTML
	{} # JSON
	)

	# --- Definir Tema ---
	dark_theme = gr.themes.Default(
	primary_hue=gr.themes.colors.blue,
	secondary_hue=gr.themes.colors.blue,
	neutral_hue=gr.themes.colors.gray,
	font=[gr.themes.GoogleFont("Inter"), "ui-sans-serif", "system-ui", "sans-serif"],
	font_mono=[gr.themes.GoogleFont("JetBrains Mono"), "ui-monospace", "Consolas", "monospace"],
	).set(
	body_background_fill="#111827",
	background_fill_primary="#1f2937",
	background_fill_secondary="#374151",
	block_background_fill="#1f2937",
	body_text_color="#d1d5db",
	block_label_text_color="#d1d5db",
	block_title_text_color="#ffffff",
	border_color_accent="#374151",
	border_color_primary="#4b5563",
	button_primary_background_fill="*primary_600",
	button_primary_text_color="#ffffff",
	button_secondary_background_fill="*neutral_700",
	button_secondary_text_color="#ffffff",
	input_background_fill="#374151",
	input_border_color="#4b5563",
	shadow_drop="rgba(0,0,0,0.2) 0px 2px 4px",
	block_shadow="rgba(0,0,0,0.2) 0px 2px 5px",
	)

	# --- Interfaz Gradio ---
	with gr.Blocks(theme=dark_theme, title="CXR Quality Assessment") as demo:
	# Cabecera
	gr.Markdown("""
	# <span style="color: #e5e7eb;">CXR Quality Assessment</span>
	<p style="color: #9ca3af;">Evalúa la calidad técnica de radiografías de tórax con AI</p>
	""")
	# Prompts editables
	with gr.Row():
	positive_prompts_input = gr.Textarea(
	label="Prompts Positivos (uno por línea)",
	value="\n".join(criteria_list_positive),
	lines=7
	)
	negative_prompts_input = gr.Textarea(
	label="Prompts Negativos (uno por línea)",
	value="\n".join(criteria_list_negative),
	lines=7
	)
	# Contenido principal
	with gr.Row(equal_height=False):
	with gr.Column(scale=1, min_width=300):
	gr.Markdown("### 1. Carga de Imagen")
	input_image = gr.Image(type="pil", label="Sube tu CXR", height=300)
	with gr.Row():
	analyze_btn = gr.Button("Analizar", variant="primary")
	reset_btn = gr.Button("Reset", variant="secondary")
	gr.Markdown("<p style='color:#9ca3af; font-size:0.9em;'>La carga de modelos tarda ~1 min; el análisis ~15–40 s.</p>")
	with gr.Column(scale=2):
	with gr.Column(visible=True) as welcome_block:
	gr.Markdown("### ¡Bienvenido! Sube una radiografía y haz clic en «Analizar».")
	with gr.Column(visible=False) as results_block:
	gr.Markdown("### 2. Resultados")
	with gr.Row():
	output_image = gr.Image(type="pil", label="Imagen Analizada", interactive=False)
	with gr.Column():
	gr.Markdown("#### Calidad Global")
	output_label = gr.Label(value="N/A")
	gr.Markdown("#### Evaluación Detallada")
	output_html = gr.HTML()
	with gr.Accordion("Ver JSON (debug)", open=False):
	output_json = gr.JSON()
	# Conexiones
	analyze_btn.click(
	fn=assess_quality_and_update_ui,
	inputs=[input_image, positive_prompts_input, negative_prompts_input],
	outputs=[welcome_block, results_block, output_image, output_label, output_html, output_json]
	)
	reset_btn.click(
	fn=reset_ui,
	inputs=None,
	outputs=[welcome_block, results_block, input_image, output_image, output_label, output_html, output_json]
	)

	if __name__ == "__main__":
	demo.launch(server_name="0.0.0.0", server_port=7860)