Spaces:

angel-born-in-hell
/

clinical-workstation

Running

App Files Files Community

clinical-workstation / app.py

angel-born-in-hell

Update app.py

32126d0 verified 3 days ago

raw

history blame contribute delete

8.7 kB

	import streamlit as st
	import pandas as pd
	import numpy as np
	from huggingface_hub import InferenceClient
	from pypdf import PdfReader
	import io
	import time

	# --- 1. PROFESSIONAL CONFIGURATION ---
	st.set_page_config(
	page_title="E.S.T.E.R A Clinical Workstation",
	page_icon="🏥",
	layout="wide",
	initial_sidebar_state="expanded"
	)

	# --- 2. SIDEBAR (TOOLS & UPLOAD) ---
	with st.sidebar:
	st.title("🏥 Workstation")

	# --- SECURITY: SILENT AUTHENTICATION ---
	if "HF_TOKEN" in st.secrets:
	hf_token = st.secrets["HF_TOKEN"]
	else:
	st.error("🚨 System Error: API Token is missing. Please add HF_TOKEN in Space Settings.")
	st.stop()

	client = InferenceClient(token=hf_token)

	# B. UPLOAD PATIENT FILES
	st.markdown("---")
	st.subheader("📂 Patient Records")
	uploaded_files = st.file_uploader("Upload Labs/History (PDF/CSV)", type=["pdf", "csv"], accept_multiple_files=True)

	# C. QUICK CALCULATOR
	st.markdown("---")
	with st.expander("🧮 Quick BMI Calc"):
	weight = st.number_input("Weight (kg)", 0.0, 300.0, 70.0)
	height = st.number_input("Height (m)", 0.0, 2.5, 1.75)
	if st.button("Calc BMI"):
	bmi = weight / (height ** 2)
	st.info(f"BMI: {bmi:.1f}")

	# D. EXPORT
	st.markdown("---")
	st.subheader("📝 Documentation")
	if st.button("📄 Generate SOAP Note", use_container_width=True):
	if "messages" in st.session_state and len(st.session_state.messages) > 1:
	chat_history = "\n".join([f"{m['role']}: {m['content']}" for m in st.session_state.messages])

	prompt = f"""
	Act as a Medical Scribe. Convert the following conversation into a professional SOAP Note.
	Format:
	- SUBJECTIVE: (Symptoms, History)
	- OBJECTIVE: (Vitals, Labs - if mentioned)
	- ASSESSMENT: (Potential Diagnosis)
	- PLAN: (Treatment, Next Steps)

	CONVERSATION:
	{chat_history}
	"""

	try:
	response = client.chat_completion(
	model="Qwen/Qwen2.5-72B-Instruct",
	messages=[{"role": "user", "content": prompt}],
	max_tokens=600, temperature=0.1
	)
	soap_note = response.choices[0].message.content
	st.session_state.soap_note = soap_note
	except Exception as e:
	st.error(f"Error generating note: {e}")

	# Show the generated note
	if "soap_note" in st.session_state:
	st.text_area("SOAP Draft", st.session_state.soap_note, height=300)
	st.download_button("💾 Save to EMR", st.session_state.soap_note, "soap_note.txt")

	# E. Reset
	st.markdown("---")
	if st.button("🗑️ Clear Patient Data", use_container_width=True):
	st.session_state.messages = []
	if "soap_note" in st.session_state: del st.session_state.soap_note
	st.rerun()

	# --- 3. DATA PROCESSOR (UPDATED FOR NEW FILES) ---
	@st.cache_resource(show_spinner=False)
	def process_uploaded_files(uploaded_files):
	all_texts = []
	source_map = []

	# --- UPDATED FILE LIST: INCLUDES YOUR 8 NEW DATASETS ---
	base_files = [
	"Cleaned_Data_Lite.csv", "Medical_Terms_Wiki.csv", "Sample_Clinical_Dialogues.csv",
	"doctor_patient_1.csv", "symptoms_diagnosis.csv", "conversation_status.csv",
	"doctor_result.csv", "nurse_data.csv", "medical_intelligence.csv",
	"indian_medicines.csv", "internal_med_qa.csv"
	]

	# Load Internal Knowledge Base (The 8 New Files)
	for fname in base_files:
	try:
	# We blindly load the first 100 rows to keep it fast
	df = pd.read_csv(fname, nrows=100)

	# Combine all text columns into one string for the AI
	texts = df.astype(str).agg(' '.join, axis=1).tolist()

	all_texts.extend(texts)
	source_map.extend([f"📚 {fname}"] * len(texts))
	except:
	# Silent fail if a file is missing so app doesn't crash
	pass

	# Load User Uploaded Files (PDFs)
	if uploaded_files:
	for file in uploaded_files:
	if file.name.endswith('.pdf'):
	try:
	pdf_reader = PdfReader(file)
	text = ""
	for page in pdf_reader.pages: text += page.extract_text() + "\n"
	chunks = [text[i:i+1000] for i in range(0, len(text), 1000)]
	all_texts.extend(chunks)
	source_map.extend([f"📄 {file.name}"] * len(chunks))
	except: pass
	elif file.name.endswith('.csv'):
	try:
	df = pd.read_csv(file)
	texts = df.astype(str).agg(' '.join, axis=1).tolist()
	all_texts.extend(texts)
	source_map.extend([f"📊 {file.name}"] * len(texts))
	except: pass

	if not all_texts: return None, None, None
	try:
	# Vectorize (Limit to 1500 chunks to prevent memory crash)
	embeddings = client.feature_extraction(all_texts[:1500], model="sentence-transformers/all-MiniLM-L6-v2")
	return all_texts[:1500], np.array(embeddings), source_map[:1500]
	except: return None, None, None

	docs, doc_embeddings, doc_sources = process_uploaded_files(uploaded_files)

	# --- 4. MAIN INTERFACE ---
	st.title("🩺 E.S.T.E.R for Clinical Support")

	# Initialize Chat
	if "messages" not in st.session_state:
	st.session_state.messages = [{"role": "assistant", "content": "Medical Systems Online. Accessing Global Database... Ready."}]

	# QUICK ACTION BUTTONS
	col1, col2, col3, col4 = st.columns(4)
	action = None
	if col1.button("💊 Dosage"): action = "What is the standard dosage for this condition?"
	if col2.button("⚠️ Side Effects"): action = "List common side effects and contraindications."
	if col3.button("🔄 Interactions"): action = "Are there any drug interactions I should know about?"
	if col4.button("📋 Protocol"): action = "Outline the standard treatment protocol."

	# Display History
	for msg in st.session_state.messages:
	with st.chat_message(msg["role"]):
	st.markdown(msg["content"])

	# INPUT LOGIC
	prompt = st.chat_input("Enter clinical query...")
	if action: prompt = action

	if prompt:
	st.session_state.messages.append({"role": "user", "content": prompt})
	with st.chat_message("user"): st.markdown(prompt)

	# Search
	context_text = "General medical guidelines."
	source_file = "AI Knowledge Base"

	if doc_embeddings is not None:
	try:
	query_vec = np.array(client.feature_extraction([prompt], model="sentence-transformers/all-MiniLM-L6-v2"))[0]
	scores = np.dot(doc_embeddings, query_vec)
	best_idx = np.argmax(scores)
	if scores[best_idx] > 0.25:
	context_text = docs[best_idx]
	source_file = doc_sources[best_idx]
	except: pass

	# Answer
	with st.chat_message("assistant"):
	message_placeholder = st.empty()
	full_response = ""

	system_prompt = f"""
	TASK: You are a strict Medical Assistant.
	RULES:
	1. ONLY answer clinical, pharmaceutical, or biological questions.
	2. If the user asks for essays, poems, code, or general chat, REFUSE politely.
	3. Say: "I am a Clinical AI. I cannot help with non-medical tasks."
	4. your name is E.S.T.E.R : Electronic Specialist for Technical Examining & Reporting.
	CONTEXT ({source_file}): {context_text}
	"""

	try:
	stream = client.chat_completion(
	model="Qwen/Qwen2.5-72B-Instruct",
	messages=[{"role": "system", "content": system_prompt}, {"role": "user", "content": prompt}],
	max_tokens=400, stream=True, temperature=0.1
	)
	for chunk in stream:
	if chunk.choices and chunk.choices[0].delta.content:
	full_response += chunk.choices[0].delta.content
	message_placeholder.markdown(full_response + "▌")
	message_placeholder.markdown(full_response)

	# Show citation if available
	if source_file != "AI Knowledge Base":
	with st.expander(f"📚 Source: {source_file}"): st.info(context_text[:500] + "...")

	except Exception as e: st.error(f"Error: {e}")

	st.session_state.messages.append({"role": "assistant", "content": full_response})