Spaces:
Sleeping
Sleeping
File size: 7,608 Bytes
fabc124 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 |
import streamlit as st
from utils import get_data, diseases, metrics_table
from transformers import pipeline
import pandas as pd
import io
import json
from openai import OpenAI
import tensorflow as tf
from transformers import TFAutoModelForSequenceClassification, AutoTokenizer
# Load model
model_name = "Zabihin/Symptom_to_Diagnosis"
model = TFAutoModelForSequenceClassification.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)
def get_data(file:str):
"""
Reads data from a JSON file and returns the loaded data.
Parameters:
file (str): The path to the JSON file to be read.
Returns:
dict: The data loaded from the specified JSON file.
"""
with open(file) as files:
data = json.load(files)
return data
def call_gpt3(api,prompt:str):
client = OpenAI(api_key=api)
response = client.chat.completions.create(
model="gpt-3.5-turbo",
messages=[
{"role": "system", "content": "You are a doctor expert in drugs and diseases."},
{"role": "user", "content": prompt}
])
generated_text = response.choices[0].message.content
return generated_text
# Define functions
def get_predictions(text):
inputs = tokenizer(text, return_tensors="tf", truncation=True, max_length=512)
outputs = model(inputs)
probabilities = tf.nn.softmax(outputs.logits, axis=-1)
predictions = []
for idx, prob in enumerate(probabilities[0]):
label = model.config.id2label[idx]
predictions.append((label, prob.numpy()))
return predictions
def analyze_probabilities(predictions):
probabilities = [prob for _, prob in predictions]
max_prob = max(probabilities)
high_prob_label = next(label for label, prob in predictions if prob == max_prob)
return high_prob_label,max_prob
def main():
# import symptoms data
symptoms = get_data('symptomes.json')
# Create sidebar and pages content
tabs = ["Home", "About Us", "Model Details & Evaluations"]
st.sidebar.header("Welcome to the Symptom checker app ! This app provide diagnosis based on your symptoms. Feel free to try it out !")
st.sidebar.divider()
active_tab = st.sidebar.radio("Select Tab", tabs)
if active_tab == "Home":
st.header("Symptom Checker and Diagnosis App", divider = 'violet')
image_path = "symptom.webp"
col1, col2 = st.columns(2)
with col1:
st.image(image_path, use_column_width='auto')
with col2:
st.subheader("π©ββοΈ Enter your symptoms:")
st.subheader("get your diagnosis and useful advices")
input_text = ""
for category, symptoms in symptoms.items():
st.sidebar.write(f"### {category}")
category_symptoms = st.sidebar.multiselect(f"Select Symptoms in {category}", [symptom[0] for symptom in symptoms])
if category_symptoms:
input_text += f""
for selected_symptom in category_symptoms:
symptom_description = next((symptom[1] for symptom in symptoms if symptom[0] == selected_symptom), "")
input_text += f"{symptom_description}\n"
# Display the updated input_text
manual_input=st.text_area("Symptoms", value=input_text, height=200)
st.warning("If you want to know more, please enter your api key and click on submit: ")
with st.expander("Click here to enter your api"):
api=st.text_input("API KEY", value="",type='password')
# Button to submit and get the predicted label
if st.button("Submit"):
predictions = get_predictions(manual_input)
predicted_label,probability=analyze_probabilities(predictions)
# Condition to display only high probability deseases
if probability > 0.6:
st.success(f"Based on your symptoms, there's a {100 * probability:.2f}% probability that you might have {predicted_label}.")
if api:
# Try using the provided API key to call GPT-3
gpt3_prompt = f"Please provide a list of medications for {predicted_label}, along with a brief explanation of this disease."
#gpt3_response = call_gpt3(api, gpt3_prompt)
try :
gpt3_response = call_gpt3(api,gpt3_prompt)
# Display the GPT-3 response if successful
st.header(f'Information about the **{predicted_label}**')
st.info('Please note: This information is AI-generated and does not replace professional medical advice.')
st.write(gpt3_response)
except:
# Handle case where API call fails
st.warning("Unable to retrieve information using the provided API key. Please try another API key if available.")
else:
st.write('If you want to know more, please enter your api key')
else:
st.warning("The symptoms you've described do not strongly indicate any of the 22 diseases in our database with a high probability. It's recommended to consult a healthcare professional for a more accurate diagnosis.")
# Expander to show the list of diseases
with st.expander("Click here to view the list of diseases"):
for disease in diseases:
st.write(disease)
elif active_tab == "About Us":
st.title("GZ-Health")
st.markdown("**[Zahra ZABIHINPOUR](https://www.linkedin.com/in/zahra-zabihinpour/)**")
st.markdown("**[Kevin GOUPIL](https://www.linkedin.com/in/kevin-goupil/)**")
st.markdown(" We are a dynamic duo of data scientists collaborating to enhance our skills and stay at the forefront of the latest developments. With backgrounds in science and experience working with health data, we bring a unique blend of expertise to our data science projects. Our shared passion and commitment drive us to showcase and elevate our capabilities through innovative and impactful initiatives. Join us on this journey of continuous improvement and exploration in the world of data science. ")
st.markdown(" ")
elif active_tab == "Model Details & Evaluations":
st.subheader("Model Overview:")
st.write("This model is a fine-tuned adaptation of the bert-base-cased architecture, specifically designed for text classification tasks associated with diagnosing diseases based on symptoms. The primary goal is to scrutinize natural language symptom descriptions and accurately predict one of 22 potential diagnoses.")
st.subheader("Dataset Information:")
st.write("The model was trained on the Gretel/symptom_to_diagnosis dataset, which consists of 1,065 symptom descriptions in English, each labeled with one of the 22 possible diagnoses. This dataset focuses on detailed, fine-grained, single-domain diagnosis, making it suitable for tasks requiring nuanced symptom classification. For those interested in utilizing the model, the Symptom Checker and Diagnosis App, or the Inference API, are accessible at [https://huggingface.co/Zabihin/Symptom_to_Diagnosis](https://huggingface.co/Zabihin/Symptom_to_Diagnosis).")
st.subheader("Model Performance Metrics:")
metrics_data = pd.read_csv(io.StringIO(metrics_table), sep="|").dropna()
st.table(metrics_data)
if __name__ == "__main__":
main()
|