Newer
Older
from Packages import *
st.set_page_config(page_title="NIRS Utils", page_icon=":goat:", layout="wide")
from Modules import *
from Class_Mod.DATA_HANDLING import *
# HTML pour le bandeau "CEFE - CNRS"
# bandeau_html = """
# <div style="width: 100%; background-color: #4682B4; padding: 10px; margin-bottom: 10px;">
# <h1 style="text-align: center; color: white;">CEFE - CNRS</h1>
# </div>
# """
# # Injecter le code HTML du bandeau
# st.markdown(bandeau_html, unsafe_allow_html=True)
add_header()
st.session_state["interface"] = st.session_state.get('interface')
M1, M2= st.columns([2, 1])
st.header('Data preprocessing', divider='blue')
M3, M4= st.columns([2, 1])
file = M2.file_uploader("Select NIRS Data to predict", type = files_format, help=" :mushroom: select a csv matrix with samples as rows and lambdas as columns")
export_folder = './data/predictions/'
export_name = 'Predictions_of_'
reg_algo = ["Interval-PLS"]
if file:
test = file.name[file.name.find('.'):]
export_name += file.name[:file.name.find('.')]
if test == files_format[0]:
#
qsep = M2.selectbox("Select csv separator - _detected_: " + str(find_delimiter('data/'+file.name)), options=[";", ","], index=[";", ","].index(str(find_delimiter('data/'+file.name))), key=2)
qhdr = M2.selectbox("indexes column in csv? - _detected_: " + str(find_col_index('data/'+file.name)), options=["no", "yes"], index=["no", "yes"].index(str(find_col_index('data/'+file.name))), key=3)
elif test == files_format[1]:
with NamedTemporaryFile(delete=False, suffix=".dx") as tmp:
tmp.write(file.read())
tmp_path = tmp.name
M2.success("The data have been loaded successfully", icon="✅")
yname = M2.selectbox('Select target', options=chem_data.columns)
measured = chem_data.loc[:,yname] == 0
y = chem_data.loc[:,yname].loc[measured]
pred_data = spectra.loc[measured]
else:
pred_data = spectra
fig = plot_spectra(pred_data, xunits = 'lab', yunits = "meta_data.loc[:,'yunits'][0]")
### preprocessing
preprocessed = pd.DataFrame
if not pred_data.empty:
params = M4.file_uploader("Load preprocessings params", type = '.json', help=" .json file")
window_length = prep["window_length"],
polyorder = prep["polyorder"],
deriv=prep["deriv"],
delta=1.0, axis=-1, mode="interp", cval=0.0)
preprocessed = pd.DataFrame(x2, index = pred_data.index, columns = pred_data.columns)
################################################################################################
fig2 = plot_spectra(preprocessed, xunits = 'lab', yunits = "meta_data.loc[:,'yunits'][0]")
M3.pyplot(fig2)
SG = f'- Savitzky-Golay derivative parameters \:(Window_length:{prep['window_length']}; polynomial order: {prep['polyorder']}; Derivative order : {prep['deriv']})'
Norm = f'- Spectral Normalization \: {norm}'
M4.write('The spectra were preprocessed using:\n'+SG+"\n"+Norm)
################### Predictions making ##########################
if not pred_data.empty:# Load the model with joblib
#dir = os.listdir('data/models/')[1:]
dir = os.listdir('data/models/')
model_name = M5.selectbox("Select your model from the dropdown list:", options = dir, key = 21)
if model_name and model_name !='':
export_name += '_with_' + model_name[:model_name.find('.')]
with open('data/models/'+ model_name,'rb') as f:
loaded_model = joblib.load(f)
if loaded_model:
M5.success("The model has been loaded successfully", icon="✅")
s = M5.checkbox('the model is of ipls type?')
index = M5.file_uploader("select wavelengths index file", type="csv")
intervalls = pd.read_csv(index, sep=';', index_col=0).to_numpy()
idx = []
for i in range(intervalls.shape[0]):
idx.extend(np.arange(intervalls[i,0], intervalls[i,1]+1))
if s:
result = loaded_model.predict(preprocessed.iloc[:,idx])
else:
# use prediction function from application_functions.py to predict chemical values
result = loaded_model.predict(x2)
result = pd.DataFrame(result, index = pred_data.index)
#############################
axs.grid( color ='grey', linestyle ='-.', linewidth = 0.5, alpha = 0.6)
# Remove axes splines
for s in ['top', 'bottom', 'left', 'right']:
axs.spines[s].set_visible(False)
# Remove x, y ticks
axs.xaxis.set_ticks_position('none')
axs.yaxis.set_ticks_position('none')
# Add padding between axes and labels
axs.xaxis.set_tick_params(pad = 5)
axs.yaxis.set_tick_params(pad = 10)
# Creating histogram
N, bins, patches = axs.hist(result, bins = 12)
# Setting color
fracs = ((N**(1 / 5)) / N.max())
norm = colors.Normalize(fracs.min(), fracs.max())
for thisfrac, thispatch in zip(fracs, patches):
color = plt.cm.viridis(norm(thisfrac))
thispatch.set_facecolor(color)
M5.pyplot(fig)
M6.write('Predicted values table')
M6.dataframe(result.T)
##################################
result.to_csv(export_folder + export_name + '.csv', sep = ';')
# export to local drive - Download
download_results(export_folder + export_name + '.csv', export_name + '.csv')
# create a report with information on the prediction