Dean
/
dvc-streamlit-example
mirror of https://github.com/sicara/dvc-streamlit-example.git


  
1

	
2

	
3

	
4

	
5

	
6

	
7

	
8

	
9

	
10

	
11

	
12

	
13

	
14

	
15

	
16

	
17

	
18

	
19

	
20

	
21

	
22

	
23

	
24

	
25

	
26

	
27

	
28

	
29

	
30

	
31

	
32

	
33

	
34

	
35

	
36

	
37

	
38

	
39

	
40

	
41

	
42

	
43

	
44

	
45

	
46

	
47

	
48

	
49

	
50

	
51

	
52

	
53

	
54

	
55

	
56

	
57

	
58

	
59

	
60

	
61

	
62

	
63

	
64

	
65

	
66

	
67

	
68

	
69

	
70

	
71

	
72

	
73

	
74

	
75

	
76

	
77

	
78

	
79

	
80

	
81

	
82

	
83

	
84

	
85

	
86

	
87

	
88

	
89

	
            import json

import dvc.api
import pandas as pd
import streamlit as st

from scripts.params import EVALUATION_DIR
from st_scripts.st_utils import st_model_selectbox, MODELS_PARAMETERS, REPO


with open("./st_scripts/vega_graphs/confusion_matrix.json") as file:
    VEGA_CONFUSION_MATRIX = json.load(file)


@st.cache
def load_predictions(model_rev: str) -> pd.DataFrame:
    with dvc.api.open(EVALUATION_DIR / "predictions.csv", rev=model_rev) as file:
        return pd.read_csv(file)


def st_evaluate_single_model():
    st.markdown("### Explore Performance on the Test Set")

    selected_model_rev = st_model_selectbox()
    threshold = st.sidebar.slider("Choose model threshold", 0.0, 1.0, value=0.5)

    model_parameters = MODELS_PARAMETERS[selected_model_rev]
    model_commit = REPO.commit(selected_model_rev)

    st.write("Commit information:", model_commit)
    st.json({
        "message": model_commit.message,
        "committed_datetime": str(model_commit.committed_datetime),
        "committer": str(model_commit.committer),
    })

    st.text("Model parameters:")
    st.json(model_parameters)

    st.markdown("## Metrics")
    predictions = (
        load_predictions(model_rev=selected_model_rev)
        .assign(predicted_label=lambda df: (
            pd.Series("cats", index=df.index).where(df.prediction < threshold, other="dogs")
        ))
    )

    accuracy = (predictions.true_label == predictions.predicted_label).mean()
    st.write("Accuracy (%):", round(100 * accuracy, 2))

    st.vega_lite_chart(predictions, VEGA_CONFUSION_MATRIX["spec"])

    st.markdown("## Images")

    images_selector_columns = st.columns(5)
    with images_selector_columns[2]:
        st.write("True label")
        st.write("Predicted label")
    with images_selector_columns[3]:
        show_true_cats_images = st.checkbox(label="cats", key="true_cats_images", value=False)
        show_predicted_cats_images = st.checkbox(label="cats", key="predicted_cats_images", value=True)
    with images_selector_columns[4]:
        show_true_dogs_images = st.checkbox(label="dogs", key="true_dogs_images", value=True)
        show_predicted_dogs_images = st.checkbox(label="dogs", key="predicted_cats_images", value=False)

    selected_true_labels = []
    if show_true_cats_images: selected_true_labels.append("cats")
    if show_true_dogs_images: selected_true_labels.append("dogs")

    selected_predicted_labels = []
    if show_predicted_cats_images: selected_predicted_labels.append("cats")
    if show_predicted_dogs_images: selected_predicted_labels.append("dogs")

    selected_predictions = predictions.loc[
        lambda df: df.true_label.isin(selected_true_labels)
    ].loc[
        lambda df: df.predicted_label.isin(selected_predicted_labels)
    ]

    with images_selector_columns[0]:
        st.write("Selected images:", len(selected_predictions))

    images_columns = st.columns(4)

    for idx, (_, row) in enumerate(selected_predictions.iterrows()):
        images_columns[idx % 4].image(
            row["image_path"],
            caption=f"true={row['true_label']}, predicted={row['predicted_label']}, pred={row['prediction']:.3f}",
        )