Add statistics for model experiments. Fix dead link in documentation

2026-03-25 21:57:52 +00:00
parent a7f5978f64
commit 77cdd9a01c
2 changed files with 79 additions and 1 deletions
@@ -11,7 +11,7 @@ Final Dissertation Submission Repository
 [See RAGAS_Service](/supporting/RAGAS_Service/)
 ## Agent Refinement
-[See agent](/supporting/agent/)
+[See agent](/agent/)
 ## Generated Database Link and Usage Experiments
 -- todo --
@@ -0,0 +1,78 @@
 from collections import Counter
 from pathlib import Path
 import json
 import streamlit as st
 import pandas as pd
 import matplotlib.pyplot as plt
 THRESH = 0.4
 def page_title() -> str:
    return "Statistics 2"
 def render():
    st.header("Statistics 2")
    path = Path("../../data/refinement")
    if not path.exists() or not path.is_dir():
        st.error("Invalid folder path.")
        return
    jsonl_files = sorted(path.glob("*.jsonl"))
    if not jsonl_files:
        st.info("No .jsonl files found in this folder.")
        return
    for file_path in jsonl_files:
        thresh = THRESH
        st.subheader(f"File: {file_path.name}")
        confidence_counter = Counter()
        # ---- Read file line by line ----
        with open(file_path, "r", encoding="utf-8") as f:
            for line in f:
                try:
                    entry = json.loads(line)
                except json.JSONDecodeError:
                    continue
                if (entry.get("status") != "success"):
                    confidence_counter["Crash"] += 1
                for event in entry.get("events", []):
                    score = event.get("score", None)
                    if score is not None:
                        if score == -1:
                            confidence_counter["BAD-1"] += 1
                        elif score > thresh:
                            confidence_counter["PERFECT"] += 1
                        else:
                            confidence_counter["BAD"] += 1
        if confidence_counter:
            df_conf = pd.DataFrame(
                confidence_counter.items(),
                columns=["Category", "Count"]
            )
            fig, ax = plt.subplots()
            ax.pie(
                df_conf["Count"],
                labels=df_conf["Category"],
                autopct="%1.1f%%",
                startangle=90
            )
            ax.axis("equal")
            ax.set_title(file_path.name)
            total = sum(confidence_counter.values())
            correct = confidence_counter["PERFECT"]
            corr_percent = (correct / total) * 100
            st.markdown(f"**Correct: {corr_percent:.2f}% ({correct}/{total})**")
            st.markdown(f"**Crash: {confidence_counter["Crash"]}**")
            st.pyplot(fig, width=500)
        else:
            st.info("No score data available in this file.")