From 97fccd073b8e2da1b904e6d27898c7c5dfb9a4dc Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Mon, 16 Mar 2026 16:41:28 +0000
Subject: [PATCH 01/24] feat(emotional): add average emotion & dominant emotion
 stats

---
 server/analysis/emotional.py | 91 ++++++++++++++++++++++++++++--------
 1 file changed, 72 insertions(+), 19 deletions(-)

diff --git a/server/analysis/emotional.py b/server/analysis/emotional.py
index 150aa20..8f78809 100644
--- a/server/analysis/emotional.py
+++ b/server/analysis/emotional.py
@@ -1,33 +1,86 @@
 import pandas as pd
 
+
 class EmotionalAnalysis:
-    def avg_emotion_by_topic(self, df: pd.DataFrame) -> dict:
-        emotion_cols = [
-            col for col in df.columns
-            if col.startswith("emotion_")
-        ]
+    def _emotion_cols(self, df: pd.DataFrame) -> list[str]:
+        return [col for col in df.columns if col.startswith("emotion_")]
+
+    def avg_emotion_by_topic(self, df: pd.DataFrame) -> list[dict]:
+        emotion_cols = self._emotion_cols(df)
+
+        if not emotion_cols:
+            return []
 
         counts = (
-            df[
-                (df["topic"] != "Misc")
-            ]
-            .groupby("topic")
-            .size()
-            .rename("n")
+            df[(df["topic"] != "Misc")].groupby("topic").size().reset_index(name="n")
         )
 
         avg_emotion_by_topic = (
-            df[
-                (df["topic"] != "Misc")
-            ]
+            df[(df["topic"] != "Misc")]
             .groupby("topic")[emotion_cols]
             .mean()
             .reset_index()
         )
 
-        avg_emotion_by_topic = avg_emotion_by_topic.merge(
-            counts,
-            on="topic"
-        )
+        avg_emotion_by_topic = avg_emotion_by_topic.merge(counts, on="topic")
 
-        return avg_emotion_by_topic.to_dict(orient='records')
\ No newline at end of file
+        return avg_emotion_by_topic.to_dict(orient="records")
+
+    def overall_emotion_average(self, df: pd.DataFrame) -> list[dict]:
+        emotion_cols = self._emotion_cols(df)
+
+        if not emotion_cols:
+            return []
+
+        means = df[emotion_cols].mean()
+        return [
+            {
+                "emotion": col.replace("emotion_", ""),
+                "score": float(means[col]),
+            }
+            for col in emotion_cols
+        ]
+
+    def dominant_emotion_distribution(self, df: pd.DataFrame) -> list[dict]:
+        emotion_cols = self._emotion_cols(df)
+
+        if not emotion_cols or df.empty:
+            return []
+
+        dominant_per_row = df[emotion_cols].idxmax(axis=1)
+        counts = dominant_per_row.value_counts()
+        total = max(len(dominant_per_row), 1)
+
+        return [
+            {
+                "emotion": col.replace("emotion_", ""),
+                "count": int(count),
+                "ratio": round(float(count / total), 4),
+            }
+            for col, count in counts.items()
+        ]
+
+    def emotion_by_source(self, df: pd.DataFrame) -> list[dict]:
+        emotion_cols = self._emotion_cols(df)
+
+        if not emotion_cols or "source" not in df.columns or df.empty:
+            return []
+
+        source_counts = df.groupby("source").size()
+        source_means = df.groupby("source")[emotion_cols].mean().reset_index()
+        rows = source_means.to_dict(orient="records")
+        output = []
+
+        for row in rows:
+            source = row["source"]
+            dominant_col = max(emotion_cols, key=lambda col: float(row.get(col, 0)))
+            output.append(
+                {
+                    "source": str(source),
+                    "dominant_emotion": dominant_col.replace("emotion_", ""),
+                    "dominant_score": round(float(row.get(dominant_col, 0)), 4),
+                    "event_count": int(source_counts.get(source, 0)),
+                }
+            )
+
+        return output

From 09a4f9036f67b22a278ff0556a22a44d0093500e Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Mon, 16 Mar 2026 16:43:24 +0000
Subject: [PATCH 02/24] refactor(stats): add summary and user stat classes for
 consistency

---
 server/analysis/stat_gen.py | 96 +++++++++++++------------------------
 server/analysis/summary.py  | 64 +++++++++++++++++++++++++
 server/analysis/user.py     | 20 ++++++++
 3 files changed, 118 insertions(+), 62 deletions(-)
 create mode 100644 server/analysis/summary.py
 create mode 100644 server/analysis/user.py

diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index a9e9289..0d1ffc9 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -6,7 +6,9 @@ from server.analysis.cultural import CulturalAnalysis
 from server.analysis.emotional import EmotionalAnalysis
 from server.analysis.interactional import InteractionAnalysis
 from server.analysis.linguistic import LinguisticAnalysis
+from server.analysis.summary import SummaryAnalysis
 from server.analysis.temporal import TemporalAnalysis
+from server.analysis.user import UserAnalysis
 
 DOMAIN_STOPWORDS = {
     "www",
@@ -36,12 +38,11 @@ class StatGen:
         self.interaction_analysis = InteractionAnalysis(EXCLUDE_WORDS)
         self.linguistic_analysis = LinguisticAnalysis(EXCLUDE_WORDS)
         self.cultural_analysis = CulturalAnalysis()
+        self.summary_analysis = SummaryAnalysis()
+        self.user_analysis = UserAnalysis(self.interaction_analysis)
 
     ## Private Methods
-    def _prepare_filtered_df(self, 
-                             df: pd.DataFrame, 
-                             filters: dict | None = None
-                             ) -> pd.DataFrame:
+    def _prepare_filtered_df(self, df: pd.DataFrame, filters: dict | None = None) -> pd.DataFrame:
         filters = filters or {}
         filtered_df = df.copy()
 
@@ -51,10 +52,9 @@ class StatGen:
         data_source_filter = filters.get("data_sources", None)
 
         if search_query:
-            mask = (
-                filtered_df["content"].str.contains(search_query, case=False, na=False)
-                | filtered_df["author"].str.contains(search_query, case=False, na=False)
-            )
+            mask = filtered_df["content"].str.contains(
+                search_query, case=False, na=False
+            ) | filtered_df["author"].str.contains(search_query, case=False, na=False)
 
             # Only include title if the column exists
             if "title" in filtered_df.columns:
@@ -76,10 +76,10 @@ class StatGen:
         return filtered_df
 
     ## Public Methods
-    def filter_dataset(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+    def filter_dataset(self, df: pd.DataFrame, filters: dict | None = None) -> list[dict]:
         return self._prepare_filtered_df(df, filters).to_dict(orient="records")
 
-    def get_time_analysis(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+    def temporal(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
         filtered_df = self._prepare_filtered_df(df, filters)
 
         return {
@@ -87,40 +87,43 @@ class StatGen:
             "weekday_hour_heatmap": self.temporal_analysis.heatmap(filtered_df),
         }
 
-    def get_content_analysis(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+    def linguistic(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
         filtered_df = self._prepare_filtered_df(df, filters)
 
         return {
             "word_frequencies": self.linguistic_analysis.word_frequencies(filtered_df),
             "common_two_phrases": self.linguistic_analysis.ngrams(filtered_df),
             "common_three_phrases": self.linguistic_analysis.ngrams(filtered_df, n=3),
-            "average_emotion_by_topic": self.emotional_analysis.avg_emotion_by_topic(
-                filtered_df
-            )
         }
 
-    def get_user_analysis(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+    def emotional(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
         filtered_df = self._prepare_filtered_df(df, filters)
 
         return {
-            "top_users": self.interaction_analysis.top_users(filtered_df),
-            "users": self.interaction_analysis.per_user_analysis(filtered_df),
+            "average_emotion_by_topic": self.emotional_analysis.avg_emotion_by_topic(filtered_df),
+            "overall_emotion_average": self.emotional_analysis.overall_emotion_average(filtered_df),
+            "dominant_emotion_distribution": self.emotional_analysis.dominant_emotion_distribution(filtered_df),
+            "emotion_by_source": self.emotional_analysis.emotion_by_source(filtered_df)
+        }
+
+    def user(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+        filtered_df = self._prepare_filtered_df(df, filters)
+
+        return {
+            "top_users": self.user_analysis.top_users(filtered_df),
+            "users": self.user_analysis.users(filtered_df)
+        }
+
+    def interactional(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+        filtered_df = self._prepare_filtered_df(df, filters)
+
+        return {
+            "average_thread_depth": self.interaction_analysis.average_thread_depth(filtered_df),
+            "average_thread_length_by_emotion": self.interaction_analysis.average_thread_length_by_emotion(filtered_df),
             "interaction_graph": self.interaction_analysis.interaction_graph(filtered_df)
         }
 
-    def get_interactional_analysis(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
-        filtered_df = self._prepare_filtered_df(df, filters)
-
-        return {
-            "average_thread_depth": self.interaction_analysis.average_thread_depth(
-                filtered_df
-            ),
-            "average_thread_length_by_emotion": self.interaction_analysis.average_thread_length_by_emotion(
-                filtered_df
-            ),
-        }
-
-    def get_cultural_analysis(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
+    def cultural(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
         filtered_df = self._prepare_filtered_df(df, filters)
 
         return {
@@ -136,35 +139,4 @@ class StatGen:
     def summary(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
         filtered_df = self._prepare_filtered_df(df, filters)
 
-        total_posts = (filtered_df["type"] == "post").sum()
-        total_comments = (filtered_df["type"] == "comment").sum()
-        events_per_user = filtered_df.groupby("author").size()
-
-        if filtered_df.empty:
-            return {
-                "total_events": 0,
-                "total_posts": 0,
-                "total_comments": 0,
-                "unique_users": 0,
-                "comments_per_post": 0,
-                "lurker_ratio": 0,
-                "time_range": {
-                    "start": None,
-                    "end": None,
-                },
-                "sources": [],
-            }
-
-        return {
-            "total_events": int(len(filtered_df)),
-            "total_posts": int(total_posts),
-            "total_comments": int(total_comments),
-            "unique_users": int(events_per_user.count()),
-            "comments_per_post": round(total_comments / max(total_posts, 1), 2),
-            "lurker_ratio": round((events_per_user == 1).mean(), 2),
-            "time_range": {
-                "start": int(filtered_df["dt"].min().timestamp()),
-                "end": int(filtered_df["dt"].max().timestamp()),
-            },
-            "sources": filtered_df["source"].dropna().unique().tolist(),
-        }
+        return self.summary_analysis.summary(filtered_df)
diff --git a/server/analysis/summary.py b/server/analysis/summary.py
new file mode 100644
index 0000000..14cc8ca
--- /dev/null
+++ b/server/analysis/summary.py
@@ -0,0 +1,64 @@
+import pandas as pd
+
+
+class SummaryAnalysis:
+    def total_events(self, df: pd.DataFrame) -> int:
+        return int(len(df))
+
+    def total_posts(self, df: pd.DataFrame) -> int:
+        return int(len(df[df["type"] == "post"]))
+
+    def total_comments(self, df: pd.DataFrame) -> int:
+        return int(len(df[df["type"] == "comment"]))
+
+    def unique_users(self, df: pd.DataFrame) -> int:
+        return int(len(df["author"].dropna().unique()))
+
+    def comments_per_post(self, total_comments: int, total_posts: int) -> float:
+        return round(total_comments / max(total_posts, 1), 2)
+
+    def lurker_ratio(self, df: pd.DataFrame) -> float:
+        events_per_user = df.groupby("author").size()
+        return round((events_per_user == 1).mean(), 2)
+
+    def time_range(self, df: pd.DataFrame) -> dict:
+        return {
+            "start": int(df["dt"].min().timestamp()),
+            "end": int(df["dt"].max().timestamp()),
+        }
+
+    def sources(self, df: pd.DataFrame) -> list:
+        return df["source"].dropna().unique().tolist()
+
+    def empty_summary(self) -> dict:
+        return {
+            "total_events": 0,
+            "total_posts": 0,
+            "total_comments": 0,
+            "unique_users": 0,
+            "comments_per_post": 0,
+            "lurker_ratio": 0,
+            "time_range": {
+                "start": None,
+                "end": None,
+            },
+            "sources": [],
+        }
+
+    def summary(self, df: pd.DataFrame) -> dict:
+        if df.empty:
+            return self.empty_summary()
+
+        total_posts = self.total_posts(df)
+        total_comments = self.total_comments(df)
+
+        return {
+            "total_events": self.total_events(df),
+            "total_posts": total_posts,
+            "total_comments": total_comments,
+            "unique_users": self.unique_users(df),
+            "comments_per_post": self.comments_per_post(total_comments, total_posts),
+            "lurker_ratio": self.lurker_ratio(df),
+            "time_range": self.time_range(df),
+            "sources": self.sources(df),
+        }
diff --git a/server/analysis/user.py b/server/analysis/user.py
new file mode 100644
index 0000000..57ddc1e
--- /dev/null
+++ b/server/analysis/user.py
@@ -0,0 +1,20 @@
+import pandas as pd
+
+from server.analysis.interactional import InteractionAnalysis
+
+
+class UserAnalysis:
+    def __init__(self, interaction_analysis: InteractionAnalysis):
+        self.interaction_analysis = interaction_analysis
+
+    def top_users(self, df: pd.DataFrame) -> list:
+        return self.interaction_analysis.top_users(df)
+
+    def users(self, df: pd.DataFrame) -> dict | list:
+        return self.interaction_analysis.per_user_analysis(df)
+
+    def user(self, df: pd.DataFrame) -> dict:
+        return {
+            "top_users": self.top_users(df),
+            "users": self.users(df),
+        }

From 3468fdc2ea35b870b3003108c9721b449ab80f62 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Mon, 16 Mar 2026 16:45:11 +0000
Subject: [PATCH 03/24] feat(api): add new user and linguistic endpoints

---
 server/app.py | 121 +++++++++++++++++++++++++++++++++++++-------------
 1 file changed, 90 insertions(+), 31 deletions(-)

diff --git a/server/app.py b/server/app.py
index f373843..3ba9295 100644
--- a/server/app.py
+++ b/server/app.py
@@ -186,7 +186,7 @@ def scrape_data():
         dataset_manager.set_dataset_status(
             dataset_id,
             "fetching",
-            f"Data is being fetched from {', '.join(source['name'] for source in source_configs)}"
+            f"Data is being fetched from {', '.join(source['name'] for source in source_configs)}",
         )
 
         fetch_and_process_dataset.delay(
@@ -198,12 +198,14 @@ def scrape_data():
         print(traceback.format_exc())
         return jsonify({"error": "Failed to queue dataset processing"}), 500
 
+    return jsonify(
+        {
+            "message": "Dataset queued for processing",
+            "dataset_id": dataset_id,
+            "status": "processing",
+        }
+    ), 202
 
-    return jsonify({
-        "message": "Dataset queued for processing",
-        "dataset_id": dataset_id,
-        "status": "processing"
-    }), 202
 
 @app.route("/datasets/upload", methods=["POST"])
 @jwt_required()
@@ -233,7 +235,9 @@ def upload_data():
 
         posts_df = pd.read_json(post_file, lines=True, convert_dates=False)
         topics = json.load(topic_file)
-        dataset_id = dataset_manager.save_dataset_info(current_user, dataset_name, topics)
+        dataset_id = dataset_manager.save_dataset_info(
+            current_user, dataset_name, topics
+        )
 
         process_dataset.delay(dataset_id, posts_df.to_dict(orient="records"), topics)
 
@@ -249,6 +253,7 @@ def upload_data():
     except Exception as e:
         return jsonify({"error": f"An unexpected error occurred"}), 500
 
+
 @app.route("/dataset/<int:dataset_id>", methods=["GET"])
 @jwt_required()
 def get_dataset(dataset_id):
@@ -256,7 +261,9 @@ def get_dataset(dataset_id):
         user_id = int(get_jwt_identity())
 
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_info = dataset_manager.get_dataset_info(dataset_id)
         included_cols = {"id", "name", "created_at"}
@@ -269,7 +276,8 @@ def get_dataset(dataset_id):
     except Exception:
         print(traceback.format_exc())
         return jsonify({"error": "An unexpected error occured"}), 500
-    
+
+
 @app.route("/dataset/<int:dataset_id>", methods=["PATCH"])
 @jwt_required()
 def update_dataset(dataset_id):
@@ -277,7 +285,9 @@ def update_dataset(dataset_id):
         user_id = int(get_jwt_identity())
 
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         body = request.get_json()
         new_name = body.get("name")
@@ -286,7 +296,9 @@ def update_dataset(dataset_id):
             return jsonify({"error": "A valid name must be provided"}), 400
 
         dataset_manager.update_dataset_name(dataset_id, new_name.strip())
-        return jsonify({"message": f"Dataset {dataset_id} renamed to '{new_name.strip()}'"}), 200
+        return jsonify(
+            {"message": f"Dataset {dataset_id} renamed to '{new_name.strip()}'"}
+        ), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:
@@ -294,7 +306,8 @@ def update_dataset(dataset_id):
     except Exception:
         print(traceback.format_exc())
         return jsonify({"error": "An unexpected error occurred"}), 500
-    
+
+
 @app.route("/dataset/<int:dataset_id>", methods=["DELETE"])
 @jwt_required()
 def delete_dataset(dataset_id):
@@ -302,11 +315,17 @@ def delete_dataset(dataset_id):
         user_id = int(get_jwt_identity())
 
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_manager.delete_dataset_info(dataset_id)
         dataset_manager.delete_dataset_content(dataset_id)
-        return jsonify({"message": f"Dataset {dataset_id} metadata and content successfully deleted"}), 200
+        return jsonify(
+            {
+                "message": f"Dataset {dataset_id} metadata and content successfully deleted"
+            }
+        ), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:
@@ -315,6 +334,7 @@ def delete_dataset(dataset_id):
         print(traceback.format_exc())
         return jsonify({"error": "An unexpected error occured"}), 500
 
+
 @app.route("/dataset/<int:dataset_id>/status", methods=["GET"])
 @jwt_required()
 def get_dataset_status(dataset_id):
@@ -322,7 +342,9 @@ def get_dataset_status(dataset_id):
         user_id = int(get_jwt_identity())
 
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_status = dataset_manager.get_dataset_status(dataset_id)
         return jsonify(dataset_status), 200
@@ -334,17 +356,44 @@ def get_dataset_status(dataset_id):
         print(traceback.format_exc())
         return jsonify({"error": "An unexpected error occured"}), 500
 
-@app.route("/dataset/<int:dataset_id>/content", methods=["GET"])
+
+@app.route("/dataset/<int:dataset_id>/linguistic", methods=["GET"])
 @jwt_required()
-def content_endpoint(dataset_id):
+def get_linguistic_analysis(dataset_id):
     try:
         user_id = int(get_jwt_identity())
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_content = dataset_manager.get_dataset_content(dataset_id)
         filters = get_request_filters()
-        return jsonify(stat_gen.get_content_analysis(dataset_content, filters)), 200
+        return jsonify(stat_gen.linguistic(dataset_content, filters)), 200
+    except NotAuthorisedException:
+        return jsonify({"error": "User is not authorised to access this content"}), 403
+    except NonExistentDatasetException:
+        return jsonify({"error": "Dataset does not exist"}), 404
+    except ValueError as e:
+        return jsonify({"error": f"Malformed or missing data"}), 400
+    except Exception as e:
+        print(traceback.format_exc())
+        return jsonify({"error": f"An unexpected error occurred"}), 500
+
+
+@app.route("/dataset/<int:dataset_id>/emotional", methods=["GET"])
+@jwt_required()
+def get_emotional_analysis(dataset_id):
+    try:
+        user_id = int(get_jwt_identity())
+        if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
+
+        dataset_content = dataset_manager.get_dataset_content(dataset_id)
+        filters = get_request_filters()
+        return jsonify(stat_gen.emotional(dataset_content, filters)), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:
@@ -362,7 +411,9 @@ def get_summary(dataset_id):
     try:
         user_id = int(get_jwt_identity())
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_content = dataset_manager.get_dataset_content(dataset_id)
         filters = get_request_filters()
@@ -378,17 +429,19 @@ def get_summary(dataset_id):
         return jsonify({"error": f"An unexpected error occurred"}), 500
 
 
-@app.route("/dataset/<int:dataset_id>/time", methods=["GET"])
+@app.route("/dataset/<int:dataset_id>/temporal", methods=["GET"])
 @jwt_required()
-def get_time_analysis(dataset_id):
+def get_temporal_analysis(dataset_id):
     try:
         user_id = int(get_jwt_identity())
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_content = dataset_manager.get_dataset_content(dataset_id)
         filters = get_request_filters()
-        return jsonify(stat_gen.get_time_analysis(dataset_content, filters)), 200
+        return jsonify(stat_gen.temporal(dataset_content, filters)), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:
@@ -406,11 +459,13 @@ def get_user_analysis(dataset_id):
     try:
         user_id = int(get_jwt_identity())
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_content = dataset_manager.get_dataset_content(dataset_id)
         filters = get_request_filters()
-        return jsonify(stat_gen.get_user_analysis(dataset_content, filters)), 200
+        return jsonify(stat_gen.user(dataset_content, filters)), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:
@@ -428,11 +483,13 @@ def get_cultural_analysis(dataset_id):
     try:
         user_id = int(get_jwt_identity())
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_content = dataset_manager.get_dataset_content(dataset_id)
         filters = get_request_filters()
-        return jsonify(stat_gen.get_cultural_analysis(dataset_content, filters)), 200
+        return jsonify(stat_gen.cultural(dataset_content, filters)), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:
@@ -444,17 +501,19 @@ def get_cultural_analysis(dataset_id):
         return jsonify({"error": f"An unexpected error occurred"}), 500
 
 
-@app.route("/dataset/<int:dataset_id>/interaction", methods=["GET"])
+@app.route("/dataset/<int:dataset_id>/interactional", methods=["GET"])
 @jwt_required()
 def get_interaction_analysis(dataset_id):
     try:
         user_id = int(get_jwt_identity())
         if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
-            raise NotAuthorisedException("This user is not authorised to access this dataset")
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
         dataset_content = dataset_manager.get_dataset_content(dataset_id)
         filters = get_request_filters()
-        return jsonify(stat_gen.get_interactional_analysis(dataset_content, filters)), 200
+        return jsonify(stat_gen.interactional(dataset_content, filters)), 200
     except NotAuthorisedException:
         return jsonify({"error": "User is not authorised to access this content"}), 403
     except NonExistentDatasetException:

From 8a13444b16a6cafd35093ffacc530ba478fccf1e Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Mon, 16 Mar 2026 16:46:07 +0000
Subject: [PATCH 04/24] chore(frontend): add new API types

---
 frontend/src/types/ApiTypes.ts | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)

diff --git a/frontend/src/types/ApiTypes.ts b/frontend/src/types/ApiTypes.ts
index 5feaddf..43b035b 100644
--- a/frontend/src/types/ApiTypes.ts
+++ b/frontend/src/types/ApiTypes.ts
@@ -71,6 +71,25 @@ type NGram = {
 type AverageEmotionByTopic = Emotion & {
   n: number;
   topic: string;
+  [key: string]: string | number;
+};
+
+type OverallEmotionAverage = {
+  emotion: string;
+  score: number;
+};
+
+type DominantEmotionDistribution = {
+  emotion: string;
+  count: number;
+  ratio: number;
+};
+
+type EmotionBySource = {
+  source: string;
+  dominant_emotion: string;
+  dominant_score: number;
+  event_count: number;
 };
 
 
@@ -79,6 +98,9 @@ type ContentAnalysisResponse = {
     average_emotion_by_topic: AverageEmotionByTopic[];
     common_three_phrases: NGram[];
     common_two_phrases: NGram[];
+    overall_emotion_average?: OverallEmotionAverage[];
+    dominant_emotion_distribution?: DominantEmotionDistribution[];
+    emotion_by_source?: EmotionBySource[];
 }
 
 // Summary
@@ -110,6 +132,9 @@ export type {
     UserAnalysisResponse,
     FrequencyWord,
     AverageEmotionByTopic,
+    OverallEmotionAverage,
+    DominantEmotionDistribution,
+    EmotionBySource,
     SummaryResponse,
     TimeAnalysisResponse,
     ContentAnalysisResponse,

From 9093059d05352ab9c039071fb7867bd861b7d97b Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 12:23:03 +0000
Subject: [PATCH 05/24] refactor(stats): move user stats out of interactional
 into users

---
 server/analysis/interactional.py | 67 ----------------------------
 server/analysis/stat_gen.py      |  4 +-
 server/analysis/user.py          | 76 ++++++++++++++++++++++++++------
 3 files changed, 65 insertions(+), 82 deletions(-)

diff --git a/server/analysis/interactional.py b/server/analysis/interactional.py
index 864980d..8220747 100644
--- a/server/analysis/interactional.py
+++ b/server/analysis/interactional.py
@@ -57,73 +57,6 @@ class InteractionAnalysis:
 
         return rows
 
-    def top_users(self, df: pd.DataFrame) -> list:
-        counts = df.groupby(["author", "source"]).size().sort_values(ascending=False)
-
-        top_users = [
-            {"author": author, "source": source, "count": int(count)}
-            for (author, source), count in counts.items()
-        ]
-
-        return top_users
-
-    def per_user_analysis(self, df: pd.DataFrame) -> dict:
-        per_user = df.groupby(["author", "type"]).size().unstack(fill_value=0)
-
-        emotion_cols = [col for col in df.columns if col.startswith("emotion_")]
-
-        avg_emotions_by_author = {}
-        if emotion_cols:
-            avg_emotions = df.groupby("author")[emotion_cols].mean().fillna(0.0)
-            avg_emotions_by_author = {
-                author: {emotion: float(score) for emotion, score in row.items()}
-                for author, row in avg_emotions.iterrows()
-            }
-
-        # ensure columns always exist
-        for col in ("post", "comment"):
-            if col not in per_user.columns:
-                per_user[col] = 0
-
-        per_user["comment_post_ratio"] = per_user["comment"] / per_user["post"].replace(
-            0, 1
-        )
-        per_user["comment_share"] = per_user["comment"] / (
-            per_user["post"] + per_user["comment"]
-        ).replace(0, 1)
-        per_user = per_user.sort_values("comment_post_ratio", ascending=True)
-        per_user_records = per_user.reset_index().to_dict(orient="records")
-
-        vocab_rows = self._vocab_richness_per_user(df)
-        vocab_by_author = {row["author"]: row for row in vocab_rows}
-
-        # merge vocab richness + per_user information
-        merged_users = []
-        for row in per_user_records:
-            author = row["author"]
-            merged_users.append(
-                {
-                    "author": author,
-                    "post": int(row.get("post", 0)),
-                    "comment": int(row.get("comment", 0)),
-                    "comment_post_ratio": float(row.get("comment_post_ratio", 0)),
-                    "comment_share": float(row.get("comment_share", 0)),
-                    "avg_emotions": avg_emotions_by_author.get(author, {}),
-                    "vocab": vocab_by_author.get(
-                        author,
-                        {
-                            "vocab_richness": 0,
-                            "avg_words_per_event": 0,
-                            "top_words": [],
-                        },
-                    ),
-                }
-            )
-
-        merged_users.sort(key=lambda u: u["comment_post_ratio"])
-
-        return merged_users
-
     def interaction_graph(self, df: pd.DataFrame):
         interactions = {a: {} for a in df["author"].dropna().unique()}
 
diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index 0d1ffc9..bec7eeb 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -39,7 +39,7 @@ class StatGen:
         self.linguistic_analysis = LinguisticAnalysis(EXCLUDE_WORDS)
         self.cultural_analysis = CulturalAnalysis()
         self.summary_analysis = SummaryAnalysis()
-        self.user_analysis = UserAnalysis(self.interaction_analysis)
+        self.user_analysis = UserAnalysis()
 
     ## Private Methods
     def _prepare_filtered_df(self, df: pd.DataFrame, filters: dict | None = None) -> pd.DataFrame:
@@ -111,7 +111,7 @@ class StatGen:
 
         return {
             "top_users": self.user_analysis.top_users(filtered_df),
-            "users": self.user_analysis.users(filtered_df)
+            "users": self.user_analysis.per_user_analysis(filtered_df)
         }
 
     def interactional(self, df: pd.DataFrame, filters: dict | None = None) -> dict:
diff --git a/server/analysis/user.py b/server/analysis/user.py
index 57ddc1e..d5e9917 100644
--- a/server/analysis/user.py
+++ b/server/analysis/user.py
@@ -1,20 +1,70 @@
 import pandas as pd
 
-from server.analysis.interactional import InteractionAnalysis
-
 
 class UserAnalysis:
-    def __init__(self, interaction_analysis: InteractionAnalysis):
-        self.interaction_analysis = interaction_analysis
-
     def top_users(self, df: pd.DataFrame) -> list:
-        return self.interaction_analysis.top_users(df)
+        counts = df.groupby(["author", "source"]).size().sort_values(ascending=False)
 
-    def users(self, df: pd.DataFrame) -> dict | list:
-        return self.interaction_analysis.per_user_analysis(df)
+        top_users = [
+            {"author": author, "source": source, "count": int(count)}
+            for (author, source), count in counts.items()
+        ]
 
-    def user(self, df: pd.DataFrame) -> dict:
-        return {
-            "top_users": self.top_users(df),
-            "users": self.users(df),
-        }
+        return top_users
+
+    def per_user_analysis(self, df: pd.DataFrame) -> dict:
+        per_user = df.groupby(["author", "type"]).size().unstack(fill_value=0)
+
+        emotion_cols = [col for col in df.columns if col.startswith("emotion_")]
+
+        avg_emotions_by_author = {}
+        if emotion_cols:
+            avg_emotions = df.groupby("author")[emotion_cols].mean().fillna(0.0)
+            avg_emotions_by_author = {
+                author: {emotion: float(score) for emotion, score in row.items()}
+                for author, row in avg_emotions.iterrows()
+            }
+
+        # ensure columns always exist
+        for col in ("post", "comment"):
+            if col not in per_user.columns:
+                per_user[col] = 0
+
+        per_user["comment_post_ratio"] = per_user["comment"] / per_user["post"].replace(
+            0, 1
+        )
+        per_user["comment_share"] = per_user["comment"] / (
+            per_user["post"] + per_user["comment"]
+        ).replace(0, 1)
+        per_user = per_user.sort_values("comment_post_ratio", ascending=True)
+        per_user_records = per_user.reset_index().to_dict(orient="records")
+
+        vocab_rows = self._vocab_richness_per_user(df)
+        vocab_by_author = {row["author"]: row for row in vocab_rows}
+
+        # merge vocab richness + per_user information
+        merged_users = []
+        for row in per_user_records:
+            author = row["author"]
+            merged_users.append(
+                {
+                    "author": author,
+                    "post": int(row.get("post", 0)),
+                    "comment": int(row.get("comment", 0)),
+                    "comment_post_ratio": float(row.get("comment_post_ratio", 0)),
+                    "comment_share": float(row.get("comment_share", 0)),
+                    "avg_emotions": avg_emotions_by_author.get(author, {}),
+                    "vocab": vocab_by_author.get(
+                        author,
+                        {
+                            "vocab_richness": 0,
+                            "avg_words_per_event": 0,
+                            "top_words": [],
+                        },
+                    ),
+                }
+            )
+
+        merged_users.sort(key=lambda u: u["comment_post_ratio"])
+
+        return merged_users

From 8a0f6e71e8aed5540111d9657da144b3b2fce921 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 12:31:53 +0000
Subject: [PATCH 06/24] chore(api): rename cultural entity emotion endpoint

---
 server/analysis/stat_gen.py | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index bec7eeb..36ef9a9 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -127,13 +127,9 @@ class StatGen:
         filtered_df = self._prepare_filtered_df(df, filters)
 
         return {
-            "identity_markers": self.cultural_analysis.get_identity_markers(
-                filtered_df
-            ),
+            "identity_markers": self.cultural_analysis.get_identity_markers(filtered_df),
             "stance_markers": self.cultural_analysis.get_stance_markers(filtered_df),
-            "entity_salience": self.cultural_analysis.get_avg_emotions_per_entity(
-                filtered_df
-            ),
+            "avg_emotion_per_entity": self.cultural_analysis.get_avg_emotions_per_entity(filtered_df)
         }
 
     def summary(self, df: pd.DataFrame, filters: dict | None = None) -> dict:

From 31fb275ee361a2c3cd2d5c6f7ab218c3377491cc Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 12:53:30 +0000
Subject: [PATCH 07/24] fix(db): incorrect NER column being inserted

---
 server/core/datasets.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/server/core/datasets.py b/server/core/datasets.py
index 4690454..a55445d 100644
--- a/server/core/datasets.py
+++ b/server/core/datasets.py
@@ -101,7 +101,7 @@ class DatasetManager:
                 row["source"],
                 row.get("topic"),
                 row.get("topic_confidence"),
-                Json(row["ner_entities"]) if row.get("ner_entities") else None,
+                Json(row["entities"]) if row.get("entities") is not None else None,
                 row.get("emotion_anger"),
                 row.get("emotion_disgust"),
                 row.get("emotion_fear"),

From 2fa1dff4b70e42031191fed1284cf7b2f3958879 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 13:27:39 +0000
Subject: [PATCH 08/24] feat(stat): add lexical diversity stat

---
 server/analysis/linguistic.py | 16 ++++++++++++++++
 server/analysis/stat_gen.py   |  1 +
 2 files changed, 17 insertions(+)

diff --git a/server/analysis/linguistic.py b/server/analysis/linguistic.py
index dc91faf..7546bbf 100644
--- a/server/analysis/linguistic.py
+++ b/server/analysis/linguistic.py
@@ -61,3 +61,19 @@ class LinguisticAnalysis:
             .head(limit)
             .to_dict(orient="records")
         )
+
+    def lexical_diversity(self, df: pd.DataFrame) -> dict:
+        tokens = (
+            df["content"].fillna("").astype(str).str.lower()
+            .str.findall(r"\b[a-z]{2,}\b")
+            .explode()
+        )
+        tokens = tokens[~tokens.isin(self.word_exclusions)]
+        total = max(len(tokens), 1)
+        unique = int(tokens.nunique())
+
+        return {
+            "total_tokens": total,
+            "unique_tokens": unique,
+            "ttr": round(unique / total, 4),
+        }
diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index 36ef9a9..8435340 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -94,6 +94,7 @@ class StatGen:
             "word_frequencies": self.linguistic_analysis.word_frequencies(filtered_df),
             "common_two_phrases": self.linguistic_analysis.ngrams(filtered_df),
             "common_three_phrases": self.linguistic_analysis.ngrams(filtered_df, n=3),
+            "lexical_diversity": self.linguistic_analysis.lexical_diversity(filtered_df)
         }
 
     def emotional(self, df: pd.DataFrame, filters: dict | None = None) -> dict:

From 7b5a9392715bf775d11949ff7b1074e1d1adf979 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 13:36:10 +0000
Subject: [PATCH 09/24] fix(stats): missing private methods in User obj

---
 server/analysis/interactional.py | 48 ----------------------------
 server/analysis/stat_gen.py      |  2 +-
 server/analysis/user.py          | 54 ++++++++++++++++++++++++++++++++
 3 files changed, 55 insertions(+), 49 deletions(-)

diff --git a/server/analysis/interactional.py b/server/analysis/interactional.py
index 8220747..53d97dc 100644
--- a/server/analysis/interactional.py
+++ b/server/analysis/interactional.py
@@ -1,9 +1,6 @@
 import pandas as pd
 import re
 
-from collections import Counter
-
-
 class InteractionAnalysis:
     def __init__(self, word_exclusions: set[str]):
         self.word_exclusions = word_exclusions
@@ -12,51 +9,6 @@ class InteractionAnalysis:
         tokens = re.findall(r"\b[a-z]{3,}\b", text)
         return [t for t in tokens if t not in self.word_exclusions]
 
-    def _vocab_richness_per_user(
-        self, df: pd.DataFrame, min_words: int = 20, top_most_used_words: int = 100
-    ) -> list:
-        df = df.copy()
-        df["content"] = df["content"].fillna("").astype(str).str.lower()
-        df["tokens"] = df["content"].apply(self._tokenize)
-
-        rows = []
-        for author, group in df.groupby("author"):
-            all_tokens = [t for tokens in group["tokens"] for t in tokens]
-
-            total_words = len(all_tokens)
-            unique_words = len(set(all_tokens))
-            events = len(group)
-
-            # Min amount of words for a user, any less than this might give weird results
-            if total_words < min_words:
-                continue
-
-            # 100% = they never reused a word (excluding stop words)
-            vocab_richness = unique_words / total_words
-            avg_words = total_words / max(events, 1)
-
-            counts = Counter(all_tokens)
-            top_words = [
-                {"word": w, "count": int(c)}
-                for w, c in counts.most_common(top_most_used_words)
-            ]
-
-            rows.append(
-                {
-                    "author": author,
-                    "events": int(events),
-                    "total_words": int(total_words),
-                    "unique_words": int(unique_words),
-                    "vocab_richness": round(vocab_richness, 3),
-                    "avg_words_per_event": round(avg_words, 2),
-                    "top_words": top_words,
-                }
-            )
-
-        rows = sorted(rows, key=lambda x: x["vocab_richness"], reverse=True)
-
-        return rows
-
     def interaction_graph(self, df: pd.DataFrame):
         interactions = {a: {} for a in df["author"].dropna().unique()}
 
diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index 8435340..c2f09ed 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -39,7 +39,7 @@ class StatGen:
         self.linguistic_analysis = LinguisticAnalysis(EXCLUDE_WORDS)
         self.cultural_analysis = CulturalAnalysis()
         self.summary_analysis = SummaryAnalysis()
-        self.user_analysis = UserAnalysis()
+        self.user_analysis = UserAnalysis(EXCLUDE_WORDS)
 
     ## Private Methods
     def _prepare_filtered_df(self, df: pd.DataFrame, filters: dict | None = None) -> pd.DataFrame:
diff --git a/server/analysis/user.py b/server/analysis/user.py
index d5e9917..fc8e618 100644
--- a/server/analysis/user.py
+++ b/server/analysis/user.py
@@ -1,7 +1,61 @@
 import pandas as pd
+import re
 
+from collections import Counter
 
 class UserAnalysis:
+    def __init__(self, word_exclusions: set[str]):
+        self.word_exclusions = word_exclusions
+
+    def _tokenize(self, text: str):
+        tokens = re.findall(r"\b[a-z]{3,}\b", text)
+        return [t for t in tokens if t not in self.word_exclusions]
+
+    def _vocab_richness_per_user(
+            self, df: pd.DataFrame, min_words: int = 20, top_most_used_words: int = 100
+        ) -> list:
+            df = df.copy()
+            df["content"] = df["content"].fillna("").astype(str).str.lower()
+            df["tokens"] = df["content"].apply(self._tokenize)
+
+            rows = []
+            for author, group in df.groupby("author"):
+                all_tokens = [t for tokens in group["tokens"] for t in tokens]
+
+                total_words = len(all_tokens)
+                unique_words = len(set(all_tokens))
+                events = len(group)
+
+                # Min amount of words for a user, any less than this might give weird results
+                if total_words < min_words:
+                    continue
+
+                # 100% = they never reused a word (excluding stop words)
+                vocab_richness = unique_words / total_words
+                avg_words = total_words / max(events, 1)
+
+                counts = Counter(all_tokens)
+                top_words = [
+                    {"word": w, "count": int(c)}
+                    for w, c in counts.most_common(top_most_used_words)
+                ]
+
+                rows.append(
+                    {
+                        "author": author,
+                        "events": int(events),
+                        "total_words": int(total_words),
+                        "unique_words": int(unique_words),
+                        "vocab_richness": round(vocab_richness, 3),
+                        "avg_words_per_event": round(avg_words, 2),
+                        "top_words": top_words,
+                    }
+                )
+
+            rows = sorted(rows, key=lambda x: x["vocab_richness"], reverse=True)
+
+            return rows
+
     def top_users(self, df: pd.DataFrame) -> list:
         counts = df.groupby(["author", "source"]).size().sort_values(ascending=False)
 

From 8372aa727864a73db1a8f62228b3c539cbc37a29 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 13:36:41 +0000
Subject: [PATCH 10/24] feat(api): add endpoint to view entire dataset

---
 server/app.py | 21 +++++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/server/app.py b/server/app.py
index 3ba9295..7a5dea0 100644
--- a/server/app.py
+++ b/server/app.py
@@ -523,7 +523,28 @@ def get_interaction_analysis(dataset_id):
     except Exception as e:
         print(traceback.format_exc())
         return jsonify({"error": f"An unexpected error occurred"}), 500
+    
+@app.route("/dataset/<int:dataset_id>/all", methods=["GET"])
+@jwt_required()
+def get_full_dataset(dataset_id: int):
+    try:
+        user_id = int(get_jwt_identity())
+        if not dataset_manager.authorize_user_dataset(dataset_id, user_id):
+            raise NotAuthorisedException(
+                "This user is not authorised to access this dataset"
+            )
 
+        dataset_content = dataset_manager.get_dataset_content(dataset_id)
+        return jsonify(dataset_content.to_dict(orient="records")), 200
+    except NotAuthorisedException:
+        return jsonify({"error": "User is not authorised to access this content"}), 403
+    except NonExistentDatasetException:
+        return jsonify({"error": "Dataset does not exist"}), 404
+    except ValueError as e:
+        return jsonify({"error": f"Malformed or missing data"}), 400
+    except Exception as e:
+        print(traceback.format_exc())
+        return jsonify({"error": f"An unexpected error occurred"}), 500
 
 if __name__ == "__main__":
     app.run(debug=True)

From 2a00384a5557e51aab0e2b081f58a8f723ec1457 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 19:03:56 +0000
Subject: [PATCH 11/24] feat(interaction): add top interaction pairs and
 initiator ratio methods

---
 server/analysis/interactional.py | 77 +++++++-------------------------
 server/analysis/stat_gen.py      |  3 +-
 2 files changed, 18 insertions(+), 62 deletions(-)

diff --git a/server/analysis/interactional.py b/server/analysis/interactional.py
index 53d97dc..7e0c081 100644
--- a/server/analysis/interactional.py
+++ b/server/analysis/interactional.py
@@ -51,68 +51,23 @@ class InteractionAnalysis:
             return 0
 
         return round(sum(depths) / len(depths), 2)
+    
+    def top_interaction_pairs(self, df: pd.DataFrame, top_n=10):
+        graph = self.interaction_graph(df)
+        pairs = []
 
-    def average_thread_length_by_emotion(self, df: pd.DataFrame):
-        emotion_exclusions = {"emotion_neutral", "emotion_surprise"}
+        for a, targets in graph.items():
+            for b, count in targets.items():
+                pairs.append(((a, b), count))
 
-        emotion_cols = [
-            c
-            for c in df.columns
-            if c.startswith("emotion_") and c not in emotion_exclusions
-        ]
+        pairs.sort(key=lambda x: x[1], reverse=True)
+        return pairs[:top_n]
+    
+    def initiator_ratio(self, df: pd.DataFrame):
+        starters = df["reply_to"].isna().sum()
+        total = len(df)
 
-        id_to_reply = df.set_index("id")["reply_to"].to_dict()
-        length_cache = {}
+        if total == 0:
+            return 0
 
-        def thread_length_from(start_id):
-            if start_id in length_cache:
-                return length_cache[start_id]
-
-            seen = set()
-            length = 1
-            current = start_id
-
-            while True:
-                if current in seen:
-                    # infinite loop shouldn't happen, but just in case
-                    break
-                seen.add(current)
-
-                reply_to = id_to_reply.get(current)
-
-                if (
-                    reply_to is None
-                    or (isinstance(reply_to, float) and pd.isna(reply_to))
-                    or reply_to == ""
-                ):
-                    break
-
-                length += 1
-                current = reply_to
-
-                if current in length_cache:
-                    length += length_cache[current] - 1
-                    break
-
-            length_cache[start_id] = length
-            return length
-
-        emotion_to_lengths = {}
-
-        # Fill NaNs in emotion cols to avoid max() issues
-        emo_df = df[["id"] + emotion_cols].copy()
-        emo_df[emotion_cols] = emo_df[emotion_cols].fillna(0)
-
-        for _, row in emo_df.iterrows():
-            msg_id = row["id"]
-            length = thread_length_from(msg_id)
-
-            emotions = {c: row[c] for c in emotion_cols}
-            dominant = max(emotions, key=emotions.get)
-
-            emotion_to_lengths.setdefault(dominant, []).append(length)
-
-        return {
-            emotion: round(sum(lengths) / len(lengths), 2)
-            for emotion, lengths in emotion_to_lengths.items()
-        }
+        return round(starters / total, 2)
diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index c2f09ed..f5b328d 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -120,7 +120,8 @@ class StatGen:
 
         return {
             "average_thread_depth": self.interaction_analysis.average_thread_depth(filtered_df),
-            "average_thread_length_by_emotion": self.interaction_analysis.average_thread_length_by_emotion(filtered_df),
+            "top_interaction_pairs": self.interaction_analysis.top_interaction_pairs(filtered_df, top_n=100),
+            "initiator_ratio": self.interaction_analysis.initiator_ratio(filtered_df),
             "interaction_graph": self.interaction_analysis.interaction_graph(filtered_df)
         }
 

From 71998c450e13007d4e6254591415b467d9752661 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Tue, 17 Mar 2026 19:49:03 +0000
Subject: [PATCH 12/24] fix(db): change title type to text

Occasionally a Reddit post would have a long title, and would break in the schema.
---
 server/db/schema.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/server/db/schema.sql b/server/db/schema.sql
index 4550633..5bec116 100644
--- a/server/db/schema.sql
+++ b/server/db/schema.sql
@@ -43,7 +43,7 @@ CREATE TABLE events (
     weekday VARCHAR(255) NOT NULL,
 
     /* Posts Only */
-    title VARCHAR(255),
+    title TEXT,
 
     /* Comments Only*/
     parent_id VARCHAR(255),

From 3e78a54388e4bc3cd2d2637a443736d29910fb48 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 18:36:05 +0000
Subject: [PATCH 13/24] feat(stat): add conversation concentration metric

Remove old `initiator_ratio` metric which wasn't working due every event having a `reply_to` value.

This metric was suggested by AI, and is a surprisingly interesting one that gave interesting insights.
---
 server/analysis/interactional.py | 26 ++++++++++++++++++++------
 server/analysis/stat_gen.py      |  4 ++--
 2 files changed, 22 insertions(+), 8 deletions(-)

diff --git a/server/analysis/interactional.py b/server/analysis/interactional.py
index 7e0c081..e15940e 100644
--- a/server/analysis/interactional.py
+++ b/server/analysis/interactional.py
@@ -63,11 +63,25 @@ class InteractionAnalysis:
         pairs.sort(key=lambda x: x[1], reverse=True)
         return pairs[:top_n]
     
-    def initiator_ratio(self, df: pd.DataFrame):
-        starters = df["reply_to"].isna().sum()
-        total = len(df)
+    def conversation_concentration(self, df: pd.DataFrame) -> dict:
+        if "type" not in df.columns:
+            return {}
 
-        if total == 0:
-            return 0
+        comments = df[df["type"] == "comment"]
+        if comments.empty:
+            return {}
 
-        return round(starters / total, 2)
+        author_counts = comments["author"].value_counts()
+        total_comments = len(comments)
+        total_authors = len(author_counts)
+
+        top_10_pct_n = max(1, int(total_authors * 0.1))
+        top_10_pct_share = round(author_counts.head(top_10_pct_n).sum() / total_comments, 4)
+
+        return {
+            "total_commenting_authors": total_authors,
+            "top_10pct_author_count": top_10_pct_n,
+            "top_10pct_comment_share": float(top_10_pct_share),
+            "single_comment_authors": int((author_counts == 1).sum()),
+            "single_comment_author_ratio": float(round((author_counts == 1).sum() / total_authors, 4)),
+        }
\ No newline at end of file
diff --git a/server/analysis/stat_gen.py b/server/analysis/stat_gen.py
index f5b328d..4368841 100644
--- a/server/analysis/stat_gen.py
+++ b/server/analysis/stat_gen.py
@@ -121,8 +121,8 @@ class StatGen:
         return {
             "average_thread_depth": self.interaction_analysis.average_thread_depth(filtered_df),
             "top_interaction_pairs": self.interaction_analysis.top_interaction_pairs(filtered_df, top_n=100),
-            "initiator_ratio": self.interaction_analysis.initiator_ratio(filtered_df),
-            "interaction_graph": self.interaction_analysis.interaction_graph(filtered_df)
+            "interaction_graph": self.interaction_analysis.interaction_graph(filtered_df),
+            "conversation_concentration": self.interaction_analysis.conversation_concentration(filtered_df)
         }
 
     def cultural(self, df: pd.DataFrame, filters: dict | None = None) -> dict:

From 436549641fede45e1217e2fc020fd517ccd9da3b Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 18:37:39 +0000
Subject: [PATCH 14/24] chore(frontend): add api types for new backend data

---
 frontend/src/types/ApiTypes.ts | 82 ++++++++++++++++++++++++++++++++++
 1 file changed, 82 insertions(+)

diff --git a/frontend/src/types/ApiTypes.ts b/frontend/src/types/ApiTypes.ts
index 43b035b..f336fef 100644
--- a/frontend/src/types/ApiTypes.ts
+++ b/frontend/src/types/ApiTypes.ts
@@ -31,12 +31,25 @@ type User = {
 
 type InteractionGraph = Record<string, Record<string, number>>;
 
+type ConversationConcentration = {
+  total_commenting_authors: number;
+  top_10pct_author_count: number;
+  top_10pct_comment_share: number;
+  single_comment_authors: number;
+  single_comment_author_ratio: number;
+};
+
 type UserAnalysisResponse = {
   top_users: TopUser[];
   users: User[];
   interaction_graph: InteractionGraph;
 };
 
+type UserEndpointResponse = {
+  top_users: TopUser[];
+  users: User[];
+};
+
 // Time Analysis
 type EventsPerDay = {
     date: Date;
@@ -103,6 +116,65 @@ type ContentAnalysisResponse = {
     emotion_by_source?: EmotionBySource[];
 }
 
+type LinguisticAnalysisResponse = {
+  word_frequencies: FrequencyWord[];
+  common_two_phrases: NGram[];
+  common_three_phrases: NGram[];
+  lexical_diversity?: Record<string, number>;
+};
+
+type EmotionalAnalysisResponse = {
+  average_emotion_by_topic: AverageEmotionByTopic[];
+  overall_emotion_average?: OverallEmotionAverage[];
+  dominant_emotion_distribution?: DominantEmotionDistribution[];
+  emotion_by_source?: EmotionBySource[];
+};
+
+type InteractionAnalysisResponse = {
+  average_thread_depth?: number;
+  top_interaction_pairs?: [[string, string], number][];
+  conversation_concentration?: ConversationConcentration;
+  interaction_graph: InteractionGraph;
+};
+
+type IdentityMarkers = {
+  in_group_usage: number;
+  out_group_usage: number;
+  in_group_ratio: number;
+  out_group_ratio: number;
+  in_group_posts: number;
+  out_group_posts: number;
+  tie_posts: number;
+  in_group_emotion_avg?: Record<string, number>;
+  out_group_emotion_avg?: Record<string, number>;
+};
+
+type StanceMarkers = {
+  hedge_total: number;
+  certainty_total: number;
+  deontic_total: number;
+  permission_total: number;
+  hedge_per_1k_tokens: number;
+  certainty_per_1k_tokens: number;
+  deontic_per_1k_tokens: number;
+  permission_per_1k_tokens: number;
+};
+
+type EntityEmotionAggregate = {
+  post_count: number;
+  emotion_avg: Record<string, number>;
+};
+
+type AverageEmotionPerEntity = {
+  entity_emotion_avg: Record<string, EntityEmotionAggregate>;
+};
+
+type CulturalAnalysisResponse = {
+  identity_markers?: IdentityMarkers;
+  stance_markers?: StanceMarkers;
+  avg_emotion_per_entity?: AverageEmotionPerEntity;
+};
+
 // Summary
 type SummaryResponse = {
   total_events: number;
@@ -129,7 +201,9 @@ export type {
     Vocab,
     User,
     InteractionGraph,
+    ConversationConcentration,
     UserAnalysisResponse,
+    UserEndpointResponse,
     FrequencyWord,
     AverageEmotionByTopic,
     OverallEmotionAverage,
@@ -138,5 +212,13 @@ export type {
     SummaryResponse,
     TimeAnalysisResponse,
     ContentAnalysisResponse,
+    LinguisticAnalysisResponse,
+    EmotionalAnalysisResponse,
+    InteractionAnalysisResponse,
+    IdentityMarkers,
+    StanceMarkers,
+    EntityEmotionAggregate,
+    AverageEmotionPerEntity,
+    CulturalAnalysisResponse,
     FilterResponse
 }

From 7e4a91bb5e92cef24e17b245b582650488ee6990 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 18:40:39 +0000
Subject: [PATCH 15/24] style(frontend): style api types to be in order of the
 endpoint

---
 frontend/src/types/ApiTypes.ts | 172 +++++++++++++++++----------------
 1 file changed, 88 insertions(+), 84 deletions(-)

diff --git a/frontend/src/types/ApiTypes.ts b/frontend/src/types/ApiTypes.ts
index f336fef..0e41386 100644
--- a/frontend/src/types/ApiTypes.ts
+++ b/frontend/src/types/ApiTypes.ts
@@ -1,14 +1,28 @@
-// User Responses
-type TopUser = { 
-    author: string; 
-    source: string; 
-    count: number 
+// Shared types
+type FrequencyWord = {
+  word: string;
+  count: number;
 };
 
-type FrequencyWord = {
-    word: string;
-    count: number;
-}
+type NGram = {
+  count: number;
+  ngram: string;
+};
+
+type Emotion = {
+  emotion_anger: number;
+  emotion_disgust: number;
+  emotion_fear: number;
+  emotion_joy: number;
+  emotion_sadness: number;
+};
+
+// User 
+type TopUser = {
+  author: string;
+  source: string;
+  count: number;
+};
 
 type Vocab = {
   author: string;
@@ -31,12 +45,9 @@ type User = {
 
 type InteractionGraph = Record<string, Record<string, number>>;
 
-type ConversationConcentration = {
-  total_commenting_authors: number;
-  top_10pct_author_count: number;
-  top_10pct_comment_share: number;
-  single_comment_authors: number;
-  single_comment_author_ratio: number;
+type UserEndpointResponse = {
+  top_users: TopUser[];
+  users: User[];
 };
 
 type UserAnalysisResponse = {
@@ -45,42 +56,24 @@ type UserAnalysisResponse = {
   interaction_graph: InteractionGraph;
 };
 
-type UserEndpointResponse = {
-  top_users: TopUser[];
-  users: User[];
-};
-
-// Time Analysis
+// Time 
 type EventsPerDay = {
-    date: Date;
-    count: number;
-}
+  date: Date;
+  count: number;
+};
 
 type HeatmapCell = {
-    date: Date;
-    hour: number;
-    count: number;
-}
-
-type TimeAnalysisResponse = {
-    events_per_day: EventsPerDay[];
-    weekday_hour_heatmap: HeatmapCell[];
-}
-
-// Content Analysis
-type Emotion = {
-  emotion_anger: number;
-  emotion_disgust: number;
-  emotion_fear: number;
-  emotion_joy: number;
-  emotion_sadness: number;
+  date: Date;
+  hour: number;
+  count: number;
 };
 
-type NGram = {
-    count: number;
-    ngram: string;
-}
+type TimeAnalysisResponse = {
+  events_per_day: EventsPerDay[];
+  weekday_hour_heatmap: HeatmapCell[];
+};
 
+// Content (combines emotional and linguistic)
 type AverageEmotionByTopic = Emotion & {
   n: number;
   topic: string;
@@ -105,17 +98,17 @@ type EmotionBySource = {
   event_count: number;
 };
 
-
 type ContentAnalysisResponse = {
-    word_frequencies: FrequencyWord[];
-    average_emotion_by_topic: AverageEmotionByTopic[];
-    common_three_phrases: NGram[];
-    common_two_phrases: NGram[];
-    overall_emotion_average?: OverallEmotionAverage[];
-    dominant_emotion_distribution?: DominantEmotionDistribution[];
-    emotion_by_source?: EmotionBySource[];
-}
+  word_frequencies: FrequencyWord[];
+  average_emotion_by_topic: AverageEmotionByTopic[];
+  common_three_phrases: NGram[];
+  common_two_phrases: NGram[];
+  overall_emotion_average?: OverallEmotionAverage[];
+  dominant_emotion_distribution?: DominantEmotionDistribution[];
+  emotion_by_source?: EmotionBySource[];
+};
 
+// Linguistic
 type LinguisticAnalysisResponse = {
   word_frequencies: FrequencyWord[];
   common_two_phrases: NGram[];
@@ -123,6 +116,7 @@ type LinguisticAnalysisResponse = {
   lexical_diversity?: Record<string, number>;
 };
 
+// Emotional
 type EmotionalAnalysisResponse = {
   average_emotion_by_topic: AverageEmotionByTopic[];
   overall_emotion_average?: OverallEmotionAverage[];
@@ -130,6 +124,15 @@ type EmotionalAnalysisResponse = {
   emotion_by_source?: EmotionBySource[];
 };
 
+// Interactional 
+type ConversationConcentration = {
+  total_commenting_authors: number;
+  top_10pct_author_count: number;
+  top_10pct_comment_share: number;
+  single_comment_authors: number;
+  single_comment_author_ratio: number;
+};
+
 type InteractionAnalysisResponse = {
   average_thread_depth?: number;
   top_interaction_pairs?: [[string, string], number][];
@@ -137,6 +140,7 @@ type InteractionAnalysisResponse = {
   interaction_graph: InteractionGraph;
 };
 
+// Cultural
 type IdentityMarkers = {
   in_group_usage: number;
   out_group_usage: number;
@@ -175,7 +179,7 @@ type CulturalAnalysisResponse = {
   avg_emotion_per_entity?: AverageEmotionPerEntity;
 };
 
-// Summary
+// Summary 
 type SummaryResponse = {
   total_events: number;
   total_posts: number;
@@ -190,35 +194,35 @@ type SummaryResponse = {
   sources: string[];
 };
 
-// Filtering Response
+// Filter 
 type FilterResponse = {
-    rows: number
-    data: any;
-}
+  rows: number;
+  data: any;
+};
 
 export type {
-    TopUser,
-    Vocab,
-    User,
-    InteractionGraph,
-    ConversationConcentration,
-    UserAnalysisResponse,
-    UserEndpointResponse,
-    FrequencyWord,
-    AverageEmotionByTopic,
-    OverallEmotionAverage,
-    DominantEmotionDistribution,
-    EmotionBySource,
-    SummaryResponse,
-    TimeAnalysisResponse,
-    ContentAnalysisResponse,
-    LinguisticAnalysisResponse,
-    EmotionalAnalysisResponse,
-    InteractionAnalysisResponse,
-    IdentityMarkers,
-    StanceMarkers,
-    EntityEmotionAggregate,
-    AverageEmotionPerEntity,
-    CulturalAnalysisResponse,
-    FilterResponse
-}
+  TopUser,
+  Vocab,
+  User,
+  InteractionGraph,
+  ConversationConcentration,
+  UserAnalysisResponse,
+  UserEndpointResponse,
+  FrequencyWord,
+  AverageEmotionByTopic,
+  OverallEmotionAverage,
+  DominantEmotionDistribution,
+  EmotionBySource,
+  SummaryResponse,
+  TimeAnalysisResponse,
+  ContentAnalysisResponse,
+  LinguisticAnalysisResponse,
+  EmotionalAnalysisResponse,
+  InteractionAnalysisResponse,
+  IdentityMarkers,
+  StanceMarkers,
+  EntityEmotionAggregate,
+  AverageEmotionPerEntity,
+  CulturalAnalysisResponse,
+  FilterResponse,
+};

From 17ef42e5489142eb9009e30e3fe784a61d7742fc Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 18:43:49 +0000
Subject: [PATCH 16/24] feat!(frontend): add cultural, interactional and
 linguistic stat pages

---
 frontend/src/components/CulturalStats.tsx     | 119 +++++++++++
 .../src/components/InteractionalStats.tsx     | 198 ++++++++++++++++++
 frontend/src/components/LinguisticStats.tsx   |  86 ++++++++
 frontend/src/pages/Stats.tsx                  | 100 ++++++++-
 4 files changed, 495 insertions(+), 8 deletions(-)
 create mode 100644 frontend/src/components/CulturalStats.tsx
 create mode 100644 frontend/src/components/InteractionalStats.tsx
 create mode 100644 frontend/src/components/LinguisticStats.tsx

diff --git a/frontend/src/components/CulturalStats.tsx b/frontend/src/components/CulturalStats.tsx
new file mode 100644
index 0000000..7f3a775
--- /dev/null
+++ b/frontend/src/components/CulturalStats.tsx
@@ -0,0 +1,119 @@
+import Card from "./Card";
+import StatsStyling from "../styles/stats_styling";
+import type { CulturalAnalysisResponse } from "../types/ApiTypes";
+
+const styles = StatsStyling;
+
+type CulturalStatsProps = {
+  data: CulturalAnalysisResponse;
+};
+
+const CulturalStats = ({ data }: CulturalStatsProps) => {
+  const identity = data.identity_markers;
+  const stance = data.stance_markers;
+  const rawEntities = data.avg_emotion_per_entity?.entity_emotion_avg ?? {};
+  const entities = Object.entries(rawEntities)
+    .sort((a, b) => (b[1].post_count - a[1].post_count))
+    .slice(0, 20);
+
+  const topEmotion = (emotionAvg: Record<string, number> | undefined) => {
+    const entries = Object.entries(emotionAvg ?? {});
+    if (!entries.length) {
+      return "—";
+    }
+
+    entries.sort((a, b) => b[1] - a[1]);
+    const dominant = entries[0] ?? ["emotion_unknown", 0];
+    const dominantLabel = dominant[0].replace("emotion_", "");
+    return `${dominantLabel} (${dominant[1].toFixed(3)})`;
+  };
+
+  return (
+    <div style={styles.page}>
+      <div style={{ ...styles.container, ...styles.grid }}>
+        <Card
+          label="In-Group Usage"
+          value={identity?.in_group_usage?.toLocaleString() ?? "—"}
+          sublabel="we/us/our references"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Out-Group Usage"
+          value={identity?.out_group_usage?.toLocaleString() ?? "—"}
+          sublabel="they/them/their references"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="In-Group Posts"
+          value={identity?.in_group_posts?.toLocaleString() ?? "—"}
+          sublabel="Posts with stronger in-group language"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Out-Group Posts"
+          value={identity?.out_group_posts?.toLocaleString() ?? "—"}
+          sublabel="Posts with stronger out-group language"
+          style={{ gridColumn: "span 3" }}
+        />
+
+        <Card
+          label="Hedge Markers"
+          value={stance?.hedge_total?.toLocaleString() ?? "—"}
+          sublabel={typeof stance?.hedge_per_1k_tokens === "number" ? `${stance.hedge_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Certainty Markers"
+          value={stance?.certainty_total?.toLocaleString() ?? "—"}
+          sublabel={typeof stance?.certainty_per_1k_tokens === "number" ? `${stance.certainty_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Deontic Markers"
+          value={stance?.deontic_total?.toLocaleString() ?? "—"}
+          sublabel={typeof stance?.deontic_per_1k_tokens === "number" ? `${stance.deontic_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Permission Markers"
+          value={stance?.permission_total?.toLocaleString() ?? "—"}
+          sublabel={typeof stance?.permission_per_1k_tokens === "number" ? `${stance.permission_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          style={{ gridColumn: "span 3" }}
+        />
+
+        <div style={{ ...styles.card, gridColumn: "span 6" }}>
+          <h2 style={styles.sectionTitle}>In-Group Emotion Profile</h2>
+          <p style={styles.sectionSubtitle}>Dominant average emotion where in-group framing is stronger.</p>
+          <div style={styles.topUserName}>{topEmotion(identity?.in_group_emotion_avg)}</div>
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 6" }}>
+          <h2 style={styles.sectionTitle}>Out-Group Emotion Profile</h2>
+          <p style={styles.sectionSubtitle}>Dominant average emotion where out-group framing is stronger.</p>
+          <div style={styles.topUserName}>{topEmotion(identity?.out_group_emotion_avg)}</div>
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Entity Emotion Averages</h2>
+          <p style={styles.sectionSubtitle}>Most frequent entities and their dominant average emotion signature.</p>
+          {!entities.length ? (
+            <div style={styles.topUserMeta}>No entity-level cultural data available.</div>
+          ) : (
+            <div style={{ ...styles.topUsersList, maxHeight: 420, overflowY: "auto" }}>
+              {entities.map(([entity, aggregate]) => (
+                <div key={entity} style={styles.topUserItem}>
+                  <div style={styles.topUserName}>{entity}</div>
+                  <div style={styles.topUserMeta}>
+                    {aggregate.post_count.toLocaleString()} posts • Dominant emotion: {topEmotion(aggregate.emotion_avg)}
+                  </div>
+                </div>
+              ))}
+            </div>
+          )}
+        </div>
+      </div>
+    </div>
+  );
+};
+
+export default CulturalStats;
diff --git a/frontend/src/components/InteractionalStats.tsx b/frontend/src/components/InteractionalStats.tsx
new file mode 100644
index 0000000..43567c5
--- /dev/null
+++ b/frontend/src/components/InteractionalStats.tsx
@@ -0,0 +1,198 @@
+import Card from "./Card";
+import StatsStyling from "../styles/stats_styling";
+import type { InteractionAnalysisResponse } from "../types/ApiTypes";
+import {
+  ResponsiveContainer,
+  BarChart,
+  Bar,
+  XAxis,
+  YAxis,
+  CartesianGrid,
+  Tooltip,
+  PieChart,
+  Pie,
+  Cell,
+  Legend,
+} from "recharts";
+
+const styles = StatsStyling;
+
+type InteractionalStatsProps = {
+  data: InteractionAnalysisResponse;
+};
+
+const InteractionalStats = ({ data }: InteractionalStatsProps) => {
+  const graph = data.interaction_graph ?? {};
+  const userCount = Object.keys(graph).length;
+  const edges = Object.values(graph).flatMap((targets) => Object.values(targets));
+  const edgeCount = edges.length;
+  const interactionVolume = edges.reduce((sum, value) => sum + value, 0);
+  const concentration = data.conversation_concentration;
+  const topTenCommentShare = typeof concentration?.top_10pct_comment_share === "number"
+    ? concentration?.top_10pct_comment_share
+    : null;
+  const topTenAuthorCount = typeof concentration?.top_10pct_author_count === "number"
+    ? concentration.top_10pct_author_count
+    : null;
+  const totalCommentingAuthors = typeof concentration?.total_commenting_authors === "number"
+    ? concentration.total_commenting_authors
+    : null;
+  const singleCommentAuthorRatio = typeof concentration?.single_comment_author_ratio === "number"
+    ? concentration.single_comment_author_ratio
+    : null;
+
+  const topPairs = (data.top_interaction_pairs ?? [])
+    .filter((item): item is [[string, string], number] => {
+      if (!Array.isArray(item) || item.length !== 2) {
+        return false;
+      }
+
+      const pair = item[0];
+      const count = item[1];
+
+      return Array.isArray(pair)
+        && pair.length === 2
+        && typeof pair[0] === "string"
+        && typeof pair[1] === "string"
+        && typeof count === "number";
+    })
+    .slice(0, 20);
+
+  const topPairChartData = topPairs.slice(0, 8).map(([[source, target], value], index) => ({
+    pair: `${source} -> ${target}`,
+    replies: value,
+    rank: index + 1,
+  }));
+
+  const topTenSharePercent = topTenCommentShare === null
+    ? null
+    : topTenCommentShare * 100;
+  const nonTopTenSharePercent = topTenSharePercent === null
+    ? null
+    : Math.max(0, 100 - topTenSharePercent);
+
+  let concentrationPieData: { name: string; value: number }[] = [];
+  if (topTenSharePercent !== null && nonTopTenSharePercent !== null) {
+    concentrationPieData = [
+      { name: "Top 10% authors", value: topTenSharePercent },
+      { name: "Other authors", value: nonTopTenSharePercent },
+    ];
+  }
+
+  const PIE_COLORS = ["#2b6777", "#c8d8e4"];
+
+  return (
+    <div style={styles.page}>
+      <div style={{ ...styles.container, ...styles.grid }}>
+        <Card
+          label="Avg Thread Depth"
+          value={typeof data.average_thread_depth === "number" ? data.average_thread_depth.toFixed(2) : "—"}
+          sublabel="Depth from reply chains"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Network Users"
+          value={userCount.toLocaleString()}
+          sublabel="Authors in interaction graph"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Unique Links"
+          value={edgeCount.toLocaleString()}
+          sublabel="Directed source-target pairs"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Interaction Volume"
+          value={interactionVolume.toLocaleString()}
+          sublabel="Sum of link weights"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Top 10% Comment Share"
+          value={topTenSharePercent === null ? "-" : `${topTenSharePercent.toFixed(1)}%`}
+          sublabel={topTenAuthorCount === null || totalCommentingAuthors === null
+            ? "Comment volume held by top commenters"
+            : `${topTenAuthorCount.toLocaleString()} of ${totalCommentingAuthors.toLocaleString()} authors`}
+          style={{ gridColumn: "span 6" }}
+        />
+        <Card
+          label="Single-Comment Authors"
+          value={singleCommentAuthorRatio === null ? "-" : `${(singleCommentAuthorRatio * 100).toFixed(1)}%`}
+          sublabel="Authors who commented exactly once"
+          style={{ gridColumn: "span 6" }}
+        />
+
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Interaction Visuals</h2>
+          <p style={styles.sectionSubtitle}>Quick charts for interaction direction and conversation concentration.</p>
+
+          <div style={{ ...styles.grid, marginTop: 12 }}>
+            <div style={{ ...styles.cardBase, gridColumn: "span 6" }}>
+              <h3 style={{ ...styles.sectionTitle, fontSize: "1rem" }}>Top Interaction Pairs</h3>
+              <div style={{ width: "100%", height: 300 }}>
+                <ResponsiveContainer>
+                  <BarChart data={topPairChartData} layout="vertical" margin={{ top: 8, right: 16, left: 16, bottom: 8 }}>
+                    <CartesianGrid strokeDasharray="3 3" stroke="#d9e2ec" />
+                    <XAxis type="number" allowDecimals={false} />
+                    <YAxis
+                      type="category"
+                      dataKey="rank"
+                      tickFormatter={(value) => `#${value}`}
+                      width={36}
+                    />
+                    <Tooltip />
+                    <Bar dataKey="replies" fill="#2b6777" radius={[0, 6, 6, 0]} />
+                  </BarChart>
+                </ResponsiveContainer>
+              </div>
+            </div>
+
+            <div style={{ ...styles.cardBase, gridColumn: "span 6" }}>
+              <h3 style={{ ...styles.sectionTitle, fontSize: "1rem" }}>Top 10% vs Other Comment Share</h3>
+              <div style={{ width: "100%", height: 300 }}>
+                <ResponsiveContainer>
+                  <PieChart>
+                    <Pie
+                      data={concentrationPieData}
+                      dataKey="value"
+                      nameKey="name"
+                      innerRadius={56}
+                      outerRadius={88}
+                      paddingAngle={2}
+                    >
+                      {concentrationPieData.map((entry, index) => (
+                        <Cell key={`${entry.name}-${index}`} fill={PIE_COLORS[index % PIE_COLORS.length]} />
+                      ))}
+                    </Pie>
+                    <Tooltip />
+                    <Legend verticalAlign="bottom" height={36} />
+                  </PieChart>
+                </ResponsiveContainer>
+              </div>
+            </div>
+          </div>
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Top Interaction Pairs</h2>
+          <p style={styles.sectionSubtitle}>Most frequent directed reply paths between users.</p>
+          {!topPairs.length ? (
+            <div style={styles.topUserMeta}>No interaction pair data available.</div>
+          ) : (
+            <div style={{ ...styles.topUsersList, maxHeight: 420, overflowY: "auto" }}>
+              {topPairs.map(([[source, target], value], index) => (
+                <div key={`${source}->${target}-${index}`} style={styles.topUserItem}>
+                  <div style={styles.topUserName}>{source} -&gt; {target}</div>
+                  <div style={styles.topUserMeta}>{value.toLocaleString()} replies</div>
+                </div>
+              ))}
+            </div>
+          )}
+        </div>
+      </div>
+    </div>
+  );
+};
+
+export default InteractionalStats;
diff --git a/frontend/src/components/LinguisticStats.tsx b/frontend/src/components/LinguisticStats.tsx
new file mode 100644
index 0000000..3569511
--- /dev/null
+++ b/frontend/src/components/LinguisticStats.tsx
@@ -0,0 +1,86 @@
+import Card from "./Card";
+import StatsStyling from "../styles/stats_styling";
+import type { LinguisticAnalysisResponse } from "../types/ApiTypes";
+
+const styles = StatsStyling;
+
+type LinguisticStatsProps = {
+  data: LinguisticAnalysisResponse;
+};
+
+const LinguisticStats = ({ data }: LinguisticStatsProps) => {
+  const lexical = data.lexical_diversity;
+  const words = data.word_frequencies ?? [];
+  const bigrams = data.common_two_phrases ?? [];
+  const trigrams = data.common_three_phrases ?? [];
+
+  const topWords = words.slice(0, 20);
+  const topBigrams = bigrams.slice(0, 10);
+  const topTrigrams = trigrams.slice(0, 10);
+
+  return (
+    <div style={styles.page}>
+      <div style={{ ...styles.container, ...styles.grid }}>
+        <Card
+          label="Total Tokens"
+          value={lexical?.total_tokens?.toLocaleString() ?? "—"}
+          sublabel="After token filtering"
+          style={{ gridColumn: "span 4" }}
+        />
+        <Card
+          label="Unique Tokens"
+          value={lexical?.unique_tokens?.toLocaleString() ?? "—"}
+          sublabel="Distinct vocabulary items"
+          style={{ gridColumn: "span 4" }}
+        />
+        <Card
+          label="Type-Token Ratio"
+          value={typeof lexical?.ttr === "number" ? lexical.ttr.toFixed(4) : "—"}
+          sublabel="Vocabulary richness proxy"
+          style={{ gridColumn: "span 4" }}
+        />
+
+        <div style={{ ...styles.card, gridColumn: "span 4" }}>
+          <h2 style={styles.sectionTitle}>Top Words</h2>
+          <p style={styles.sectionSubtitle}>Most frequent filtered terms.</p>
+          <div style={{ ...styles.topUsersList, maxHeight: 360, overflowY: "auto" }}>
+            {topWords.map((item) => (
+              <div key={item.word} style={styles.topUserItem}>
+                <div style={styles.topUserName}>{item.word}</div>
+                <div style={styles.topUserMeta}>{item.count.toLocaleString()} uses</div>
+              </div>
+            ))}
+          </div>
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 4" }}>
+          <h2 style={styles.sectionTitle}>Top Bigrams</h2>
+          <p style={styles.sectionSubtitle}>Most frequent 2-word phrases.</p>
+          <div style={{ ...styles.topUsersList, maxHeight: 360, overflowY: "auto" }}>
+            {topBigrams.map((item) => (
+              <div key={item.ngram} style={styles.topUserItem}>
+                <div style={styles.topUserName}>{item.ngram}</div>
+                <div style={styles.topUserMeta}>{item.count.toLocaleString()} uses</div>
+              </div>
+            ))}
+          </div>
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 4" }}>
+          <h2 style={styles.sectionTitle}>Top Trigrams</h2>
+          <p style={styles.sectionSubtitle}>Most frequent 3-word phrases.</p>
+          <div style={{ ...styles.topUsersList, maxHeight: 360, overflowY: "auto" }}>
+            {topTrigrams.map((item) => (
+              <div key={item.ngram} style={styles.topUserItem}>
+                <div style={styles.topUserName}>{item.ngram}</div>
+                <div style={styles.topUserMeta}>{item.count.toLocaleString()} uses</div>
+              </div>
+            ))}
+          </div>
+        </div>
+      </div>
+    </div>
+  );
+};
+
+export default LinguisticStats;
diff --git a/frontend/src/pages/Stats.tsx b/frontend/src/pages/Stats.tsx
index 683584f..910b0a0 100644
--- a/frontend/src/pages/Stats.tsx
+++ b/frontend/src/pages/Stats.tsx
@@ -5,12 +5,20 @@ import StatsStyling from "../styles/stats_styling";
 import SummaryStats from "../components/SummaryStats";
 import EmotionalStats from "../components/EmotionalStats";
 import UserStats from "../components/UserStats";
+import LinguisticStats from "../components/LinguisticStats";
+import InteractionalStats from "../components/InteractionalStats";
+import CulturalStats from "../components/CulturalStats";
 
 import { 
   type SummaryResponse, 
   type UserAnalysisResponse, 
   type TimeAnalysisResponse,
-  type ContentAnalysisResponse
+  type ContentAnalysisResponse,
+  type UserEndpointResponse,
+  type LinguisticAnalysisResponse,
+  type EmotionalAnalysisResponse,
+  type InteractionAnalysisResponse,
+  type CulturalAnalysisResponse
 } from '../types/ApiTypes'
 
 const API_BASE_URL = import.meta.env.VITE_BACKEND_URL
@@ -20,11 +28,14 @@ const StatPage = () => {
   const { datasetId: routeDatasetId } = useParams<{ datasetId: string }>();
   const [error, setError] = useState('');
   const [loading, setLoading] = useState(false);
-  const [activeView, setActiveView] = useState<"summary" | "emotional" | "user">("summary");
+  const [activeView, setActiveView] = useState<"summary" | "emotional" | "user" | "linguistic" | "interactional" | "cultural">("summary");
 
   const [userData, setUserData] = useState<UserAnalysisResponse | null>(null);
   const [timeData, setTimeData] = useState<TimeAnalysisResponse | null>(null);
   const [contentData, setContentData] = useState<ContentAnalysisResponse | null>(null);
+  const [linguisticData, setLinguisticData] = useState<LinguisticAnalysisResponse | null>(null);
+  const [interactionData, setInteractionData] = useState<InteractionAnalysisResponse | null>(null);
+  const [culturalData, setCulturalData] = useState<CulturalAnalysisResponse | null>(null);
   const [summary, setSummary] = useState<SummaryResponse | null>(null);
 
 
@@ -83,15 +94,23 @@ const StatPage = () => {
     setLoading(true);
 
     Promise.all([
-      axios.get<TimeAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/time`, {
+      axios.get<TimeAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/temporal`, {
         params,
         headers: authHeaders,
       }),
-      axios.get<UserAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/user`, {
+      axios.get<UserEndpointResponse>(`${API_BASE_URL}/dataset/${datasetId}/user`, {
         params,
         headers: authHeaders,
       }),
-      axios.get<ContentAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/content`, {
+      axios.get<LinguisticAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/linguistic`, {
+        params,
+        headers: authHeaders,
+      }),
+      axios.get<EmotionalAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/emotional`, {
+        params,
+        headers: authHeaders,
+      }),
+      axios.get<InteractionAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/interactional`, {
         params,
         headers: authHeaders,
       }),
@@ -99,11 +118,28 @@ const StatPage = () => {
         params,
         headers: authHeaders,
       }),
+      axios.get<CulturalAnalysisResponse>(`${API_BASE_URL}/dataset/${datasetId}/cultural`, {
+        params,
+        headers: authHeaders,
+      }),
     ]) 
-      .then(([timeRes, userRes, contentRes, summaryRes]) => {
-        setUserData(userRes.data || null);
+      .then(([timeRes, userRes, linguisticRes, emotionalRes, interactionRes, summaryRes, culturalRes]) => {
+        const combinedUserData: UserAnalysisResponse = {
+          ...userRes.data,
+          interaction_graph: interactionRes.data?.interaction_graph ?? {},
+        };
+
+        const combinedContentData: ContentAnalysisResponse = {
+          ...linguisticRes.data,
+          ...emotionalRes.data,
+        };
+
+        setUserData(combinedUserData);
         setTimeData(timeRes.data || null);
-        setContentData(contentRes.data || null);
+        setContentData(combinedContentData);
+        setLinguisticData(linguisticRes.data || null);
+        setInteractionData(interactionRes.data || null);
+        setCulturalData(culturalRes.data || null);
         setSummary(summaryRes.data || null);
       })
       .catch((e) => setError("Failed to load statistics: " + String(e)))
@@ -218,6 +254,24 @@ return (
       >
         Users
       </button>
+      <button
+        onClick={() => setActiveView("linguistic")}
+        style={activeView === "linguistic" ? styles.buttonPrimary : styles.buttonSecondary}
+      >
+        Linguistic
+      </button>
+      <button
+        onClick={() => setActiveView("interactional")}
+        style={activeView === "interactional" ? styles.buttonPrimary : styles.buttonSecondary}
+      >
+        Interactional
+      </button>
+      <button
+        onClick={() => setActiveView("cultural")}
+        style={activeView === "cultural" ? styles.buttonPrimary : styles.buttonSecondary}
+      >
+        Cultural
+      </button>
     </div>
 
     {activeView === "summary" && (
@@ -243,6 +297,36 @@ return (
       <UserStats data={userData} />
     )}
 
+    {activeView === "linguistic" && linguisticData && (
+      <LinguisticStats data={linguisticData} />
+    )}
+
+    {activeView === "linguistic" && !linguisticData && (
+      <div style={{ ...styles.container, ...styles.card, marginTop: 16 }}>
+        No linguistic data available.
+      </div>
+    )}
+
+    {activeView === "interactional" && interactionData && (
+      <InteractionalStats data={interactionData} />
+    )}
+
+    {activeView === "interactional" && !interactionData && (
+      <div style={{ ...styles.container, ...styles.card, marginTop: 16 }}>
+        No interactional data available.
+      </div>
+    )}
+
+    {activeView === "cultural" && culturalData && (
+      <CulturalStats data={culturalData} />
+    )}
+
+    {activeView === "cultural" && !culturalData && (
+      <div style={{ ...styles.container, ...styles.card, marginTop: 16 }}>
+        No cultural data available.
+      </div>
+    )}
+
   </div>
 );
 }

From c215024ef2ccc25a0261eb0933ef1d49ab4f48a1 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 18:50:51 +0000
Subject: [PATCH 17/24] feat(frontend): add deleted user filter

Reddit often contains "[Deleted]" when a user is banned or deletes their post/comment. Keeping the backend faithful to the original dataset is important so the filtering is being done on the frontend.
---
 frontend/src/pages/Stats.tsx | 69 ++++++++++++++++++++++++++++++++++--
 1 file changed, 66 insertions(+), 3 deletions(-)

diff --git a/frontend/src/pages/Stats.tsx b/frontend/src/pages/Stats.tsx
index 910b0a0..f3f483f 100644
--- a/frontend/src/pages/Stats.tsx
+++ b/frontend/src/pages/Stats.tsx
@@ -23,6 +23,11 @@ import {
 
 const API_BASE_URL = import.meta.env.VITE_BACKEND_URL
 const styles = StatsStyling;
+const DELETED_USERS = ["[deleted]"];
+
+const isDeletedUser = (value: string | null | undefined) => (
+  DELETED_USERS.includes((value ?? "").trim().toLowerCase())
+);
 
 const StatPage = () => {
   const { datasetId: routeDatasetId } = useParams<{ datasetId: string }>();
@@ -124,9 +129,56 @@ const StatPage = () => {
       }),
     ]) 
       .then(([timeRes, userRes, linguisticRes, emotionalRes, interactionRes, summaryRes, culturalRes]) => {
+        const usersList = userRes.data.users ?? [];
+        const topUsersList = userRes.data.top_users ?? [];
+        const interactionGraphRaw = interactionRes.data?.interaction_graph ?? {};
+        const topPairsRaw = interactionRes.data?.top_interaction_pairs ?? [];
+
+        const filteredUsers: typeof usersList = [];
+        for (const user of usersList) {
+          if (isDeletedUser(user.author)) continue;
+          filteredUsers.push(user);
+        }
+
+        const filteredTopUsers: typeof topUsersList = [];
+        for (const user of topUsersList) {
+          if (isDeletedUser(user.author)) continue;
+          filteredTopUsers.push(user);
+        }
+
+        const filteredInteractionGraph: Record<string, Record<string, number>> = {};
+        for (const [source, targets] of Object.entries(interactionGraphRaw)) {
+          if (isDeletedUser(source)) {
+            continue;
+          }
+
+          const nextTargets: Record<string, number> = {};
+          for (const [target, count] of Object.entries(targets)) {
+            if (isDeletedUser(target)) {
+              continue;
+            }
+            nextTargets[target] = count;
+          }
+
+          filteredInteractionGraph[source] = nextTargets;
+        }
+
+        const filteredTopInteractionPairs: typeof topPairsRaw = [];
+        for (const pairEntry of topPairsRaw) {
+          const pair = pairEntry[0];
+          const source = pair[0];
+          const target = pair[1];
+          if (isDeletedUser(source) || isDeletedUser(target)) {
+            continue;
+          }
+          filteredTopInteractionPairs.push(pairEntry);
+        }
+
         const combinedUserData: UserAnalysisResponse = {
           ...userRes.data,
-          interaction_graph: interactionRes.data?.interaction_graph ?? {},
+          users: filteredUsers,
+          top_users: filteredTopUsers,
+          interaction_graph: filteredInteractionGraph,
         };
 
         const combinedContentData: ContentAnalysisResponse = {
@@ -134,13 +186,24 @@ const StatPage = () => {
           ...emotionalRes.data,
         };
 
+        const filteredInteractionData: InteractionAnalysisResponse = {
+          ...interactionRes.data,
+          interaction_graph: filteredInteractionGraph,
+          top_interaction_pairs: filteredTopInteractionPairs,
+        };
+
+        const filteredSummary: SummaryResponse = {
+          ...summaryRes.data,
+          unique_users: filteredUsers.length,
+        };
+
         setUserData(combinedUserData);
         setTimeData(timeRes.data || null);
         setContentData(combinedContentData);
         setLinguisticData(linguisticRes.data || null);
-        setInteractionData(interactionRes.data || null);
+        setInteractionData(filteredInteractionData || null);
         setCulturalData(culturalRes.data || null);
-        setSummary(summaryRes.data || null);
+        setSummary(filteredSummary || null);
       })
       .catch((e) => setError("Failed to load statistics: " + String(e)))
       .finally(() => setLoading(false));

From 1446dd176d702c82de11293ba5c3bdea8f7d1775 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 18:53:14 +0000
Subject: [PATCH 18/24] feat(frontend): center page selection

---
 frontend/src/pages/Stats.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/frontend/src/pages/Stats.tsx b/frontend/src/pages/Stats.tsx
index f3f483f..408cfa2 100644
--- a/frontend/src/pages/Stats.tsx
+++ b/frontend/src/pages/Stats.tsx
@@ -297,7 +297,7 @@ return (
           <div style={styles.dashboardMeta}>Dataset #{datasetId ?? "-"}</div>
         </div>
 
-    <div style={{ ...styles.container, ...styles.tabsRow }}>
+    <div style={{ ...styles.container, ...styles.tabsRow, justifyContent: "center" }}>
       <button
         onClick={() => setActiveView("summary")}
         style={activeView === "summary" ? styles.buttonPrimary : styles.buttonSecondary}

From b7aec2b0eaa693cc10abae65b3bcda65d9726723 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 19:00:31 +0000
Subject: [PATCH 19/24] feat(frontend): add favicon

Credit goes to `srip` on flaticon for the image.
---
 frontend/index.html      |   2 +-
 frontend/public/icon.png | Bin 0 -> 19606 bytes
 2 files changed, 1 insertion(+), 1 deletion(-)
 create mode 100644 frontend/public/icon.png

diff --git a/frontend/index.html b/frontend/index.html
index 072a57e..8a54e69 100644
--- a/frontend/index.html
+++ b/frontend/index.html
@@ -2,7 +2,7 @@
 <html lang="en">
   <head>
     <meta charset="UTF-8" />
-    <link rel="icon" type="image/svg+xml" href="/vite.svg" />
+    <link rel="icon" type="image/png" href="/icon.png" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
     <title>frontend</title>
   </head>
diff --git a/frontend/public/icon.png b/frontend/public/icon.png
new file mode 100644
index 0000000000000000000000000000000000000000..a9fc02b4635b95ef62de5f2cf6aafe070f18d521
GIT binary patch
literal 19606
zcmXuL2Rzm9`#*k$E%OjU*?aG@vok~XJaRHa_CE9u2a)VOi*hnEGfp`uj)d%RkdZyI
z$N9hde1CtB2j@7i`*q#d>v`?_zOREaG18%;xJ3a1fvEI!HBCVv2=EpHA|nA_{)YTK
z2VRK$@9UY90Y4FBj}w6Z$$fRL{XrngmVdus-H2u?;6s)GEvo=CA4EW~^D|daaB#4g
z`%_PU7iV8rF`s8o@^_SOfj}G}Jxz7<kb>>G;GEl!&ItP_Ps5(S`tRlg$mpj4h6*7e
zQ**UCP%NBDYwNs;povCSmBf~n$-JS6Wq5;%)%Cf5pM#bohIVvtXE!zcPGimNnm=MS
z_pGC4)2_6rb8Y&`_h0@Vl!zgBG6`~KXfkmexH{nSa9_={zt~<Bd^70miGNJ?r;IkW
z@I=fIZlL7NItbTp#hyc90G@zOY@9xUp-7|FRL$~@d7zCkmB=UIr~WtVMB+nmxW@$`
zt9hFQ(#tH&Dmr4ycw4|Fkz6=^1p~vBW4dE>?p;SP<jn8y4&fg3k|W=Iyj@3J7ua8H
zOGk56uSJsC=!#j!%wg;c2mG~2ToJ287;_775J}J<^9cc&vS;CWx<uE+m$24M<_8ke
zgD+qpR`gJevejALLP1W*ljkP_zLa~G_|=qdd1?JG<jAARc1%~{z;AfZyBF4)T)r@0
z(LJa7#T@HQ1#n#vdLUYLPhM1xjhm0bVf<kY=}m@PFLPyO`9TxY_b}?1{21k!#ojoV
zPOJMj810BJ=|Wnkd~xV$;9ja2XiN{%a&cF)F^|NK+D`WdYfkRbz{^NwZ|aWpkaZtB
zUy-*bpfobOAN!LC1fhpqEfP)62JWDoD#crgsGh)37$0OmMM^IY_e|>b`g}LY>cN)x
zuIa)vQeP#BThh|i72C*0WGDmSho7KhC|IHJv?wRnI-M2V@q9}6?K)|){$Yk9k_NOa
zA>H^^ise+wPs)CT29~`ldWbYbL3439H1?QCjN2$r_<V8Ew6GyLNBTer_*BLwK`(M=
zHTYZkFLE~G8$CFo{y|WFk1u{3Q<)%pInk(vSxV_HB1LoDM))gUPkXROQ<L@uTplrZ
zY&!cOK>W}rFh$xtYhnekKubL)JO+m93E5b6g%d9RU=A@`DXMFKO=hI7J4!LwrvtYN
zufq)C1rbnqu4|!^77s+V2ZgjA^M{xiamUa=ii!Cc+4LW5V|%XD@qQL6Tdb}|oDYu{
zY&5wfGBfo)lVEO|Uwp(?B7Nvkm?f2KTWMiIe$a|k#`*?9YM<lX>rm|3F%7ND;0ct#
zHNR2qrc}q6cEd|=tE-h=IG+7I{w_Wo<Bt82l$%RsBJ9hvN7ie6X`1l{vyc$qW4k}v
z5XXt(!$wg(0R@}Ae8eW5Ao|ue@J?o~^-(7(1SZx_H*C5}%Rdr%GlWXw!8!S(Ss~0d
z#uB-i5K5y(P$9M50Uf`Nx`#k8e&pSIlIZi1)GP}$39F`W{;Z+*KqJOJ!MSACx-GFZ
zci;^Mu{7L^L;rcnk1!Q4J&g<FSYg52Es-rgS}9IEdd#(-TTG6tINeo`9&AX-nfw{e
zgFp<u$+Q|hVe6IuekDr4gwtf`3D<G&J%X=jjx3~JXS88-P-ip<L{lTom$g^E?@I6l
zHaDDKamr!fp}!P-MB5wfb1oE2r@;!0kpQ0(*Q*<jQ2F|-+{RO$mM-9eI3`w&%TIUB
zj9u^6KlaVkERM;w7G$Hqm7Qw0R332o@m)5*QvnHUQr3}5I=XQ7Mh~|OOULw>MS>6r
zEo;_O<zD#)<;?s9s6&T&?Rg*c4&O1Wz<KzjeOuy&cZe%OHjuf#(SC%=bMk;ok~=&<
zAp0qA3v{17M`wSb|GO*L7vk{117YYP<V)2n|JHsm5>t;!cx?G}2*I}Jw}gIC)?HjU
zn5ns&n`=F$kQ~w@)(+mbdrCr$^?5YWXtAVd`gUAUoZglqKR0tm2vaN2HR1)xmKgJ0
zP<%$nJ$UJpS(ZP!7>AsiRO5e_aS95xBvFQUsoSiHE^`z@o*+Kg|Mn)@FIl&<K`m#n
zrnB|a&2Bc+FPt!98*th8uCL%0MUUkx_212s2j@eJ`KX0&+4zbW!+I>Eg%qe82cAJB
zBs7re$Xaj@MT)CneLu!Bp|8PXf{Pyg-8IsQ%87oz?oPf!95LE}q=>kPtM5Cj>#cgN
zXW>f<2hHF;7Q8~@+~?XttM_5_^-XoT)|_u4EhZ5s>!xtIlQ6wnxjPz2LsTe(BUFqt
zh)ZPi{AgzY4(IO@M*2W>Xchl57IFxAk=tqRvs%w3@RQ|PtIvZv)aqa2Dd1iK<=Dx*
z0SPBd__xVnRJlw3A9d9q4gXDDAKNWa1qH+1%2>R$B2E$wh>D;N+2{9%aJOub;-;5r
zXv-fF{naVZWA5Yk-B}*0TNk!jbg1EXnzjA6o?rP=HVF6D+_Iv+ydzoMgA>X1!}Ky-
zU_zJ`IF4Q<CiB6sI7ePO2DJD!X2hd73*})8Z4I8Bue1L!oaEXY<LD%%(`RGda*{mo
ztF$^*S&?j^8u$?WGk9Ob2+bHmd=PazRve~yk{SAXhZ#Pv{ZLs^8fnSb{Xn`p^Lc_a
zF3Ig@7M;)YYX0tl&+fc^4aU&hm8YbL@j)}}iL+y3;md{mKvXET*56Yc>HO<!`XTg&
z4YJnEZt~~@_Hnh8M}Z=NxmT58(*^;fnSlyMy^IPz=CRQDebx36TwM99lNVtD=T3MT
zndmmfM4Mlmu}$Tph@Z{y84k&wI$1P_n>ys);O-jK|4NWPV^>)m#gVwl!VCTAsLt-h
z2!5-rBlOX^oXeYCYJ7hay`sKUs`xH{;mN~hl56ej;$H8NXC=8uV{r^)-e+uk$80sV
z-M4glyA1YeWU@bJ_F`?Wt^{;~PidEaem?tsaTf<_9$Gxdp;6oSy>|10HLg4d{C<2B
zz+YkJ7zlgMMzZ2j@w-9{K2Z3b1f|+&u{uj?AkY}D)55ouhqeFk;tNCV?Cx0bw<j0B
zJtfW5pOH$<5w26|_27)lI_Oxt35{R%^FvH1rSKC9ubx(%YKL$yIll^CS~iUk9DF!3
z3pz<#2oxusPag!l;h)Hai0m^_?yO<PyFJlN@bcTcxV2I0OO~nprDP%_zHXk5m#w5j
z=sp$0E~;%8%+oeI>yzfUr%*e)0o$i<r!?_RzZGu;-cr%PY;|WiH~Zf1(kt*O%65d@
z;c3<znzaBdr*ozH^1_?H*`P?n>-E^_W_Cj0dfhXf{uL|*DY72@3m)2(q8blgMt#e*
z*PlLqV)7|Z!D;Od@#U5*a)DNu>0nP7Kc~6-Jok|u<zD1L_@I^cUl|5xGkgm}^t00U
zIBp98JBmxtDYIm#zao4n+~M00QJMUT+EPT^F1VXN<vh|4IcYvIsvYrNOQe|fe!$4u
zQD-Oe*-nKU;=Ts5IL(p!UOK$}(vrK+JZUP@@L?9Lhc_EW6Wf#UAwK`j30!t5;y+lz
zhp^p}P#SHI&DJ<Bxv{&iF6rMN`q4XCSbxye$g=D?V{#g@tMPhMik0ZuO0HkCFCr1+
zns~Q+-+-bzZxM5h(Lo+247n#>{~|SYfT(DBr4?2VAxWkB<`)ix->Y`GSSX5OQoq&K
zE2UqiZqL!QTGEE!URl8IE*E0ICj~a$_9c>J5v`54n>Y~g^-ZKHXL3P3Jy)vP4Q}Pf
zpiR4UR9^PO@$7f)&3YK%=;n1&4IfudzrN2pF)zm=Ze&ViPNDYc2fB$5i&1y^LfyeC
z`YOU!-+Pt8h|Il52kx{_py9s*3~4oP@te$(_KM(d;Ezr<n?EyCZ)q4<MZR8&E}qNO
z!q$HZJq}_wQaKciipeI+lWj^(Gu8l*x5&-@kYM&bF$xqQ>TeaQ5;?EI@u&q_@40M{
zNKg(IJ)!lNKWGp>E12Fd?-2Wn`>3L+@^Zl&JF}vc%rSA8?H)vkz<c2XL$+jSK46Nl
zY>9nEB(4I3sM2Q1KVnziUb<}I1?TN5*<(jJxnCuJOIw71&xWiPa-SJ8e1eADSy8aB
zsnLe&z!XmzuOi(t+<&*^<2CVbv6EvYZ27=V*4nk))c5q}eiYtU*&JncxpEEJj7C{4
z)<upAH-DbWn7UZJn@A}7NY}&IlkVWhtcPAS4pkmZa2Ayot{46GWcgLPe|ymp$_$$H
z^v50kAZa_<KjV2{eDMMY%FeZw&&2Cp;2xrwKd4$)&ic0W+{_=3@#Ld&5N|9(HdG-w
z$K3KUG>U&;Vt*>?(4F%*uC)N(twD*pjsDr`Dq7*VqnHhE)|P8@Naj9vHV!?k<tX;Y
z_R}f8W*m2Fq1*g%)ojMDXmXiLn@#U>{4SDvKM+@v<DE8yX4OCr>V}Vr^YhuhX(sOt
znscDs%DEK!Adn9ml*u;3op_Q+=E^qx?2lM@aBa(#Z!Q0wV|%EJC`6xn(vPE8bhDi$
z#PD4I<Ljx{R-a$@Kgg|dl|1`f5sCb$e0y!xmkKeF1k)qzMY}9{GT%245-F4HB3C`#
z^wPn591!N4U>D344!nCRqw|*hyeSK~usZpACI0cDPPP!+CC?nPOTk6izve|ed?&Jl
z`|Vj44@vdr)C*kGMs;9)-H;HorPCpF(vj{bMmJVpyCu&likzaoTkXQ)u<#bk{Z{)y
z1ap1hG3D=z!UC;x@Bg}UB(6iTonDB$%-~-}Gx3CdRIRh)!E|lOp{%{ymax-AJ~@_8
zMKFA_J*yX6|5dQCK;l{lH9Ul)zYuh1EjQ*%Auu0IzpHzAZCD`mM2>bALf}~7IT}RO
z{`o|{+zp|5m&<z;H7a*skmlNr^Hyuet)H$~+tg1N-gR;G`KLJk?%i!;y_S7*N?(gF
zQ>tkKPa9`uGuMR-0uQ59ows_v1^X9&N*Hp)G05>8Cw$$!xZodUmy-Q&Dnmf)mwwC~
zeXqBL?XsSt^A1Isv##?EU&Aj`irHG&(XZx{@T2kj=!Ie(m4%gVa5Zmx)<dl1yx>xi
zx{BiMyzxFCy~!WH)Z3+T{g6ri<WB##J5ypKfjP1Uyxq(3yQC9F0qoVVLl;x*_8ADl
z)&IICCYJ=AE3h-3(311><zrSq&E0j)N#}`i6Zoe&CB8-#B6R-xJvsil1|1*z$5|tN
z*qI{+`E^Q7=&LVzm^swaj$IKkwQc|vB69jgfX_(bV1QG(=42gB{c`2K)i>A<UTN0<
zN-M&jJ3QEm%K8$9>G^j{4QIRLP~u0Sz3|cKg<^=DegKuuYs4VFKfzf|nzh8|b&aH6
z)8NA6(QdjXy5g7o=hoIALB*U`g3pI(`4MmT2=u)XHf140LYuM`o(55`1y;vVdisK_
zm{3e9YDs?3!x-+lka2=Z$B>Z2eTZuw(E6~}MaKd+xU=mMx!+2i)$>m|d5`so&7fN7
z!AjO3T${!I@ONM5uX~&2>*lTW8NYh!2yJ|D_qoi=zQ&4NL#33zRP&7Ns{Lq|WTGgI
znee5kQC!UQO{-TN^Nld9hlSuLIvua~K3yvqPZ(B_qLov<qj1o=V)oX!NTyPA*EN$n
z^<wCgvXF(>92Sia0LO7==(qf4sytl4*R?EU7Nxn4CGyK(`C~P@!{keumQa1gqmCZN
zn?Z-#Gd(5<FDj-pH{(%DK!E&f7^(E$+QIZrbR?%F%2;r`ep!{V-+kh5Gw+b?m-LEn
zt*V(E6WY0kUUhH_URyfPGqXAQ1tZ$SIE?<1!YtB~KVcj#NJYG(xxj%29UIZ^mR96e
z{xA|Lo#9i*AzUS1e7txZA)t=iHKJYX#MBYh=gAftzkVxusvT<;%r$glF=&aQ-aNk`
zC$o133zg_q{>Y{P3}@m=I7%m9lJOMsEZc>9@=yGxVd_7pz@HJ-H^Y3i%zF3pGRJRW
zZ(K8+j1I0F_p+r%`Mf4REo#YAWQv4J+?g_GTeBMNY*HdabEizAxB8$huUCu0AXm4+
z;Ux=&e`%JOhw}QKR@_B$_o@)q_!Ao0L;ed`E6mTF6T&R$`TJb4T!pgm^Cw96zItK(
zt_ea=i<Y*};+QbzNoXt#(a(L&;n0YXx_!#;zEkg$=)#^7wZ8Q5Z%-!Tc@}&q!g7~4
zsMRb_M?^Nv)M{-Wh+!LrrwDq|+sa}!lX+vz_?KFwoCiMm8t}EMCn#Dy`j?NQuYzw{
z-S<M|?2luy2)5IhI+eyzn-^1b`i0xwj%;f)m@)FD2<oZ(Y}K+YFLe(|>@?37IaHqq
zqW-gDA0AxaZP`V+M8qg0d_^C0C0+9ogl7sdadg&Q_r5cs3{!FU{2_G*{<{0md{svV
z%cMvm8xGi=BM@&ss?;%WziecVj3W@RlFcwh_8tC|vG<?JF%M>8KHD3u-*L>AmKP<3
z*pB~BZ|6Lkm|pkU8cuRCsQ*<-rC`HW`6wQSBphr1J#kW$yrcFfd+9WaKV=v#BL~hZ
z?R4Hz|MX@x#Hn4OFKEfiys=0DeCoKXPdiJA2`fA0=-V!4>|67Ppc{V9x;KMs>H9;9
zfRXr?-;E7l^0Hybok&&n2>G%?@c@I^Q=E`1>EHb8OKrC0PuP9gr-<79rY;5Wx`VK<
zdn~gmXL3F9RsH91ie+ixU*m2*uU@#xkK`s^8^p3;&k>FPMotT1G?ti|%9R7nI;;O2
zeVM{hG?AWbuj(%`kCP9WDrG&nS|ch6&M!0mv3vj1=j^akUt?!4#EUlY_De}9vuN_J
zfM3Km)+iovwL(<lLt1`ETj?S5LYP}BMYj=izBOl%_5y}YFxiK`Ub<MS%m2l`wK6bm
zu^F~rj3edD;;ccTYm&@GdT{Q}k9pdbvciY8JIxoQ5~j?><IiEpYnBJeslv;hB=-4I
z6x&iuo?3pnD^LBMh-dO2wQcQEElsV$!r61EGJv7^H<ZLv&fJ_Mbdp>S?YKN2td(@q
z)iCtQWhtasvMl(0IYm1ZfNtROdnJcSESP%bh(gquXYXhN6cP4tAI}xT_C|>=Ky?od
zJ**YL%&m=BKjBn<)%(no6cO4;S(YQe+-|16W^kP@^Q=KcMy2aAkrTeJWbTd=ab3AU
zvjyJq%ajqU*L9*24TJO1&TYC7*Q<$Kh4R+#c7N%`*lGqgK}kWDsEx+38L|)=7xrP=
zg>4ZBb==EuOE>U6ESu}K+bEY$k3M<Ne;J6>ZwRBDj=n>6h;ohd*E-7O^{1bar&uAk
z4oA5RZhH5>HynZbHgcqB5c~a(G>*`s^<R5dB~Wt{zx$<CMKEztB=;tsF2M181?vHM
zVS%T1_L4@8L5CWEx;msM=7QKyKJi(3y*&AH7{&ItO2pj2Gt-G{Oy7I8gcbs+R$yng
zLWb_j^H%-uXg7Tnqk?zY`2<u&?ENN18Izhbdw@nZLeDNvY}uQ%8P+Qs$IShx_YGT?
zgg=d1kSd#6a%5)cdKR&e%9wVW7DIaOuXD}p&W*vSmlDm!<jZ+bv|#cOj$AFMns)Bw
z{lz82Lpu#*H0AP)DMPk(3yC7p9(ZZ6=D_};^70R(k~5w?be)Ry;M3cCbk31?AQSXI
z8zBmhOpJT#zqI3c;$SpdkFvtW+ppTX1(G+78ivv&HdDeu0X19~vNDMqpOy2byiMrF
zyqx|M5Njkz=8*m>#oYSB+@&8e-Dtx&_g_&Eo+u#wCC*@1(<!&A=7cUC(r80gAXr5T
zAFF?^8JK&O`k4o$LmquSh82vY;0ITuHqJ%!T12Gv*VOU+W$oIaV%T_~P@R=|_Aq<>
zs1@t>@9yEmr99naN+Gxna@7!nR=f@Qk*8)b@#xouKJr~zYm```JFx@+&2%)28x1CH
zosS?&9L4v3^EsAC?S&bVUn?-z+D07YNIx#iHYZW$VWcj+_w=DXBKHzDH{0zIc|{hm
zd0njDBAsI${0mwl&oEb0Azse<z<gW#T%jE`iXce7x{VY~cphdRCG>vH-YsiSjg7s-
z#5_B9#pSM_5%P-_{;I6qT)BX?M44;O3)6+#*(ONJ=x^El*rrl}G4m#TL(A`gb;~mq
zw9H3t;vm`-@LM{61q9%x+nMm=J6DlpEg&7T=pEw`k@|4%5$V!BS*NrrG3h}|RzDhH
zH0o_<I7_RE2@Pg3#F1Y3Ytj1rbvAu9IYSLouMGR#-DO0lAC1~QQH;IY4AD4=>nGHb
zJE?<cLjRU(-0@*|c;ns^2X%wyK@VFeA9ZDrBQHHnxNjAsm_&X5w`oA-mubvLm@q_)
z@n;ib-5p==zObjz9ln`rG<APGku~^j=^&hjwl^S7poo8edR9x3XzrwXeRPsY>I76#
zxj}3axDai?Fl?Z7!|DFjnN%nJ+$wY9NWrCi;#9iY;>CJ1Otx|9O3i#&-K|-fz+PW!
zY>^(LOmvh3zS0L#-@NWnEeW0Kq8hT93&p0`BP`h0N~dw23V9!fpMd4bH^AGz=yAJf
zdZfmGs=E;nm3JA({crBQ2G9|Xcg50{ehD8jATe)>^r0PhnRo(`U>y3*h+K>5Cfk@!
z&auuPm%<0AD<dpaRQbYA8)k?MTQ0P)aaz{i5HFFce)KRAUi3?GAZH#cKGIF<fD*|P
z8-_zitb(5;ZG@$kq)cO8#)femt4a={Yl-lNz|feI6zBD<q<8IPL+FAiO<d9NhKUoS
zy7GHx5I=}-#1<lPD<pG$4R^mWz+Khpbx9E^>ZlE2VV_#Y62zv3Ci}Vpm$`VkrB`6>
zl%?lGj@iNLg;Ow<Ta);=mQW*$6E-9ppP8}WJC;*t7l+7`ZLom1xU2d-YFdb#R2PTa
zOilWIWvox(_{o2aUW)PcEi}&D$>FG46H;f#kAwJr*g{GMB$&$o#F@<@nV{li0Ko%W
z$fdT)u!M{_$9p1tQ&||gFYEz`k5&;RbV+O_P^B||Rl7ki)41yUw(54T1cn>yw{G1D
zu`)JE9k((j$Eb8(eu^=D+`&Eacwr3LO#zTx-RJO)FDZ(QLB)n$^Hf3MMOo7&M}J=}
zSe{BVkYhYYM0(mlLk%3#o??l-Aw565Ue??q*=qx3=^2wFH*)6sQDU`d^G%0Go4!Nn
zwt`f?GfRW6Pcb?9uf~gF@1gtJ^+9~}vxY)dQgf5!8zIRGd_Qp;YkK$~b>&*_i~U8)
zA8gbg@8*qBe0UodbT}NO-8e4hmU2DEHf3Tmyh{{l6?#Q{`l#<7^?m6{?7*K0r^)0%
z^yovK3DVQ?$BrIzkd8bB*KsclFi*og2h}!4G&amZyb3B~OJ^IZta)5sI0@{9WERpy
zWN*O=9F32O)as>$uu6cC<pk#D$P|+{qR4W%t8~&pN)*2U3E}c4r7;UcM*^$hUoQ}$
zf2)ZDtqcPVK{iNx%|KzPUy>M4;9?LLfO2I{_D6P!yDsedG0|l3>9{R_di2|NK2Sac
zaEBHFgk8NY@T*LZxevLr@>-A|u?T(@E!MlQbNF55oa|ws@mbY%dL;U0>2%^0E^ome
z(-<4Zpq!p4NAE=XP}xHI-;h&+zgzPsb2gm_Xc|#YZd0jsVFhz|_sazS>TQ5ADuA(O
zy76$zY56&3@RmTriibKoV0wvi&M>E=<iHLxC5{AO-;3(OB$1Q;!_F4+jj7v1r`<4+
z^yb#BhVIaol0T&#k4*ZTF|_Kyl!Y+lw{<>{P|z>4fO=&^5wMK3XAadb{wkdjZNZrV
zNi5ORM)02kP}Tf3c!%+4X=|H#zITpwlK>xHa7IAOmb_kO#7pfSKgbrfQSbth^#QJP
ze_X^?y85QpY#nquUT|04UpH;z@@91!gEA<Q{p2mklYGMu;)Ixc_>qeH>-ExKDGB9p
z0V9wX-t;d>fFAjQI8X$%bMvPQVqBU%<bg>ld?f?Ui~%0WiW}?(Zl)c7mt$An`tF)q
zgz4X)ikz6*5bK8>GTyN}43^a>ZAcxTgpqmW(g)iS)>4JPJ-GM!BiaJ=AT1h<f=tg_
z3+|UhPKi}rD_B9KwYP9p&l~|U!K%et>Q-&epBW}tLiP1WimE*A_z6*+f(twMkK`w^
z7yI2l&=jG2WNF4_)B89By%B8#uKA89u2svDPQ=slhtou@k}mB3NUM!QCG1W5Z=#bu
z>u!!+vVy#CbkwhNXm(i#fDm&zR7y~EVSUkuZ&@G_ZayA_cf9=fQ-bY~OdRNK;zmAS
zl}0_=K3EC-19$#*o!A6tohMf1qO1;(b~OMwa8~s!1Ki$8Bo9gCG}oGKODUnQraR)n
z{E5BCP+!$NDbwg7tPcSghzB+<Us=GntAxNNkL%5d1C>Oo03?j-J>H2ZgVOgMKysiD
zSaM{!){!C8&xcw0-*E4J+DlU20ff9K$ehYbZdao$oB|)(Cw-HH-Gm<#+F3T;__Mh4
za*tN-Iz{!}>wDG7URbnG@W~N*-|tbvXy13rGi}^tle(o3Du&)fpnGr|8v9>fHLX44
z%gfZab}T__XDEY)DK~P2s$AMjsHLlEv`)e&h)SqJ)M?|xLFk1Ha*UTcd!jXZj5sjI
zIx@qRyr_)ohz+#aVgVP{f6)*TT1mMf(RiLCR;4kLA~f^k(LYno5CxlH50d{8Ohu<>
zs~;Xn>6r9~0GPoBh}8C1L<bEYBaR+sH4iF-vZ^hdVynb@iLx33%5#A!-kg}GB>>y4
zQJ%aLbwUCb;8s!$?!Y4JHi!mnRbvyAR@VLt>Vz1o0#LgRsk5WfYN6U21VHMcOVq3o
zG6IWzwd!v{MiSTOWR6ETk=JMLI0?>(X|ZnH2G}me2t2gcCk}jUsGS8qB=R%wO~(|n
zZ01yxVbQ-=UwOj{7uk9B6<c|F2(u-(Mw@QAX-z^)P7e^@Fr44HzqYg2=Z+6^sk8S;
zT@w<st2hDw%4aij1j^t99@z<TR337gReCiLmX$c3AO-#!25owMHCWw>8bU|CKY%O~
zVa^TPC^$BIf<wsR5{+S|AK9&ECA1)~0-3*fR5X>xTYeh)|IY#lJia<W3>7g-=2$Cd
zmXfNa{r9oNbL_*CO$_7zgW&xQ!2c8X^?)YC-xHM>nxvL(dgT5?y;$l7xXQr^NF%OB
zA1HM&9zEU;GUefNfVd!@Ka69deRQ$H3EE_O1OZL^aA=)m!<j$hHY#uUzhaO?uHCm*
z6<h;lI75;*NTeFW1T`QfAu;a#8l@A)1GkY<$<b|qKuF4gxrIn}<2<fR-`+;9JWd5%
zTrQP1iv_13J+k-zV2N~QaGaO=rG~IjbzKLW@NnKHv_yGo`4jPGEDvrH{i7lzF0u1Z
z)>^?4Pg%Nvs95L?peV_?Oz4h%<`uUJ$V}c9QlemSO03SFPV`R+llj6gWOZocmsWa}
zK@&a$oJbTPefc!5fBM_2-}6sln>Ts?r){@Ey@nOKpnnPjefWk*Z6wadFyjMhiHLk!
z?l@qP)x54WYSvvHJ79^%7y*5VNtT28KP#)Lsu?E^6zJ+mRKTHC7-$@NiB{3VbZW5p
zaZO<feRE6eIM4*sPiKJDM<(%Q+ol~I0!wvyZp1}5$KQM{D`xyzAM-!;|7X48rmig7
zP5&;^jla<az5SoP{m&LhB@9jCxxjn0$fJBIuoYk=G7ZI#o5Uo{X_Iotd(73@tzk$%
zcHZhWAPO6Pgos0uhyp*{Kh_gTLas?qNM`6laJch^TM{ZR>`C8Lh$Li}2{ii$G8#a#
zp$VMqc<+Gx$AG;%;BIoPj|AHZ#T?<oZ@5y{VqV0Cq4|E2t6BGr%H0GWWV|J<gjy^A
zjho`tu@7`q7i2CBW^i2k6ML`u|1Q4-E<+@=O!{GfaJ6rdBbO*|<kg%20~q9+avv2h
zxt0PJ2}BLGTjZGXvUA{OQsO`b0NCp(3zL3m>^&tSr#3Tw5WveXjbn1z>cvbDV&c=I
zkuA1==^?-<ASUSRGEyhqzI&?>V+y#RI5PJL!CJ!W!tNhaDK#OPrmNimxZfU+ibEkJ
zaqPKvY3`%&+7fDhfDmi%DWUW6ZoN5nByLCRyGL0X=p!^0wPCIl!f5ZINDjEEjTwOb
zx!8N=!gLJceiqyx3a@Q4mESjPpdCd2`Qm?3X+}sZ|6NXkn`}B4SU{f!lZO!o@@wm(
zsu@x(+Z7@V#mHT7tD|`(7dV7yC@X7+SfX)f3y27JeI5Jm*~Ewv*8{!_yjcMH#rxi0
z$WOxL<{+~B3C%z22-Hsl{i4DRTlL3btkgvSs4zg7rYQ~Ge5yY7CNSy$o`YR$*0&MB
z+IHIL;{pOYdKYY^e!PPw0dmO?vB0YA#8h6cY%;VN_Oslr97qpgk9SdZw>-8FPTo5s
z?E!2bpuLC67(+gA+?1|Pi9|XB8BJ$KV)KC!U=bScfT(*iV<)o)>2NTK&wbR-N))I>
zjl)^#2<LT@F&w@@$C>hiYC#h>f0lo(JK?_wD*l(tWJ9!OKk`bbn+$IQ(vJfYtP^^D
zTLuT-Dh<hR2vMhSpe~rWlp}phwjnskv%(lch9P<938^ESivlHzpENyQc)|*JBZT_M
z70rm8>zfe0Fpx3mqxwc32+7w-YzUE{Jk2h-J#OfO7&6?K+M|^u<q+<5Ac}_lbe0{r
zhxn#f?N~y}iI40=t6b!r8cJ?UdpcBu!znh}9+>poVE6x6heArIYzBy&nClu#ZUd<v
zMTeG2YOZXpM$96B0HChhcYt$BBy+qVX;e8c<1yn;KjC^FiRzwzrg3Qc5llJK!L!X>
z<s#O8*VaM<7*~=TNt0K9vVsYW4GSU#%-sbs^d!(pTwPfnltg^AC0@0x4QE77m;B8D
zRmFju`BUa_4@OodV&lQMjg1c&6LsapW;f|2+7dK_xVDAMyKs=rkH_uVrPIZj9uVRv
z;J=a-IXpd3?>y3*Oxmc=+YkhYBv{2(mYg=I8V3ZsHVN0I{d>~eo6vBwjkXtCvxL~y
zH|s1iwr^}-9%TUf9Zi3gd=<kP8zx5ka|FW1|1Wp$_xt;6f(m;Udruo&OZU@XInQtu
zC{jKNGPu~&dipR9g2f?O6dR%PdFdFS?6HY)Av*d9j;8(DD4$03cx5Mg5ZywAzZD>D
zz}N#4FFPBpCGXG!pv+v@96?{V(S_KUq<Yvs;|FC~12tFDdUI|><G)e|gbCLIET!$;
zPN3FFG^KA{Ns$in58!52&u=lAZG9oFWAyv$YLQ*SLK4D055u50CLq+ntZarSgr{yZ
z?7a_&8dYFORf^~=IQe`MW+gT(4%AQiujUG)$vabt=CR;%JpyVuP<A2!)}}DHHOcB}
zS;_eU!Q6b96e(HOjzimNgYM9ezj5=oK@BA|gi#lR+_)lnLEGyVP%jEE;i@$onPo@V
z4;-~z<H6lLX2@3$zC5|Tam+mcLT(G59M_5Brg|pw=ps0C36+8^uuj1LW9y+4Vr2vp
zVPHNv?Pj4N7{o=CO2{_>>S$G{ctX@X9d;-;bK~tV&=A^AS~wLNGemq;<sfG>g8nZr
z^@Jc_dd&kG{NY;2N>57U`eq{wdit^IHc)b>YaUg_v7SHxTl1&NOD7vbUKghXa{8jz
zpLDUdnwbn+yUG2X&Yj}73xsfCcj7k@Xbr!_rN>U2K>fv);G%(l<8a*xcmGM$;JA4!
zR^j{{Hwn8;9*Mk6z7`mKqCz=z<08(obo%5D{z+L_3f=f&_(Np`R4OAUaz;$RA4MWk
z%?WtwoD7=igcY5{Ry(`*4qeEJz_Ql2<#$y=9y!Hu6rBN{N(n(2S%6AqmD`553;9-+
z6ft7n#fE``NRR2pT@k$|^Zlx7{zPYrBOQB}F+fCmO!Dmh#EUP*)iXthUQQ`hHMJ-}
zi0}w|^I@d`;g{x>sn<5<sngLnc)+bi%p@jL>{ItmhVSF~f#rcdYR34Rxz^Xmq{j^7
zN8DWGUp;j2nXzFAy6Spd1<7lWh)({CE*<k>_jN>H6xEQFmh|AHrRI?c^gHeNn~gt8
zG;`n3|5llZKmoIR5H{juhM$LQe$NHAKx};P2XO~}0(D7MHHXMbqN8N>ma}0W&7+*F
z>=-^EyKF&49c#*@gTY-%Ps4FO;BsJ*&Dw@L#tc{@1uxKz2lC|cexv~r7=F4OtCHk_
zK$mu>hpJ-l*T4bk43+e@METZdg_>LI?|kWei%W`b26)f5m4)GW`siVg%{P&c27}}{
z`*s;5MLA}*1?NdIy>Fs<2US3xrJhMy<<lz6@aIxm2Kqm|j9e!^eEti<>3rfbIcmNl
z+p~RWUp^u#DAg!q1n&E{%C}ciCH5#k2;81&iIA$je?szu#EU!8liTT?M9pU-k!Li>
zBz?kwQ#dGybLXMfjX~r~QWhOc#RRwqX%MXU@&Cw!ekCH%H{cyxL=Wu=+VY5r`vvk6
z2Ij@N?l*WRHmb9>iuApNYf8c{2u$tdlZd%nUJy{bcL;bsX7!^8vX<WE3B_!QqBRaD
zqk>vBe+aD4`Xp@FFwG6{jXMw_lm}jeE=lGD9k`J+NgH`FPlMHv1a3a&JnMZqk}d)C
zZa-$Ztlda+%te7|E`qP|wyPfKW@+S)s00NE^F?8d*F$@5R4Hhe*3ANab1CM-Oyx3h
zS-*)hefykYv^rW-N?%AH0+OVz+<5B9Xdir$gvr(nRNs=UX>S|y@|}ln38Qx@*QsF_
zB6*DD-kPsnvI>?y95Z1?03B<Xry3E7WTE&)?8RF}S!Vmx7M@Tl?!(az9YP1M{pkMC
zF-f{Z(w7vq6Nv>}ICu0UA0LNs%2g-xoD!t*ce8d2TP6ExvqW>`e|}BSXyQ1sW$DJQ
zCi==Wq1}~9@?}MP=E<5bt+;2U9e0_)n`ADZG?{G`N5-EZ&d!u(!cR}WOigebaX-Qa
zevlAr{M7;8rV7iGXnvVcai4M4)QKP1?wM#T9P!>6rxqb{;7s1-|1xz9>vPSjo*kJZ
zOG4pnR{XzA&7k&G#&1?2CORcCJ#M>m!(_|(_YGn#ut&kpc8E4b(DutPfJbNScbkFJ
zj7qM&X~I3yZRKz#$-7o7cFtZtjD4;a3EkzNI4w%HJr+<o`_*119Wp;eUY?Y8T4qBP
zDVEKOwDxGHvmfU(8U@}!l>hoK2wJq8xNMue2F-c5o%|GTUoK$D)I@vnw;Hba0N7V4
z&FBPeW9Yt2X~ULJ22K&6YDyQG>P8es=HtnFfD>AxFPPlr6OFiNGsRu9?V$@ENfzCe
zCbtt&ppM-=<&zsk2>7zkgg3ryU3;VrH6~kDv;wFu+8`B2=CK6+lzkasTL;sEmCPF-
zY8hF`9x&7A{7!As8^o&Of)gf85N3!7xpVVlb~`c|*LFb{3~R``3ee6>zZ9cz`>
zp~k$R0&FHdSP}Xte|WZZ+RQ^w>6)xR@>J5pg7gA9_+vgP3Du~WAx7VK!tdvWc++tA
zJl{sy;n?rryh?wmQmr3(>lMtu>!MK=N-=92)?=-Et^jNR-lg0&REEvDJJBxtSSGr7
zkrqKF82j8Uw9-e6sys7POWAE5U*sgC6OHHc-7Ow?g2l@_+lFcTTjl&N>)Pqs)7=zs
zThSjLY~d=qb`f;jDWj<`_C@)=^GjC05HIWeYzg|5<noL4%2!L#mvZK)AMr@y)+y!r
zg*QuGrNV?gN=}DySsuF&9ElWwH?pm~yrz{fWn1I#m6RK3B8SU*TJ*%IzFu{>XjPb?
z!#;pKiZEVcf>f85|5(^^WbB{1pFH%&Ek}%#nn$X-krVTxqOCtFHOjE_*-*6NjJ@Gd
zo;IZ~_e{RK;Cb#x7u1KlW-=yBOLLG9T{ba?y8b@O2~k}`$LlHQ-uyGFKIbk?P2}fL
zmD|L9sO4WbLiE_4lovct2UQnyV#M|QjfZ$=ZoV1OG%Zc^yX$bvt8a2d9`uAS;n3+L
zEc#yd!r~&RI(4yP^VpG^Er(;ZIAK{ySv?tH_=Mqn>~tnZgB}|Ok5yn@q4;Q<k(W6_
z2EW#Sf1%qsO`~~Go9sufBKmVn)giu%GbCoJ(pI#$RQ=^M?(;>;#s+2$G*T~+5TUA$
z^Q65X0~T?L75@Cd=}OOD--4H=jnd*9i0b7AhTMYXWQ3oSWA%dH?d0qKSlE0QMC_eG
z=}YfKg53%CA6a-@tV_G;hW8<dduLq4ydz(d6aGSifmVES+~Ejg`e|A~IoebZ&kxQA
z``$Qb^<vq}BdV`4%u^m@U14$R|F`4sZi%-Zo#P)v%EEd-*d0vT`WYjwNmussUP@6~
z@vEa*VKf`&R6P-YE7|i_R)#Q;(YZUr^!fqg6Fk(r1IvrMJQ#HPxSsT%RSWo8+Ke2g
zfM{QC;Mpk7OHTif=BQ}CHz@*Y%bO4`a85OFZYze>L*_<I8<rPj3CtJ9greY2GyM0Z
z)P=j#FvGgx;vJgpi}iPSQaZo#;5Ff?47)0BZ?ZkI>s;u2FNDelRa}>S`HR@xR+?__
z1&_`{DRreQN#TyyTz9So(~;l9a|&LhgM`~2=}CWkN>^VQOmR`VFw^Q8dOO6s>~x64
z(`VG^*pr`crIYjFrER)O%pEuSk{R}opQvyJL{@*cNk5i$x4lh6tV&?zD&D0dU9k^)
zyJ9}LiDH;^73UYIMR?|Vq60^_wDXz-<S5TI#g7QIEu0q5DqpRxwij9r7k_c6D2Dx@
zwlfsbkrDoKt71-|^5H5>94eU1#Ye_;Rk!=@u{HaT*`5VGr0k1QjA2Dvn;8EbAKRyN
zgiCqNiZ$L4Rr49me~}(U?p5AFww1LG9E@G~?Mr1nsC6Sk!HFZEIaC4jz}p^wcl4Lt
zf<E)fF*YZ1gQV<b&RqU`ogTC^gRhW#+-iH)lbCIK2mSZ+y=Cdh&s$FGJeUXDM-{A3
zE_J`Owr~~8zX`%Sz#Sot49%psd5U)r%qpgTS1v}PmW=K)m8n)k8w#v87D2*Iwdp%=
z4gDf~d-^ctDEO{T7Q~S^#a`BonK&XTCnB#u_*8xA5^3&Gylzv&yGrONDB02e^MN1l
z5_>)eb9y67)EXlrKM?^JjTV9-yZI73KOG3v%M6MnDI?>*?uLg`N(e3<ZE5C_w~rxF
z?5Zx}qfcXg&C#o`eAe0_uN$?2h2#PE+l}7FNXJI-vp3Nxk{RiS7+M%Eqe6K@laJ&F
z&ag(Y@4O7XIMFHLbafip#Z8Lt;Se!|D}71G;jYaufQu&5KSmp2x2L3>w?6z<JzE!q
zXG<^qn8>!kyB*}Wj2iK<IC5^E_^1Cj84y6D>MuTeOk_t?kWm+PLS*I6uHP<xJ%-Un
zEvu$5*A7>w0f%7R4Vx+k@)nFVnIei7zPV!m>&SQulBVw^l&eG?J5(4#Oquw>7B&l<
zb4<}Be@^BWvLmv{gT#c9jr%0`n@8KRKg^5fuC_JHI>VPdZJ!7DGhaU-7%>|vv%P8$
z0R;Sxu{Als@lr>RP-1uIROgH5`a2v{g)&($BGSU48szvkNB(ENUbK%PWJjNY;Bv#O
zp)4KLNMyk|(Or4Iv_NBE6hXzEKyIn^Yibx;+^0h|`HdM*<aDz)V(oiHw9j{IH1)4c
zfomqDAt~LM12Ch(Qz3U_u6&XXuJ}!bM1{W<3HcY+Ty(m3DQ6R9*%XQbs@=|ol90jt
z-4Cpi0>p{+QKg?gKLcC^M9`AtBg`Kn_igcB5Ep$)+0(s0SdA|zwZLSs3I(pBb$46?
z)BH|6BZNgav|(XCmigohaGdj5JZMnwq_<d0#df>qzMlr<<pG<dO2IR;oBEzqOTjtt
z?F+SmHq6w=Yzobmi1*Xi+gR#+p&fDwef(9$)lxTTD{ricZDRj0v15b@Ms>Q1svQrI
z<D%XY^iX*B(1GW;_-oJ2itR-OVRf7l1V?`=<=%ZNPNzW~nsdL)mh8mb0+bCQeYHd8
z%G%)!wA!e?COqrf8EC2~R+_Domf&A(vU||Jd-*?Tc1VF4#YyIi#+q(`RgAA$NsoZT
zf<aI7UmuixaFl~|>2)cd99i6?`!v?{wqxDM!8ot;igm@O!cl0m2qax^0r%O@aJ-bm
zONZLi)@Pq>lh?S^xf1&_`U*H`=Tz2X6p@<({j*W!mzkeMQ(4ieuY<l1D`PzF+7CJa
z$7T&Y6h;_x&j+J#Mi!5K7=3`#G&-A*&S{`+EwCC;xHmmMIjM_RgR5vy&);05zo7Vi
zG@<(6U*!lIdeYPtck!|(k}H89bgfzd$5>eZyRrLh9Mf7*Lk@2nd$i<flG%n4kC9(m
z`Oi9;)1tXR=j`_R%LCE_*3EcbF~TeSy?fcw(9Pe0>V*{w<F)>0GLl}o4U>Qq&-~7e
zCmEHGJE6C|Sp8Foecf4hhe$b-7?X*K*NeuOGI~)LklAURw|o{^5yXE$sXQ+-;A*Bd
z3bi+eu>Ox;)M<3r*zmmqh5rP{hYtz>?)(6U=)-)dfUl_D#{>%w^L(BkD98N4sE4G2
z6YMwVDK2y1^2iMzYodt4%i&j3bRk?WTalT$4CxiC`>PA%X#iRte6>7If|BZjKCDot
z8(i~TgD%+C<9$q)dH2ZFs~mnmKELmpxqSOakHji-T9%g+u-q$6%3578X4b@zQ+WmQ
zx)~NKJ7X29)ldfinfYrB^m#(djg`B2V~il?6VmeaH9m(y8=^=Xz7S1wD(yb`zEUI@
z9PXi76vd+M<(6@NUR09jb6xo9D*PGqZR)zbZ_?zg`4QCg8y?J(I}TY#i`D~DOIDMI
zDB0b9Xf1b`l6I9!ojNnQmo{39080C4r_19g$U5FJ0K?7(J2YM>+LE?<BloG_Dj6O1
zUtTQnV6Mx>x~n8Ht{9cOmuMzb%e1inskQw}5*4zDL<O!UkC_CXCnWoEb8Sk-Th9qn
zBjab!`U#ClLXr5$10MR9D@n_!3n#`U>3kxCt-ouUPRdJ47ee#m#!v#yso?(I6>lG|
zY5l9nNYGU3>GkhFE|?S81c3!_3%!g^A&Sy!XQvqksoekNgLoqmd)bGxr1eSA3Vf2v
z*$2&UVx8fQ3@tiMVQ6|cW`fuMJr@3qzn2HAm2!5{3mn=CvPoe18!FpyLa%tv==uoG
zy3qDJct~tTY?zKFg=@81#(=Y1TD*pT=XpowyV-7j06?2_nX{p<4w_p97QcbhG2C%~
z7zm(ef^U_yBS;hH+a!n0#G{QR^UY*?db&UBA;(80e=CM=dcfI3(ri$oh{GJ;71NYw
zr1cE->t^hhoPC9d?K@+Fi2E+m%9pG_)E8yHe=gf!I5>uF=#-jDvf3<s*6o`OACSUx
zImr(=(;RF@4qW`G`97eux{%$%pQ5~?soSVNTNu$Y=?#qn8+=`yId@?%bI#SSrxDHG
zTG7KlK3FJg=U-0v<`l}CONsj6lk@{eL$JWFk-IqF|ErXjIohsi>0b2ms8Ms$%laez
zV1-!8-DZ{`R71sba1cjt@L}+=_NdR=Y?~6*R>5HARV`xc*vE~t`K{5}m6C$<C4$}s
zrKb@pkGC`}l5dXthFMFX3QY{DYWr)y!$D0iG#f?ZNjs~&c4qxc11%yDd*@o2N%iu>
zyN~qo#lJhBTqxl+7^L0biQ7UP--foZ)|j?+F9$!wsvJkUgH!kjo%~|FuTQvIXS>&y
zo<@7x=+FYOR(>xU8uV@PoW#=>&x&Q)2#uBt6g`2lu6j+RE*Jw{CN<m(!>+{pZ48+*
z7mEx2`#lSJ^C{Sh_Z_U4a%Gf(&(8I6k2T=M*Mr}Jd9}s|@8fNjz;&VB(X72WM3)I4
z6$b(>9YEAy7th0%;-iP(Pz7JuY8i0#ttW-hig2`tC(XPM<j|&rks0@C5I+}8rPCp~
zqbtcedE=)E*I9VcrD}B<^)HXToaluWwt>3^?s86|*!HC|qlkQMub(3Zd@#x42L=|0
z4p8C2XJxho132T?4E3l!Ey07+Kl%be{2JY7C*1`vf!g5JoFGEC<l$3@L;9uAm{q2N
z_DQwoNl?*+7=t|m63x?Bee$N2+|%0I*iI*{cqPEeV`gwG?ann++z5g;O=P2Y%K%z8
z%^cmREx2F5hb6Qu=A)cbxm0IGT*>zl(PASxcgWC!7atQFiR*{e=7n9tgp6qqjSqf5
zC4A2I2XcEx)4#9O%I(xUG9P_2S)%gs0UAqEKeuV__M0(W(ApR&MO@$C`hCh<Mj1`x
zr2KyJt2f1E)-&n_1ODzJQ1{sr@f~sj!8<=BLS|`cD!nOFmWMHw$WIh0+%!EgDEonm
z6sfdzhdY!vxNjBoN!FFe(6L8%{+HuUBb=(|V1Ry{Lxbas6Icz%m<F0BwHkzlQw6bn
zCjIo}*49HD^u7JC>*Un5Aeswt+CdL9H%<$;4%LTO&?8E`0vAfY`oA<R?xZ7IJy6se
zJJmipKjY-B!}D?IBUQk_A}IJ`bMP+Uq=nq%@pOsZpJ!sC>Fvi{qrw{xrV6J9OGR8R
zp`wDXL8_Nyng2sVCUKogU@+&83_PNKgzD*pM1d~-?wixycVz<U|3>{EUQMcJMX?i>
zK$|M@l){RZt(g_mDVN_fhmi&Sz+CNPR7}xcw&Olltr|Uo6^qgrxYpjZ+u;cE6@Dho
zIB2=%Qk3M-_PYJ?AM(BY=<5|Wz$v`&Hbnb~pKEX0tb$ZIjLsW9W?tnutE4Y=`xFkU
zDn59BUMacv59|}WtXIcceac`9cTr6ES3=Iu>nz(C8rrp1TYuY3h1VxG1JX=y9wK1+
zqj9wPYFFHg!+F|-f4ql_=_BRo;x81)B?g@!^~?6wPi$*B!i0@5-_)d8v_uF>*+BD8
zYZ-U*_$O?qkZ<^x;@RSV5CT(zNCVG9eRz%sb&n3e|8shnYUHdym-EgC5#HlSRTAdn
z-)40p+R%6?6D<E0&};JN-DT#KV+p_3G12Kz_u43s7!Lqh7(`SPdd=J`KYHbU<N8Jf
zWSB)@G!8?GlD%+^7~8cgg3KEcf^La&k?-|%pImf)ijM}0XX!L&Ecz00kKO0y$eVEH
zc^8g1Y1pl+bksPj7GeIvY&8(8_!K#rx8{okf}of^@MmceBwb35En0T9m76LiSq{r1
zRLx2;gMrgJlZy`q2w4klBA_n4jv*S0+sa@^<IB6|XG7h>Cqy|YZ{1(Nhd$m3Uu#GX
zu~p7wUdlmVg$TKFNrvv)Vt)^2_?W*NFkQmrHfa^>ZSZioz8m{r7_f%0f>g^xVKLuV
z{NS)WaayWAlApT_1K+UJX~mEzVkNau%jbV9(V!@3$Ne+TK({`gk`x*O2|pNtG9dn5
zb_=Dpc0dobbHm^?vC1(=DA}bUFHtAUrKzzyph>#Tg{13_N3Mc<`c9PNq!Z5(4<H+t
zdp>~iX8mA*)5IY1xg~N){yfCr;@UqG@g?$`Sz<^mbdgA$(vJ?uf55&^xC5~SotW*c
zgjf$k@G?umud)%kkjp*CZ+dF5_qLW^jkc_(w0kN}rl0E>0KZ|OTv@I(xqosP)28WC
z&usN`f1!J7f2}MfdQySZ`B9lV3w83Jzr%g>%ZKR+L!Nv=8GX@a{Nj)&v^0b@%G0xI
zx^MUtpjoXeA}*&p?Y{7y8GcIhNSycelrZ+_w!w`PDyGR<U+Vg558JZyp}a2w@H0G=
zfpGJ;Y3BitZ=pVeCGaf*7yrH&fFA1jJ^MaOIOKA5p;5yZC;^@Z@yo@#uj;vqtq91&
zE);K++nMgdBwm@u2VPr;7K0iKyon2_JJj}HRsdb&ZP<pPA%PaDzyCCm090odNII<T
zuclT@%$v0Xkl&t}wD-LEV`JpPCFyrSM~P<=rb@Tn6Ql91430&-^T)wup)dIf|BR2O
zC>(;Lkjn^xD$s=FF5S@-JIf?y?>>>IUwAI`RT|J*RYgFcypj|O8CEr81{Xu0{&u4|
z;*cqC*`&|Rn2pcJWb&^Tqn*B-k`Cx0t-mF6-9q`J0{?2Mw%U<6-UPlC09Mt{a$}d1
zzR<k5vj6f(3Fu<0(1!I77d>Drw)qPkdb2APzy9rR;zrk>;C>oHk-qhvYbv1N$ip;a
zEjr}EgM!!2YxFdopOCwt@R7?W{5Se8bU(HC&Rzcj3VAfjfFtEZ8QRJuE{<zdy3dvu
zz<e}!-S+t(rADQH`ALrKI~2BSVSyXr@+n@;Yz7&Ry35iJ+B`Zuc}Uv793O4`X8QL3
zrWA5w^P9g~Lng(zGY}-a;||#TI0gyeTK=F<jf9ndG4=oPCgcW@e784-Im1eJ2W|^m
z&HG(t)3QpllY1$grZ!t#?$!Q(tz2nT6Im8cid`|ZfTObN7)WyjL5eME1VtN>O%Pc|
z9dPM#VQqr43bET3?QTQ_fr=1tzztClWRoaS1QjA+E2}JlfkXrhi(rt1^iA-bnLqPy
ze!i+#-@W&{_r9w8>b>`AF^87@L8wsd+pc%(D}9i_6qqcmz4yKOayoef@`R*E4DR@;
z*Csqc<SQNM=aKUWW;;~^+YccYN`ANUU5y(!9m?(FqIor?`gV7{QY#2wHSU@W7n?@)
z!9e}DcC0LMR$=m2^@)2sPE{iIN|)TcrCx{8;wG)OfON+Tea{9iezZ^W+uogVd*LQ5
zR$;!f7<9;*)K9$MK6y-FS^757zOboZgQDYc!7MdXE9lC~Q{tH>{lxycL;a%BS?!fa
zdv{AFq^98!|9T{uXla0HCx18nB-^=>d+(*ZbCa3B+Ag(3@8Sx(HuDo>pLNps#luu0
zhFM$cRi#HJFZ^CWUD6e{a01>|+@c?tX0l*1gJ8m}|1@=G7%t2~u4Az9$^(+NB@;%)
zG98m3O<q#sMlTAHwdyzqe+XURo_WUNJr~(MDh&4M-BhU6?Zr*?GL@3GuPTZL0^A{F
zxF^XlnWiC)pv#eCjED&$TNSxTOQh-w=%mLRJU7!35+;2|TI;?$Qr1o3P8{O3RV?8b
z3!v02(>YNggLnvWgSYJ}BLjq>PA(^%CbJ+wE~lVKW<mX;1$TT^)NjUHjjY%o#@-~e
z^}Ir+r}&pzPnJ@JYixbHE{wu>+l4g3C|3>y6;iVt{{MODr7ADwbM5i~<sKSCnve&R
zlhXyh!H*}q<b?OL7{gE`zu}ych=jdbt=TYY0QYB%h{>`y6653|V>Bb;L3#ESzLskm
z>4wC{%1XN1Hj9qig?#<*wk6UTN03U6Lmf*avp41W0Tp6BSy#6v8nKNJgrcLV-{3J?
zgyx<Q8GS`g?nvP{LB@f<Mz*5&HE{6%>?hL%pLyx*P)-Hcml;sMDbv1=0usm^E;n|F
zoYyS}OZg9&$MT{I+q4Dkr)#SZCgZqsH6^dx>x-gT=lHAflU%NABLLoTN8Fo*UeJ2|
zt;LnMLaf4RBL<o*tvyBQbi{|?G!$imVK@0K#z~hhtrFEv<64)EC~6G~WLT<IL5(Ln
z*+XU>OrhouMeAc&21B6ey}yx4Od4Kn#vz4f`#d<ofrl@39KtX);IzWqnR6oMpXYG=
z#sFC0MJ6_#4Vh-EqNqz99lF<NGju0?o?_Tl7#zC$)E-`!<QQa+t^i?{G3qM8SKqh!
z`BJV+&h)XuL?H4C$QX}&SliMur27Owhggh{I?Cc@y~3%+_&Qs(>|Kx6o`br?=~l79
z`*6!+m=6{FFd7|M`$9ORSA*ljoH}CLyWOsXd&Q(<h~w0<elB+kWHV1YR$7G@$2$TB
zJK8RfnUKQ&5{31hy@vZI0Oc(kjweL5Xw@yjFdt6?(ruRR8}X-#W@;#kHsPSuu!U7^
zrG`Mi3PiL(Tx`_La+&S#Qi@Rt#jyHS%fzcG#C_o#nEja^s#fS-H4PQ-y8W%<C+#hp
z!%=kor8tDyPqvCf#;!&2K!hoU_*%HNRLbfTmNPJHrt~{I)vC3gk|09I-~b~%RO{V?
z2U?KIU;S0t7bBfH|9Bp+Kp~!hC7MT$z-nHsy<m%8Yc^@^ypTWJlW&8Tc};#~@XM^b
z63sP+49ao*s!U>2>``eB_a*HlXkY{qk8FXhGUki-Gm;dTb$d#s8#0FF{h4t{V;H$B
zQDZ4RrJKv$-Qw&}?e_P1A+K7Fe-k)l+pL)vNTWY_0%vb0vKbNGSI2TCv}&giNS1nM
zhdFlISnmAmz9pRy&~H0!M2~jN6f5;yNK#Nfyl$Jm2duq<|B@oY^@uK5>Yo4eCP*XW
zEgMUs%{Zo|iS5FdGOB_?-I3qQS2J5;Zm|`>S^Uh{!#q>4HcjJ-WcuK?U`jBC*#ts$
z(-81-p(|D`566ETB(DibyIA?9D0g&3?vb{C4=}{p=lCdXix7?vDq{9%UGB5ssafR;
zx~VU~Wh)>P9$wl$P3_B(JLHTz^5-g~CxwrSgPR|Kfo{=u4noJ{TWf3v$=gu0jGV3b
z!Ii*rny&7>LLUPcIvS8#Mbt+vW9#IA*264DFlpx(|JQXjQaCH*QnsRc^H+{uWbRv&
zx$|Kd#vfpu)lq?cDS|RZKT5}X3m7kWEZDoHd?0zYY|j6_Zy@+}Cw%(uA3ALv>&OVm
zm$+si*M?%2V;I)!+^aQ#l*EPl=A($6p+qn_zQz0*5NHd3C}7tVy@ol~kWb}T))=Jj
zqq9k%@zxs#BtKGo>IWb5vhlM{yQWvO*S{E*iLHF+>=5T9Nt=F@2kWKXq2BO1@WoBv
zz7Fuxr*<KHf?>gy$He_<vrGY^%Rg-m3jC7pq}fUmFYVlXE9hf0nP(Na`b6<`NX)^@
zV64v_it_0VQHWD&Knh2j=N*{vEa+r9N`GXGqA1ReMRbOj^IQu2DfY^CnpNqa!^FuE
zhLfwAIBuQ8PGkHqN14#)IRut(drmu-^+vjpr#Th#UU&dQ_Nr)>98+cD{#}14-_NU>
zg!5fyJbC@kZR(~kzB)CoKbcH4*3{@tKAX%)ReHW;LbHSt9<|LLlHS$0g-U!4Rnq*j
zDbxlM;0C-ow56BLg8Y^BHhu8u09&7*SE$VwC53b~B0PqA?p?5Cq@2)yLzEQi->AoH
z!?$_@kH%9c@{$J)IXg2(IM`}?C%ANzPTn~B_=Cz%%ZE1wj*l5$hbQSwq-Xb}#t^$P
zg4dKTFjatl&(w_!ep~<j0x_qQOPFnqKMF*)JushGQ*VEJFMCFs^>lpqafqd*bquZB
z%{`1-g_>RVYvI8q@ZqmCIeXx<W4y(W$`c#dZnZexl^5)wS6jmvH2f$rNztUO+L>bn
zG2>$rL<ms9;K+|BHB-L4HR1+{wv6ZB4RW&SXJfSITWfRu9+x;bE(I3Kq&7Oyy5XdW
zRU?L?-x<0WlNM}V6^9af#sTP51*v4^gUSUyr$JvDZ1Fb*sd2++sharLtT(k}db*l8
Z5%(`N8Bh|#$zue9^G^32_qPZB{1?O7dfxy5

literal 0
HcmV?d00001


From f604fcc53172401d4c40603a822231208c56c0ca Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 19:02:11 +0000
Subject: [PATCH 20/24] feat(frontend): add warning message for scraping limits

---
 frontend/src/pages/AutoScrape.tsx | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/frontend/src/pages/AutoScrape.tsx b/frontend/src/pages/AutoScrape.tsx
index 9e9d336..96163dd 100644
--- a/frontend/src/pages/AutoScrape.tsx
+++ b/frontend/src/pages/AutoScrape.tsx
@@ -191,6 +191,9 @@ const AutoScrapePage = () => {
             <p style={styles.sectionHeaderSubtitle}>
               Select sources and scrape settings, then queue processing automatically.
             </p>
+            <p style={{ ...styles.subtleBodyText, marginTop: 6, color: "#9a6700" }}>
+              Warning: Scraping more than 250 posts from any single site can take hours.
+            </p>
           </div>
           <button
             type="button"

From b1177540a1d13701050dc85ed77cd6f1849a4f25 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 19:11:18 +0000
Subject: [PATCH 21/24] feat(frontend): enhance EmotionalStats component with
 detailed mood analysis

---
 frontend/src/components/EmotionalStats.tsx | 110 +++++++++++++++++----
 1 file changed, 89 insertions(+), 21 deletions(-)

diff --git a/frontend/src/components/EmotionalStats.tsx b/frontend/src/components/EmotionalStats.tsx
index ecc588f..a0a66f3 100644
--- a/frontend/src/components/EmotionalStats.tsx
+++ b/frontend/src/components/EmotionalStats.tsx
@@ -9,6 +9,9 @@ type EmotionalStatsProps = {
 
 const EmotionalStats = ({contentData}: EmotionalStatsProps) => {
   const rows = contentData.average_emotion_by_topic ?? [];
+  const overallEmotionAverage = contentData.overall_emotion_average ?? [];
+  const dominantEmotionDistribution = contentData.dominant_emotion_distribution ?? [];
+  const emotionBySource = contentData.emotion_by_source ?? [];
   const lowSampleThreshold = 20;
   const stableSampleThreshold = 50;
   const emotionKeys = rows.length
@@ -64,39 +67,104 @@ const EmotionalStats = ({contentData}: EmotionalStatsProps) => {
   return (
     <div style={styles.page}>
       <div style={{ ...styles.container, ...styles.card, marginTop: 16 }}>
-        <h2 style={styles.sectionTitle}>Average Emotion by Topic</h2>
-        <p style={styles.sectionSubtitle}>Read confidence together with sample size. Topics with fewer than {lowSampleThreshold} events are usually noisy and less reliable.</p>
+        <h2 style={styles.sectionTitle}>Topic Mood Overview</h2>
+        <p style={styles.sectionSubtitle}>Use the strength score together with post count. Topics with fewer than {lowSampleThreshold} events are often noisy.</p>
         <div style={styles.emotionalSummaryRow}>
           <span><strong style={{ color: "#24292f" }}>Topics:</strong> {strongestPerTopic.length}</span>
-          <span><strong style={{ color: "#24292f" }}>Median Sample:</strong> {medianSampleSize} events</span>
-          <span><strong style={{ color: "#24292f" }}>Low Sample (&lt;{lowSampleThreshold}):</strong> {lowSampleTopics}</span>
-          <span><strong style={{ color: "#24292f" }}>Stable Sample ({stableSampleThreshold}+):</strong> {stableSampleTopics}</span>
+          <span><strong style={{ color: "#24292f" }}>Median Posts:</strong> {medianSampleSize}</span>
+          <span><strong style={{ color: "#24292f" }}>Small Topics (&lt;{lowSampleThreshold}):</strong> {lowSampleTopics}</span>
+          <span><strong style={{ color: "#24292f" }}>Stable Topics ({stableSampleThreshold}+):</strong> {stableSampleTopics}</span>
         </div>
         <p style={{ ...styles.sectionSubtitle, marginTop: 10, marginBottom: 0 }}>
-          Confidence reflects how strongly one emotion leads within a topic, not model accuracy. Use larger samples for stronger conclusions.
+          Strength means how far the top emotion is ahead in that topic. It does not mean model accuracy.
         </p>
       </div>
 
       <div style={{ ...styles.container, ...styles.grid }}>
-        {strongestPerTopic.map((topic) => (
-          <div key={topic.topic} style={{ ...styles.card, gridColumn: "span 4" }}>
-            <h3 style={{ ...styles.sectionTitle, marginBottom: 6 }}>{topic.topic}</h3>
-            <div style={styles.emotionalTopicLabel}>
-              Top Emotion
+        <div style={{ ...styles.card, gridColumn: "span 4" }}>
+          <h2 style={styles.sectionTitle}>Mood Averages</h2>
+          <p style={styles.sectionSubtitle}>Average score for each emotion.</p>
+          {!overallEmotionAverage.length ? (
+            <div style={styles.topUserMeta}>No overall emotion averages available.</div>
+          ) : (
+            <div style={{ ...styles.topUsersList, maxHeight: 260, overflowY: "auto" }}>
+              {[...overallEmotionAverage]
+                .sort((a, b) => b.score - a.score)
+                .map((row) => (
+                  <div key={row.emotion} style={styles.topUserItem}>
+                    <div style={styles.topUserName}>{formatEmotion(row.emotion)}</div>
+                    <div style={styles.topUserMeta}>{row.score.toFixed(3)}</div>
+                  </div>
+                ))}
             </div>
-            <div style={styles.emotionalTopicValue}>
-              {formatEmotion(topic.emotion)}
+          )}
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 4" }}>
+          <h2 style={styles.sectionTitle}>Mood Split</h2>
+          <p style={styles.sectionSubtitle}>How often each emotion is dominant.</p>
+          {!dominantEmotionDistribution.length ? (
+            <div style={styles.topUserMeta}>No dominant-emotion split available.</div>
+          ) : (
+            <div style={{ ...styles.topUsersList, maxHeight: 260, overflowY: "auto" }}>
+              {[...dominantEmotionDistribution]
+                .sort((a, b) => b.ratio - a.ratio)
+                .map((row) => (
+                  <div key={row.emotion} style={styles.topUserItem}>
+                    <div style={styles.topUserName}>{formatEmotion(row.emotion)}</div>
+                    <div style={styles.topUserMeta}>{(row.ratio * 100).toFixed(1)}% • {row.count.toLocaleString()} events</div>
+                  </div>
+                ))}
             </div>
-            <div style={styles.emotionalMetricRow}>
-              <span>Confidence</span>
-              <span style={styles.emotionalMetricValue}>{topic.value.toFixed(3)}</span>
-            </div>
-            <div style={styles.emotionalMetricRowCompact}>
-              <span>Sample Size</span>
-              <span style={styles.emotionalMetricValue}>{topic.count} events</span>
+          )}
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 4" }}>
+          <h2 style={styles.sectionTitle}>Mood by Source</h2>
+          <p style={styles.sectionSubtitle}>Leading emotion in each source.</p>
+          {!emotionBySource.length ? (
+            <div style={styles.topUserMeta}>No source emotion profile available.</div>
+          ) : (
+            <div style={{ ...styles.topUsersList, maxHeight: 260, overflowY: "auto" }}>
+              {[...emotionBySource]
+                .sort((a, b) => b.event_count - a.event_count)
+                .map((row) => (
+                  <div key={row.source} style={styles.topUserItem}>
+                    <div style={styles.topUserName}>{row.source}</div>
+                    <div style={styles.topUserMeta}>
+                      {formatEmotion(row.dominant_emotion)} • {row.dominant_score.toFixed(3)} • {row.event_count.toLocaleString()} events
+                    </div>
+                  </div>
+                ))}
             </div>
+          )}
+        </div>
+
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Topic Snapshots</h2>
+          <p style={styles.sectionSubtitle}>Per-topic mood with strength and post count.</p>
+          <div style={{ ...styles.grid, marginTop: 10 }}>
+            {strongestPerTopic.map((topic) => (
+              <div key={topic.topic} style={{ ...styles.cardBase, gridColumn: "span 4" }}>
+                <h3 style={{ ...styles.sectionTitle, marginBottom: 6 }}>{topic.topic}</h3>
+                <div style={styles.emotionalTopicLabel}>
+                  Likely Mood
+                </div>
+                <div style={styles.emotionalTopicValue}>
+                  {formatEmotion(topic.emotion)}
+                </div>
+                <div style={styles.emotionalMetricRow}>
+                  <span>Strength</span>
+                  <span style={styles.emotionalMetricValue}>{topic.value.toFixed(3)}</span>
+                </div>
+                <div style={styles.emotionalMetricRowCompact}>
+                  <span>Posts in Topic</span>
+                  <span style={styles.emotionalMetricValue}>{topic.count}</span>
+                </div>
+              </div>
+            ))}
           </div>
-        ))}
+        </div>
       </div>
     </div>
   );

From 86926898ce9aa69d5b920924dd44af15c4214919 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 19:11:50 +0000
Subject: [PATCH 22/24] feat(frontend): improve labels to be more
 understandable

---
 .../src/components/InteractionalStats.tsx     | 40 ++++++++++++-------
 frontend/src/components/LinguisticStats.tsx   | 23 ++++++-----
 frontend/src/components/SummaryStats.tsx      | 34 ++++++++--------
 frontend/src/components/UserStats.tsx         | 16 ++++----
 4 files changed, 63 insertions(+), 50 deletions(-)

diff --git a/frontend/src/components/InteractionalStats.tsx b/frontend/src/components/InteractionalStats.tsx
index 43567c5..11ab3a2 100644
--- a/frontend/src/components/InteractionalStats.tsx
+++ b/frontend/src/components/InteractionalStats.tsx
@@ -40,6 +40,9 @@ const InteractionalStats = ({ data }: InteractionalStatsProps) => {
   const singleCommentAuthorRatio = typeof concentration?.single_comment_author_ratio === "number"
     ? concentration.single_comment_author_ratio
     : null;
+  const singleCommentAuthors = typeof concentration?.single_comment_authors === "number"
+    ? concentration.single_comment_authors
+    : null;
 
   const topPairs = (data.top_interaction_pairs ?? [])
     .filter((item): item is [[string, string], number] => {
@@ -84,48 +87,55 @@ const InteractionalStats = ({ data }: InteractionalStatsProps) => {
   return (
     <div style={styles.page}>
       <div style={{ ...styles.container, ...styles.grid }}>
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Conversation Overview</h2>
+          <p style={styles.sectionSubtitle}>Who talks to who, and how concentrated the replies are.</p>
+        </div>
+
         <Card
-          label="Avg Thread Depth"
+          label="Average Reply Depth"
           value={typeof data.average_thread_depth === "number" ? data.average_thread_depth.toFixed(2) : "—"}
-          sublabel="Depth from reply chains"
+          sublabel="How deep reply chains usually go"
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Network Users"
+          label="Users in Network"
           value={userCount.toLocaleString()}
-          sublabel="Authors in interaction graph"
+          sublabel="Users in the reply graph"
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Unique Links"
+          label="User-to-User Links"
           value={edgeCount.toLocaleString()}
-          sublabel="Directed source-target pairs"
+          sublabel="Unique reply directions"
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Interaction Volume"
+          label="Total Replies"
           value={interactionVolume.toLocaleString()}
-          sublabel="Sum of link weights"
+          sublabel="All reply links combined"
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Top 10% Comment Share"
+          label="Concentrated Replies"
           value={topTenSharePercent === null ? "-" : `${topTenSharePercent.toFixed(1)}%`}
           sublabel={topTenAuthorCount === null || totalCommentingAuthors === null
-            ? "Comment volume held by top commenters"
+            ? "Reply share from the top 10% commenters"
             : `${topTenAuthorCount.toLocaleString()} of ${totalCommentingAuthors.toLocaleString()} authors`}
           style={{ gridColumn: "span 6" }}
         />
         <Card
           label="Single-Comment Authors"
           value={singleCommentAuthorRatio === null ? "-" : `${(singleCommentAuthorRatio * 100).toFixed(1)}%`}
-          sublabel="Authors who commented exactly once"
+          sublabel={singleCommentAuthors === null
+            ? "Authors who commented exactly once"
+            : `${singleCommentAuthors.toLocaleString()} authors commented exactly once`}
           style={{ gridColumn: "span 6" }}
         />
 
         <div style={{ ...styles.card, gridColumn: "span 12" }}>
-          <h2 style={styles.sectionTitle}>Interaction Visuals</h2>
-          <p style={styles.sectionSubtitle}>Quick charts for interaction direction and conversation concentration.</p>
+          <h2 style={styles.sectionTitle}>Conversation Visuals</h2>
+          <p style={styles.sectionSubtitle}>Main reply links and concentration split.</p>
 
           <div style={{ ...styles.grid, marginTop: 12 }}>
             <div style={{ ...styles.cardBase, gridColumn: "span 6" }}>
@@ -175,8 +185,8 @@ const InteractionalStats = ({ data }: InteractionalStatsProps) => {
         </div>
 
         <div style={{ ...styles.card, gridColumn: "span 12" }}>
-          <h2 style={styles.sectionTitle}>Top Interaction Pairs</h2>
-          <p style={styles.sectionSubtitle}>Most frequent directed reply paths between users.</p>
+          <h2 style={styles.sectionTitle}>Frequent Reply Paths</h2>
+          <p style={styles.sectionSubtitle}>Most common user-to-user reply paths.</p>
           {!topPairs.length ? (
             <div style={styles.topUserMeta}>No interaction pair data available.</div>
           ) : (
diff --git a/frontend/src/components/LinguisticStats.tsx b/frontend/src/components/LinguisticStats.tsx
index 3569511..34fdafd 100644
--- a/frontend/src/components/LinguisticStats.tsx
+++ b/frontend/src/components/LinguisticStats.tsx
@@ -21,28 +21,33 @@ const LinguisticStats = ({ data }: LinguisticStatsProps) => {
   return (
     <div style={styles.page}>
       <div style={{ ...styles.container, ...styles.grid }}>
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Language Overview</h2>
+          <p style={styles.sectionSubtitle}>Quick read on how broad and repetitive the wording is.</p>
+        </div>
+
         <Card
-          label="Total Tokens"
+          label="Total Words"
           value={lexical?.total_tokens?.toLocaleString() ?? "—"}
-          sublabel="After token filtering"
+          sublabel="Words after basic filtering"
           style={{ gridColumn: "span 4" }}
         />
         <Card
-          label="Unique Tokens"
+          label="Unique Words"
           value={lexical?.unique_tokens?.toLocaleString() ?? "—"}
-          sublabel="Distinct vocabulary items"
+          sublabel="Different words used"
           style={{ gridColumn: "span 4" }}
         />
         <Card
-          label="Type-Token Ratio"
+          label="Vocabulary Variety"
           value={typeof lexical?.ttr === "number" ? lexical.ttr.toFixed(4) : "—"}
-          sublabel="Vocabulary richness proxy"
+          sublabel="Higher means less repetition"
           style={{ gridColumn: "span 4" }}
         />
 
         <div style={{ ...styles.card, gridColumn: "span 4" }}>
           <h2 style={styles.sectionTitle}>Top Words</h2>
-          <p style={styles.sectionSubtitle}>Most frequent filtered terms.</p>
+          <p style={styles.sectionSubtitle}>Most used single words.</p>
           <div style={{ ...styles.topUsersList, maxHeight: 360, overflowY: "auto" }}>
             {topWords.map((item) => (
               <div key={item.word} style={styles.topUserItem}>
@@ -55,7 +60,7 @@ const LinguisticStats = ({ data }: LinguisticStatsProps) => {
 
         <div style={{ ...styles.card, gridColumn: "span 4" }}>
           <h2 style={styles.sectionTitle}>Top Bigrams</h2>
-          <p style={styles.sectionSubtitle}>Most frequent 2-word phrases.</p>
+          <p style={styles.sectionSubtitle}>Most used 2-word phrases.</p>
           <div style={{ ...styles.topUsersList, maxHeight: 360, overflowY: "auto" }}>
             {topBigrams.map((item) => (
               <div key={item.ngram} style={styles.topUserItem}>
@@ -68,7 +73,7 @@ const LinguisticStats = ({ data }: LinguisticStatsProps) => {
 
         <div style={{ ...styles.card, gridColumn: "span 4" }}>
           <h2 style={styles.sectionTitle}>Top Trigrams</h2>
-          <p style={styles.sectionSubtitle}>Most frequent 3-word phrases.</p>
+          <p style={styles.sectionSubtitle}>Most used 3-word phrases.</p>
           <div style={{ ...styles.topUsersList, maxHeight: 360, overflowY: "auto" }}>
             {topTrigrams.map((item) => (
               <div key={item.ngram} style={styles.topUserItem}>
diff --git a/frontend/src/components/SummaryStats.tsx b/frontend/src/components/SummaryStats.tsx
index 0ff46ac..98f54ad 100644
--- a/frontend/src/components/SummaryStats.tsx
+++ b/frontend/src/components/SummaryStats.tsx
@@ -58,15 +58,13 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
     const [selectedUser, setSelectedUser] = useState<string | null>(null);
     const selectedUserData: User | null = userData?.users.find((u) => u.author === selectedUser) ?? null;
 
-    console.log(summary)
-
     return (
     <div style={styles.page}>
 
         {/* main grid*/}
         <div style={{ ...styles.container, ...styles.grid}}>
             <Card
-            label="Total Events"
+            label="Total Activity"
             value={summary?.total_events ?? "—"}
             sublabel="Posts + comments"
             style={{
@@ -74,15 +72,15 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
             }}
             />
             <Card
-            label="Unique Users"
+            label="Active People"
             value={summary?.unique_users ?? "—"}
-            sublabel="Distinct authors"
+            sublabel="Distinct users"
             style={{
                 gridColumn: "span 4"
             }}
             />
             <Card
-            label="Posts / Comments"
+            label="Posts vs Comments"
             value={
                 summary
                 ? `${summary.total_posts} / ${summary.total_comments}`
@@ -108,13 +106,13 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
             />
 
             <Card
-            label="Lurker Ratio"
+            label="One-Time Users"
             value={
                 typeof summary?.lurker_ratio === "number"
                 ? `${Math.round(summary.lurker_ratio * 100)}%`
                 : "—"
             }
-            sublabel="Users with only 1 event"
+            sublabel="Users with only one event"
             style={{
                 gridColumn: "span 4"
             }}
@@ -136,12 +134,12 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
 
         {/* events per day */}
         <div style={{ ...styles.card, gridColumn: "span 5" }}>
-            <h2 style={styles.sectionTitle}>Events per Day</h2>
-            <p style={styles.sectionSubtitle}>Trend of activity over time</p>
+            <h2 style={styles.sectionTitle}>Activity Over Time</h2>
+            <p style={styles.sectionSubtitle}>How much posting happened each day.</p>
 
             <div style={styles.chartWrapper}>
             <ResponsiveContainer width="100%" height="100%">
-                <LineChart data={timeData?.events_per_day.filter((d) => new Date(d.date) >= new Date('2026-01-10'))}>
+                <LineChart data={timeData?.events_per_day ?? []}>
                 <CartesianGrid strokeDasharray="3 3" />
                 <XAxis dataKey="date" />
                 <YAxis />
@@ -154,8 +152,8 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
 
         {/* Word Cloud */}
         <div style={{ ...styles.card, gridColumn: "span 4" }}>
-            <h2 style={styles.sectionTitle}>Word Cloud</h2>
-            <p style={styles.sectionSubtitle}>Most common terms across events</p>
+            <h2 style={styles.sectionTitle}>Common Words</h2>
+            <p style={styles.sectionSubtitle}>Frequently used words across the dataset.</p>
 
             <div style={styles.chartWrapper}>
             <ReactWordcloud
@@ -174,8 +172,8 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
         <div style={{...styles.card, ...styles.scrollArea, gridColumn: "span 3",
         }}
         >
-            <h2 style={styles.sectionTitle}>Top Users</h2>
-            <p style={styles.sectionSubtitle}>Most active authors</p>
+            <h2 style={styles.sectionTitle}>Most Active Users</h2>
+            <p style={styles.sectionSubtitle}>Who posted the most events.</p>
 
             <div style={styles.topUsersList}>
             {userData?.top_users.slice(0, 100).map((item) => (
@@ -195,8 +193,8 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
 
         {/* Heatmap */}
         <div style={{ ...styles.card, gridColumn: "span 12" }}>
-            <h2 style={styles.sectionTitle}>Heatmap</h2>
-            <p style={styles.sectionSubtitle}>Activity density across time</p>
+            <h2 style={styles.sectionTitle}>Weekly Activity Pattern</h2>
+            <p style={styles.sectionSubtitle}>When activity tends to happen by weekday and hour.</p>
 
             <div style={styles.heatmapWrapper}>
             <ActivityHeatmap data={timeData?.weekday_hour_heatmap ?? []} />
@@ -214,4 +212,4 @@ const SummaryStats = ({userData, timeData, contentData, summary}: SummaryStatsPr
     );
 }
 
-export default SummaryStats;
\ No newline at end of file
+export default SummaryStats;
diff --git a/frontend/src/components/UserStats.tsx b/frontend/src/components/UserStats.tsx
index bb060cc..b467998 100644
--- a/frontend/src/components/UserStats.tsx
+++ b/frontend/src/components/UserStats.tsx
@@ -87,15 +87,15 @@ const UserStats = (props: { data: UserAnalysisResponse }) => {
             style={{ gridColumn: "span 3" }}
           />
           <Card
-            label="Interactions"
+            label="Replies"
             value={totalInteractions.toLocaleString()}
-            sublabel="Filtered links (2+ interactions)"
+            sublabel="Links with at least 2 replies"
             style={{ gridColumn: "span 3" }}
           />
           <Card
-            label="Average Intensity"
+            label="Replies per Connected User"
             value={avgInteractionsPerConnectedUser.toFixed(1)}
-            sublabel="Interactions per connected user"
+            sublabel="Average from visible graph links"
             style={{ gridColumn: "span 3" }}
           />
           <Card
@@ -106,13 +106,13 @@ const UserStats = (props: { data: UserAnalysisResponse }) => {
           />
 
           <Card
-            label="Strongest Connection"
+            label="Strongest User Link"
             value={strongestLink ? `${strongestLink.source} -> ${strongestLink.target}` : "—"}
-            sublabel={strongestLink ? `${strongestLink.value.toLocaleString()} interactions` : "No graph edges after filtering"}
+            sublabel={strongestLink ? `${strongestLink.value.toLocaleString()} replies` : "No graph links after filtering"}
             style={{ gridColumn: "span 6" }}
           />
           <Card
-            label="Most Reply-Driven User"
+            label="Most Comment-Heavy User"
             value={highlyInteractiveUser?.author ?? "—"}
             sublabel={
               highlyInteractiveUser
@@ -125,7 +125,7 @@ const UserStats = (props: { data: UserAnalysisResponse }) => {
           <div style={{ ...styles.card, gridColumn: "span 12" }}>
             <h2 style={styles.sectionTitle}>User Interaction Graph</h2>
             <p style={styles.sectionSubtitle}>
-              Nodes represent users and links represent conversation interactions.
+              Each node is a user, and each link shows replies between them.
             </p>
             <div ref={graphContainerRef} style={{ width: "100%", height: graphSize.height }}>
               <ForceGraph3D

From e5414befa748d6cfdabe5057494cdba387ddd41b Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 19:12:25 +0000
Subject: [PATCH 23/24] feat(frontend): add dominant emotion display to
 UserModal

---
 frontend/src/components/UserModal.tsx | 12 ++++++++++++
 frontend/src/types/ApiTypes.ts        |  1 +
 2 files changed, 13 insertions(+)

diff --git a/frontend/src/components/UserModal.tsx b/frontend/src/components/UserModal.tsx
index 54ee5fc..682b730 100644
--- a/frontend/src/components/UserModal.tsx
+++ b/frontend/src/components/UserModal.tsx
@@ -12,6 +12,9 @@ type Props = {
 };
 
 export default function UserModal({ open, onClose, userData, username }: Props) {
+  const dominantEmotionEntry = Object.entries(userData?.avg_emotions ?? {})
+    .sort((a, b) => b[1] - a[1])[0];
+
   return (
     <Dialog open={open} onClose={onClose} style={styles.modalRoot}>
       <div style={styles.modalBackdrop} />
@@ -66,6 +69,15 @@ export default function UserModal({ open, onClose, userData, username }: Props)
                   </div>
                 </div>
               ) : null}
+
+              {dominantEmotionEntry ? (
+                <div style={styles.topUserItem}>
+                  <div style={styles.topUserName}>Dominant Avg Emotion</div>
+                  <div style={styles.topUserMeta}>
+                    {dominantEmotionEntry[0].replace("emotion_", "")} ({dominantEmotionEntry[1].toFixed(3)})
+                  </div>
+                </div>
+              ) : null}
             </div>
           )}
         </DialogPanel>
diff --git a/frontend/src/types/ApiTypes.ts b/frontend/src/types/ApiTypes.ts
index 0e41386..7a0b521 100644
--- a/frontend/src/types/ApiTypes.ts
+++ b/frontend/src/types/ApiTypes.ts
@@ -40,6 +40,7 @@ type User = {
   comment: number;
   comment_post_ratio: number;
   comment_share: number;
+  avg_emotions?: Record<string, number>;
   vocab?: Vocab | null;
 };
 

From e054997bb18afd18684e44d71606f77724871319 Mon Sep 17 00:00:00 2001
From: Dylan De Faoite <dylanseandefaoite@gmail.com>
Date: Wed, 18 Mar 2026 19:23:35 +0000
Subject: [PATCH 24/24] feat(frontend): reword CulturalStats to improve
 understandability

---
 frontend/src/components/CulturalStats.tsx | 87 ++++++++++++++++-------
 frontend/src/pages/AutoScrape.tsx         |  2 +-
 2 files changed, 64 insertions(+), 25 deletions(-)

diff --git a/frontend/src/components/CulturalStats.tsx b/frontend/src/components/CulturalStats.tsx
index 7f3a775..c46e0c3 100644
--- a/frontend/src/components/CulturalStats.tsx
+++ b/frontend/src/components/CulturalStats.tsx
@@ -11,6 +11,15 @@ type CulturalStatsProps = {
 const CulturalStats = ({ data }: CulturalStatsProps) => {
   const identity = data.identity_markers;
   const stance = data.stance_markers;
+  const inGroupWords = identity?.in_group_usage ?? 0;
+  const outGroupWords = identity?.out_group_usage ?? 0;
+  const totalGroupWords = inGroupWords + outGroupWords;
+  const inGroupWordRate = typeof identity?.in_group_ratio === "number"
+    ? identity.in_group_ratio * 100
+    : null;
+  const outGroupWordRate = typeof identity?.out_group_ratio === "number"
+    ? identity.out_group_ratio * 100
+    : null;
   const rawEntities = data.avg_emotion_per_entity?.entity_emotion_avg ?? {};
   const entities = Object.entries(rawEntities)
     .sort((a, b) => (b[1].post_count - a[1].post_count))
@@ -25,77 +34,107 @@ const CulturalStats = ({ data }: CulturalStatsProps) => {
     entries.sort((a, b) => b[1] - a[1]);
     const dominant = entries[0] ?? ["emotion_unknown", 0];
     const dominantLabel = dominant[0].replace("emotion_", "");
-    return `${dominantLabel} (${dominant[1].toFixed(3)})`;
+    return `${dominantLabel} (${(dominant[1] * 100).toFixed(1)}%)`;
   };
 
   return (
     <div style={styles.page}>
       <div style={{ ...styles.container, ...styles.grid }}>
+        <div style={{ ...styles.card, gridColumn: "span 12" }}>
+          <h2 style={styles.sectionTitle}>Community Framing Overview</h2>
+          <p style={styles.sectionSubtitle}>Simple view of how often people use "us" words vs "them" words, and the tone around that language.</p>
+        </div>
+
         <Card
-          label="In-Group Usage"
-          value={identity?.in_group_usage?.toLocaleString() ?? "—"}
-          sublabel="we/us/our references"
+          label="In-Group Words"
+          value={inGroupWords.toLocaleString()}
+          sublabel="Times we/us/our appears"
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Out-Group Usage"
-          value={identity?.out_group_usage?.toLocaleString() ?? "—"}
-          sublabel="they/them/their references"
+          label="Out-Group Words"
+          value={outGroupWords.toLocaleString()}
+          sublabel="Times they/them/their appears"
           style={{ gridColumn: "span 3" }}
         />
         <Card
           label="In-Group Posts"
           value={identity?.in_group_posts?.toLocaleString() ?? "—"}
-          sublabel="Posts with stronger in-group language"
+          sublabel='Posts leaning toward "us" language'
           style={{ gridColumn: "span 3" }}
         />
         <Card
           label="Out-Group Posts"
           value={identity?.out_group_posts?.toLocaleString() ?? "—"}
-          sublabel="Posts with stronger out-group language"
+          sublabel='Posts leaning toward "them" language'
           style={{ gridColumn: "span 3" }}
         />
 
         <Card
-          label="Hedge Markers"
+          label="Balanced Posts"
+          value={identity?.tie_posts?.toLocaleString() ?? "—"}
+          sublabel="Posts with equal us/them signals"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Total Group Words"
+          value={totalGroupWords.toLocaleString()}
+          sublabel="In-group + out-group words"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="In-Group Share"
+          value={inGroupWordRate === null ? "—" : `${inGroupWordRate.toFixed(2)}%`}
+          sublabel="Share of all words"
+          style={{ gridColumn: "span 3" }}
+        />
+        <Card
+          label="Out-Group Share"
+          value={outGroupWordRate === null ? "—" : `${outGroupWordRate.toFixed(2)}%`}
+          sublabel="Share of all words"
+          style={{ gridColumn: "span 3" }}
+        />
+
+        <Card
+          label="Hedging Words"
           value={stance?.hedge_total?.toLocaleString() ?? "—"}
-          sublabel={typeof stance?.hedge_per_1k_tokens === "number" ? `${stance.hedge_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          sublabel={typeof stance?.hedge_per_1k_tokens === "number" ? `${stance.hedge_per_1k_tokens.toFixed(1)} per 1k words` : "Word frequency"}
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Certainty Markers"
+          label="Certainty Words"
           value={stance?.certainty_total?.toLocaleString() ?? "—"}
-          sublabel={typeof stance?.certainty_per_1k_tokens === "number" ? `${stance.certainty_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          sublabel={typeof stance?.certainty_per_1k_tokens === "number" ? `${stance.certainty_per_1k_tokens.toFixed(1)} per 1k words` : "Word frequency"}
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Deontic Markers"
+          label="Need/Should Words"
           value={stance?.deontic_total?.toLocaleString() ?? "—"}
-          sublabel={typeof stance?.deontic_per_1k_tokens === "number" ? `${stance.deontic_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          sublabel={typeof stance?.deontic_per_1k_tokens === "number" ? `${stance.deontic_per_1k_tokens.toFixed(1)} per 1k words` : "Word frequency"}
           style={{ gridColumn: "span 3" }}
         />
         <Card
-          label="Permission Markers"
+          label="Permission Words"
           value={stance?.permission_total?.toLocaleString() ?? "—"}
-          sublabel={typeof stance?.permission_per_1k_tokens === "number" ? `${stance.permission_per_1k_tokens.toFixed(3)} per 1k tokens` : "Marker frequency"}
+          sublabel={typeof stance?.permission_per_1k_tokens === "number" ? `${stance.permission_per_1k_tokens.toFixed(1)} per 1k words` : "Word frequency"}
           style={{ gridColumn: "span 3" }}
         />
 
         <div style={{ ...styles.card, gridColumn: "span 6" }}>
-          <h2 style={styles.sectionTitle}>In-Group Emotion Profile</h2>
-          <p style={styles.sectionSubtitle}>Dominant average emotion where in-group framing is stronger.</p>
+          <h2 style={styles.sectionTitle}>Mood in "Us" Posts</h2>
+          <p style={styles.sectionSubtitle}>Most likely emotion when in-group wording is stronger.</p>
           <div style={styles.topUserName}>{topEmotion(identity?.in_group_emotion_avg)}</div>
         </div>
 
         <div style={{ ...styles.card, gridColumn: "span 6" }}>
-          <h2 style={styles.sectionTitle}>Out-Group Emotion Profile</h2>
-          <p style={styles.sectionSubtitle}>Dominant average emotion where out-group framing is stronger.</p>
+          <h2 style={styles.sectionTitle}>Mood in "Them" Posts</h2>
+          <p style={styles.sectionSubtitle}>Most likely emotion when out-group wording is stronger.</p>
           <div style={styles.topUserName}>{topEmotion(identity?.out_group_emotion_avg)}</div>
         </div>
 
         <div style={{ ...styles.card, gridColumn: "span 12" }}>
-          <h2 style={styles.sectionTitle}>Entity Emotion Averages</h2>
-          <p style={styles.sectionSubtitle}>Most frequent entities and their dominant average emotion signature.</p>
+          <h2 style={styles.sectionTitle}>Entity Mood Snapshot</h2>
+          <p style={styles.sectionSubtitle}>Most mentioned entities and the mood that appears most with each.</p>
           {!entities.length ? (
             <div style={styles.topUserMeta}>No entity-level cultural data available.</div>
           ) : (
@@ -104,7 +143,7 @@ const CulturalStats = ({ data }: CulturalStatsProps) => {
                 <div key={entity} style={styles.topUserItem}>
                   <div style={styles.topUserName}>{entity}</div>
                   <div style={styles.topUserMeta}>
-                    {aggregate.post_count.toLocaleString()} posts • Dominant emotion: {topEmotion(aggregate.emotion_avg)}
+                    {aggregate.post_count.toLocaleString()} posts • Likely mood: {topEmotion(aggregate.emotion_avg)}
                   </div>
                 </div>
               ))}
diff --git a/frontend/src/pages/AutoScrape.tsx b/frontend/src/pages/AutoScrape.tsx
index 96163dd..cbea251 100644
--- a/frontend/src/pages/AutoScrape.tsx
+++ b/frontend/src/pages/AutoScrape.tsx
@@ -192,7 +192,7 @@ const AutoScrapePage = () => {
               Select sources and scrape settings, then queue processing automatically.
             </p>
             <p style={{ ...styles.subtleBodyText, marginTop: 6, color: "#9a6700" }}>
-              Warning: Scraping more than 250 posts from any single site can take hours.
+              Warning: Scraping more than 250 posts from any single site can take hours due to rate limits.
             </p>
           </div>
           <button