codewiththomas
diff --git a/‎README.md‎
Lines changed: 4 additions & 2 deletions b/‎README.md‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎eval/evaluation.ipynb‎
Lines changed: 86 additions & 0 deletions b/‎eval/evaluation.ipynb‎
Lines changed: 86 additions & 0 deletions
diff --git a/‎eval/evaluation_anonym.csv‎
Lines changed: 41 additions & 0 deletions b/‎eval/evaluation_anonym.csv‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎eval/requirements.txt‎
Lines changed: 34 additions & 0 deletions b/‎eval/requirements.txt‎
Lines changed: 34 additions & 0 deletions
diff --git a/‎…rator.Abstractions/Contracts/ICrawler.cs‎ ‎…rator.Abstractions/Contracts/ICrawler.cs‎FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/ICrawler.cs renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/ICrawler.cs b/‎…rator.Abstractions/Contracts/ICrawler.cs‎ ‎…rator.Abstractions/Contracts/ICrawler.cs‎FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/ICrawler.cs renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/ICrawler.cs
diff --git a/‎…ator.Abstractions/Contracts/IDocument.cs‎ ‎…ator.Abstractions/Contracts/IDocument.cs‎FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/IDocument.cs renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/IDocument.cs b/‎…ator.Abstractions/Contracts/IDocument.cs‎ ‎…ator.Abstractions/Contracts/IDocument.cs‎FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/IDocument.cs renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/Contracts/IDocument.cs
diff --git a/‎…chestrator.Abstractions/Dtos/Document.cs‎ ‎…chestrator.Abstractions/Dtos/Document.cs‎FOM.RAG.CrawlerOrchestrator.Abstractions/Dtos/Document.cs renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/Dtos/Document.cs b/‎…chestrator.Abstractions/Dtos/Document.cs‎ ‎…chestrator.Abstractions/Dtos/Document.cs‎FOM.RAG.CrawlerOrchestrator.Abstractions/Dtos/Document.cs renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/Dtos/Document.cs
diff --git a/‎….CrawlerOrchestrator.Abstractions.csproj‎ ‎….CrawlerOrchestrator.Abstractions.csproj‎FOM.RAG.CrawlerOrchestrator.Abstractions/FOM.RAG.CrawlerOrchestrator.Abstractions.csproj renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/FOM.RAG.CrawlerOrchestrator.Abstractions.csproj b/‎….CrawlerOrchestrator.Abstractions.csproj‎ ‎….CrawlerOrchestrator.Abstractions.csproj‎FOM.RAG.CrawlerOrchestrator.Abstractions/FOM.RAG.CrawlerOrchestrator.Abstractions.csproj renamed to src/FOM.RAG.CrawlerOrchestrator.Abstractions/FOM.RAG.CrawlerOrchestrator.Abstractions.csproj
diff --git a/‎…chestrator/CrawlerOrchestratorService.cs‎ ‎…chestrator/CrawlerOrchestratorService.cs‎FOM.RAG.CrawlerOrchestrator/CrawlerOrchestratorService.cs renamed to src/FOM.RAG.CrawlerOrchestrator/CrawlerOrchestratorService.cs b/‎…chestrator/CrawlerOrchestratorService.cs‎ ‎…chestrator/CrawlerOrchestratorService.cs‎FOM.RAG.CrawlerOrchestrator/CrawlerOrchestratorService.cs renamed to src/FOM.RAG.CrawlerOrchestrator/CrawlerOrchestratorService.cs
diff --git a/‎…rator/FOM.RAG.CrawlerOrchestrator.csproj‎ ‎…rator/FOM.RAG.CrawlerOrchestrator.csproj‎FOM.RAG.CrawlerOrchestrator/FOM.RAG.CrawlerOrchestrator.csproj renamed to src/FOM.RAG.CrawlerOrchestrator/FOM.RAG.CrawlerOrchestrator.csproj b/‎…rator/FOM.RAG.CrawlerOrchestrator.csproj‎ ‎…rator/FOM.RAG.CrawlerOrchestrator.csproj‎FOM.RAG.CrawlerOrchestrator/FOM.RAG.CrawlerOrchestrator.csproj renamed to src/FOM.RAG.CrawlerOrchestrator/FOM.RAG.CrawlerOrchestrator.csproj
@@ -0,0 +1,86 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Evaluierung der Ergebnisse"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "            METRIK    RAG  TF-IDF    GPT\n",
+      "0      PRECISION@5  0.825   0.630    NaN\n",
+      "1         RECALL@5  0.700   0.465    NaN\n",
+      "2  ANTWORTRELEVANZ  4.125   3.125  3.350\n",
+      "3      FAKTENTREUE  4.300   3.050  2.300\n",
+      "4  VOLLSTÄNDIGKEIT  3.750   2.575  2.125\n"
+     ]
+    }
+   ],
+   "source": [
+    "import pandas as pd\n",
+    "\n",
+    "file_path = \"evaluation_anonym.csv\" #same dir as notbook\n",
+    "df = pd.read_csv(file_path, sep=\",\")\n",
+    "\n",
+    "metrics_avg = {\n",
+    "    \"METRIK\": [\"PRECISION@5\", \"RECALL@5\", \"ANTWORTRELEVANZ\", \"FAKTENTREUE\", \"VOLLSTÄNDIGKEIT\"],\n",
+    "    \"RAG\": [\n",
+    "        df[\"RAG_Precision5\"].mean(),\n",
+    "        df[\"RAG_Recall5\"].mean(),\n",
+    "        df[\"RAG_Antwortrelevanz\"].mean(),\n",
+    "        df[\"RAG_Faktentreue\"].mean(),\n",
+    "        df[\"RAG_Vollständigkeit\"].mean()\n",
+    "    ],\n",
+    "    \"TF-IDF\": [\n",
+    "        df[\"Baseline_Precision5\"].mean(),\n",
+    "        df[\"Baseline_Recall5\"].mean(),\n",
+    "        df[\"Baseline_Antwortrelevanz\"].mean(),\n",
+    "        df[\"Baseline_Faktentreue\"].mean(),\n",
+    "        df[\"Baseline_Vollständigkeit\"].mean()\n",
+    "    ],\n",
+    "    \"GPT\": [\n",
+    "        None,  # Kein Precision@5 für GPT in den Daten vorhanden\n",
+    "        None,  # Kein Recall@5 für GPT in den Daten vorhanden\n",
+    "        df[\"GPT_Antwortrelevanz\"].mean(),\n",
+    "        df[\"GPT_Faktentreue\"].mean(),\n",
+    "        df[\"GPT_Vollständigkeit\"].mean()\n",
+    "    ]\n",
+    "}\n",
+    "\n",
+    "metrics_df = pd.DataFrame(metrics_avg)\n",
+    "\n",
+    "print(metrics_df)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.7"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
@@ -0,0 +1,41 @@
+Frage_ID,Kategorie,Frage,Gold_Standard,RAG_Precision5,RAG_Recall5,RAG_Antwortrelevanz,RAG_Faktentreue,RAG_Vollständigkeit,Baseline_Precision5,Baseline_Recall5,Baseline_Antwortrelevanz,Baseline_Faktentreue,Baseline_Vollständigkeit,GPT_Antwortrelevanz,GPT_Faktentreue,GPT_Vollständigkeit
+F001,Faktenfrage,****,****,0.8,0.8,4,4,4,0.8,0.6,3,3,3,4,2,2
+F002,Faktenfrage,****,****,1.0,0.8,5,5,4,0.8,0.6,4,3,3,3,2,2
+F003,Faktenfrage,****,****,0.8,0.8,4,5,4,0.6,0.6,3,3,3,4,3,2
+F004,Faktenfrage,****,****,0.8,0.6,4,4,4,0.6,0.4,3,3,2,3,2,2
+F005,Faktenfrage,****,****,0.8,0.6,4,4,3,0.6,0.6,3,3,3,3,2,2
+F006,Faktenfrage,****,****,1.0,0.8,5,5,4,0.8,0.6,4,4,3,4,3,2
+F007,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,3,3,2,2
+F008,Faktenfrage,****,****,0.8,0.6,4,5,4,0.6,0.4,3,3,2,4,3,2
+F009,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.6,3,3,3,3,2,2
+F010,Faktenfrage,****,****,1.0,0.8,5,5,4,0.8,0.6,4,4,3,4,3,2
+F011,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,2,3,2,2
+F012,Faktenfrage,****,****,0.8,0.6,4,5,4,0.6,0.4,3,3,3,3,2,2
+F013,Faktenfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,2,3,2,2
+F014,Faktenfrage,****,****,1.0,0.8,5,5,4,0.8,0.6,4,4,3,4,2,2
+F015,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,3,3,2,2
+F016,Faktenfrage,****,****,0.8,0.6,4,5,4,0.6,0.6,3,3,3,3,2,2
+F017,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,2,3,2,2
+F018,Faktenfrage,****,****,1.0,0.8,5,5,4,0.8,0.6,4,3,3,4,3,2
+F019,Faktenfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,3,3,2,2
+F020,Faktenfrage,****,****,0.8,0.6,4,5,4,0.6,0.4,3,3,3,3,2,2
+F021,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,2,3,2,2
+F022,Faktenfrage,****,****,1.0,0.8,5,5,4,0.8,0.6,4,4,3,4,3,2
+F023,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,3,3,2,2
+F024,Faktenfrage,****,****,0.8,0.6,4,5,4,0.6,0.4,3,3,3,3,2,2
+F025,Faktenfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,2,3,2,2
+F026,Faktenfrage,****,****,0.8,0.6,4,5,4,0.6,0.4,3,3,3,3,2,2
+F027,Faktenfrage,****,****,0.8,0.8,4,4,4,0.6,0.6,3,3,3,3,2,2
+P001,Prozessfrage,****,****,0.8,0.6,4,4,4,0.6,0.4,3,3,2,4,3,2
+P002,Prozessfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,2,3,2,2
+P003,Prozessfrage,****,****,1.0,0.8,5,4,4,0.8,0.6,4,3,3,4,3,3
+P004,Prozessfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,2,3,2,2
+P005,Prozessfrage,****,****,0.8,0.6,4,4,4,0.6,0.4,3,3,3,3,2,2
+P006,Prozessfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,2,3,2,2
+P007,Prozessfrage,****,****,0.8,0.6,4,4,4,0.6,0.4,3,3,3,4,3,3
+P008,Prozessfrage,****,****,0.8,0.8,4,4,4,0.6,0.4,3,3,2,3,2,2
+L001,Problemlösungsfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,2,4,3,3
+L002,Problemlösungsfrage,****,****,0.6,0.6,3,4,3,0.4,0.4,2,2,2,3,2,2
+L003,Problemlösungsfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,2,4,3,3
+L004,Problemlösungsfrage,****,****,0.6,0.6,3,3,3,0.4,0.4,2,2,2,3,2,2
+L005,Problemlösungsfrage,****,****,0.8,0.6,4,4,3,0.6,0.4,3,3,2,4,3,3
@@ -0,0 +1,34 @@
+ace_tools==0.0
+asttokens==3.0.0
+colorama==0.4.6
+comm==0.2.2
+debugpy==1.8.12
+decorator==5.2.1
+executing==2.2.0
+ipykernel==6.29.5
+ipython==9.0.0
+ipython_pygments_lexers==1.1.1
+jedi==0.19.2
+jupyter_client==8.6.3
+jupyter_core==5.7.2
+matplotlib-inline==0.1.7
+nest-asyncio==1.6.0
+numpy==2.2.3
+packaging==24.2
+pandas==2.2.3
+parso==0.8.4
+platformdirs==4.3.6
+prompt_toolkit==3.0.50
+psutil==7.0.0
+pure_eval==0.2.3
+Pygments==2.19.1
+python-dateutil==2.9.0.post0
+pytz==2025.1
+pywin32==308
+pyzmq==26.2.1
+six==1.17.0
+stack-data==0.6.3
+tornado==6.4.2
+traitlets==5.14.3
+tzdata==2025.1
+wcwidth==0.2.13