Spaces:
Runtime error
Runtime error
Commit
·
b81234c
1
Parent(s):
9856745
Updated pathing for Wizards And Sorcery revised, migrated to poetry
Browse files- README.md +1 -1
- app.py +2 -2
- poetry.lock +0 -0
- pyproject.toml +21 -0
README.md
CHANGED
|
@@ -9,7 +9,7 @@ app_file: app.py
|
|
| 9 |
pinned: false
|
| 10 |
---
|
| 11 |
|
| 12 |
-
# Retrieval Augmented Generation for
|
| 13 |
|
| 14 |
## Project Overview
|
| 15 |
|
|
|
|
| 9 |
pinned: false
|
| 10 |
---
|
| 11 |
|
| 12 |
+
# Retrieval Augmented Generation for Wizards & Wizardy Rule Sets
|
| 13 |
|
| 14 |
## Project Overview
|
| 15 |
|
app.py
CHANGED
|
@@ -19,7 +19,7 @@ def load_enhanced_json(file_path):
|
|
| 19 |
with open(file_path, 'r') as file:
|
| 20 |
return json.load(file)
|
| 21 |
|
| 22 |
-
enhanced_json_file = "
|
| 23 |
enhanced_data = load_enhanced_json(enhanced_json_file)
|
| 24 |
|
| 25 |
# Extract document summary and page summaries
|
|
@@ -27,7 +27,7 @@ document_summary = enhanced_data.get('document_summary', 'No document summary av
|
|
| 27 |
page_summaries = {int(page): data['summary'] for page, data in enhanced_data.get('pages', {}).items()}
|
| 28 |
|
| 29 |
# Import saved file and view
|
| 30 |
-
embeddings_df_save_path = "
|
| 31 |
print("Loading embeddings.csv")
|
| 32 |
text_chunks_and_embedding_df_load = pd.read_csv(embeddings_df_save_path)
|
| 33 |
print("Embedding file loaded")
|
|
|
|
| 19 |
with open(file_path, 'r') as file:
|
| 20 |
return json.load(file)
|
| 21 |
|
| 22 |
+
enhanced_json_file = "./output/SWCompleteRevisedPDF_enhanced_output.json"
|
| 23 |
enhanced_data = load_enhanced_json(enhanced_json_file)
|
| 24 |
|
| 25 |
# Extract document summary and page summaries
|
|
|
|
| 27 |
page_summaries = {int(page): data['summary'] for page, data in enhanced_data.get('pages', {}).items()}
|
| 28 |
|
| 29 |
# Import saved file and view
|
| 30 |
+
embeddings_df_save_path = "./output/SWCompleteRevisedPDF_output_embeddings.csv"
|
| 31 |
print("Loading embeddings.csv")
|
| 32 |
text_chunks_and_embedding_df_load = pd.read_csv(embeddings_df_save_path)
|
| 33 |
print("Embedding file loaded")
|
poetry.lock
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pyproject.toml
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[tool.poetry]
|
| 2 |
+
name = "ruleslawyer"
|
| 3 |
+
version = "0.1.0"
|
| 4 |
+
description = "Ingest PDFs, process into a json, generate embeddings, and load into a chat interface for RAG."
|
| 5 |
+
authors = ["Alan Meigs <alan.meigs@gmail.com>"]
|
| 6 |
+
readme = "README.md"
|
| 7 |
+
|
| 8 |
+
[tool.poetry.dependencies]
|
| 9 |
+
python = "^3.10"
|
| 10 |
+
pandas = "^2.2.3"
|
| 11 |
+
numpy = "^2.1.2"
|
| 12 |
+
openai = "^1.53.0"
|
| 13 |
+
gradio = "^5.4.0"
|
| 14 |
+
sentence-transformers = "^3.2.1"
|
| 15 |
+
torch = "^2.5.1"
|
| 16 |
+
docling-core = "^2.3.1" # This may need to be updated to the correct version.
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
[build-system]
|
| 20 |
+
requires = ["poetry-core"]
|
| 21 |
+
build-backend = "poetry.core.masonry.api"
|