Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
42 commits
Select commit Hold shift + click to select a range
44f0134
add module to parse pdf to markdown
du-phan Jan 22, 2025
be2e189
add cli command for the pdf parsing
du-phan Jan 22, 2025
0465148
update dependencies
du-phan Jan 22, 2025
e6f3f92
add parsed documents
du-phan Jan 22, 2025
b18a956
add extractor using mistral
du-phan Jan 23, 2025
3a9f98c
update github action
du-phan Jan 23, 2025
7453bd4
add cli for extractor
du-phan Jan 23, 2025
65e07d8
add tool to populate supabase
du-phan Jan 24, 2025
0297b05
add functions to evaluate feedstock sustainability
du-phan Jan 25, 2025
857aba1
cleaner logging
du-phan Jan 25, 2025
f8efebf
check if file exists first before doing anything
du-phan Jan 25, 2025
4e8a474
add cli command to populate supabase with feedstock evaluation
du-phan Jan 26, 2025
1c320c9
updated data
du-phan Jan 26, 2025
7702e58
add function to parse the whole folder at once
du-phan Feb 3, 2025
a2470e4
add sequestrae due diligence criteria
du-phan Feb 3, 2025
69a9ba5
add cli command for due diligence analyzer
du-phan Feb 4, 2025
b3d8884
move from llama to gemini
du-phan Feb 7, 2025
9c96df4
Removed project_data directory from repository tracking
du-phan Feb 7, 2025
cdbd2d1
add hallucination detection promp
du-phan Feb 10, 2025
c96ba5a
add function to validate and fix the json array
du-phan Feb 10, 2025
9014f9b
fix an error in the fix_hallucination_recursive function that leads t…
du-phan Feb 10, 2025
a97343b
update .gitignore
du-phan Feb 10, 2025
77795c1
fix minor error with the value to return in fix_hallucination_recursive
du-phan Feb 10, 2025
f18c6cc
add retry on error decorator
du-phan Feb 11, 2025
b6fcf24
add function to summarize subtopic insight
du-phan Feb 20, 2025
ada510c
misc update
du-phan Feb 20, 2025
2658b96
tell the llm to avoid redundancy
du-phan Feb 20, 2025
bb01c31
add a prompt to refine the subtopic summaries
du-phan Feb 21, 2025
d9cb550
add a prompt to refine the subtopic summaries
du-phan Feb 21, 2025
b6cf59e
add a prompt to resume topic
du-phan Feb 23, 2025
2aa81d3
add functions to populate the db
du-phan Feb 28, 2025
813cd7b
fix a small error in the field name
du-phan Mar 3, 2025
e462e4f
add new prompt to extract project overview data
du-phan Mar 11, 2025
21c4d6a
add new prompt to extract main insights
du-phan Mar 11, 2025
b30f8b7
add project_url
du-phan Mar 13, 2025
ca2f3ff
new function with the whole pipeline
du-phan Mar 21, 2025
4b53179
create folder if not exist
du-phan Mar 21, 2025
8934e7e
clean up abit
du-phan Mar 21, 2025
b3fecf1
add checkpoint
du-phan Mar 21, 2025
fa8bc59
add retry_on_error
du-phan Mar 21, 2025
3c48197
add cli to run pipeline on root dir
du-phan Mar 21, 2025
48117ad
fix minor error with process count
du-phan Mar 21, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion .github/workflows/ci.yml
Original file line number Diff line number Diff line change
Expand Up @@ -52,7 +52,7 @@ jobs:

# Step 7: Upload Coverage Report as an Artifact (optional)
- name: Upload Coverage Report
uses: actions/upload-artifact@v3
uses: actions/upload-artifact@v4
with:
name: coverage-report
path: htmlcov/
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
project_data/
.python-version
.vscode/
.DS_Store
Expand Down
3,319 changes: 2,741 additions & 578 deletions poetry.lock

Large diffs are not rendered by default.

17 changes: 15 additions & 2 deletions pyproject.toml
Original file line number Diff line number Diff line change
@@ -1,21 +1,34 @@
[tool.poetry.scripts]
sequestrae = "sequestrae_engine.cli.main:main"

[tool.poetry]
name = "sequestrae-engine"
version = "0.1.0"
description = "A Biochar Carbon Removal Assessment Engine for evaluating carbon sequestration potential."
description = "A Biochar Carbon Removal Assessment Engine for evaluating project risk."
authors = ["Du Phan <du-phan@users.noreply.github.com>"]
license = "MIT"
readme = "README.md"
homepage = "https://github.com/du-phan/sequestrae-engine"
repository = "https://github.com/du-phan/sequestrae-engine"
keywords = ["biochar", "carbon removal", "assessment", "engine", "sequestration"]
packages = [
{ include = "sequestrae_engine" }
]

[tool.poetry.dependencies]
python = ">=3.10,<4.0"
numpy = ">=1.24,<2.0"
pandas = "^2.0"
pydantic = "^1.10.2"
pydantic = "^2.5.2"
jsonschema = "^4.16.0"
jupyterlab = "^4.0.5"
llama-index = "^0.12.16"
llama-parse = "^0.6"
python-dotenv = "^1.0.0"
openai = "^1.0.0"
mistralai = "^1.3"
google-genai = "^1.0.0"
supabase = "^2.10.0"

[tool.poetry.dev-dependencies]
black = "24.10.0"
Expand Down
Empty file.
Loading
Loading