update with ChatGPT (Code Interpreter)
This commit is contained in:
parent
31530815ed
commit
15faed98a8
49
README.md
49
README.md
@ -1,6 +1,7 @@
|
|||||||
|
|
||||||
# Personal Finance Database
|
# Personal Finance Database
|
||||||
|
|
||||||
This project aims to manage personal finance data using a Google Sheets based database. It provides tools to import data from PDF statements, perform basic personal financial analysis, and visualize the data.
|
This project aims to manage personal finance data using a Google Sheets-based database. It provides tools to import data from PDF statements, perform basic personal financial analysis, and visualize the data.
|
||||||
|
|
||||||
## Features
|
## Features
|
||||||
|
|
||||||
@ -9,6 +10,44 @@ This project aims to manage personal finance data using a Google Sheets based da
|
|||||||
- **Data Analysis:** Conduct basic personal financial analysis.
|
- **Data Analysis:** Conduct basic personal financial analysis.
|
||||||
- **Data Visualization:** Create simple and understandable visualizations of financial data.
|
- **Data Visualization:** Create simple and understandable visualizations of financial data.
|
||||||
|
|
||||||
|
## Project Structure
|
||||||
|
|
||||||
|
```
|
||||||
|
personal-finance-database/
|
||||||
|
├── .git
|
||||||
|
├── data/
|
||||||
|
│ ├── raw/
|
||||||
|
│ │ ├── your_file.pdf
|
||||||
|
│ ├── processed/
|
||||||
|
│ └── external/
|
||||||
|
├── src/
|
||||||
|
│ ├── __init__.py
|
||||||
|
│ ├── data_ingestion/
|
||||||
|
│ │ ├── __init__.py
|
||||||
|
│ │ ├── google_sheets_api.py
|
||||||
|
│ │ └── pdf_parser.py
|
||||||
|
│ ├── data_processing/
|
||||||
|
│ │ ├── __init__.py
|
||||||
|
│ │ └── data_cleaner.py
|
||||||
|
│ └── analysis_visualization/
|
||||||
|
│ ├── __init__.py
|
||||||
|
│ ├── financial_analysis.py
|
||||||
|
│ └── data_visualization.py
|
||||||
|
├── tests/
|
||||||
|
│ ├── __init__.py
|
||||||
|
│ ├── test_data_ingestion.py
|
||||||
|
│ ├── test_data_processing.py
|
||||||
|
│ └── test_analysis_visualization.py
|
||||||
|
├── notebooks/
|
||||||
|
│ ├── notebook1.ipynb
|
||||||
|
│ ├── notebook2.ipynb
|
||||||
|
│ └── ...
|
||||||
|
├── docs/
|
||||||
|
├── .gitignore
|
||||||
|
├── README.md
|
||||||
|
└── requirements.txt
|
||||||
|
```
|
||||||
|
|
||||||
## Installation
|
## Installation
|
||||||
|
|
||||||
Clone this repository to your local machine.
|
Clone this repository to your local machine.
|
||||||
@ -27,15 +66,19 @@ Install the necessary packages.
|
|||||||
pip install -r requirements.txt
|
pip install -r requirements.txt
|
||||||
```
|
```
|
||||||
## Usage
|
## Usage
|
||||||
[Provide instructions on how to use the project. This should include code examples and explanations of the different components.]
|
|
||||||
|
Details on how to use the project will be updated as the project progresses.
|
||||||
|
|
||||||
## Contributing
|
## Contributing
|
||||||
|
|
||||||
Pull requests are welcome. For major changes, please open an issue first to discuss what you would like to change.
|
Pull requests are welcome. For major changes, please open an issue first to discuss what you would like to change.
|
||||||
|
|
||||||
## License
|
## License
|
||||||
|
|
||||||
[Choose an open source license and mention it here.]
|
[Choose an open source license and mention it here.]
|
||||||
|
|
||||||
## Contact
|
## Contact
|
||||||
|
|
||||||
[Your Name] - [Your Email] - [Your LinkedIn/GitHub/Twitter etc.]
|
[Your Name] - [Your Email] - [Your LinkedIn/GitHub/Twitter etc.]
|
||||||
|
|
||||||
Remember to replace the placeholders with your actual details. You should also include a more detailed explanation in the "Usage" section once you have more functionality built out.
|
Remember to replace the placeholders with your actual details.
|
||||||
|
1522
notebooks/pdf_data_extraction_test.ipynb
Normal file
1522
notebooks/pdf_data_extraction_test.ipynb
Normal file
File diff suppressed because it is too large
Load Diff
@ -1,14 +1,35 @@
|
|||||||
from pdfminer.high_level import extract_text
|
from pdfminer.high_level import extract_text
|
||||||
import tabula
|
import tabula
|
||||||
|
|
||||||
class PdfParser:
|
class StatementParser:
|
||||||
def __init__(self, file_path):
|
def __init__(self, file_path: str):
|
||||||
self.file_path = file_path
|
self.file_path = file_path
|
||||||
|
|
||||||
def extract_text(self):
|
def extract_text(self):
|
||||||
text = extract_text(self.file_path)
|
# Code to extract text from PDF
|
||||||
return text
|
pass
|
||||||
|
|
||||||
def extract_table(self):
|
def extract_transactions(self):
|
||||||
tables = tabula.read_pdf(self.file_path, pages='all')
|
# This method should be implemented by each subclass
|
||||||
return tables
|
raise NotImplementedError
|
||||||
|
|
||||||
|
|
||||||
|
class DBSCreditCardStatementParser(StatementParser):
|
||||||
|
def extract_transactions(self):
|
||||||
|
# Code specific to DBS Credit Card statements
|
||||||
|
pass
|
||||||
|
|
||||||
|
|
||||||
|
class BankSavingAccountStatementParser(StatementParser):
|
||||||
|
def extract_transactions(self):
|
||||||
|
# Code specific to Bank Saving Account statements
|
||||||
|
pass
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
class FundAccountStatementParser(StatementParser):
|
||||||
|
def extract_transactions(self):
|
||||||
|
# Code specific to Fund Account statements
|
||||||
|
pass
|
||||||
|
Loading…
Reference in New Issue
Block a user