Spaces:
Sleeping
Sleeping
# MIT License | |
# | |
# Copyright (c) 2024 dataforgood | |
# | |
# Permission is hereby granted, free of charge, to any person obtaining a copy | |
# of this software and associated documentation files (the "Software"), to deal | |
# in the Software without restriction, including without limitation the rights | |
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | |
# copies of the Software, and to permit persons to whom the Software is | |
# furnished to do so, subject to the following conditions: | |
# | |
# The above copyright notice and this permission notice shall be included in all | |
# copies or substantial portions of the Software. | |
# | |
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | |
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | |
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | |
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | |
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | |
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE | |
# SOFTWARE. | |
# Standard imports | |
import logging | |
import pickle | |
import sys | |
from pathlib import Path | |
import yaml | |
# Local imports | |
from dotenv import load_dotenv | |
from country_by_country import processor | |
NUM_CLI_ARGS = 3 | |
def process_report(config: dict, pdf_filepath: str) -> None: | |
# Loading API keys from .env file | |
load_dotenv() | |
proc = processor.ReportProcessor(config) | |
return proc.process(pdf_filepath) | |
if __name__ == "__main__": | |
logging.basicConfig(stream=sys.stdout, level=logging.INFO, format="%(message)s") | |
if len(sys.argv) != NUM_CLI_ARGS: | |
logging.error("Usage : python -m country_by_country config.yaml report.pdf") | |
sys.exit(-1) | |
logging.info(f"\nLoading {sys.argv[1]}") | |
with Path(sys.argv[1]).open() as fh: | |
config = yaml.safe_load(fh) | |
assets = process_report(config, sys.argv[2]) | |
# Save all the assets to disk | |
with Path("assets.pkl").open("wb") as fh: | |
pickle.dump(assets, fh) | |
logging.info( | |
"Assets dumped in assets.pkl. You can read then using : \n" | |
+ "pickle.load(open('assets.pkl', 'rb'))", | |
) | |