Import CSV files via HTTP importer
Since I ulimately want to run `xactfetch` in Kubernetes, running the
importer in a container as a child process doesn't make much sense.
While running `podman` in a Kubernetes container is possible, getting it
to work is non trivial. Rather than go through all that effort, I think
it makes more sense to just use HTTP to communicate with the importer I
already have running.
I had originally chosen not to use the web importer because of how I
have it configured to use Authelia for authentication. The importer
itself does not have any authentication beyond the "secret" parameter
(which is not secret at all, given that it is passed in the query string
and thus visible to anyone and stored in access logs), so I was hesitant
to add an access control rule to bypass authentication for the
`/autoupload` path. Fortunately, I discovered that Authelia will use
the value of the `Proxy-Authorization` header to authenticate the
request without redirecting to the login screen. With just a couple of
lines in the Ingress configuration, I got it to work using the regular
`Authorization` header as well:
```yaml
kind: Ingress
metadata:
annotations:
nginx.ingress.kubernetes.io/auth-snippet: |
proxy_set_header Proxy-Authorization $http_authorization;
proxy_set_header X-Forwarded-Method $request_method;
nginx.ingress.kubernetes.io/configuration-snippet: |
proxy_set_header Authorization "";
```
This commit is contained in:
129
xactfetch.py
129
xactfetch.py
@@ -1,14 +1,12 @@
|
||||
import base64
|
||||
import copy
|
||||
import datetime
|
||||
import getpass
|
||||
import json
|
||||
import logging
|
||||
import os
|
||||
import random
|
||||
import shlex
|
||||
import shutil
|
||||
import subprocess
|
||||
import tempfile
|
||||
import urllib.parse
|
||||
from pathlib import Path
|
||||
from types import TracebackType
|
||||
@@ -25,6 +23,7 @@ log = logging.getLogger('xactfetch')
|
||||
NTFY_URL = 'https://ntfy.pyrocufflink.net'
|
||||
NTFY_TOPIC = 'dustin'
|
||||
FIREFLY_III_URL = 'https://firefly.pyrocufflink.blue'
|
||||
FIREFLY_III_IMPORTER_URL = 'https://dustin.import.firefly.pyrocufflink.blue'
|
||||
ACCOUNTS = {
|
||||
'commerce': {
|
||||
'8357': 1,
|
||||
@@ -34,6 +33,42 @@ ACCOUNTS = {
|
||||
}
|
||||
|
||||
|
||||
class FireflyImporter:
|
||||
def __init__(
|
||||
self,
|
||||
url: str,
|
||||
secret: str,
|
||||
auth: Optional[tuple[str, str]],
|
||||
) -> None:
|
||||
self.url = url
|
||||
self.secret = secret
|
||||
self.auth = auth
|
||||
|
||||
def import_csv(
|
||||
self,
|
||||
csv: Path,
|
||||
config: dict[str, Any],
|
||||
) -> None:
|
||||
log.debug('Importing transactions from %s to Firefly III', csv)
|
||||
url = f'{self.url.rstrip("/")}/autoupload'
|
||||
with csv.open('rb') as f:
|
||||
r = requests.post(
|
||||
url,
|
||||
auth=self.auth,
|
||||
headers={
|
||||
'Accept': 'application/json',
|
||||
},
|
||||
params={
|
||||
'secret': self.secret,
|
||||
},
|
||||
files={
|
||||
'importable': ('import.csv', f),
|
||||
'json': ('import.json', json.dumps(config)),
|
||||
},
|
||||
)
|
||||
r.raise_for_status()
|
||||
|
||||
|
||||
def ntfy(
|
||||
message: Optional[str] = None,
|
||||
topic: str = NTFY_TOPIC,
|
||||
@@ -132,48 +167,11 @@ def rfc2047_base64encode(
|
||||
return f"=?UTF-8?B?{encoded}?="
|
||||
|
||||
|
||||
def firefly_import(csv: Path, config: dict[str, Any], token: str) -> None:
|
||||
log.debug('Importing transactions from %s to Firefly III', csv)
|
||||
env = {
|
||||
'PATH': os.environ['PATH'],
|
||||
'FIREFLY_III_ACCESS_TOKEN': token,
|
||||
'IMPORT_DIR_ALLOWLIST': '/import',
|
||||
'FIREFLY_III_URL': FIREFLY_III_URL,
|
||||
'WEB_SERVER': 'false',
|
||||
}
|
||||
with tempfile.TemporaryDirectory() as tmpdir:
|
||||
dest = Path(tmpdir) / 'import.csv'
|
||||
log.debug('Copying %s to %s', csv, dest)
|
||||
shutil.copyfile(csv, dest)
|
||||
configfile = dest.with_suffix('.json')
|
||||
log.debug('Saving config as %s', configfile)
|
||||
with configfile.open('w', encoding='utf-8') as f:
|
||||
json.dump(config, f)
|
||||
cmd = [
|
||||
'podman',
|
||||
'run',
|
||||
'--rm',
|
||||
'-it',
|
||||
'-v',
|
||||
f'{tmpdir}:/import:ro,z',
|
||||
'--env-host',
|
||||
'docker.io/fireflyiii/data-importer',
|
||||
]
|
||||
if log.isEnabledFor(logging.DEBUG):
|
||||
log.debug(
|
||||
'Running command: %s',
|
||||
' '.join(shlex.quote(str(a)) for a in cmd),
|
||||
)
|
||||
if os.environ.get('DEBUG_SKIP_IMPORT'):
|
||||
cmd = ['true']
|
||||
p = subprocess.run(cmd, env=env, check=False)
|
||||
if p.returncode == 0:
|
||||
log.info(
|
||||
'Successfully imported transactions from %s to Firefly III',
|
||||
csv,
|
||||
)
|
||||
else:
|
||||
log.error('Failed to import transactions from %s')
|
||||
def secret_from_file(env: str, default: str) -> str:
|
||||
filename = os.environ.get(env, default)
|
||||
log.debug('Loading secret value from %s', filename)
|
||||
with open(filename, 'r', encoding='utf-8') as f:
|
||||
return f.read().rstrip()
|
||||
|
||||
|
||||
def get_last_transaction_date(key: int, token: str) -> datetime.date:
|
||||
@@ -204,7 +202,9 @@ def get_last_transaction_date(key: int, token: str) -> datetime.date:
|
||||
return last_date.date() + datetime.timedelta(days=1)
|
||||
|
||||
|
||||
def download_chase(page: Page, end_date: datetime.date, token: str) -> bool:
|
||||
def download_chase(
|
||||
page: Page, end_date: datetime.date, token: str, importer: FireflyImporter
|
||||
) -> bool:
|
||||
with Chase(page) as c, ntfyerror('Chase', page) as r:
|
||||
c.login()
|
||||
key = ACCOUNTS['chase']
|
||||
@@ -224,11 +224,16 @@ def download_chase(page: Page, end_date: datetime.date, token: str) -> bool:
|
||||
return True
|
||||
csv = c.download_transactions(start_date, end_date)
|
||||
log.info('Importing transactions from Chase into Firefly III')
|
||||
c.firefly_import(csv, key, token)
|
||||
c.firefly_import(csv, key, importer)
|
||||
return r.success
|
||||
|
||||
|
||||
def download_commerce(page: Page, end_date: datetime.date, token: str) -> bool:
|
||||
def download_commerce(
|
||||
page: Page,
|
||||
end_date: datetime.date,
|
||||
token: str,
|
||||
importer: FireflyImporter,
|
||||
) -> bool:
|
||||
log.info('Downloading transaction lists from Commerce Bank')
|
||||
csvs = []
|
||||
with CommerceBank(page) as c, ntfyerror('Commerce Bank', page) as r:
|
||||
@@ -259,7 +264,7 @@ def download_commerce(page: Page, end_date: datetime.date, token: str) -> bool:
|
||||
csvs.append((key, c.download_transactions(start_date, end_date)))
|
||||
log.info('Importing transactions from Commerce Bank into Firefly III')
|
||||
for key, csv in csvs:
|
||||
c.firefly_import(csv, key, token)
|
||||
c.firefly_import(csv, key, importer)
|
||||
return r.success
|
||||
|
||||
|
||||
@@ -451,10 +456,12 @@ class CommerceBank:
|
||||
modal.get_by_label('Close').click()
|
||||
return path
|
||||
|
||||
def firefly_import(self, csv: Path, account: int, token: str) -> None:
|
||||
def firefly_import(
|
||||
self, csv: Path, account: int, importer: FireflyImporter
|
||||
) -> None:
|
||||
config = copy.deepcopy(self.IMPORT_CONFIG)
|
||||
config['default_account'] = account
|
||||
firefly_import(csv, config, token)
|
||||
importer.import_csv(csv, config)
|
||||
|
||||
|
||||
class Chase:
|
||||
@@ -635,7 +642,9 @@ class Chase:
|
||||
self.page.get_by_role('button', name='Sign out').click()
|
||||
log.info('Logged out of Chase')
|
||||
|
||||
def firefly_import(self, csv: Path, account: int, token: str) -> None:
|
||||
def firefly_import(
|
||||
self, csv: Path, account: int, importer: FireflyImporter
|
||||
) -> None:
|
||||
config = copy.deepcopy(self.IMPORT_CONFIG)
|
||||
config['default_account'] = account
|
||||
with csv.open('r', encoding='utf-8') as f:
|
||||
@@ -648,7 +657,7 @@ class Chase:
|
||||
config['do_mapping'].pop(0)
|
||||
else:
|
||||
raise ValueError(f'Unexpected CSV schema: {headers}')
|
||||
firefly_import(csv, config, token)
|
||||
importer.import_csv(csv, config)
|
||||
|
||||
|
||||
def main() -> None:
|
||||
@@ -660,15 +669,25 @@ def main() -> None:
|
||||
)
|
||||
log.debug('Getting Firefly III access token from rbw vault')
|
||||
token = rbw_get('xactfetch')
|
||||
import_secret = secret_from_file(
|
||||
'FIREFLY_IMPORT_SECRET_FILE', 'import.secret'
|
||||
)
|
||||
import_auth = (
|
||||
os.environ.get('FIREFLY_IMPORT_USER', getpass.getuser()),
|
||||
secret_from_file('FIREFLY_IMPORT_PASSWORD_FILE', 'import.password'),
|
||||
)
|
||||
importer = FireflyImporter(
|
||||
FIREFLY_III_IMPORTER_URL, import_secret, import_auth
|
||||
)
|
||||
end_date = datetime.date.today() - datetime.timedelta(days=1)
|
||||
with sync_playwright() as pw:
|
||||
headless = os.environ.get('DEBUG_HEADLESS_BROWSER', '1') == '1'
|
||||
browser = pw.firefox.launch(headless=headless)
|
||||
page = browser.new_page()
|
||||
failed = False
|
||||
if not download_commerce(page, end_date, token):
|
||||
if not download_commerce(page, end_date, token, importer):
|
||||
failed = True
|
||||
if not download_chase(page, end_date, token):
|
||||
if not download_chase(page, end_date, token, importer):
|
||||
failed = True
|
||||
raise SystemExit(1 if failed else 0)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user