=================================================================== RCS file: /cvs/pta/pta_import.pl,v retrieving revision 1.2 retrieving revision 1.11 diff -u -p -r1.2 -r1.11 --- pta/pta_import.pl 2020/11/01 20:12:08 1.2 +++ pta/pta_import.pl 2020/11/17 14:13:31 1.11 @@ -16,81 +16,183 @@ use warnings; use strict; -use autodie; -# Please change the account numbers below to match the -# desired accounts in your accounts.txt. +use Getopt::Std qw(getopts); -my %accounts = ( - CHASE_CREDIT_CARD => '1234', - CHASE_PAYMENT_ACCOUNT => '5678', - AUTO => '1111', - BILLS => '2222', - FEES => '3333', - FOOD => '4444', - GAS => '5555', - GIFTS => '6666', - GROCERIES => '7777', - HEALTH => '8888', - HOME => '9999', - PERSONAL => '9998', - PRO => '9997', - SHOP => '9996' -); +our ($opt_I); -# This is the end of the user-configurable section. - # === SUBROUTINES ===================================================== -sub import_chase_credit_card() { - my %categories = ( - 'Automotive' => 'AUTO', - 'Bills & Utilities' => 'BILLS', - 'Fees & Adjustments' => 'FEES', - 'Food & Drink' => 'FOOD', - 'Gas' => 'GAS', - 'Gifts & Donations' => 'GIFTS', - 'Groceries' => 'GROCERIES', - 'Health & Wellness' => 'HEALTH', - 'Home' => 'HOME', - 'Personal' => 'PERSONAL', - 'Professional Services' => 'PRO', - 'Shopping' => 'SHOP' - ); +sub import_account ($$$$$) { + my ($account_name, $accounts_ref, $bookings_ref, + $compiled_ref, $csv_account) = @_; + my ($account, $amount, $booking, $credit, $date, $debit, + $description); + chomp(my $header = <>); while (<>) { + next if (/^$/); chomp; - my ($trans_date, $post_date, $description, $category, - $type, $amount) = split /,/; - - $trans_date =~ s#(\d+)/(\d+)/(\d+)#$3$1$2#; - $post_date =~ s#(\d+)/(\d+)/(\d+)#$3$1$2#; - $description =~ s/#//g; - my $booking = $categories{$category} || - 'CHASE_PAYMENT_ACCOUNT'; - my $contra = $accounts{$booking}; - my ($debit, $credit); - if ($amount <= 0) { - $amount = substr $amount, 1; - $credit = $accounts{CHASE_CREDIT_CARD}; - $debit = $contra; + my $line = $_; + foreach my $regex (@$compiled_ref) { + if ($line =~ /$regex/) { + $account = %$accounts_ref{$regex}; + $booking = %$bookings_ref{$regex}; + last; + } + } + if ($account_name eq "chase_credit") { + ($date, $amount, $debit, $credit, + $description) = + import_chase_credit($account, + $csv_account, $line); + } elsif ($account_name eq "capital_one_credit") { + ($date, $amount, $debit, $credit, + $description) = + import_capital_one_credit($account, + $csv_account, $line); + } elsif ($account_name eq "optum_hsa") { + ($date, $amount, $debit, $credit, + $description) = + import_optum_hsa($account, + $csv_account, $line); + } elsif ($account_name eq "sparkasse_camt") { + ($date, $amount, $debit, $credit, + $description) = + import_sparkasse_camt($account, + $csv_account, $line); } else { - $debit = $accounts{CHASE_CREDIT_CARD}; - $credit = $contra; + die "undefined format: $account_name"; } - print "$post_date $booking $debit $credit $amount " . + unless ($date && $booking && $debit && $credit && + $amount && $description) { + die "import parse error: $line"; + } + $description =~ s/#//g; + print "$date $booking $debit $credit $amount " . "$description\n"; } } -# === MAIN PROGRAM ===================================================== +sub import_chase_credit ($$$) { + my ($account, $csv_account, $line) = @_; + my ($trans_date, $post_date, $description, $category, + $type, $amount) = split /,/, $line; + my ($debit, $credit); + $post_date =~ s#(\d+)/(\d+)/(\d+)#$3$1$2#; + ($amount, $debit, $credit) = + get_accounts_by_amount_sign($amount, $account, + $csv_account); + return ($post_date, $amount, $debit, $credit, $description); +} -my $chase_credit_card_header = "Transaction Date,Post Date," . - "Description,Category,Type,Amount"; -my $firstLine; +sub import_capital_one_credit ($$$) { + my ($account, $csv_account, $line) = @_; + my ($trans_date, $post_date, $card_num, + $description, $category, $csv_debit, + $csv_credit) = split /,/, $line; + $post_date =~ s/(\d+)-(\d+)-(\d+)/$1$2$3/; + my ($amount, $debit, $credit) = + get_accounts_by_csv_col($account, $csv_account, + $csv_debit, $csv_credit); + return ($post_date, $amount, $debit, $credit, $description); +} -chomp($firstLine = <>); -if ($firstLine eq $chase_credit_card_header) { - import_chase_credit_card; +sub import_optum_hsa ($$$) { + my ($account, $csv_account, $line) = @_; + my ($date, $description, $amount, + $type) = split /,/, $line; + my ($debit, $credit); + $date =~ s/(\d+)-(\d+)-(\d+)/$1$2$3/; + $amount =~ s/\$//; + ($amount, $debit, $credit) = + get_accounts_by_amount_sign($amount, $account, + $csv_account); + return ($date, $amount, $debit, $credit, $description); +} + +sub import_sparkasse_camt ($$$) { + my ($account, $csv_account, $line) = @_; + my @fields; + $_ = $line; + push @fields, $1 while s/"([^"]*)";?//; + $_ eq "" or die "CAMT parse error before $_ in $line"; + @fields == 17 or die "not 17 but @fields fields: $line"; + $fields[1] =~ s/^(\d\d)\.(\d\d)\.(\d\d)$/20$3$2$1/ + or die "date parse error: $line"; + $fields[14] =~ s/,/./; + return $fields[1], + get_accounts_by_amount_sign($fields[14], $account, $csv_account), + (join ' ', $fields[11], $fields[4]); +} + +sub get_accounts_by_amount_sign ($$$) { + my ($amount, $account, $csv_account) = @_; + my ($debit, $credit); + if ($amount <= 0) { + $amount = substr $amount, 1; + $credit = $csv_account; + $debit = $account; + } else { + $debit = $csv_account; + $credit = $account; + } + return ($amount, $debit, $credit); +} + +sub get_accounts_by_csv_col ($$$$) { + my ($account, $csv_account, $csv_debit, $csv_credit) = @_; + my ($amount, $debit, $credit); + if ($csv_debit eq "") { + $amount = $csv_credit; + $credit = $account; + $debit = $csv_account; + } else { + $amount = $csv_debit; + $credit = $csv_account; + $debit = $account; + } + return ($amount, $debit, $credit); +} + +sub usage () { + printf STDERR "usage: %s -I accountname csvfilename\n", $0; + exit 1; +} + +# === MAIN PROGRAM ===================================================== + +my ($csv_account, $fn, $in, $account_name, %accounts, %bookings, @compiled); +getopts 'I:' or usage; +if ($opt_I) { + $account_name = $opt_I; + $fn = "import_" . $account_name . ".txt"; + open $in, $fn or die "$fn: $!"; } else { - print "Undefined bank header\n"; + usage; } +while (<$in>) { + chomp; + next if /^(?:#|$)/; + my $line = $_; + if (/^ACCOUNT\s+(\d+)$/) { + $csv_account and die "duplicate ACCOUNT line: $1"; + $csv_account = $1; + next; + } + /^(.*)[,;]\s+(\d+)\s+(\S+)$/ or + die "$fn import parse error: $line"; + my ($reg, $account, $booking) = ($1, $2, $3); + if ($account_name eq 'sparkasse_camt') { + $reg =~ s/(?:^|(?<=;))(?:$|(?=;))/"[^"]*"/g; + } else { + $reg =~ s/(?:^|(?<=,))(?:$|(?=,))/[^,]*/g; + } + $reg = qr/$reg/; + push @compiled, $reg; + $bookings{$reg} = $booking; + $accounts{$reg} = $account; +} +close $in; +$csv_account or die "no ACCOUNT line in $fn"; +import_account($account_name, \%accounts, \%bookings, + \@compiled, $csv_account);