File size: 3,752 Bytes
5e692ef
 
f57bf28
5e692ef
f57bf28
20905da
f57bf28
 
5e692ef
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
ed7fe7c
f57bf28
 
 
 
 
 
 
 
 
 
 
 
 
5e692ef
f57bf28
 
c9b35f3
f57bf28
 
5e692ef
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
from sepa import parser
import re
import pandas as pd
import gradio as gr
import numpy as np

def full_function(xml_file):

    # Utility function to remove additional namespaces from the XML
    def strip_namespace(xml):
        return re.sub(' xmlns="[^"]+"', '', xml, count=1)

    # Read file
    with open(xml_file, 'r') as f:
        input_data = f.read()

    # Parse the bank statement XML to dictionary
    camt_dict = parser.parse_string(parser.bank_to_customer_statement, bytes(strip_namespace(input_data), 'utf8'))

    statements = pd.DataFrame.from_dict(camt_dict['statements'])
    all_entries = []
    for i,_ in statements.iterrows():
        if 'entries' in camt_dict['statements'][i]:

            #create empty df
            df = pd.DataFrame()
            dd = pd.DataFrame.from_records(camt_dict['statements'][i]['entries'])

            df['reference'] = dd['reference']
            df['credit_debit_indicator'] = dd['credit_debit_indicator']
            df['status'] = dd['status']
            df['account_servicer_reference'] = dd['account_servicer_reference']
            
            iban = camt_dict['statements'][i]['account']['id']['iban']
            name = camt_dict['statements'][i]['account']['name']
            df['iban'] = iban
            df['name'] = name
            df['currency'] = dd['amount'].str['currency']
            df['amount'] = dd['amount'].str['_value']

            df['value_date'] = dd['value_date'].str['date']
            df['value_date'] = pd.to_datetime(df['value_date']).dt.strftime('%Y-%m-%d')
            df['booking_date'] = dd['booking_date'].str['date']
            df['booking_date'] = pd.to_datetime(df['booking_date']).dt.strftime('%Y-%m-%d')

            #bank transaction code
            df['proprietary_code'] = dd['bank_transaction_code'].str['proprietary'].str['code']
            df['proprietary_issuer'] = dd['bank_transaction_code'].str['proprietary'].str['issuer']

            df['domain_code'] = dd['bank_transaction_code'].str['domain'].str['code']
            df['family_code'] = dd['bank_transaction_code'].str['domain'].str['family'].str['code']
            df['sub_family_code'] = dd['bank_transaction_code'].str['domain'].str['family'].str['sub_family_code']

            #transaction details
            df['debtor_name'] = dd['entry_details'].str[0].str['transaction_details'].str[0].str['related_parties'].str['debtor'].str['name']
            df['debtor_iban'] = dd['entry_details'].str[0].str['transaction_details'].str[0].str['related_parties'].str['debtor_account'].str['id'].str['iban']

            df['account_servicer_reference'] = dd['entry_details'].str[0].str['transaction_details'].str[0].str['refs'].str['account_servicer_reference']
            df['end_to_end_id'] = dd['entry_details'].str[0].str['transaction_details'].str[0].str['refs'].str['end_to_end_id']


            all_entries.append(df)

    df_entries = pd.concat(all_entries)
    df_entries.head()

    return df_entries





desc = "Upload XML file, convert to .csv file, and analyze transactions"

with gr.Blocks() as demo: 

    xml_file = gr.File(label = "Upload XML file here")
     
    # input_employees = gr.CheckboxGroup(["Transfer Solutions", "Ordina", "PwC", "Quistor", "Full Orbit", "Accenture", "Atos", "AMIS"], label="Oracle Partners", info="Who to judge?")
    # input_question = gr.Text(label="What activity is the Oracle Partner performing?")
    # additional_info = gr.Text(label="Additional information (optional)")
    output_text = gr.Text(label="R")
    df_entries = gr.DataFrame(label="Output table")


    submit_btn = gr.Button("Run analysis on XML file")


gr.Interface(fn=full_function, inputs=xml_file, outputs=df_entries, title=desc).launch(share=True)