In [2]:
!pip install numpy
!pip install pandas
In [2]:
import json
import numpy as np
import pandas
import datetime
from utils import pprint
from record import RecordEntry, MetaData, DataRecord
In [3]:
# Example: Record entry
name = RecordEntry(value="Max Mustermann", ocr="Max Mosterman", ocr_pos=(54, 23, 10, 100), txt_pos=(250, 260), probability=0.95)
pprint(name)
name2 = RecordEntry(value="Mandy Mustermann", ocr="Mandy Mustermann", position=(54, 23, 20, 100), probability=0.93)
pprint(name2)
street = RecordEntry(value="Musterstraße 84", ocr="Musterstr. b4", position=(67, 138, 11, 90), txt_pos=(1000, 1020), probability=0.9)
pprint(street)
city = RecordEntry(value="Musterhausen", ocr="Musterhaus", position=(288, 417, 9, 110), probability=0.99)
pprint(city)
In [4]:
# Example: DataRecord
# Define meta data
doc_meta = MetaData(document="my_invoice.png",
user="MKrause",
release="1.2.3")
address = DataRecord(street=[street], city=[city])
sender = DataRecord(name=[name, name2], address=[address])
# Define a single doc data record
single_record = DataRecord(meta=doc_meta, sender=[sender])
In [5]:
pprint(single_record)
In [6]:
json.JSONEncoder().encode(single_record)
Out[6]: