"""
IMPORTANT:
THE EXAMPLE IN THIS FILE IS CURRENTLY NOT FUNCTIONAL
BECAUSE THE `download_from_public_repository` FUNCTION
NO LONGER EXISTS. WE HAD TO MAKE A QUICK RELEASE TO
REMEDIATE AN ISSUE IN OUR PREVIOUS STORAGE SOLUTION.
THIS WILL BE FIXED IN A FUTURE RELEASE.
IN THE MEAN TIME IF YOU NEED ANY CLARIFICATION
REGARDING THE PACKAGE PLEASE FEEL FREE TO OPEN AN ISSUE.
"""
import pandas as pd
from deepparse import download_from_public_repository
from deepparse.dataset_container import PickleDatasetContainer
from deepparse.parser import AddressParser
saving_dir = "./data"
file_extension = "p"
test_dataset_name = "predict"
download_from_public_repository(test_dataset_name, saving_dir, file_extension=file_extension)
addresses_to_parse = PickleDatasetContainer("./data/predict.p", is_training_container=False)
print(addresses_to_parse[:2])
address_parser = AddressParser(model_type="bpemb", device=0)
parsed_addresses = address_parser(addresses_to_parse[0:300])
print(parsed_addresses[0])
address_parser("")
address_parser(" ")
fields = ["StreetNumber", "StreetName", "Municipality", "Province", "PostalCode"]
parsed_address_data_frame = pd.DataFrame(
[parsed_address.to_dict(fields=fields) for parsed_address in parsed_addresses],
columns=fields,
)