## Entity Annotation

In [1]:
import pandas as pd

df = pd.read_csv("pii_dataset.csv")
df

Unnamed: 0,gender,title,first_name,last_name,email,name_partner,gender_partner,postcode,city,street,full_address
0,Male,Mr,Imanol,Kirlin,imanol_kirlin@faulkner.com,Mila Weissnat,Female,AB10 1AB,Aberdeen,Broad Street,"Broad Street, AB10 1AB Aberdeen"
1,Female,Ms,Claudie,Rodriguez,claudierodriguez91@haas.com,Jorja Schuster,Female,IM1 1AG,Isle of Man,Circular Road,"Circular Road, IM1 1AG Isle of Man"
2,Male,Mr,Ismael,Zemlak,ismael-zemlak45@jackson-campbell.info,Jalon Glover,Male,TN34 2EZ,Hastings,Baldslow Road,"Baldslow Road, TN34 2EZ Hastings"
3,Non-Binary,Mx,Jesus,Rutherford,jesus-rutherford61@nunez.com,Martin Kihn,Male,LA22 9HA,Ambleside,Kirkfield,"Kirkfield, LA22 9HA Ambleside"
4,Female,Mrs,Leslee,Brown,leslee_brown42@mendez.org,Derrell Keebler,Male,W9 2BT,London,Shirland Road,"Shirland Road, W9 2BT London"
...,...,...,...,...,...,...,...,...,...,...,...
6068,Female,Ms,Louetta,O'Conner,louetta_o'conner@gallagher.com,Obed Terry,Male,HG4 2QN,Ripon,Bishopton Lane,"Bishopton Lane, HG4 2QN Ripon"
6069,Non-Binary,Mx,Fleet,Thompson,fleet_thompson@thompson.com,Leeann Stoltenberg,Non-Binary,EH10 4AN,Edinburgh,Falcon Avenue,"Falcon Avenue, EH10 4AN Edinburgh"
6070,Male,Mr,Pleasant,Kshlerin,pleasant.kshlerin69@leonard.org,Evelyne Bernier,Female,CM8 1SX,Witham,Holst Avenue,"Holst Avenue, CM8 1SX Witham"
6071,Non-Binary,Mx,Tilden,Dickens,tilden.dickens@alvarez.org,Savion Johns,Male,HA1 2RZ,Harrow,Rosslyn Crescent,"Rosslyn Crescent, HA1 2RZ Harrow"


In [2]:
from synthesized.config import PersonLabels
from synthesized.metadata.value import Person

person_annot = Person(name="person", labels=PersonLabels(firstname="first_name", lastname="last_name", title="title", email="email"))
person_partner_annot = Person(name="person_partner", labels=PersonLabels(fullname="name_partner", gender="gender_partner"))

In [3]:
from synthesized.config import AddressLabels
from synthesized.metadata.value import Address

address_annot = Address(
    name="address",
    labels=AddressLabels(
        postcode="postcode",
        street="street",
        city="city",
        full_address="full_address"
        ),
    locales="en_GB",
    )

In [4]:
from synthesized import MetaExtractor

df_meta = MetaExtractor.extract(
    df=df,
    annotations=
        [
            person_annot,
            person_partner_annot,
            address_annot
        ]
    )

In [5]:
from synthesized.config import HighDimConfig
from synthesized import HighDimSynthesizer

config = HighDimConfig(
    learn_postcodes=True,
    postcode_level=1,
)

synth = HighDimSynthesizer(df_meta, config=config)

In [6]:
synth.learn(df)

[38;5;98mYou're currently on the free version of the Synthesized SDK. For full access to all of our features contact the Synthesized team.[39m
Training [38;5;47m╠████████████████████╣[39m Done.


In [7]:
df_synth = synth.synthesize(10)
df_synth

[38;5;98mYou're currently on the free version of the Synthesized SDK. For full access to all of our features contact the Synthesized team.[39m


Unnamed: 0,gender,title,first_name,last_name,email,name_partner,gender_partner,postcode,city,street,full_address
0,Female,Mr,Connor,Smart,connorsmart42@watson-morgan.com,Edward Patel,Male,CA35XW,Carlisle,Thomas bridge,"Flat 22 97 Thomas bridge, CA35XW Carlisle West..."
1,Female,Ms,Sara,Archer,sara.archer35@bennett.com,Adam Grant,Male,SK100GU,Macclesfield,Jones crossing,"Flat 01 8 Jones crossing, SK100GU Macclesfield..."
2,Female,Mrs,Alice,Foster,alice.foster@ferguson.com,Joanne Harris,Female,BH236ZR,Christchurch,Malcolm light,"Flat 13F 35 Malcolm light, BH236ZR Christchurc..."
3,Non-Binary,Mr,Roger,Miah,rogermiah68@perkins-henderson.net,Lorraine Connolly,Female,SN156XB,Chippenham,Stephanie divide,"Studio 92Q 839 Stephanie divide, SN156XB Chipp..."
4,Male,Mr,Thomas,White,thomas-white@carter.com,Paige Price,Female,S425UZ,Chesterfield,Thompson streets,"Flat 21 10 Thompson streets, S425UZ Chesterfie..."
5,Male,Mr,Derek,Rice,derek-rice@hart-mason.com,Beth Boyle,Female,CB239JX,Cambridge,Alexander pine,"Flat 5 180 Alexander pine, CB239JX Cambridge E..."
6,Female,Mrs,Josephine,Miles,josephine_miles@shaw.com,Toby Nolan,Male,WF136JW,Dewsbury,Stanley forks,"Flat 92 132 Stanley forks, WF136JW Dewsbury Ci..."
7,Non-Binary,Mr,Frederick,Potts,frederick-potts75@perry-brennan.com,Jane Williams,Female,TR135SG,Helston,Pamela courts,"Studio 9 1 Pamela courts, TR135SG Helston Dorset"
8,Non-Binary,Mr,Craig,Mitchell,craig-mitchell@warner-jordan.com,Aaron Begum,Non-Binary,LE44SJ,Leicester,Craig glens,"Flat 5 9 Craig glens, LE44SJ Leicester Angus"
9,Female,Mr,Hugh,Walsh,hugh.walsh48@clarke.com,Graeme Nicholls,Male,DD100RQ,Montrose,Jones trafficway,"Flat 95 721 Jones trafficway, DD100RQ Montrose..."
