Files
mobile-pii-discovery-agent/model_PII_results/GPT-3.5-turbo/PII_I2_AddressBook_20260208T004210Z.jsonl
2026-02-11 22:13:22 -05:00

6 lines
15 KiB
JSON

{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["B2@2D02\\\u0002NP*.Z\u0001\f\u0002\t\u0001Ü\u000b\u0002Ü\b"]], "Total_raw_rows": 1, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain email addresses:\n- ABPerson (Columns: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, FirstSort, LastSort, DisplayName, ImageURI, WallpaperURI)\n- ABMultiValueEntry (Column: value)\n- ABStore (Column: ProviderIdentifier)\n\nTo search for email addresses in these tables, you can use the following SQL query:\n\n```sql\nSELECT First FROM ABPerson WHERE First REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Last FROM ABPerson WHERE Last REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Middle FROM ABPerson WHERE Middle REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT FirstPhonetic FROM ABPerson WHERE FirstPhonetic REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT MiddlePhonetic FROM ABPerson WHERE MiddlePhonetic REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT LastPhonetic FROM ABPerson WHERE LastPhonetic REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Organization FROM ABPerson WHERE Organization REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Department FROM ABPerson WHERE Department REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Note FROM ABPerson WHERE Note REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT JobTitle FROM ABPerson WHERE JobTitle REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Nickname FROM ABPerson WHERE Nickname REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Prefix FROM ABPerson WHERE Prefix REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Suffix FROM ABPerson WHERE Suffix REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT FirstSort FROM ABPerson WHERE FirstSort REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT LastSort FROM ABPerson WHERE LastSort REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT DisplayName FROM ABPerson WHERE DisplayName REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ImageURI FROM ABPerson WHERE ImageURI REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT WallpaperURI FROM ABPerson WHERE WallpaperURI REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value FROM ABMultiValueEntry WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ProviderIdentifier FROM ABStore WHERE ProviderIdentifier REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["16133 NE 44th Ct. "], ["98052"]], "Total_raw_rows": 2, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US phone numbers:\n\n1. Table: ABPerson\n - Columns: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, FirstSort, LastSort, DisplayName, ImageURI, guid\n\n2. Table: ABMultiValueEntry\n - Column: value\n\n3. Table: ABPhoneLastFour\n - Column: value\n\nTo search for US phone numbers in these tables and columns, you can use the following SQL queries:\n\n```sql\nSELECT First FROM ABPerson WHERE First REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Last FROM ABPerson WHERE Last REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Middle FROM ABPerson WHERE Middle REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT FirstPhonetic FROM ABPerson WHERE FirstPhonetic REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT MiddlePhonetic FROM ABPerson WHERE MiddlePhonetic REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT LastPhonetic FROM ABPerson WHERE LastPhonetic REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Organization FROM ABPerson WHERE Organization REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Department FROM ABPerson WHERE Department REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Note FROM ABPerson WHERE Note REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT FirstSort FROM ABPerson WHERE FirstSort REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT LastSort FROM ABPerson WHERE LastSort REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT DisplayName FROM ABPerson WHERE DisplayName REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ImageURI FROM ABPerson WHERE ImageURI REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT value FROM ABMultiValueEntry WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT value FROM ABPhoneLastFour WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the columns that may contain usernames are as follows:\n- ABAccount: AccountIdentifier\n- ABGroup: Name\n- ABGroupMembers: No potential username column found\n- ABMultiValue: value\n- ABMultiValueEntry: value\n- ABPerson: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, DisplayName\n- ABPersonSearchKey: SearchKey\n- ABPhoneLastFour: value\n- ClientCursor: No potential username column found\n- ClientSequence: No potential username column found\n\nTo search for possible usernames, you can use the following SQL query:\n```sql\nSELECT AccountIdentifier AS username FROM ABAccount WHERE AccountIdentifier REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Name AS username FROM ABGroup WHERE Name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM ABMultiValue WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM ABMultiValueEntry WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT First AS username FROM ABPerson WHERE First REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Last AS username FROM ABPerson WHERE Last REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Middle AS username FROM ABPerson WHERE Middle REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT FirstPhonetic AS username FROM ABPerson WHERE FirstPhonetic REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT MiddlePhonetic AS username FROM ABPerson WHERE MiddlePhonetic REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT LastPhonetic AS username FROM ABPerson WHERE LastPhonetic REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Organization AS username FROM ABPerson WHERE Organization REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Department AS username FROM ABPerson WHERE Department REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Note AS username FROM ABPerson WHERE Note REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT JobTitle AS username FROM ABPerson WHERE JobTitle REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Nickname AS username FROM ABPerson WHERE Nickname REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Prefix AS username FROM ABPerson WHERE Prefix REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Suffix AS username FROM ABPerson WHERE Suffix REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT DisplayName AS username FROM ABPerson WHERE DisplayName REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SearchKey AS username FROM ABPersonSearchKey WHERE SearchKey REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM ABPhoneLastFour WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\n```\nThis query will search for potential usernames in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["16133 NE 44th Ct. "], ["us"], ["Redmond"], ["WA"], ["United States"], ["_$!<Mobile>!$_"], ["_$!<Home>!$_"], ["_$!<Other>!$_"], ["NA OG"], ["GenericGPT"]], "Total_raw_rows": 10, "Exploration_sql": "The following columns in the database tables may contain person names:\n- ABPerson: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, DisplayName, PreviousFamilyName\n- ABMultiValueEntry: value\n- ABMultiValueLabel: value\n- ABGroupMembers: member_id\n- ABGroup: Name\n\nYou can use the following SQL query to search for person names in these columns:\n```sql\nSELECT First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, DisplayName, PreviousFamilyName FROM ABPerson WHERE First REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Last REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Middle REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR FirstPhonetic REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR MiddlePhonetic REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR LastPhonetic REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Organization REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Department REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Note REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR JobTitle REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Nickname REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Prefix REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Suffix REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR DisplayName REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR PreviousFamilyName REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value FROM ABMultiValueEntry WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value FROM ABMultiValueLabel WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT member_id FROM ABGroupMembers WHERE member_id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT Name FROM ABGroup WHERE Name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US postal addresses:\n\n1. Table: ABPerson\n - Columns: First, Last, Middle, Organization, Department, Note, FirstSort, LastSort, CompositeNameFallback, Address\n\n2. Table: ABMultiValueEntry\n - Columns: value\n\n3. Table: ABMultiValueLabel\n - Columns: value\n\nTo search for US postal addresses in these tables, you can use the following SQL queries:\n\n```sql\nSELECT First, Last, Middle, Organization, Department, Note, FirstSort, LastSort, CompositeNameFallback, Address\nFROM ABPerson\nWHERE Address REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT value\nFROM ABMultiValueEntry\nWHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT value\nFROM ABMultiValueLabel\nWHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n```\n\nThese queries will search for US postal addresses in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}