mirror of
https://github.com/frankwxu/mobile-pii-discovery-agent.git
synced 2026-02-20 13:40:41 +00:00
add other model results
This commit is contained in:
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The only table in the database is \"android_metadata\" with a column \"locale\". Let's search for possible email addresses in this column.\n```sql\nSELECT locale FROM android_metadata WHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The only table in the database is \"android_metadata\" with a column \"locale\". Let's search for US phone numbers in this column.\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The only table in the database is \"android_metadata\" with a column \"locale\". Let's query the \"locale\" column to find possible usernames.\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the table \"android_metadata\", there is only one column named \"locale\" of type TEXT. Let's search this column for possible person names.\nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The only table in the database is \"android_metadata\" with a column \"locale\". Let's search for US postal addresses in this column.\nSELECT locale FROM android_metadata WHERE locale REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_msgstore.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following columns have the potential to contain email addresses:\n- Table: message_text, Column: text_data\n- Table: message_vcard, Column: vcard\n- Table: message_system, Column: user\n- Table: message_system_business_state, Column: business_name\n- Table: message_system_chat_participant, Column: display_name\n- Table: message_system_group, Column: business_name\n- Table: message_system_initial_privacy_provider, Column: verified_biz_name\n- Table: message_system_number_change, Column: old_data\n- Table: message_system_photo_change, Column: old_data\n- Table: message_system_value_change, Column: old_data\n- Table: message_template, Column: description\n- Table: message_template_button, Column: extra_data\n- Table: message_template_button, Column: extra_consent_data\n- Table: message_template_button, Column: otp_matched_package_name\n- Table: message_template_button, Column: tag\n\nYou can use the following SQL query to search for email addresses in these columns:\n```sql\nSELECT text_data AS email FROM message_text WHERE text_data REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT vcard AS email FROM message_vcard WHERE vcard REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT user AS email FROM message_system WHERE user REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT business_name AS email FROM message_system_business_state WHERE business_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT display_name AS email FROM message_system_chat_participant WHERE display_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT business_name AS email FROM message_system_group WHERE business_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT verified_biz_name AS email FROM message_system_initial_privacy_provider WHERE verified_biz_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT old_data AS email FROM message_system_number_change WHERE old_data REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT old_data AS email FROM message_system_photo_change WHERE old_data REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT old_data AS email FROM message_system_value_change WHERE old_data REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT description AS email FROM message_template WHERE description REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT extra_data AS email FROM message_template_button WHERE extra_data REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT extra_consent_data AS email FROM message_template_button WHERE extra_consent_data REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT otp_matched_package_name AS email FROM message_template_button WHERE otp_matched_package_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT tag AS email FROM message_template_button WHERE tag REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_msgstore.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, the following tables and columns may contain US phone numbers:\n- Table: message\n - Columns: text_data\n\nTo search for US phone numbers in these tables, you can use the following SQL query:\n```sql\nSELECT text_data FROM message WHERE text_data REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_msgstore.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following columns have the potential to contain usernames:\n- Table: message_text, Column: text_data\n- Table: message_vcard, Column: vcard\n- Table: message_template_button, Column: extra_data\n- Table: message_template_button, Column: otp_matched_package_name\n- Table: message_template_button, Column: extra_consent_data\n- Table: message_template_button, Column: description\n- Table: message_template_button, Column: page_title\n- Table: message_template_button, Column: url\n- Table: message_template_button, Column: counter_abuse_token\n\nTo search for possible usernames in these columns, you can use the following SQL query:\n```sql\nSELECT text_data AS username FROM message_text WHERE text_data REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT vcard AS username FROM message_vcard WHERE vcard REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT extra_data AS username FROM message_template_button WHERE extra_data REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT otp_matched_package_name AS username FROM message_template_button WHERE otp_matched_package_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT extra_consent_data AS username FROM message_template_button WHERE extra_consent_data REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT description AS username FROM message_template_button WHERE description REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT page_title AS username FROM message_template_button WHERE page_title REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT url AS username FROM message_template_button WHERE url REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT counter_abuse_token AS username FROM message_template_button WHERE counter_abuse_token REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_msgstore.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following columns have text-like fields where person names could potentially be found:\n- Table: message_text, Column: text_data\n- Table: message_vcard, Column: vcard\n- Table: message_system, Column: user\n- Table: message_system_business_state, Column: business_name\n- Table: message_system_chat_participant, Column: display_name\n- Table: message_system_group, Column: business_name\n- Table: message_system_initial_privacy_provider, Column: verified_biz_name\n- Table: message_system_number_change, Column: old_data\n- Table: message_system_photo_change, Column: old_data\n- Table: message_system_value_change, Column: old_data\n- Table: message_template, Column: content_text_data\n- Table: message_template_button, Column: extra_consent_data\n- Table: message_text, Column: text_data\n- Table: message_vcard, Column: vcard\n\nYou can search for person names in these columns using the appropriate REGEXP pattern matching.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_msgstore.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US postal addresses:\n\n1. Table: message_location\n - Columns: latitude, longitude, place_name, place_address\n\n2. Table: message_text\n - Column: text_data\n\n3. Table: message_vcard\n - Column: vcard\n\nTo search for US postal addresses in these tables, you can use the following SQL queries:\n\n```sql\nSELECT place_address\nFROM message_location\nWHERE place_address REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT text_data\nFROM message_text\nWHERE text_data REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT vcard\nFROM message_vcard\nWHERE vcard REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n```\n\nThese queries will search for US postal addresses in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The following tables and columns have been identified as potential sources for email addresses:\n1. Table: quick_promotion_payload\n - Columns: trigger_id, trigger_context\n\n2. Table: wa_address_book\n - Columns: jid, email\n\n3. Table: wa_biz_profiles\n - Columns: jid, email\n\n4. Table: wa_bot_profiles\n - Columns: jid\n\n5. Table: wa_contacts\n - Columns: jid, number, display_name, given_name, family_name, nickname, company, title\n\n6. Table: wa_trusted_contacts\n - Columns: jid\n\n7. Table: wa_trusted_contacts_send\n - Columns: jid\n\nYou can use the following SQL query to search for email addresses in these tables:\n```sql\nSELECT trigger_id AS email FROM quick_promotion_payload WHERE trigger_id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT trigger_context AS email FROM quick_promotion_payload WHERE trigger_context REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT email FROM wa_address_book WHERE email REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT email FROM wa_biz_profiles WHERE email REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT jid AS email FROM wa_biz_profiles WHERE jid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT jid AS email FROM wa_bot_profiles WHERE jid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT jid AS email FROM wa_contacts WHERE jid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT number AS email FROM wa_contacts WHERE number REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT display_name AS email FROM wa_contacts WHERE display_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT given_name AS email FROM wa_contacts WHERE given_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT family_name AS email FROM wa_contacts WHERE family_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT nickname AS email FROM wa_contacts WHERE nickname REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT company AS email FROM wa_contacts WHERE company REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT title AS email FROM wa_contacts WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT jid AS email FROM wa_trusted_contacts WHERE jid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT jid AS email FROM wa_trusted_contacts_send WHERE jid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n```\nThis query will search for email addresses in the specified columns of the identified tables.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["5713298742"], ["5713349815"], ["8085096467"], ["8624338328"], ["7034241981"], ["2028177932"], ["5715917168"], ["2025692832"], ["+16106046786"], ["+16263678865"]], "Total_raw_rows": 10, "Exploration_sql": "The columns in the relevant tables are as follows:\n- Table 'wa_address_book':\n - number TEXT\n\n- Table 'wa_contacts':\n - number TEXT\n\n- Table 'wa_newsletter_props':\n - prop_name TEXT\n - prop_value TEXT\n\n- Table 'wa_props':\n - prop_name TEXT\n - prop_value TEXT\n\n- Table 'wa_trusted_contacts':\n - jid TEXT\n - incoming_tc_token BLOB\n - incoming_tc_token_timestamp LONG\n\n- Table 'wa_trusted_contacts_send':\n - jid TEXT\n - sent_tc_token_timestamp LONG\n - real_issue_timestamp LONG\n\nNow, I will search these columns for US phone numbers.\nSELECT number FROM wa_address_book WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT number FROM wa_contacts WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The following tables and columns may contain usernames:\n1. Table: quick_promotion_payload\n - Columns: trigger_id, trigger_context\n\n2. Table: wa_address_book\n - Columns: jid, display_name, family_name, given_name, nickname\n\n3. Table: wa_biz_profiles\n - Columns: jid, email, tag, name, description, creator_name\n\n4. Table: wa_bot_profiles\n - Columns: jid, tag, name, description, category, creator_name\n\n5. Table: wa_contacts\n - Columns: jid, display_name, family_name, given_name, nickname, wa_name\n\n6. Table: wa_trusted_contacts\n - Columns: jid, incoming_tc_token\n\n7. Table: wa_trusted_contacts_send\n - Columns: jid\n\nYou can use the following SQL query to search for possible usernames in these columns:\n```sql\nSELECT trigger_id AS username FROM quick_promotion_payload WHERE trigger_id REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT trigger_context AS username FROM quick_promotion_payload WHERE trigger_context REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT jid AS username FROM wa_address_book WHERE jid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT display_name AS username FROM wa_address_book WHERE display_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT family_name AS username FROM wa_address_book WHERE family_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT given_name AS username FROM wa_address_book WHERE given_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT nickname AS username FROM wa_address_book WHERE nickname REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT jid AS username FROM wa_biz_profiles WHERE jid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT email AS username FROM wa_biz_profiles WHERE email REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT tag AS username FROM wa_biz_profiles WHERE tag REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT name AS username FROM wa_biz_profiles WHERE name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT description AS username FROM wa_biz_profiles WHERE description REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT creator_name AS username FROM wa_biz_profiles WHERE creator_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT jid AS username FROM wa_bot_profiles WHERE jid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT tag AS username FROM wa_bot_profiles WHERE tag REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT name AS username FROM wa_bot_profiles WHERE name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT description AS username FROM wa_bot_profiles WHERE description REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT category AS username FROM wa_bot_profiles WHERE category REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT creator_name AS username FROM wa_bot_profiles WHERE creator_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT jid AS username FROM wa_contacts WHERE jid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT display_name AS username FROM wa_contacts WHERE display_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT family_name AS username FROM wa_contacts WHERE family_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT given_name AS username FROM wa_contacts WHERE given_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT nickname AS username FROM wa_contacts WHERE nickname REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT wa_name AS username FROM wa_contacts WHERE wa_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT jid AS username FROM wa_trusted_contacts WHERE jid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT incoming_tc_token AS username FROM wa_trusted_contacts WHERE incoming_tc_token REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT jid AS username FROM wa_trusted_contacts_send WHERE jid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "PERSON_NAME", "PII": ["Svetlana", "Don", "Karen", "Hank", "Brian", "Goldie", "Vladamir", "Joey", "Mary", "Abe", "Russ", "Otto", "Toks", "Bo", "Chernoff", "Whalen", "Wayne", "Tate", "Reynolds", "Kahn", "Stravinsky", "Garcia", "Rudder", "Philby"], "Num_of_PII": 24, "source_columns": ["wa_contacts.given_name", "wa_contacts.family_name"], "Raw_rows_first_100": [["Svetlana"], ["Don"], ["Karen"], ["Hank"], ["Brian"], ["Goldie"], ["Vladamir"], ["Joey"], ["Mary"], ["Abe"], ["Russ"], ["Voice Mail"], ["Otto"], ["Toks"], ["Bo"], ["Chernoff"], ["Whalen"], ["Wayne"], ["Tate"], ["Reynolds"], ["Kahn"], ["Stravinsky"], ["Garcia"], ["Rudder"], ["Philby"]], "Total_raw_rows": 25, "Exploration_sql": "Based on the schema of the relevant tables, here is the SQL query to find possible person names in the database:\n\n```sql\nSELECT display_name FROM wa_address_book WHERE display_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT given_name FROM wa_contacts WHERE given_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT family_name FROM wa_contacts WHERE family_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT description FROM wa_group_descriptions WHERE description REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n```\n\nThis query will search for loosely structured human name-like strings in the 'display_name' column of 'wa_address_book', 'given_name' and 'family_name' columns of 'wa_contacts', and 'description' column of 'wa_group_descriptions' tables.", "Extraction_sql": "Based on the schema of the relevant tables, here is the SQL query to find possible person names in the database:\n```sql\nSELECT display_name FROM wa_address_book WHERE display_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT given_name FROM wa_contacts WHERE given_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT family_name FROM wa_contacts WHERE family_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT description FROM wa_group_descriptions WHERE description REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n```\nThis query will search for loosely structured human name-like strings in the 'display_name' column of 'wa_address_book', 'given_name' and 'family_name' columns of 'wa_contacts', and 'description' column of 'wa_group_descriptions' tables.", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, the following tables and columns have the potential to contain US postal addresses:\n\n1. Table: `wa_address_book`\n - Column: `address`\n\n2. Table: `wa_biz_profiles`\n - Columns: `address`, `address_postal_code`, `address_city_id`, `address_city_name`\n\n3. Table: `wa_biz_profiles_websites`\n - Column: `websites`\n\nTo search for US postal addresses in these tables, you can use the following SQL queries:\n\n```sql\nSELECT address FROM wa_address_book WHERE address REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';\n\nUNION ALL\n\nSELECT address, address_postal_code, address_city_id, address_city_name FROM wa_biz_profiles WHERE address REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';\n\nUNION ALL\n\nSELECT websites FROM wa_biz_profiles_websites WHERE websites REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';\n``` \n\nThese queries will search for US postal addresses in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A2_core.db", "PII_type": "EMAIL", "PII": ["sharononeil368@gmail.com"], "Num_of_PII": 1, "source_columns": ["Preferences.stringValue", "SnapUserStore.textVal", "SnapchatUserProperties.textVal"], "Raw_rows_first_100": [["sharononeil368@gmail.com"]], "Total_raw_rows": 1, "Exploration_sql": "Based on the schema of the tables in the database, there are no columns that directly indicate the presence of email addresses. To search for email addresses, we can focus on text fields such as 'stringValue', 'textVal', or 'blobVal' in the tables. Let's search these columns in the tables for possible email addresses using the REGEXP pattern matching.\nSELECT etag FROM ConfigEtag WHERE etag REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT stringValue FROM Preferences WHERE stringValue REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT textVal FROM SnapUserStore WHERE textVal REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT textVal FROM SnapchatUserProperties WHERE textVal REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "Based on the schema of the tables in the database, there are no columns that directly indicate the presence of email addresses. To search for email addresses, we can focus on text fields such as 'stringValue', 'textVal', or 'blobVal' in the tables. Let's search these columns in the tables for possible email addresses using the REGEXP pattern matching.\nSELECT etag FROM ConfigEtag WHERE etag REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT stringValue FROM Preferences WHERE stringValue REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT textVal FROM SnapUserStore WHERE textVal REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT textVal FROM SnapchatUserProperties WHERE textVal REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A2_core.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US phone numbers:\n- Table: Preferences\n - Columns: key, stringValue\n\nTo search for US phone numbers in these tables, you can use the following SQL query:\n```sql\nSELECT key, stringValue FROM Preferences WHERE stringValue REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A2_core.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following columns have the potential to contain usernames:\n- ConfigEtag: etag\n- ConfigRule: rule_id, config_id\n- DeltaForceSync: client_key, group_key\n- Preferences: key, stringValue\n- SnapUserStore: groupKey, itemKey, textVal\n- SnapchatUserProperties: textVal\n\nTo search for possible usernames in these columns, you can use the following SQL query:\n\n```sql\nSELECT etag AS username FROM ConfigEtag WHERE etag REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT rule_id AS username FROM ConfigRule WHERE rule_id REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT config_id AS username FROM ConfigRule WHERE config_id REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT client_key AS username FROM DeltaForceSync WHERE client_key REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT group_key AS username FROM DeltaForceSync WHERE group_key REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT key AS username FROM Preferences WHERE key REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT stringValue AS username FROM Preferences WHERE stringValue REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT groupKey AS username FROM SnapUserStore WHERE groupKey REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT itemKey AS username FROM SnapUserStore WHERE itemKey REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT textVal AS username FROM SnapUserStore WHERE textVal REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT textVal AS username FROM SnapchatUserProperties WHERE textVal REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\n```\n\nThis query will search for usernames in the specified columns of the tables.", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A2_core.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns will be checked for possible person names:\n- Table: ConfigEtag\n - Column: etag\n\n- Table: ConfigRule\n - Columns: rule_id, config_id\n\n- Table: DeltaForceSync\n - Columns: client_key, group_key\n\n- Table: Preferences\n - Columns: key, stringValue\n\n- Table: SnapUserStore\n - Columns: groupKey, itemKey, textVal\n\n- Table: SnapchatUserProperties\n - Column: textVal\n\n- Table: android_metadata\n - Column: locale\n\nWe will search these columns for possible person names using REGEXP.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A2_core.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, there are no columns that directly indicate messages, chats, or other text fields where a US postal address might be stored. If you have specific tables or columns in mind where you suspect the US postal address might be present, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of email addresses. To search for email addresses, we need to explore text fields such as messages, chats, or other textual data. Let's search for email addresses in the text fields of the tables.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"], ["4EDFB389483E360F0CBA63F7A928FD39.discover_story_streaming_snap_ff"], ["629156B858FDF391C0639F2DE6933EEB.discover_story_streaming_snap_ff"], ["5A4F0362F54488AC2542C174F69C9A24.discover_story_streaming_snap_ff"]], "Total_raw_rows": 10, "Exploration_sql": "The databases contain the following tables and columns:\n1. Table: android_metadata\n - Column: locale (TEXT)\n\n2. Table: journal\n - Columns: _id (INTEGER), path (TEXT), size (INTEGER), locked_size (INTEGER)\n\n3. Table: journal_entry\n - Columns: _id (INTEGER), journal_id (INTEGER), key (TEXT), sequence_number (INTEGER), value_count (INTEGER), status (INTEGER), last_update_time (INTEGER), last_read_time (INTEGER), lock_count (INTEGER), total_size (INTEGER), value_sizes (BLOB), expiration (INTEGER), last_consumed_time (INTEGER), metadata (BLOB)\n\nTo find US phone numbers in the database, we need to search through text columns that may contain phone numbers. Let's proceed with searching for US phone numbers in the relevant text columns.\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT path FROM journal WHERE path REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT key FROM journal_entry WHERE key REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following columns may contain usernames:\n- android_metadata: No relevant columns for usernames.\n- journal: key (TEXT)\n- journal_entry: No relevant columns for usernames.\n\nYou can use the following SQL query to search for possible usernames in the 'key' column of the 'journal' table:\n```sql\nSELECT key FROM journal WHERE key REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "AAAAAAAAd0M="}], [{"__bytes_b64__": "AAAAAAAARXg="}], [{"__bytes_b64__": "AAAAAAAAc3Y="}], [{"__bytes_b64__": "AAAAAAAAV3o="}], [{"__bytes_b64__": "AAAAAAAASC0="}], [{"__bytes_b64__": "AAAAAAAAQWg="}], [{"__bytes_b64__": "AAAAAAABa2o="}], [{"__bytes_b64__": "AAAAAAAARnU="}], [{"__bytes_b64__": "AAAAAAAAdk4="}], [{"__bytes_b64__": "AAAAAAAjWXU="}]], "Total_raw_rows": 10, "Exploration_sql": "Based on the database schema, the tables and columns that could potentially contain person names are:\n1. Table: journal_entry\n - Columns: key, value_sizes\n\nTo search for person names in these columns, you can use the following SQL query:\n```sql\nSELECT key FROM journal_entry WHERE key REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value_sizes FROM journal_entry WHERE value_sizes REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of US postal addresses. To further explore the possibility of finding US postal addresses, additional information or specific tables/columns related to messages, chats, or other text fields may be required.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate the presence of email addresses. To further explore the database for email addresses, additional tables and columns need to be examined. Let's proceed with checking other tables and columns.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate messages, chats, or text fields where US phone numbers might be stored. To further explore the possibility of finding US phone numbers in the database, additional tables and columns related to messages or chats need to be examined. Let's proceed with checking other tables.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate usernames. To further explore the possibility of finding usernames, we may need to consider other text fields or messages within these tables. Let's construct a query to search for possible usernames in text fields or messages.\nSELECT title FROM dialog_filter WHERE title REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The tables \"dialog_filter\" and \"params\" do not contain columns that are likely to have person names. Let's explore other tables in the database to find possible person names.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, there are no columns that directly indicate messages, chats, or other text fields where a US postal address might be stored. If you have specific tables or columns in mind where you suspect the US postal address might be present, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate the presence of email addresses. To further explore the database for email addresses, additional tables and columns need to be examined. Let's proceed with checking other tables and columns.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "No additional tables related to messages or chats were found in the database. Given the current tables available, it seems challenging to directly identify US phone numbers. If you have any specific tables or columns in mind where US phone numbers might be stored, please provide that information for further investigation.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate usernames. To further explore the possibility of finding usernames, additional tables and columns need to be examined. Let's continue by checking other tables and columns for potential usernames.", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate person names. To further explore the possibility of finding person names, we can search for text fields that may contain human names. Let's search for potential person names in the text fields of these tables. \n\n```sql\nSELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT pbytes FROM params WHERE pbytes REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, there are no columns that directly indicate messages, chats, or other text fields where a US postal address might be stored. If you have specific tables or columns in mind where you suspect the addresses might be stored, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate the presence of email addresses. To further explore the database for email addresses, additional tables and columns need to be examined. Let's proceed with checking other tables and columns.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate messages, chats, or text fields where US phone numbers might be stored. To further explore the possibility of finding US phone numbers in the database, additional tables and columns related to messages or chats may need to be examined. Let's proceed with querying other tables and columns.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate usernames. To further explore the possibility of finding usernames, additional tables and columns need to be examined. Let's continue exploring other tables and columns for potential usernames.", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables \"dialog_filter\" and \"params\", there are no columns that directly indicate person names. To search for person names, we can focus on text fields such as messages, chats, or other textual data. Let's search for person names in these text fields.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, there are no columns that directly indicate messages, chats, or other text fields where a US postal address might be stored. If you have specific tables or columns in mind where you suspect the addresses might be located, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of email addresses. To search for email addresses, we can focus on text fields such as messages, chats, or other textual data. Let's search for possible email addresses in the text fields of these tables.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the available tables and their schemas, there are no columns that directly indicate messages, chats, or other text fields where US phone numbers might be stored. To proceed with searching for US phone numbers, we may need to explore additional tables or columns that contain text data. Let's continue the exploration.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the columns that might contain usernames are not explicitly identified. To search for possible usernames, we can look into text fields such as 'key_string' in the 'sync_corpus' table and 'sync_item' in the 'sync_item' table. Let's search for usernames in these text fields. \n\nHere is the SQL query to find possible usernames in the 'key_string' column of the 'sync_corpus' table and the 'sync_item' column of the 'sync_item' table:\n\n```sql\nSELECT key_string AS username FROM sync_corpus WHERE key_string REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT sync_item AS username FROM sync_item WHERE sync_item REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "EgMwOjAy5wEKBAgAEAASLUJlcnd5biBQYXJrIFJkLCBUcmVkeWZmcmluIFRvd25zaGlwLCBQQSAxOTMxMhokMHg4OWM2OTMxMzU3NDAyZDM1OjB4OGRjN2Q2MGM0NTM3Yzc5IhAIg6CNExDisoLc//////8BKOzrotSCMTJxaHR0cDovL21hcHMuZ29vZ2xlLmNvbS8/cT1CZXJ3eW4rUGFyaytSZCwrVHJlZHlmZnJpbitUb3duc2hpcCwrUEErMTkzMTImZnRpZD0weDg5YzY5MzEzNTc0MDJkMzU6MHg4ZGM3ZDYwYzQ1MzdjNzk="}]], "Total_raw_rows": 1, "Exploration_sql": "Based on the schema of the tables in the database, the columns are as follows:\n- android_metadata: locale\n- sync_corpus: corpus, last_sync_time\n- sync_item: corpus, key_string, timestamp, merge_key, feature_fprint, latitude, longitude, is_local, sync_item\n\nTo find person names in the database, we will search through text fields such as messages, chats, or other communication-related columns. Let's search for person names in the relevant columns.\nSELECT key_string FROM sync_item WHERE key_string REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL \nSELECT sync_item FROM sync_item WHERE sync_item REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of US postal addresses. To further explore the data for US postal addresses, additional tables or columns related to messages, chats, or other text fields may need to be examined.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "EMAIL", "PII": ["heather@cellebrite.com", "hmahalik@gmail.com"], "Num_of_PII": 2, "source_columns": ["Tokens_content.c1value", "Tokens_stat.value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["hmahalik@gmail.com"]], "Total_raw_rows": 2, "Exploration_sql": "Based on the schema of the tables, the following columns may contain email addresses:\n- Contacts table: value\n- Tokens_content table: c1value\n- Tokens_stat table: value\n\nYou can use the following SQL query to search for email addresses in these columns:\n```sql\nSELECT value FROM Contacts WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value FROM Tokens_stat WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "Based on the schema of the tables, the following columns may contain email addresses:\n- Contacts table: value\n- Tokens_content table: c1value\n- Tokens_stat table: value\nYou can use the following SQL query to search for email addresses in these columns:\n```sql\nSELECT value FROM Contacts WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value FROM Tokens_stat WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["17423794330"], ["7423794330"], ["3794330"]], "Total_raw_rows": 3, "Exploration_sql": "Based on the schema of the available tables, the following columns may contain US phone numbers:\n- Contacts table: value\n- Tokens_content table: c1value\n\nTo search for US phone numbers in these columns, you can use the following SQL query:\n\n```sql\nSELECT value FROM Contacts WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the following columns may contain usernames:\n- Contacts table: value\n- Tokens table: type\n- Tokens_content table: value\n- Tokens_docsize table: c1value\n- Tokens_segdir table: value\n- Tokens_stat table: value\n- android_metadata table: locale\n- room_master_table table: identity_hash\n\nYou can use the following SQL query to search for possible usernames in these columns:\n```sql\nSELECT value FROM Contacts WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT type FROM Tokens WHERE type REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value FROM Tokens_content WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT c1value FROM Tokens_docsize WHERE c1value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value FROM Tokens_segdir WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value FROM Tokens_stat WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT identity_hash FROM room_master_table WHERE identity_hash REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PERSON_NAME", "PII": ["Heather", "Heather Mahalik", "H. Mahalik", "Bo"], "Num_of_PII": 4, "source_columns": ["Tokens_content.c0contact_id", "Tokens_content.c1value", "Tokens_docsize.docid", "Tokens_segdir.level", "Tokens_segdir.idx", "android_metadata.locale"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["Bo"], ["en_US"]], "Total_raw_rows": 6, "Exploration_sql": "Based on the schema of the tables, the following columns may contain person names:\n1. Contacts table: contact_id, value\n2. Tokens_content table: c0contact_id, c1value\n3. Tokens_docsize table: docid\n4. Tokens_segdir table: level, idx\n5. android_metadata table: locale\n\nI will now search for person names in these columns.\nSELECT contact_id FROM Contacts WHERE contact_id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT value FROM Contacts WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT c0contact_id FROM Tokens_content WHERE c0contact_id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT docid FROM Tokens_docsize WHERE docid REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT level FROM Tokens_segdir WHERE level REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT idx FROM Tokens_segdir WHERE idx REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": "Based on the schema of the tables, the following columns may contain person names:\n1. Contacts table: contact_id, value\n2. Tokens_content table: c0contact_id, c1value\n3. Tokens_docsize table: docid\n4. Tokens_segdir table: level, idx\n5. android_metadata table: locale\nI will now search for person names in these columns.\nSELECT contact_id FROM Contacts WHERE contact_id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value FROM Contacts WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT c0contact_id FROM Tokens_content WHERE c0contact_id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT docid FROM Tokens_docsize WHERE docid REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT level FROM Tokens_segdir WHERE level REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT idx FROM Tokens_segdir WHERE idx REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the database schema, the following tables and columns may contain US postal addresses:\n- Table: Contacts\n - Columns: contact_id, value, affinity, field_type\n\nTo search for US postal addresses in these tables, we can use the REGEXP function with a pattern matching the address components. Let's proceed with the SQL query.\n```sql\nSELECT contact_id, value, affinity, field_type\nFROM Contacts\nWHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the columns in the BOOKMARKS table that might contain email addresses are: URL, SURL, TAGS, ACCOUNT_NAME, and ACCOUNT_TYPE.\n\nTo search for possible email addresses in these columns, you can use the following SQL query:\n\n```sql\nSELECT URL FROM BOOKMARKS WHERE URL REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT SURL FROM BOOKMARKS WHERE SURL REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ACCOUNT_TYPE FROM BOOKMARKS WHERE ACCOUNT_TYPE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n```\n\nThis query will search for email addresses in the specified columns of the BOOKMARKS table.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The 'BOOKMARKS' table in the database contains columns such as URL, TITLE, TAGS, ACCOUNT_NAME, and DESCRIPTION. To search for US phone numbers in these columns, we can use the following SQL query:\n\n```sql\nSELECT URL FROM BOOKMARKS WHERE URL REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT DESCRIPTION FROM BOOKMARKS WHERE DESCRIPTION REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\n```\n\nThis query will search for US phone numbers in the URL, TITLE, TAGS, ACCOUNT_NAME, and DESCRIPTION columns of the 'BOOKMARKS' table.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The 'BOOKMARKS' table in the database contains several columns. To find possible usernames, we can search the following columns for short textual identifiers that do not include whitespace and are intended for human recognition:\n- ACCOUNT_NAME\n- ACCOUNT_TYPE\n- TAGS\n- SYNC1\n- SYNC2\n- SYNC3\n- SYNC4\n- SYNC5\n- keyword\n- description\n- guid\n\nWe will search these columns for potential usernames using the REGEXP pattern matching.\n```sql\nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ACCOUNT_TYPE FROM BOOKMARKS WHERE ACCOUNT_TYPE REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SYNC1 FROM BOOKMARKS WHERE SYNC1 REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SYNC2 FROM BOOKMARKS WHERE SYNC2 REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SYNC3 FROM BOOKMARKS WHERE SYNC3 REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SYNC4 FROM BOOKMARKS WHERE SYNC4 REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SYNC5 FROM BOOKMARKS WHERE SYNC5 REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT keyword FROM BOOKMARKS WHERE keyword REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT description FROM BOOKMARKS WHERE description REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT guid FROM BOOKMARKS WHERE guid REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the columns that may contain person names are not present in the BOOKMARKS and android_metadata tables. If you have additional tables or specific columns in mind where you suspect person names might be stored, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAx0od46RvJj3ZMpmE/r++aNuxFfDaTafncAW0XddYSB0WkI7vryB4lplJKYOFVJvriCJ54MlN56/+r6ZnwIIKx3TF4rvHTUNRIc9LKLCfh5hqUwF5ebYY+wMqebfiqMSY="}]], "Total_raw_rows": 1, "Exploration_sql": "The table \"BOOKMARKS\" in the database contains columns that might potentially have US postal addresses. To search for US postal addresses in the database, we can query specific columns in the \"BOOKMARKS\" table. Let's proceed with searching for US postal addresses in relevant columns of the \"BOOKMARKS\" table.\n```sql\nSELECT URL FROM BOOKMARKS WHERE URL REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "EMAIL", "PII": ["sharononeil368@gmail.com"], "Num_of_PII": 1, "source_columns": ["BOOKMARKS.ACCOUNT_TYPE", "INTERNET_SYNC.SYNC_KEY", "SYNC_STATE.account_name", "TABS.ACCOUNT_NAME"], "Raw_rows_first_100": [["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"]], "Total_raw_rows": 5, "Exploration_sql": "The following columns may contain email addresses:\n- BOOKMARKS: ACCOUNT_NAME, ACCOUNT_TYPE\n- INTERNET_SYNC: SYNC_KEY\n- SYNC_STATE: account_name\n- TABS: ACCOUNT_NAME\n\nYou can use the following SQL query to search for email addresses in these columns:\n```sql\nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ACCOUNT_TYPE FROM BOOKMARKS WHERE ACCOUNT_TYPE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "The following columns may contain email addresses:\n- BOOKMARKS: ACCOUNT_NAME, ACCOUNT_TYPE\n- INTERNET_SYNC: SYNC_KEY\n- SYNC_STATE: account_name\n- TABS: ACCOUNT_NAME\nYou can use the following SQL query to search for email addresses in these columns:\n```sql\nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ACCOUNT_TYPE FROM BOOKMARKS WHERE ACCOUNT_TYPE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://www.pinterest.com/pin/410812797236816112/"]], "Total_raw_rows": 1, "Exploration_sql": "Based on the schema of the available tables, the following columns may contain US phone numbers:\n- In the BOOKMARKS table: URL, TITLE, TAGS\n- In the INTERNET_SYNC table: SYNC_KEY\n- In the SYNC_STATE table: SYNC_VALUE\n- In the TABS table: TAB_URL, TAB_TITLE\n- In the android_metadata table: No relevant columns\n\nNow, I will construct SQL queries to search for US phone numbers in these columns.\n```sql\nSELECT URL FROM BOOKMARKS WHERE URL REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT SYNC_VALUE FROM SYNC_STATE WHERE SYNC_VALUE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT TAB_URL FROM TABS WHERE TAB_URL REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT TAB_TITLE FROM TABS WHERE TAB_TITLE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the following columns may contain usernames:\n- BOOKMARKS: ACCOUNT_NAME\n- INTERNET_SYNC: SYNC_KEY\n- SYNC_STATE: account_name\n- TABS: ACCOUNT_NAME\n- android_metadata: No relevant columns for usernames\n\nTo search for possible usernames, you can use the following SQL query:\n```sql\nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["sync_internet_data"], ["sync_bookmarks"], ["sync_open_pages"], ["sync_saved_pages"], ["SBROWSER_TAB1724467631361__BROWSER1724467632107__SBROWSER_SAVEDPAGES1724467635256__QUICKACCESS_SYNC_V21724467633471__SBROWSER_HISTORY1724467634746__"], ["Pin on Simon, God of Hairdos"], ["puck from.glee - Google Search"], ["Midjourney AI - Free Image Generator"], ["billie eilish birds of a feather lyrics - Google Search"]], "Total_raw_rows": 9, "Exploration_sql": "Based on the schema of the tables, the following columns may contain person names:\n- BOOKMARKS: TITLE, TAGS\n- INTERNET_SYNC: SYNC_KEY\n- SYNC_STATE: data\n- TABS: TAB_TITLE\n\nTo search for person names in these columns, you can use the following SQL query:\n\n```sql\nSELECT TITLE AS person_name FROM BOOKMARKS WHERE TITLE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT TAGS AS person_name FROM BOOKMARKS WHERE TAGS REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT SYNC_KEY AS person_name FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT data AS person_name FROM SYNC_STATE WHERE data REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT TAB_TITLE AS person_name FROM TABS WHERE TAB_TITLE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there is no specific column that directly indicates the presence of a US postal address. However, we can search through text fields in these tables to find possible US postal addresses. Let's search through the text fields in these tables for US postal addresses.\nSELECT URL FROM BOOKMARKS WHERE URL REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b' UNION ALL \nSELECT SYNC_VALUE FROM INTERNET_SYNC WHERE SYNC_VALUE REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b' UNION ALL \nSELECT data FROM SYNC_STATE WHERE data REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b' UNION ALL \nSELECT TAB_URL FROM TABS WHERE TAB_URL REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b' UNION ALL \nSELECT locale FROM android_metadata WHERE locale REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of email addresses. It seems that the tables 'android_metadata' and 'searchengine' do not contain email addresses. If you have any other tables in mind that may contain email addresses, please provide the table names for further investigation.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate messages, chats, or other text fields where US phone numbers might be stored. Therefore, it is not possible to search for US phone numbers in the current databases.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, we will search for possible usernames in the following columns using REGEXP pattern matching:\n- android_metadata: locale\n- searchengine: title, url, image_url\n\nHere is the SQL query:\n```sql\nSELECT locale AS possible_username FROM android_metadata WHERE locale REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT title AS possible_username FROM searchengine WHERE title REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT url AS possible_username FROM searchengine WHERE url REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT image_url AS possible_username FROM searchengine WHERE image_url REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://duckduckgo.com/favicon.ico"], ["https://home.imgsmail.ru/resplash/123689/i/meta/favicon.ico"], ["https://m.toutiao.com/favicon.ico"], ["https://p0.ssl.qhimg.com/d/inn/128c749e/icon.png"], ["https://search.daum.net/favicon.ico"], ["https://search.naver.com/favicon.ico"], ["https://search.seznam.cz/re/media/favicon.192a42730e.ico"], ["https://search.yahoo.com/favicon.ico"], ["https://sm01.alicdn.com/L1/272/1990/favicon/favicon.ico"], ["https://www.baidu.com/favicon.ico"]], "Total_raw_rows": 10, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate person names. To further explore the database for person names, we can focus on text fields such as 'title', 'url', 'extra1', 'extra2', and 'extra3' in the 'searchengine' table. Let's search these columns for possible person names. \n\n```sql\nSELECT title FROM searchengine WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT url FROM searchengine WHERE url REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT extra1 FROM searchengine WHERE extra1 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT extra2 FROM searchengine WHERE extra2 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT extra3 FROM searchengine WHERE extra3 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of US postal addresses. If you have any specific tables or columns in mind where you suspect the addresses might be stored, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the following columns may contain email addresses:\n- ZLINKTOKEN in ZWAAGGREGATECALLEVENT table\n- ZGROUPCALLCREATORUSERJIDSTRING in ZWACDCALLEVENT table\n- ZJIDSTRING in ZWACDCALLEVENTPARTICIPANT table\n\nTo search for email addresses in these columns, you can use the following SQL query:\n```sql\nSELECT ZLINKTOKEN AS email FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS email FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZJIDSTRING AS email FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there is no clear indication of columns that may contain text fields such as messages or chats where US phone numbers could be stored. To proceed with searching for US phone numbers, we may need to explore additional tables or columns that are not listed in the current schema. Let's continue the exploration.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The columns in the relevant tables are as follows:\n- ZWAAGGREGATECALLEVENT: ZINCOMING, ZMISSED, ZMISSEDREASON, ZVIDEO, ZFIRSTDATE, ZLINKTOKEN\n- ZWACDCALLEVENT: ZBYTESRECEIVED, ZBYTESSENT, ZISLIGHTWEIGHT, ZOUTCOME, Z1CALLEVENTS, Z_FOK_1CALLEVENTS, ZDATE, ZDURATION, ZCALLIDSTRING, ZGROUPCALLCREATORUSERJIDSTRING, ZGROUPJIDSTRING, ZSCHEDULEDID\n- ZWACDCALLEVENTPARTICIPANT: ZOUTCOME, Z1PARTICIPANTS, Z_FOK_1PARTICIPANTS, ZJIDSTRING\n\nTo find possible usernames, we will search these columns for short textual identifiers that do not contain whitespace and are intended for human recognition. Let's construct the SQL query.\nSELECT ZLINKTOKEN AS username FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZCALLIDSTRING AS username FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS username FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZGROUPJIDSTRING AS username FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZJIDSTRING AS username FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["3C399CDDAF11A41F7AFF2892E0A4B10C"], ["3C37CBFE11C261E6CD80C2DE7834D770"], ["372FA57E129467051E04B3E4DD5A26D5"], ["3A6DF670F7121CD6D08B"], ["3A9CEF8B4996D645358B"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 14, "Exploration_sql": "Based on the schema of the tables, the following columns may contain person names:\n- ZWAAGGREGATECALLEVENT: ZLINKTOKEN\n- ZWACDCALLEVENT: ZCALLIDSTRING, ZGROUPCALLCREATORUSERJIDSTRING\n- ZWACDCALLEVENTPARTICIPANT: ZJIDSTRING\n\nTo search for person names in these columns, you can use the following SQL query:\n\n```sql\nSELECT ZLINKTOKEN AS PersonName FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZCALLIDSTRING AS PersonName FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS PersonName FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZJIDSTRING AS PersonName FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the potential columns where US postal addresses might be found are as follows:\n- ZWAAGGREGATECALLEVENT: ZLINKTOKEN\n- ZWACDCALLEVENT: ZCALLIDSTRING\n- ZWACDCALLEVENTPARTICIPANT: ZJIDSTRING\n\nI will now construct SQL queries to search for US postal addresses in these columns.\n```sql\nSELECT ZLINKTOKEN AS US_POSTAL_ADDRESS FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT ZCALLIDSTRING AS US_POSTAL_ADDRESS FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT ZJIDSTRING AS US_POSTAL_ADDRESS FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I1_ChatStorage.sqlite", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["0@s.whatsapp.net"], ["120363021860168333@g.us"], ["120363166957275373@g.us"], ["120363171979772631@g.us"], ["120363297701499017@g.us"], ["120363304649477491@g.us"], ["120363313118297318@g.us"], ["120363320717891109@g.us"], ["12068996918-1583025771@g.us"], ["12608942032@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["15162879924@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["60183723602@s.whatsapp.net"], ["5359042582@s.whatsapp.net"], ["6285791909576@s.whatsapp.net"], ["16052709346@s.whatsapp.net"], ["16052709346@s.whatsapp.net"], ["17852533080@s.whatsapp.net"], ["5359042582@s.whatsapp.net"], ["5359042582@s.whatsapp.net"], ["6288219778388@s.whatsapp.net"], ["447774218634@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["15162879924@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["60183723602@s.whatsapp.net"], ["5359042582@s.whatsapp.net"], ["628983529854@s.whatsapp.net"], ["16052709346@s.whatsapp.net"], ["16052709346@s.whatsapp.net"], ["12018466978@s.whatsapp.net"], ["12022588062@s.whatsapp.net"], ["12026511035@s.whatsapp.net"], ["12027132090@s.whatsapp.net"], ["12027444937@s.whatsapp.net"], ["12034004949@s.whatsapp.net"], ["12035031470@s.whatsapp.net"], ["12035031470@s.whatsapp.net"], ["12037040819@s.whatsapp.net"], ["12037069838@s.whatsapp.net"]], "Total_raw_rows": 43, "Exploration_sql": "Based on the schema of the tables, the following columns may contain email addresses:\n- ZJID in ZWACHATPUSHCONFIG\n- ZCREATORJID, ZOWNERJID, ZCONTACTJID in ZWACHATSESSION\n- ZCREATORJID, ZOWNERJID, ZSOURCEJID, ZSUBJECTOWNERJID in ZWAGROUPINFO\n- ZMEMBERJID in ZWAGROUPMEMBER\n\nYou can use the following SQL query to search for email addresses in these columns:\n```sql\nSELECT ZJID AS email FROM ZWACHATPUSHCONFIG WHERE ZJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZCREATORJID AS email FROM ZWACHATSESSION WHERE ZCREATORJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZOWNERJID AS email FROM ZWACHATSESSION WHERE ZOWNERJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZCONTACTJID AS email FROM ZWACHATSESSION WHERE ZCONTACTJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZCREATORJID AS email FROM ZWAGROUPINFO WHERE ZCREATORJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZOWNERJID AS email FROM ZWAGROUPINFO WHERE ZOWNERJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZSOURCEJID AS email FROM ZWAGROUPINFO WHERE ZSOURCEJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZSUBJECTOWNERJID AS email FROM ZWAGROUPINFO WHERE ZSUBJECTOWNERJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZMEMBERJID AS email FROM ZWAGROUPMEMBER WHERE ZMEMBERJID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I1_ChatStorage.sqlite", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["120363021860168333@g.us"], ["120363150265582047@newsletter"], ["120363166957275373@g.us"], ["120363169975121665@newsletter"], ["120363171979772631@g.us"], ["120363297701499017@g.us"], ["120363304649477491@g.us"], ["120363313118297318@g.us"], ["120363320717891109@g.us"], ["12068996918-1583025771@g.us"], ["+1 (971) 678-6701"], ["100021315842277@lid"], ["100188802781436@lid"], ["100618467295310@lid"], ["100639707246710@lid"], ["100811522703520@lid"], ["101060681162912@lid"], ["101090964033567@lid"], ["101189580492820@lid"], ["101266856378468@lid"], ["101310208712878@lid"], ["19735203731-1612395525@g.us"], ["15162879924-1612888425@g.us"], ["19735203731-1611101165@g.us"], ["12068996918-1583025771@g.us"], ["15162879924-1612888425@g.us"], ["12068996918-1583025771@g.us"], ["19735203731-1612395525@g.us"], ["19735203731-1611101165@g.us"], ["12068996918-1583025771@g.us"], ["15162879924-1612888425@g.us"], ["Need a package picked up at 12503 E Via De Palmas, Chandler, AZ on Tuesday and taken to 8500 Peña Blvd, Denver, CO ask the bartender at Mesa Verde Bar “where are the goats around here?” He’ll tell where to drop the package, COD at the drop off spot"], ["17852533080@s.whatsapp.net"], ["https://x.com/emergencystream/status/1800602193025769961?s=46"], ["{\"auto_add_disabled\":true,\"author\":\"5359042582@s.whatsapp.net\",\"show_membership_string\":false,\"is_initially_empty\":false,\"context_group\":null,\"parent_group_jid\":\"120363294790600721@g.us\",\"should_use_identity_header\":false,\"reason\":4,\"parent_group_name\":\"Citi tudy group209\",\"is_parent_group_general_chat\":false,\"is_open_group\":false,\"subject\":null}"], ["{\"is_open_group\":false,\"parent_group_jid\":\"120363294790600721@g.us\",\"reason\":0,\"auto_add_disabled\":true,\"should_use_identity_header\":false,\"author\":\"5359042582@s.whatsapp.net\",\"is_initially_empty\":false,\"is_parent_group_general_chat\":false,\"parent_group_name\":\"Citi tudy group209\",\"subject\":null,\"context_group\":null,\"show_membership_string\":false}"], ["13412133458@s.whatsapp.net"], ["13412133458@s.whatsapp.net"], ["13213147461@s.whatsapp.net"], ["13412133458@s.whatsapp.net"], ["17625243488@s.whatsapp.net"]], "Total_raw_rows": 41, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US phone numbers:\n\n1. Table: ZWACHATSESSION\n - Columns: ZCONTACTIDENTIFIER, ZCONTACTJID, ZLASTMESSAGETEXT, ZPARTNERNAME\n\n2. Table: ZWAGROUPMEMBER\n - Columns: ZCONTACTIDENTIFIER, ZMEMBERJID\n\n3. Table: ZWAMESSAGE\n - Columns: ZFROMJID, ZTEXT, ZTOJID\n\nTo search for US phone numbers in these tables, you can use the following SQL query:\n\n```sql\nSELECT ZCONTACTIDENTIFIER FROM ZWACHATSESSION WHERE ZCONTACTIDENTIFIER REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZCONTACTJID FROM ZWACHATSESSION WHERE ZCONTACTJID REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZLASTMESSAGETEXT FROM ZWACHATSESSION WHERE ZLASTMESSAGETEXT REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZPARTNERNAME FROM ZWACHATSESSION WHERE ZPARTNERNAME REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZCONTACTIDENTIFIER FROM ZWAGROUPMEMBER WHERE ZCONTACTIDENTIFIER REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZMEMBERJID FROM ZWAGROUPMEMBER WHERE ZMEMBERJID REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZFROMJID FROM ZWAMESSAGE WHERE ZFROMJID REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZTEXT FROM ZWAMESSAGE WHERE ZTEXT REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZTOJID FROM ZWAMESSAGE WHERE ZTOJID REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\n```\n\nThis query will search for US phone numbers in the specified columns of the mentioned tables.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I1_ChatStorage.sqlite", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the following columns may contain usernames:\n- ZJID in ZWACHATPUSHCONFIG\n- ZCONTACTIDENTIFIER in ZWACHATSESSION\n- ZCREATORJID and ZOWNERJID in ZWAGROUPINFO\n- ZCONTACTIDENTIFIER and ZMEMBERJID in ZWAGROUPMEMBER\n- ZMEMBERJIDS in ZWAGROUPMEMBERSCHANGE\n- ZAUTHORNAME in ZWAMEDIAITEM\n- ZFROMJID and ZTOJID in ZWAMESSAGE\n- ZJID in ZWAPROFILEPUSHNAME\n\nYou can search for possible usernames in these columns using the following SQL query:\n```sql\nSELECT ZJID AS username FROM ZWACHATPUSHCONFIG WHERE ZJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZCONTACTIDENTIFIER AS username FROM ZWACHATSESSION WHERE ZCONTACTIDENTIFIER REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZCREATORJID AS username FROM ZWAGROUPINFO WHERE ZCREATORJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZOWNERJID AS username FROM ZWAGROUPINFO WHERE ZOWNERJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZCONTACTIDENTIFIER AS username FROM ZWAGROUPMEMBER WHERE ZCONTACTIDENTIFIER REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZMEMBERJID AS username FROM ZWAGROUPMEMBER WHERE ZMEMBERJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZMEMBERJIDS AS username FROM ZWAGROUPMEMBERSCHANGE WHERE ZMEMBERJIDS REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZAUTHORNAME AS username FROM ZWAMEDIAITEM WHERE ZAUTHORNAME REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZFROMJID AS username FROM ZWAMESSAGE WHERE ZFROMJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZTOJID AS username FROM ZWAMESSAGE WHERE ZTOJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT ZJID AS username FROM ZWAPROFILEPUSHNAME WHERE ZJID REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I1_ChatStorage.sqlite", "PII_type": "PERSON_NAME", "PII": ["Finn", "Ronen Engler", "John Reynolds", "Colin DaCopps", "Russell Philby", "Lisena Gocaj", "Andy Sieg", "Howell", "Yaliweisi", "Abner", "Andy Schweichert", "Brian Arseneau", "Virginia", "Christian Justiniano", "Jim Wilson", "Virginia Benton", "Abe Rudder", "Jason", "Sharon Oneil", "Job Vizcarra", "Robert Elliott", "Sultan", "Emerick", "Nia Yuniar", "David Wilson", "Robechucks Raul", "Ella Bella", "Dick Oscar", "Charlie", "Steven", "Ameya Joshi", "Amiel Williamson", "Ashwin Menon", "Ajax Edmiston", "Eleazar Lewden", "Polly Lucas", "Lemuel Glasgow", "Bazel McConnel", "William Stevenson", "Denice R Allen", "Leif Fox", "William Hopkins", "Jonas Bradley", "Amit Sharma"], "Num_of_PII": 44, "source_columns": ["ZWAGROUPMEMBER.ZCONTACTNAME", "ZWAGROUPMEMBER.ZFIRSTNAME", "ZWAMEDIAITEM.ZAUTHORNAME", "ZWAPROFILEPUSHNAME.ZPUSHNAME"], "Raw_rows_first_100": [["Finn"], ["Ronen Engler"], ["John Reynolds"], ["Colin DaCopps"], ["Russell Philby"], ["WMzaMoVZnL"], ["Lisena Gocaj"], ["Lisena Gocaj"], ["Lisena Gocaj"], ["Andy Sieg"], ["Howell"], ["Yaliweisi"], ["Andy Sieg"], ["Abner"], ["Andy Schweichert"], ["Lisena Gocaj"], ["Andy Sieg"], ["Brian Arseneau"], ["Virginia"], ["Christian Justiniano"], ["Lisena Gocaj"], ["Jim Wilson"], ["Lisena Gocaj"], ["Virginia Benton"], ["Howell"], ["Lisena"], ["Yaliweisi"], ["Abner"], ["Abe Rudder"], ["Virginia"], ["Jason"], ["Sharon Oneil"], ["Job Vizcarra"], ["Robert Elliott"], ["Sultan"], ["Emerick"], ["Nia Yuniar"], ["skol"], ["David Wilson"], ["Robechucks Raul"], ["Ella Bella"], ["Dick Oscar"], ["Charlie"], ["Steven"], ["Ameya Joshi"], ["Robechucks Raul"], ["Robechucks Raul"], ["Amiel Williamson"], ["Ashwin Menon"], ["Ajax Edmiston"], ["Eleazar Lewden"], ["Polly Lucas"], ["Eleazar Lewden"], ["Robechucks Raul"], ["Lemuel Glasgow"], ["Bazel McConnel"], ["William Stevenson"], ["Robechucks Raul"], ["Denice R Allen"], ["Leif Fox"], ["William Hopkins"], ["Robechucks Raul"], ["Jonas Bradley"], ["Robechucks Raul"], ["Amit Sharma"]], "Total_raw_rows": 65, "Exploration_sql": "Based on the schema of the tables in the database, the following columns have the potential to contain person names:\n- ZPARTNERNAME in ZWACHATSESSION table\n- ZCONTACTNAME and ZFIRSTNAME in ZWAGROUPMEMBER table\n- ZAUTHORNAME in ZWAMEDIAITEM table\n- ZPUSHNAME in ZWAPROFILEPUSHNAME table\n\nTo search for person names in these columns, you can use the following SQL query:\n```sql\nSELECT ZPARTNERNAME AS person_name FROM ZWACHATSESSION WHERE ZPARTNERNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZCONTACTNAME AS person_name FROM ZWAGROUPMEMBER WHERE ZCONTACTNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZFIRSTNAME AS person_name FROM ZWAGROUPMEMBER WHERE ZFIRSTNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZAUTHORNAME AS person_name FROM ZWAMEDIAITEM WHERE ZAUTHORNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZPUSHNAME AS person_name FROM ZWAPROFILEPUSHNAME WHERE ZPUSHNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": "Based on the schema of the tables in the database, the following columns have the potential to contain person names:\n- ZPARTNERNAME in ZWACHATSESSION table\n- ZCONTACTNAME and ZFIRSTNAME in ZWAGROUPMEMBER table\n- ZAUTHORNAME in ZWAMEDIAITEM table\n- ZPUSHNAME in ZWAPROFILEPUSHNAME table\nTo search for person names in these columns, you can use the following SQL query:\n```sql\nSELECT ZPARTNERNAME AS person_name FROM ZWACHATSESSION WHERE ZPARTNERNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZCONTACTNAME AS person_name FROM ZWAGROUPMEMBER WHERE ZCONTACTNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZFIRSTNAME AS person_name FROM ZWAGROUPMEMBER WHERE ZFIRSTNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZAUTHORNAME AS person_name FROM ZWAMEDIAITEM WHERE ZAUTHORNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZPUSHNAME AS person_name FROM ZWAPROFILEPUSHNAME WHERE ZPUSHNAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I1_ChatStorage.sqlite", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US postal addresses:\n- Table: ZWACHATSESSION\n - Columns: ZLASTMESSAGETEXT, ZPARTNERNAME\n\n- Table: ZWAMESSAGE\n - Columns: ZTEXT\n\nTo search for US postal addresses in these tables, we can use the following SQL queries:\n```sql\nSELECT ZLASTMESSAGETEXT, ZPARTNERNAME FROM ZWACHATSESSION WHERE ZLASTMESSAGETEXT REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT ZTEXT FROM ZWAMESSAGE WHERE ZTEXT REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the database schema, there are no columns that directly indicate the presence of email addresses. To further explore the possibility of finding email addresses, additional tables or columns need to be examined. Let's proceed with checking other tables for email addresses.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate messages, chats, or other text fields where US phone numbers might be stored. Therefore, it seems that the tables provided may not contain the information needed to find US phone numbers. If you have any other tables or specific columns in mind where US phone numbers might be stored, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The columns in the databases are as follows:\n- ABFullSizeImage: record_id, crop_x, crop_y, crop_width, data\n- ABThumbnailImage: record_id, format, derived_from_format, data\n- _SqliteDatabaseProperties: key, value\n\nI will now search for possible usernames in these columns.\nSELECT record_id FROM ABFullSizeImage WHERE record_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT record_id FROM ABThumbnailImage WHERE record_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT value FROM _SqliteDatabaseProperties WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of person names. To further explore the database for person names, additional tables related to messages, chats, or contacts may need to be examined. Let's proceed with checking other tables for person names.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate text fields or messages where a US postal address might be stored. If you have any specific tables or columns in mind where you suspect the US postal address might be present, please provide that information for further investigation.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["B2@2D02\\\u0002NP*.Z\u0001\f\u0002\t\u0001Ü\u000b\u0002Ü\b"]], "Total_raw_rows": 1, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain email addresses:\n- ABPerson (Columns: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, FirstSort, LastSort, DisplayName, ImageURI, WallpaperURI)\n- ABMultiValueEntry (Column: value)\n- ABStore (Column: ProviderIdentifier)\n\nTo search for email addresses in these tables, you can use the following SQL query:\n\n```sql\nSELECT First FROM ABPerson WHERE First REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Last FROM ABPerson WHERE Last REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Middle FROM ABPerson WHERE Middle REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT FirstPhonetic FROM ABPerson WHERE FirstPhonetic REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT MiddlePhonetic FROM ABPerson WHERE MiddlePhonetic REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT LastPhonetic FROM ABPerson WHERE LastPhonetic REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Organization FROM ABPerson WHERE Organization REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Department FROM ABPerson WHERE Department REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Note FROM ABPerson WHERE Note REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT JobTitle FROM ABPerson WHERE JobTitle REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Nickname FROM ABPerson WHERE Nickname REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Prefix FROM ABPerson WHERE Prefix REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Suffix FROM ABPerson WHERE Suffix REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT FirstSort FROM ABPerson WHERE FirstSort REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT LastSort FROM ABPerson WHERE LastSort REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT DisplayName FROM ABPerson WHERE DisplayName REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ImageURI FROM ABPerson WHERE ImageURI REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT WallpaperURI FROM ABPerson WHERE WallpaperURI REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value FROM ABMultiValueEntry WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ProviderIdentifier FROM ABStore WHERE ProviderIdentifier REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["16133 NE 44th Ct. "], ["98052"]], "Total_raw_rows": 2, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US phone numbers:\n\n1. Table: ABPerson\n - Columns: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, FirstSort, LastSort, DisplayName, ImageURI, guid\n\n2. Table: ABMultiValueEntry\n - Column: value\n\n3. Table: ABPhoneLastFour\n - Column: value\n\nTo search for US phone numbers in these tables and columns, you can use the following SQL queries:\n\n```sql\nSELECT First FROM ABPerson WHERE First REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Last FROM ABPerson WHERE Last REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Middle FROM ABPerson WHERE Middle REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT FirstPhonetic FROM ABPerson WHERE FirstPhonetic REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT MiddlePhonetic FROM ABPerson WHERE MiddlePhonetic REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT LastPhonetic FROM ABPerson WHERE LastPhonetic REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Organization FROM ABPerson WHERE Organization REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Department FROM ABPerson WHERE Department REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Note FROM ABPerson WHERE Note REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT FirstSort FROM ABPerson WHERE FirstSort REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT LastSort FROM ABPerson WHERE LastSort REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT DisplayName FROM ABPerson WHERE DisplayName REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ImageURI FROM ABPerson WHERE ImageURI REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT value FROM ABMultiValueEntry WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT value FROM ABPhoneLastFour WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the columns that may contain usernames are as follows:\n- ABAccount: AccountIdentifier\n- ABGroup: Name\n- ABGroupMembers: No potential username column found\n- ABMultiValue: value\n- ABMultiValueEntry: value\n- ABPerson: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, DisplayName\n- ABPersonSearchKey: SearchKey\n- ABPhoneLastFour: value\n- ClientCursor: No potential username column found\n- ClientSequence: No potential username column found\n\nTo search for possible usernames, you can use the following SQL query:\n```sql\nSELECT AccountIdentifier AS username FROM ABAccount WHERE AccountIdentifier REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Name AS username FROM ABGroup WHERE Name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM ABMultiValue WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM ABMultiValueEntry WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT First AS username FROM ABPerson WHERE First REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Last AS username FROM ABPerson WHERE Last REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Middle AS username FROM ABPerson WHERE Middle REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT FirstPhonetic AS username FROM ABPerson WHERE FirstPhonetic REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT MiddlePhonetic AS username FROM ABPerson WHERE MiddlePhonetic REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT LastPhonetic AS username FROM ABPerson WHERE LastPhonetic REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Organization AS username FROM ABPerson WHERE Organization REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Department AS username FROM ABPerson WHERE Department REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Note AS username FROM ABPerson WHERE Note REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT JobTitle AS username FROM ABPerson WHERE JobTitle REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Nickname AS username FROM ABPerson WHERE Nickname REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Prefix AS username FROM ABPerson WHERE Prefix REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT Suffix AS username FROM ABPerson WHERE Suffix REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT DisplayName AS username FROM ABPerson WHERE DisplayName REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT SearchKey AS username FROM ABPersonSearchKey WHERE SearchKey REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM ABPhoneLastFour WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\n```\nThis query will search for potential usernames in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["16133 NE 44th Ct. "], ["us"], ["Redmond"], ["WA"], ["United States"], ["_$!<Mobile>!$_"], ["_$!<Home>!$_"], ["_$!<Other>!$_"], ["NA OG"], ["GenericGPT"]], "Total_raw_rows": 10, "Exploration_sql": "The following columns in the database tables may contain person names:\n- ABPerson: First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, DisplayName, PreviousFamilyName\n- ABMultiValueEntry: value\n- ABMultiValueLabel: value\n- ABGroupMembers: member_id\n- ABGroup: Name\n\nYou can use the following SQL query to search for person names in these columns:\n```sql\nSELECT First, Last, Middle, FirstPhonetic, MiddlePhonetic, LastPhonetic, Organization, Department, Note, JobTitle, Nickname, Prefix, Suffix, DisplayName, PreviousFamilyName FROM ABPerson WHERE First REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Last REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Middle REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR FirstPhonetic REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR MiddlePhonetic REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR LastPhonetic REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Organization REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Department REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Note REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR JobTitle REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Nickname REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Prefix REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR Suffix REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR DisplayName REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' OR PreviousFamilyName REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value FROM ABMultiValueEntry WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value FROM ABMultiValueLabel WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT member_id FROM ABGroupMembers WHERE member_id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT Name FROM ABGroup WHERE Name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBook.sqlitedb", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following tables and columns have the potential to contain US postal addresses:\n\n1. Table: ABPerson\n - Columns: First, Last, Middle, Organization, Department, Note, FirstSort, LastSort, CompositeNameFallback, Address\n\n2. Table: ABMultiValueEntry\n - Columns: value\n\n3. Table: ABMultiValueLabel\n - Columns: value\n\nTo search for US postal addresses in these tables, you can use the following SQL queries:\n\n```sql\nSELECT First, Last, Middle, Organization, Department, Note, FirstSort, LastSort, CompositeNameFallback, Address\nFROM ABPerson\nWHERE Address REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT value\nFROM ABMultiValueEntry\nWHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n\nUNION ALL\n\nSELECT value\nFROM ABMultiValueLabel\nWHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\n```\n\nThese queries will search for US postal addresses in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The tables and columns in the database are as follows:\n- Table: cloud_tab_devices\n - Columns: device_uuid (TEXT), system_fields (BLOB), device_name (TEXT), has_duplicate_device_name (BOOLEAN), is_ephemeral_device (BOOLEAN), last_modified (REAL)\n \n- Table: cloud_tabs\n - Columns: tab_uuid (TEXT), system_fields (BLOB), device_uuid (TEXT), position (BLOB), title (TEXT), url (TEXT), is_showing_reader (BOOLEAN), is_pinned (BOOLEAN), reader_scroll_position_page_index (INTEGER), scene_id (TEXT)\n \n- Table: metadata\n - Columns: key (TEXT), value (TEXT)\n\nTo find possible email addresses in the database, we will search through the columns in these tables. Let's proceed with the SQL query to search for email addresses.\nSELECT device_uuid FROM cloud_tab_devices WHERE device_uuid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT title FROM cloud_tabs WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value FROM metadata WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "There are no additional tables available in the database that could potentially contain text data where US phone numbers might be stored. Without specific text fields to search for US phone numbers, it is not possible to directly query for them. If you have any specific tables or columns in mind where US phone numbers might be stored, please provide that information for further exploration.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["falafel hardboiled egg israel - Google Search"], ["Dickens Cider is now Dickins Cider Company | Hard Cider Drinks | Dickens Cider"], ["Blue Bite | Connecting Possibility"], ["Home page - Mapat"], ["snack with dairy kids - Google Search"], ["figs growing green not ripe - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["How to Change a Light Bulb"], ["Tolls"], ["ravensmanorexperience.com"]], "Total_raw_rows": 10, "Exploration_sql": "The columns in the databases are as follows:\n- Table: cloud_tab_devices\n - device_uuid (TEXT)\n - system_fields (BLOB)\n - device_name (TEXT)\n - has_duplicate_device_name (BOOLEAN)\n - is_ephemeral_device (BOOLEAN)\n - last_modified (REAL)\n\n- Table: cloud_tabs\n - tab_uuid (TEXT)\n - system_fields (BLOB)\n - device_uuid (TEXT)\n - position (BLOB)\n - title (TEXT)\n - url (TEXT)\n - is_showing_reader (BOOLEAN)\n - is_pinned (BOOLEAN)\n - reader_scroll_position_page_index (INTEGER)\n - scene_id (TEXT)\n\n- Table: metadata\n - key (TEXT)\n - value (TEXT)\n\nTo find possible usernames, we will search for patterns in the text columns of these tables. Let's proceed with the SQL query.\nSELECT device_name FROM cloud_tab_devices WHERE device_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT title FROM cloud_tabs WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the database schema, the tables and columns that may contain person names are not directly related to messages, chats, or other text fields where names are commonly found. Therefore, it is recommended to explore other tables or databases that are more likely to contain person names. Let's focus on other databases or tables for this search.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The following tables and columns are available in the database:\n- Table: cloud_tab_devices\n - Columns: device_uuid TEXT, system_fields BLOB, device_name TEXT, has_duplicate_device_name BOOLEAN, is_ephemeral_device BOOLEAN, last_modified REAL\n\n- Table: cloud_tabs\n - Columns: tab_uuid TEXT, system_fields BLOB, device_uuid TEXT, position BLOB, title TEXT, url TEXT, is_showing_reader BOOLEAN, is_pinned BOOLEAN, reader_scroll_position_page_index INTEGER, scene_id TEXT\n\n- Table: metadata\n - Columns: key TEXT, value\n\nTo find US postal addresses in the database, we can search through text columns such as 'device_name', 'title', 'url', 'key', and 'value' in the tables 'cloud_tab_devices', 'cloud_tabs', and 'metadata'. Let's proceed with searching for US postal addresses in these columns.\n```sql\nSELECT device_name FROM cloud_tab_devices WHERE device_name REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\nUNION ALL\nSELECT title FROM cloud_tabs WHERE title REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\nUNION ALL\nSELECT url FROM cloud_tabs WHERE url REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\nUNION ALL\nSELECT value FROM metadata WHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the following columns may contain email addresses:\n- history_event_listeners: listener_name\n- history_items: url\n- history_items_to_tags: No relevant column\n- history_tags: No relevant column\n- history_visits: No relevant column\n- metadata: No relevant column\n\nTo search for email addresses in the mentioned columns, you can use the following SQL query:\n\n```sql\nSELECT listener_name AS email_address FROM history_event_listeners WHERE listener_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT url AS email_address FROM history_items WHERE url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n```\n\nThis query will search for potential email addresses in the 'listener_name' column of 'history_event_listeners' table and the 'url' column of the 'history_items' table.", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there is a possibility of finding US phone numbers in the following columns:\n- history_event_listeners: listener_name\n- history_items: url\n- history_items_to_tags: No relevant columns\n- history_tags: No relevant columns\n- history_visits: No relevant columns\n- metadata: No relevant columns\n\nI will now construct SQL queries to search for US phone numbers in the identified columns.\n```sql\nSELECT listener_name FROM history_event_listeners WHERE listener_name REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT url FROM history_items WHERE url REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\n```\nThis SQL query will search for US phone numbers in the 'listener_name' column of 'history_event_listeners' table and the 'url' column of 'history_items' table.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables, the following columns may contain usernames:\n- history_event_listeners: listener_name\n- history_items: url\n- history_items_to_tags: No potential username column\n- history_tags: identifier\n- history_visits: title\n- metadata: value\n\nTo search for possible usernames, you can use the following SQL query:\n```sql\nSELECT listener_name AS username FROM history_event_listeners WHERE listener_name REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT url AS username FROM history_items WHERE url REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT identifier AS username FROM history_tags WHERE identifier REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT title AS username FROM history_visits WHERE title REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'\nUNION ALL\nSELECT value AS username FROM metadata WHERE value REGEXP '\\\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://tickets.hersheypa.com/storefront/shop/ViewItems.aspx?CG=HPTKTS&C=HPTKTS&_gl=1*1sguq9m*_gcl_aw*R0NMLjE3MjM0OTA5NTQuQ2owS0NRanc1ZWExQmhDNkFSSXNBRU9HNXB5NE1nbEZtZHhiU0RhbEs0Z00tc3FUd0VGcEh1Z2NEWlZ5Z3N1d05aS0g2ekM0SzYtYmxURWFBaE44RUFMd193Y0I.*_gcl_dc*R0NMLjE3MjM0OTA5NTQuQ2owS0NRanc1ZWExQmhDNkFSSXNBRU9HNXB5NE1nbEZtZHhiU0RhbEs0Z00tc3FUd0VGcEh1Z2NEWlZ5Z3N1d05aS0g2ekM0SzYtYmxURWFBaE44RUFMd193Y0I.*_gcl_au*MTk5NzQyOTczOS4xNzIzNDgxMDgy*_ga*MTI1Mjg3ODg0Ni4xNzIzNDgxMDgy*_ga_LXCGZ9WB35*MTcyMzQ5MDk0Ny4yLjEuMTcyMzQ5MDk1OS40OC4wLjEyOTE0MTY0MTI.#3408579"], ["https://www.google.com/search?q=17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari"], ["https://www.google.com/search?q=17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari&dlnr=1&sei=GuOzZuy0NbWi5NoPtbmK0QU"], ["https://www.google.com/search?q=17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari&dlnr=1&sei=GuOzZuy0NbWi5NoPtbmK0QU#sbfbu=1&pi=17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K"], ["https://www.google.com/search?q=a%26e+nails&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari"], ["https://www.google.com/search?q=a%26e+nails&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari&dlnr=1&sei=OUW6ZqKwH6er5NoPrdaEkA0"], ["https://www.google.com/search?q=hersheypark+hours&client=safari&sca_esv=1926c2955f272b3e&hl=en-us&sxsrf=ADLYWIL5Cqe0vl7oGRIbN3u5ZfPrUMTiPw%3A1723065118580&ei=HuOzZvyFI9qr5NoProGloQ8&oq=hersheypark+hours&gs_lp=EhNtb2JpbGUtZ3dzLXdpei1zZXJwGgIYAiIRaGVyc2hleXBhcmsgaG91cnMyCxAAGIAEGLEDGIMBMgUQABiABDILEC4YgAQYxwEYrwEyCxAAGIAEGLEDGIMBMgUQABiABDIFEAAYgAQyBRAAGIAEMgUQABiABEjWnwJQzsQBWOT8AXACeACQAQKYAcAOoAGcL6oBCDAuMTcuOC0yuAEDyAEA-AEBmAIToAKEE6gCD8ICExAjGKYDGCcY-AUYqAMY6gIYiwPCAgcQIxgnGOoCwgITEAAYAxjlAhjqAhiLAxiMAxiPAcICGRAuGAMYpAMY5QIYqAMY6gIYiwMYjAMYjwHCAgQQIxgnwgILEAAYgAQYkQIYigXCAhEQLhiABBixAxjRAxiDARjHAcICERAuGIAEGLEDGIMBGNQCGIoFwgIOEC4YgAQYxwEYjgUYrwHCAgsQLhiABBiRAhiKBcICFBAuGIAEGLEDGIMBGMcBGI4FGK8BwgILEC4YgAQYsQMYgwHCAg4QLhiABBixAxiDARjUAsICBRAuGIAEwgIOEAAYgAQYsQMYgwEYigXCAggQLhiABBixA8ICGhAuGIAEGLEDGIMBGMcBGJgFGJoFGI4FGK8BwgIOEC4YgAQYkQIYsQMYigXCAhQQLhiABBiRAhixAxjRAxjHARiKBcICERAuGIAEGLEDGMcBGI4FGK8BwgIMELkBGIAEGLEDGMYFwgIJELkBGIAEGMYFmAMSiAYBkgcEMi4xN6AHqMcB&sclient=mobile-gws-wiz-serp"], ["https://www.google.com/search?q=hersheypark+hours&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari"], ["https://www.google.com/search?q=hersheypark+tickets&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari"], ["https://www.googleadservices.com/pagead/aclk?sa=L&ai=DChcSEwiooMWOmPCHAxW0SEcBHX8DLEYYABAAGgJxdQ&co=1&gclid=Cj0KCQjw5ea1BhC6ARIsAEOG5py4MglFmdxbSDalK4gM-sqTwEFpHugcDZVygsuwNZKH6zC4K6-blTEaAhN8EALw_wcB&ohost=www.google.com&cid=CAESVuD2nPO6L3xFHsnCSlyzb0WGk6sxE6lAJJtMOWSgXHnAsSdqwEKI-QiIF9rpNfORKO0yeiJN7sbWqT7gHAaodPwwdV6L7g38vgilrWmsYD7T3h5j55I5&sig=AOD64_3CR0w2bL3nyr_vwglCyST3stR7RQ&q&adurl&ved=2ahUKEwjqiL6OmPCHAxXmFFkFHeKuC-UQ0Qx6BAgXEAE&nis=2"], ["Gefilte fish"], ["Email marketing"], ["Firmware"], ["Sushi"], ["National Weather Service"], ["Atmospheric pressure"], ["Water vapor"], ["Vacation rental"], ["San Diego County, California"], ["Hotel"]], "Total_raw_rows": 20, "Exploration_sql": "Based on the schema of the tables in the database, the following columns may contain person names:\n- history_event_listeners: listener_name\n- history_items: url\n- history_items_to_tags: No relevant column for person names\n- history_tags: title\n- history_visits: title\n- metadata: No relevant column for person names\n\nTo search for person names in the identified columns, you can use the following SQL query:\n```sql\nSELECT listener_name AS person_name FROM history_event_listeners WHERE listener_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT url AS person_name FROM history_items WHERE url REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT title AS person_name FROM history_tags WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT title AS person_name FROM history_visits WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n```\n\nThis query will search for loosely structured human name-like strings in the specified columns of the respective tables.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, the following columns may contain US postal addresses:\n- history_event_listeners: listener_name\n- history_items: url, domain_expansion\n- history_items_to_tags: No relevant columns\n- history_tags: No relevant columns\n- history_visits: title\n- metadata: value\n\nI will now construct SQL queries to search for US postal addresses in these columns.\n```sql\nSELECT listener_name FROM history_event_listeners WHERE listener_name REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|ter\\\\.?|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';\n\nUNION ALL\n\nSELECT url FROM history_items WHERE url REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b'\nUNION ALL\nSELECT domain_expansion FROM history_items WHERE domain_expansion REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';\n\nUNION ALL\n\nSELECT title FROM history_visits WHERE title REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';\n\nUNION ALL\n\nSELECT value FROM metadata WHERE value REGEXP '(?i)\\\\b(?:p\\\\.?\\\\s*o\\\\.?\\\\s*box|post\\\\s+office\\\\s+box|ave\\\\.?|avenue|st\\\\.?|street|rd\\\\.?|road|blvd\\\\.?|boulevard|dr\\\\.?|drive|ln\\\\.?|lane|ct\\\\.?|court|pl\\\\.?|place|way|pkwy\\\\.?|parkway|cir\\\\.?|circle|terrace|hwy\\\\.?|highway|trl\\\\.?|trail|sq\\\\.?|square|pike|loop|run|walk|path|byp\\\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\\\b)\\\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the available tables, there are no columns that directly indicate the presence of email addresses. To further explore the database for email addresses, we may need to look into other tables or columns that contain text fields such as messages, chats, or user information. Let's proceed with searching for email addresses in potential text fields.\nSELECT ZVALUE FROM ZSETTING WHERE ZVALUE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT Z_PLIST FROM Z_METADATA WHERE Z_PLIST REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT Z_CONTENT FROM Z_MODELCACHE WHERE Z_CONTENT REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT Z_NAME FROM Z_MODELCACHE WHERE Z_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["748022768.494298"]], "Total_raw_rows": 1, "Exploration_sql": "Based on the schema of the tables, the following columns may contain text fields where US phone numbers could be found:\n- ZSETTING: ZKEY, ZVALUE\n- Z_METADATA: Z_UUID\n- Z_MODELCACHE: Z_CONTENT\n- Z_PRIMARYKEY: Z_NAME\n\nI will now search these columns for US phone numbers.\n```sql\nSELECT ZKEY AS US_PHONE_NUMBER FROM ZSETTING WHERE ZKEY REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT ZVALUE AS US_PHONE_NUMBER FROM ZSETTING WHERE ZVALUE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Z_UUID AS US_PHONE_NUMBER FROM Z_METADATA WHERE Z_UUID REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Z_CONTENT AS US_PHONE_NUMBER FROM Z_MODELCACHE WHERE Z_CONTENT REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT Z_NAME AS US_PHONE_NUMBER FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "It seems that the tables related to messages, chats, or user profiles are not available in the current database. Without access to these specific tables, it is challenging to identify usernames directly. If you have access to additional tables or specific data sources where usernames may be stored, please provide that information for further analysis.", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "The table \"Z_CONTENT\" does not contain any columns that are likely to store person names. Let's continue exploring other tables.\nSince the tables explored so far do not contain columns that are likely to store person names, we may need to look into other tables related to messages, chats, or text fields to find possible person names. Let's continue exploring the remaining tables.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "Based on the schema of the tables in the database, none of the columns in the tables ZSETTING, Z_METADATA, Z_MODELCACHE, Z_PRIMARYKEY seem to contain data that could potentially include US postal addresses.\n\nIf you have additional tables or specific columns in mind where you suspect US postal addresses might be stored, please provide that information for further investigation.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "-- No query possible: The only existing table is 'android_metadata', which does not contain user data or likely phone number fields. No relevant tables or columns exist for US phone number search.", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "No user tables containing possible address data exist in the database (only \"android_metadata\" is present, which does not contain user data). No SQL can be generated for address search.", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT key FROM journal_entry WHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT metadata FROM journal_entry WHERE metadata REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["BD8E9D7526970329EBAA1947E3555FF6.discover_story_streaming_snap_ff"], ["2DB0D566CE0BFC10322344128086AD99.discover_story_streaming_snap"], ["2E6AD61E5AC1518921549291B17B78C4.discover_story_streaming_snap"], ["4E45C3749501999D41DA43D3E94FB163.discover_story_streaming_snap_ff"], ["A87458944357595BEF05BD6DA3B1FD99.discover_story_streaming_snap_ff"], ["9A57DEBAD4A3345055253FDE194BF37E.discover_story_streaming_snap_ff"], ["C63944D5009403772B9407E370E9876F.discover_story_streaming_snap_ff"], ["30918F1765D509CF5073178240329C28.snap_loading_frame"], ["07D59D2A708B4088F4954525453296F9.snap_loading_frame"], ["358501AF78004E4013FF8802869271D9.discover_story_streaming_snap"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' UNION ALL\nSELECT key FROM journal_entry WHERE key REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' UNION ALL\nSELECT value_count FROM journal_entry WHERE CAST(value_count AS TEXT) REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' UNION ALL\nSELECT status FROM journal_entry WHERE CAST(status AS TEXT) REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' UNION ALL\nSELECT metadata FROM journal_entry WHERE metadata REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["/data/data/com.snapchat.android/files/file_manager/BLOOPS_STICKER"], ["/data/data/com.snapchat.android/files/file_manager/Bitmoji_Preview"], ["/data/data/com.snapchat.android/files/file_manager/LENS_ASSET_CONTENT_TYPE_NAME"], ["/data/data/com.snapchat.android/files/file_manager/Live_Mirror_Model"], ["/data/data/com.snapchat.android/files/file_manager/Login_Kit_Privacy"], ["/data/data/com.snapchat.android/files/file_manager/MUSIC_GENERIC_ASSET_TYPE"], ["/data/data/com.snapchat.android/files/file_manager/Maps_Kashmir"], ["/data/data/com.snapchat.android/files/file_manager/Maps_WorldEffects"], ["/data/data/com.snapchat.android/files/file_manager/Perception"], ["/data/data/com.snapchat.android/files/file_manager/PerceptionMl"], ["12DB3FD3B46FC8F9DD60F79CB359FBFE.khand_medium"], ["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["2FC6ABAAFF969A947FAB4E52FE0971FC.thumbnail"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["5BBE52CE6D0010CB50CA3221C4741E7D.discover_story_streaming_snap_ff"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"]], "Total_raw_rows": 20, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT key FROM journal_entry WHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"], ["/data/data/com.snapchat.android/files/file_manager/BLOOPS_STICKER"], ["/data/data/com.snapchat.android/files/file_manager/Bitmoji_Preview"], ["/data/data/com.snapchat.android/files/file_manager/LENS_ASSET_CONTENT_TYPE_NAME"], ["/data/data/com.snapchat.android/files/file_manager/Live_Mirror_Model"], ["/data/data/com.snapchat.android/files/file_manager/Login_Kit_Privacy"], ["/data/data/com.snapchat.android/files/file_manager/MUSIC_GENERIC_ASSET_TYPE"], ["/data/data/com.snapchat.android/files/file_manager/Maps_Kashmir"], ["/data/data/com.snapchat.android/files/file_manager/Maps_WorldEffects"], ["/data/data/com.snapchat.android/files/file_manager/Perception"], ["/data/data/com.snapchat.android/files/file_manager/PerceptionMl"], ["12DB3FD3B46FC8F9DD60F79CB359FBFE.khand_medium"], ["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["2FC6ABAAFF969A947FAB4E52FE0971FC.thumbnail"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["5BBE52CE6D0010CB50CA3221C4741E7D.discover_story_streaming_snap_ff"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"]], "Total_raw_rows": 21, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' UNION ALL\nSELECT path FROM journal WHERE path REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' UNION ALL\nSELECT key FROM journal_entry WHERE key REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["/data/data/com.snapchat.android/files/file_manager/map-place-icons"], ["/data/data/com.snapchat.android/files/file_manager/place-profile-annotation"], ["/data/data/com.snapchat.android/files/file_manager/place-profile-info"]], "Total_raw_rows": 3, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT key FROM journal_entry WHERE key REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": ["dialog_filter.title"], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": ["dialog_filter.title"], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": ["dialog_filter.title"], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT key_string FROM sync_item WHERE key_string REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' UNION ALL\nSELECT key_string FROM sync_item WHERE key_string REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "EMAIL", "PII": ["heather@cellebrite.com", "hmahalik@gmail.com"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["hmahalik@gmail.com"], ["heather@cellebrite.com"], ["hmahalik@gmail.com"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PHONE", "PII": ["7423794330", "7423794330"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["17423794330"], ["7423794330"], ["17423794330"], ["7423794330"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "USERNAME", "PII": ["heather", "hmahalik"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"]], "Total_raw_rows": 8, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PERSON_NAME", "PII": ["Heather", "Bo"], "Num_of_PII": 2, "source_columns": ["Tokens_content.c1value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["Bo"]], "Total_raw_rows": 5, "Exploration_sql": "SELECT value FROM Contacts WHERE value REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": "SELECT value FROM Contacts WHERE value REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "EMAIL", "PII": ["19735203731@s.whatsapp.net", "923402582955@s.whatsapp.net", "14847353029@s.whatsapp.net", "19199037779@s.whatsapp.net"], "Num_of_PII": 4, "source_columns": ["ZWAAGGREGATECALLEVENT.ZLINKTOKEN", "ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENT.ZGROUPCALLCREATORUSERJIDSTRING", "ZWACDCALLEVENT.ZGROUPJIDSTRING", "ZWACDCALLEVENT.ZSCHEDULEDID", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING", "Z_METADATA.Z_UUID", "Z_PRIMARYKEY.Z_NAME"], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PHONE", "PII": ["9735203731", "4847353029", "9199037779"], "Num_of_PII": 3, "source_columns": ["ZWAAGGREGATECALLEVENT.ZLINKTOKEN", "ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENT.ZGROUPCALLCREATORUSERJIDSTRING", "ZWACDCALLEVENT.ZGROUPJIDSTRING", "ZWACDCALLEVENT.ZSCHEDULEDID", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING"], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "USERNAME", "PII": ["WAAggregateCallEvent", "WACDCallEvent", "WACDCallEventParticipant", "WAJoinableCallEvent", "WAJoinableCallEventParticipant", "WAUpcomingCallEvent"], "Num_of_PII": 6, "source_columns": ["ZWAAGGREGATECALLEVENT.ZLINKTOKEN", "ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENT.ZGROUPCALLCREATORUSERJIDSTRING", "ZWACDCALLEVENT.ZGROUPJIDSTRING", "ZWACDCALLEVENT.ZSCHEDULEDID", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING", "Z_METADATA.Z_UUID", "Z_PRIMARYKEY.Z_NAME"], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["397466DD-9F9E-4385-BB61-81454ECF0FA4"], ["WAAggregateCallEvent"], ["WACDCallEvent"], ["WACDCallEventParticipant"], ["WAJoinableCallEvent"], ["WAJoinableCallEventParticipant"], ["WAUpcomingCallEvent"]], "Total_raw_rows": 16, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["3C399CDDAF11A41F7AFF2892E0A4B10C"], ["3C37CBFE11C261E6CD80C2DE7834D770"], ["372FA57E129467051E04B3E4DD5A26D5"], ["3A6DF670F7121CD6D08B"], ["3A9CEF8B4996D645358B"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 14, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT ZSCHEDULEDID FROM ZWACDCALLEVENT WHERE ZSCHEDULEDID REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key FROM _SqliteDatabaseProperties WHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT value FROM _SqliteDatabaseProperties WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key FROM _SqliteDatabaseProperties WHERE key REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT value FROM _SqliteDatabaseProperties WHERE value REGEXP '(\\+1[- .]?|1[- .]?|)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key FROM _SqliteDatabaseProperties WHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT value FROM _SqliteDatabaseProperties WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["_ClientVersion"], ["_UniqueIdentifier"], ["__CPRecordSequenceNumber"], ["1BB6D11F-7D93-4A3D-80B7-9B37DFB90EED"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT key FROM _SqliteDatabaseProperties WHERE key REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' UNION ALL SELECT value FROM _SqliteDatabaseProperties WHERE value REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value FROM _SqliteDatabaseProperties WHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT listener_name FROM history_event_listeners WHERE listener_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT url FROM history_items WHERE url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT domain_expansion FROM history_items WHERE domain_expansion REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT identifier FROM history_tags WHERE identifier REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT title FROM history_tags WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT title FROM history_visits WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT key FROM metadata WHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT value FROM metadata WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://www.google.com/search?q=hersheypark+hours&client=safari&sca_esv=1926c2955f272b3e&hl=en-us&sxsrf=ADLYWIL5Cqe0vl7oGRIbN3u5ZfPrUMTiPw%3A1723065118580&ei=HuOzZvyFI9qr5NoProGloQ8&oq=hersheypark+hours&gs_lp=EhNtb2JpbGUtZ3dzLXdpei1zZXJwGgIYAiIRaGVyc2hleXBhcmsgaG91cnMyCxAAGIAEGLEDGIMBMgUQABiABDILEC4YgAQYxwEYrwEyCxAAGIAEGLEDGIMBMgUQABiABDIFEAAYgAQyBRAAGIAEMgUQABiABEjWnwJQzsQBWOT8AXACeACQAQKYAcAOoAGcL6oBCDAuMTcuOC0yuAEDyAEA-AEBmAIToAKEE6gCD8ICExAjGKYDGCcY-AUYqAMY6gIYiwPCAgcQIxgnGOoCwgITEAAYAxjlAhjqAhiLAxiMAxiPAcICGRAuGAMYpAMY5QIYqAMY6gIYiwMYjAMYjwHCAgQQIxgnwgILEAAYgAQYkQIYigXCAhEQLhiABBixAxjRAxiDARjHAcICERAuGIAEGLEDGIMBGNQCGIoFwgIOEC4YgAQYxwEYjgUYrwHCAgsQLhiABBiRAhiKBcICFBAuGIAEGLEDGIMBGMcBGI4FGK8BwgILEC4YgAQYsQMYgwHCAg4QLhiABBixAxiDARjUAsICBRAuGIAEwgIOEAAYgAQYsQMYgwEYigXCAggQLhiABBixA8ICGhAuGIAEGLEDGIMBGMcBGJgFGJoFGI4FGK8BwgIOEC4YgAQYkQIYsQMYigXCAhQQLhiABBiRAhixAxjRAxjHARiKBcICERAuGIAEGLEDGMcBGI4FGK8BwgIMELkBGIAEGLEDGMYFwgIJELkBGIAEGMYFmAMSiAYBkgcEMi4xN6AHqMcB&sclient=mobile-gws-wiz-serp"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT listener_name FROM history_event_listeners WHERE listener_name REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT url FROM history_items WHERE url REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT domain_expansion FROM history_items WHERE domain_expansion REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT identifier FROM history_tags WHERE identifier REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT title FROM history_tags WHERE title REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT title FROM history_visits WHERE title REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT key FROM metadata WHERE key REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}' \nUNION ALL \nSELECT value FROM metadata WHERE value REGEXP '(\\+1[- .]?|1[- .]?)?(\\([2-9][0-9]{2}\\)|[2-9][0-9]{2})[- .]?[0-9]{3}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Safari"], ["Q1146771"], ["Q1155133"], ["Q104851"], ["Q46383"], ["Q1066823"], ["Q81809"], ["Q190120"], ["Q336532"], ["Q108143"], ["Q27686"], ["Gefilte fish"], ["Email marketing"], ["Firmware"], ["Sushi"], ["National Weather Service"], ["Atmospheric pressure"], ["Water vapor"], ["Vacation rental"], ["San Diego County, California"], ["Hotel"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["hersheypark hours - Google Search"], ["hersheypark hours - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["cached_sync_circle_size"], ["current_generation"], ["fetch_throttler_data"], ["last_maintenance_date"], ["last_synced_generation"], ["profile_server_map"], ["push_notifications_initialized"], ["push_throttler_data"], ["server_change_token"], ["sync_circle_size_retrieval_throttler_data"], [{"__bytes_b64__": "YnBsaXN0MDChATNBxVIgtAaGnAgKAAAAAAAAAQEAAAAAAAAAAgAAAAAAAAAAAAAAAAAAABM="}], [{"__bytes_b64__": "YnBsaXN0MDDUAQIDBAUGBwpYJHZlcnNpb25ZJGFyY2hpdmVyVCR0b3BYJG9iamVjdHMSAAGGoF8QD05TS2V5ZWRBcmNoaXZlctEICVRyb290gAGkCwwRElUkbnVsbNINDg8QViRjbGFzc18QD0NoYW5nZVRva2VuRGF0YYADgAJPEC4fChASDAAAML8tAkOxAAEAAhgBGAAiFQi3irGY46zg5EkQj+fmr5H/1u2KASgA0hMUFRZaJGNsYXNzbmFtZVgkY2xhc3Nlc18QE0NLU2VydmVyQ2hhbmdlVG9rZW6iFxhfEBNDS1NlcnZlckNoYW5nZVRva2VuWE5TT2JqZWN0AAgAEQAaACQAKQAyADcASQBMAFEAUwBYAF4AYwBqAHwAfgCAALEAtgDBAMoA4ADjAPkAAAAAAAACAQAAAAAAAAAZAAAAAAAAAAAAAAAAAAABAg=="}], [{"__bytes_b64__": "YnBsaXN0MDDQCAAAAAAAAAEBAAAAAAAAAAEAAAAAAAAAAAAAAAAAAAAJ"}], [{"__bytes_b64__": "YnBsaXN0MDChATNBxjVNMDx/ZwgKAAAAAAAAAQEAAAAAAAAAAgAAAAAAAAAAAAAAAAAAABM="}], [{"__bytes_b64__": "YnBsaXN0MDChATNBxjVNMEzwnggKAAAAAAAAAQEAAAAAAAAAAgAAAAAAAAAAAAAAAAAAABM="}]], "Total_raw_rows": 46, "Exploration_sql": "SELECT listener_name FROM history_event_listeners WHERE listener_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT identifier FROM history_tags WHERE identifier REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT title FROM history_tags WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT title FROM history_visits WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT key FROM metadata WHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT value FROM metadata WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Safari"], ["Gefilte fish"], ["Email marketing"], ["Firmware"], ["Sushi"], ["National Weather Service"], ["Atmospheric pressure"], ["Water vapor"], ["Vacation rental"], ["San Diego County, California"], ["Hotel"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["17eBu7RgHUeusRyLZr6u3cCjwmmQprK28K - Google Search"], ["hersheypark hours - Google Search"], ["hersheypark hours - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"]], "Total_raw_rows": 21, "Exploration_sql": "SELECT listener_name FROM history_event_listeners WHERE listener_name REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT identifier FROM history_tags WHERE identifier REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT title FROM history_tags WHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT title FROM history_visits WHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I4_History.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["a&e nails - Google Search"], ["a&e nails - Google Search"], ["a&e nails - Google Search"], ["a&e nails - Google Search"], ["Toll road"], [{"__bytes_b64__": "YnBsaXN0MDDUAQIDBAUGBwpYJHZlcnNpb25ZJGFyY2hpdmVyVCR0b3BYJG9iamVjdHMSAAGGoF8QD05TS2V5ZWRBcmNoaXZlctEICVRyb290gAGkCwwRElUkbnVsbNINDg8QViRjbGFzc18QD0NoYW5nZVRva2VuRGF0YYADgAJPEC4fChASDAAAML8tAkOxAAEAAhgBGAAiFQi3irGY46zg5EkQj+fmr5H/1u2KASgA0hMUFRZaJGNsYXNzbmFtZVgkY2xhc3Nlc18QE0NLU2VydmVyQ2hhbmdlVG9rZW6iFxhfEBNDS1NlcnZlckNoYW5nZVRva2VuWE5TT2JqZWN0AAgAEQAaACQAKQAyADcASQBMAFEAUwBYAF4AYwBqAHwAfgCAALEAtgDBAMoA4ADjAPkAAAAAAAACAQAAAAAAAAAZAAAAAAAAAAAAAAAAAAABAg=="}]], "Total_raw_rows": 6, "Exploration_sql": "SELECT url FROM history_items WHERE url REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT domain_expansion FROM history_items WHERE domain_expansion REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT title FROM history_visits WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT identifier FROM history_tags WHERE identifier REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT title FROM history_tags WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT value FROM metadata WHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZKEY FROM ZSETTING WHERE ZKEY REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZVALUE FROM ZSETTING WHERE ZVALUE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZKEY FROM ZSETTING WHERE ZKEY REGEXP '(\\+1[- .]?|1[- .]?)?\\\\(?[2-9][0-9]{2}\\\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT ZVALUE FROM ZSETTING WHERE ZVALUE REGEXP '(\\+1[- .]?|1[- .]?)?\\\\(?[2-9][0-9]{2}\\\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '(\\+1[- .]?|1[- .]?)?\\\\(?[2-9][0-9]{2}\\\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}' \nUNION ALL \nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '(\\+1[- .]?|1[- .]?)?\\\\(?[2-9][0-9]{2}\\\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["CacheEndDate"], ["LastDBSequence"], ["AE9BAC24-6E29-4FA2-9FA4-699FD2BE7479"], ["Alarm"], ["Setting"]], "Total_raw_rows": 5, "Exploration_sql": "SELECT ZKEY FROM ZSETTING WHERE ZKEY REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZVALUE FROM ZSETTING WHERE ZVALUE REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["CacheEndDate"], ["LastDBSequence"], ["AE9BAC24-6E29-4FA2-9FA4-699FD2BE7479"], ["Alarm"], ["Setting"]], "Total_raw_rows": 5, "Exploration_sql": "SELECT ZKEY FROM ZSETTING WHERE ZKEY REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ZVALUE FROM ZSETTING WHERE ZVALUE REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZKEY FROM ZSETTING WHERE ZKEY REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZVALUE FROM ZSETTING WHERE ZVALUE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT Z_UUID FROM Z_METADATA WHERE Z_UUID REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "No user tables are available in the database to query for person names.", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["12014946184@s.whatsapp.net"], ["12025692832@s.whatsapp.net"], ["12028177932@s.whatsapp.net"], ["12028275725@s.whatsapp.net"], ["120363098389106519@g.us"], ["12037188989@s.whatsapp.net"], ["12065937224@s.whatsapp.net"], ["12088549831@s.whatsapp.net"], ["12089234440@s.whatsapp.net"], ["12092759604@s.whatsapp.net"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT email FROM wa_biz_profiles WHERE email REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT jid FROM wa_contacts WHERE jid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT account_id FROM wa_biz_profiles_linked_accounts_table WHERE account_id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT websites FROM wa_biz_profiles_websites WHERE websites REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "PHONE", "PII": ["19199037779", "8085096467", "5713349815", "16263678865", "16106046786", "7034241981", "5715917168", "2065937224", "5713298742", "8624338328", "18056377243", "2028177932", "2025692832", "19735203731", "81367430271", "17423794330", "5713298742", "5713349815", "8085096467", "8624338328", "7034241981", "2028177932", "5715917168", "2025692832", "16106046786", "16263678865", "2065937224", "19199037779", "18056377243", "19735203731", "81367430271", "17423794330"], "Num_of_PII": 32, "source_columns": ["wa_address_book.number", "wa_contacts.number"], "Raw_rows_first_100": [["+19199037779"], ["8085096467"], ["5713349815"], ["+16263678865"], ["+16106046786"], ["7034241981"], ["5715917168"], ["+12065937224"], ["5713298742"], ["8624338328"], ["+18056377243"], ["2028177932"], ["2025692832"], ["+19735203731"], ["+81367430271"], ["+17423794330"], ["5713298742"], ["5713349815"], ["8085096467"], ["8624338328"], ["7034241981"], ["2028177932"], ["5715917168"], ["2025692832"], ["+16106046786"], ["+16263678865"], ["+12065937224"], ["+19199037779"], ["+18056377243"], ["+19735203731"], ["+81367430271"], ["+17423794330"]], "Total_raw_rows": 32, "Exploration_sql": "SELECT number FROM wa_address_book WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT number FROM wa_biz_profiles WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT number FROM wa_contacts WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "Extraction_sql": "SELECT number FROM wa_address_book WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT number FROM wa_biz_profiles WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT number FROM wa_contacts WHERE number REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Russ Philby"], ["Capt Don Wayne"], ["LTC Whalen"], ["Mary Garcia"], ["Joey"], ["Hank"], ["Goldie Kahn"], ["Abe Rudder"], ["Svetlana Chernoff"], ["Karen Tate"], ["Svetlana Chernoff"], ["LTC Whalen"], ["Capt Don Wayne"], ["Karen Tate"], ["Hank"], ["Brian Reynolds"], ["Goldie Kahn"], ["Vladamir Stravinsky"], ["6️⃣ Wealth Builders Club"], ["Joey"]], "Total_raw_rows": 20, "Exploration_sql": "SELECT display_name FROM wa_address_book WHERE display_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT nickname FROM wa_address_book WHERE nickname REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT display_name FROM wa_contacts WHERE display_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT nickname FROM wa_contacts WHERE nickname REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT custom_url FROM wa_biz_profiles WHERE custom_url REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT verified_name FROM wa_biz_profiles WHERE verified_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "PERSON_NAME", "PII": ["Svetlana Chernoff", "LTC Whalen", "Capt Don Wayne", "Karen Tate", "Hank", "Brian Reynolds", "Goldie Kahn", "Vladamir Stravinsky", "Joey", "Mary Garcia", "Abe Rudder", "Russ Philby", "Otto", "Toks", "Bo"], "Num_of_PII": 15, "source_columns": ["wa_contacts.display_name", "wa_contacts.given_name", "wa_contacts.family_name", "wa_contacts.nickname", "wa_address_book.display_name", "wa_address_book.given_name", "wa_address_book.family_name", "wa_address_book.nickname"], "Raw_rows_first_100": [["Svetlana Chernoff"], ["LTC Whalen"], ["Capt Don Wayne"], ["Karen Tate"], ["Hank"], ["Brian Reynolds"], ["Goldie Kahn"], ["Vladamir Stravinsky"], ["6️⃣ Wealth Builders Club"], ["Joey"], ["Mary Garcia"], ["Abe Rudder"], ["Russ Philby"], ["Voice Mail"], ["Otto"], ["Toks"], ["Bo"], ["Svetlana"], ["Don"], ["Karen"], ["Hank"], ["Brian"], ["Goldie"], ["Vladamir"], ["Joey"], ["Mary"], ["Abe"], ["Russ"], ["Voice Mail"], ["Otto"], ["Toks"], ["Bo"], ["Chernoff"], ["Whalen"], ["Wayne"], ["Tate"], ["Reynolds"], ["Kahn"], ["Stravinsky"], ["Garcia"], ["Rudder"], ["Philby"], ["Russ Philby"], ["Capt Don Wayne"], ["LTC Whalen"], ["Mary Garcia"], ["Joey"], ["Hank"], ["Goldie Kahn"], ["Abe Rudder"], ["Svetlana Chernoff"], ["Karen Tate"], ["Voice Mail"], ["Brian Reynolds"], ["Vladamir Stravinsky"], ["Otto"], ["Toks"], ["Bo"], ["Russ"], ["Don"], ["Mary"], ["Joey"], ["Hank"], ["Goldie"], ["Abe"], ["Svetlana"], ["Karen"], ["Voice Mail"], ["Brian"], ["Vladamir"], ["Otto"], ["Toks"], ["Bo"], ["Philby"], ["Wayne"], ["Whalen"], ["Garcia"], ["Kahn"], ["Rudder"], ["Chernoff"], ["Tate"], ["Reynolds"], ["Stravinsky"]], "Total_raw_rows": 83, "Exploration_sql": "SELECT display_name FROM wa_contacts WHERE display_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT given_name FROM wa_contacts WHERE given_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT family_name FROM wa_contacts WHERE family_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT nickname FROM wa_contacts WHERE nickname REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT display_name FROM wa_address_book WHERE display_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT given_name FROM wa_address_book WHERE given_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT family_name FROM wa_address_book WHERE family_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT nickname FROM wa_address_book WHERE nickname REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": "SELECT display_name FROM wa_contacts WHERE display_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT given_name FROM wa_contacts WHERE given_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT family_name FROM wa_contacts WHERE family_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT nickname FROM wa_contacts WHERE nickname REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT display_name FROM wa_address_book WHERE display_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT given_name FROM wa_address_book WHERE given_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT family_name FROM wa_address_book WHERE family_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT nickname FROM wa_address_book WHERE nickname REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_wa.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT display_name FROM wa_contacts WHERE display_name REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT company FROM wa_contacts WHERE company REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT display_name FROM wa_address_book WHERE display_name REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT company FROM wa_address_book WHERE company REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT key FROM journal_entry WHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT value_count FROM journal_entry WHERE value_count REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT status FROM journal_entry WHERE status REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT last_update_time FROM journal_entry WHERE last_update_time REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT last_read_time FROM journal_entry WHERE last_read_time REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT lock_count FROM journal_entry WHERE lock_count REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT total_size FROM journal_entry WHERE total_size REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT expiration FROM journal_entry WHERE expiration REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT last_consumed_time FROM journal_entry WHERE last_consumed_time REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT metadata FROM journal_entry WHERE metadata REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"], ["4EDFB389483E360F0CBA63F7A928FD39.discover_story_streaming_snap_ff"], ["629156B858FDF391C0639F2DE6933EEB.discover_story_streaming_snap_ff"], ["5A4F0362F54488AC2542C174F69C9A24.discover_story_streaming_snap_ff"]], "Total_raw_rows": 10, "Exploration_sql": "The existing tables and their columns are as follows:\n\n1. **journal**\n - _id INTEGER\n - path TEXT\n - size INTEGER\n - locked_size INTEGER\n\n2. **journal_entry**\n - _id INTEGER\n - journal_id INTEGER\n - key TEXT\n - sequence_number INTEGER\n - value_count INTEGER\n - status INTEGER\n - last_update_time INTEGER\n - last_read_time INTEGER\n - lock_count INTEGER\n - total_size INTEGER\n - value_sizes BLOB\n - expiration INTEGER\n - last_consumed_time INTEGER\n - metadata BLOB\n\nBased on the available columns, the most relevant columns for searching US phone numbers would be `path` from the `journal` table and `key`, `value_sizes`, and `metadata` from the `journal_entry` table. However, `value_sizes` and `metadata` are BLOB types, which are not suitable for direct text searches.\n\nHere is the SQL query to find possible US phone numbers:\n\n```sql\nSELECT path FROM journal WHERE path REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT key FROM journal_entry WHERE key REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["/data/data/com.snapchat.android/files/file_manager/BLOOPS_STICKER"], ["/data/data/com.snapchat.android/files/file_manager/Bitmoji_Preview"], ["/data/data/com.snapchat.android/files/file_manager/LENS_ASSET_CONTENT_TYPE_NAME"], ["/data/data/com.snapchat.android/files/file_manager/Live_Mirror_Model"], ["/data/data/com.snapchat.android/files/file_manager/Login_Kit_Privacy"], ["/data/data/com.snapchat.android/files/file_manager/MUSIC_GENERIC_ASSET_TYPE"], ["/data/data/com.snapchat.android/files/file_manager/Maps_Kashmir"], ["/data/data/com.snapchat.android/files/file_manager/Maps_WorldEffects"], ["/data/data/com.snapchat.android/files/file_manager/Perception"], ["/data/data/com.snapchat.android/files/file_manager/PerceptionMl"], ["12DB3FD3B46FC8F9DD60F79CB359FBFE.khand_medium"], ["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["2FC6ABAAFF969A947FAB4E52FE0971FC.thumbnail"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["5BBE52CE6D0010CB50CA3221C4741E7D.discover_story_streaming_snap_ff"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"]], "Total_raw_rows": 20, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT key FROM journal_entry WHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["/data/data/com.snapchat.android/files/file_manager/BLOOPS_STICKER"], ["/data/data/com.snapchat.android/files/file_manager/Bitmoji_Preview"], ["/data/data/com.snapchat.android/files/file_manager/LENS_ASSET_CONTENT_TYPE_NAME"], ["/data/data/com.snapchat.android/files/file_manager/Live_Mirror_Model"], ["/data/data/com.snapchat.android/files/file_manager/Login_Kit_Privacy"], ["/data/data/com.snapchat.android/files/file_manager/MUSIC_GENERIC_ASSET_TYPE"], ["/data/data/com.snapchat.android/files/file_manager/Maps_Kashmir"], ["/data/data/com.snapchat.android/files/file_manager/Maps_WorldEffects"], ["/data/data/com.snapchat.android/files/file_manager/Perception"], ["/data/data/com.snapchat.android/files/file_manager/PerceptionMl"], ["12DB3FD3B46FC8F9DD60F79CB359FBFE.khand_medium"], ["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["2FC6ABAAFF969A947FAB4E52FE0971FC.thumbnail"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["5BBE52CE6D0010CB50CA3221C4741E7D.discover_story_streaming_snap_ff"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"]], "Total_raw_rows": 20, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT key FROM journal_entry WHERE key REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT value_count FROM journal_entry WHERE value_count REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT status FROM journal_entry WHERE status REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT last_update_time FROM journal_entry WHERE last_update_time REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT last_read_time FROM journal_entry WHERE last_read_time REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT lock_count FROM journal_entry WHERE lock_count REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT total_size FROM journal_entry WHERE total_size REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT expiration FROM journal_entry WHERE expiration REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT last_consumed_time FROM journal_entry WHERE last_consumed_time REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT metadata FROM journal_entry WHERE metadata REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["/data/data/com.snapchat.android/files/file_manager/map-place-icons"], ["/data/data/com.snapchat.android/files/file_manager/place-profile-annotation"], ["/data/data/com.snapchat.android/files/file_manager/place-profile-info"]], "Total_raw_rows": 3, "Exploration_sql": "SELECT path FROM journal WHERE path REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT key FROM journal_entry WHERE key REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT id FROM params WHERE id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT id FROM params WHERE id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT pbytes FROM params WHERE pbytes REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT id FROM params WHERE id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT pbytes FROM params WHERE pbytes REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT CAST(pts AS TEXT) FROM params WHERE CAST(pts AS TEXT) REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL SELECT pbytes FROM params WHERE pbytes REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT id FROM params WHERE id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT id FROM params WHERE id REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM dialog_filter WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT pbytes FROM params WHERE pbytes REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT corpus FROM sync_corpus WHERE corpus REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL SELECT corpus FROM sync_corpus WHERE corpus REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT corpus FROM sync_corpus WHERE corpus REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT corpus FROM sync_corpus WHERE corpus REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string FROM sync_item WHERE key_string REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL SELECT corpus FROM sync_corpus WHERE corpus REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "EMAIL", "PII": ["heather@cellebrite.com", "hmahalik@gmail.com"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value", "Tokens_stat.value", "CacheInfo.affinity_response_context"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["hmahalik@gmail.com"], ["heather@cellebrite.com"], ["hmahalik@gmail.com"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT value FROM Tokens_stat WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT affinity_response_context FROM CacheInfo WHERE affinity_response_context REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value FROM Tokens_stat WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT affinity_response_context FROM CacheInfo WHERE affinity_response_context REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": ["Tokens.value", "Tokens_content.c1value", "Tokens_stat.value"], "Raw_rows_first_100": [["17423794330"], ["7423794330"], ["3794330"], ["17423794330"], ["7423794330"], ["3794330"]], "Total_raw_rows": 6, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT value FROM Tokens_stat WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'\nUNION ALL\nSELECT value FROM Tokens_stat WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "USERNAME", "PII": ["heather", "hmahalik"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"]], "Total_raw_rows": 8, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT identity_hash FROM android_metadata WHERE identity_hash REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT identity_hash FROM android_metadata WHERE identity_hash REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PERSON_NAME", "PII": ["Heather", "Bo"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value", "Tokens_stat.value", "CacheInfo.affinity_response_context", "android_metadata.locale"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["Bo"], ["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["Bo"], ["en_US"]], "Total_raw_rows": 11, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT value FROM Tokens_stat WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT affinity_response_context FROM CacheInfo WHERE affinity_response_context REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": "SELECT value FROM Tokens WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT c1value FROM Tokens_content WHERE c1value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT value FROM Tokens_stat WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT affinity_response_context FROM CacheInfo WHERE affinity_response_context REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value FROM Tokens WHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT c1value FROM Tokens_docsize WHERE c1value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT affinity_response_context FROM CacheInfo WHERE affinity_response_context REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT URL FROM BOOKMARKS WHERE URL REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT description FROM BOOKMARKS WHERE description REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT URL FROM BOOKMARKS WHERE URL REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT description FROM BOOKMARKS WHERE description REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "BAGBHAIGAQABLGwCAOx/Yz8pWMaZgKzK9gidY1JbWlHtbmZoPVRvHa8L1Qa5v77osj/b9cxf6AihGfAj9/oMzNgzwG4TEa1ocxhMgTw="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCADg08Y0rLftwtKLewxQylCXdY9YcWUe01qQU3juIWvYiZTepFwA/AGQEV8xammaotcT+LNCNEQBvYK49zZmdniQ="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAx0od46RvJj3ZMpmE/r++aNuxFfDaTafncAW0XddYSB0WkI7vryB4lplJKYOFVJvriCJ54MlN56/+r6ZnwIIKx3TF4rvHTUNRIc9LKLCfh5hqUwF5ebYY+wMqebfiqMSY="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAN/bPhb+tihkAfwO8uIxTzh9YWVp1U/kZ3oy/IzxRDnWH35ch+01jfwXwTtCmEj+LyGgSjHzzowXmue9uLyUvfpmVNbt3JCOqCl0EyBAo5+xpVCiij7EFhenIbvW/5cN0="}], [{"__bytes_b64__": "BAGBfgIHAQABLIFMAgAxMZf3KoVtVYHMTrajimnorfRebkfgH/qYhDfOJ2RRzWYOGMxn9xTFfrGxr/Cg60A6HnjLCVgpgftWYAW/bKRQc57iUOY3/35T/FmViNlLg/0T1xmtyNMJL85eTN6Ty8FnisaqUE3+iEK+drFSfnJt"}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgDferB3B+clQ8gWXYeFleQ01pIC6VzQ+FxtlyoVYuGZ/sO3K+0Bwv1BqzJe5oM8CyJQtis/qRu/Li9LMYVDQxRCkfClKVoXFf6qVbzv+0XrXKADvEyQD083AV/geGnfwx8="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCAFOkWm+YKKXqs73/JZomFYrCo4oPT5CxtHH55LlntGdkqmZtSDMNk5rK+qI5xXcabIuo1yoiz5gfcXbzKj6zoHU="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCAFgwiN0XYaRNwN6JFtBRdWfQw5YoTxjvsswMtBRYpQ4bzjZW6jjqVulUtvEdo3wPiKvtT0SzbxZ9i5yPZb27tpI="}], [{"__bytes_b64__": "BAGDHgIHAQABLIJsAgBmAh+1q8QXN1e6NFYn9aSifWs/qhVVZAaVAU+G+HEoDhHTH4chqxkrAUv8fV2cSb+ibuhENGUjrn5iwufMvgLEmlI6gRsKMO041/SgBVIQEn0w1gtf0qKXAH7MtFhw+KGp+LZGzJKln5mgGhgLtnaezb6gRiKJR22oNn7yGkLLsetkz8lv2fXxpdR//x8oTGlzKidUYqAgodUc3tekNCp8dBk2sf3Yhkx8wHBWgl16OdL2/8bX8HXkZj+YmSckPDI="}], [{"__bytes_b64__": "BAGEPgIHAQABLIQMAgABgxFFetbBD88wsavVtVjy+KN6LQaF52tl9Ztc+fzXT8MhsjknjCsDwrr+9tZQ1uZZNjvrZf13/vt7Nn58Xe1+sdDXmFRvJGfComqfeWyTQONx07TYcFCxWvZNWaecNUuUw+EC87PJColRgnZwE0JLLZ8Zcjsh8AjPicnUGgdkOfN8I1TaXKxMGebpzElMuqtVIhlph5EGeSm7pg0v/ELp/VeGLuxGeKbA6tXvUoiGaT51XBQebcsvu7qUegGuoIrZLf8Od7Q3JpKpH9miAs8O6o+o4zZXEI5LBv1suoFxmU6MRC7lTPGYgU6e+O1Wd9cSg4F2f7U2fAOBGDPYg3BrCZONls5ungK74IoKY48a5A=="}], [{"__bytes_b64__": "BAGDHgIHAQABLIJsAgCKKvrixPJ+dMqD7ppuoI0MyZaiuUvIgtJ4WHgnxrQGklMS6lrCMckJrtZnmVGBcHWPgbEIH/JKEmczg7KSJqaMfK+BKSyUC+v3ydvl2m/UC0JEA37crOZHBfy5z4B7KF1j7b1u7DDYe4DzyPE0+JyV0dfHonPF0zGA+yDZUAOoReeMJ9yHcuCKnASWELWEEvSukVLIZBmZ2OhTv4KNnbCyLBcA0Xz3SQ32AC3/+ef77BgKgSzNArHW3R5aUBmC7EE="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCAKl61i29x16wLpYmxrFNqnxRo2jwDmDqVicg3H5MHIkS8FpV5q51c8gBgjcNV2d81MfyilDXRcvXoZ0qUkze7rE="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCAN70T/VfPp/PiZVnhwV26fhis3esilpD+8o44vKDTZ780w6meoaKkG5GCzgz35949sNwnsKtaFGFdJ9fWtNKozQ="}], [{"__bytes_b64__": "BAGDHgIHAQABLIJsAgDa5rn5/h/uPxLOY8KfuGKu45sg2E1RRV79AuDrwZAO/CdOjK94CeByOdIR/dW/LnMwaCJ/Fzsktoej/DoH9XIfnD+9F+UZYDRgfpb9Ie0a/0TZyy2zL4HhatC455OfG5sGqlu7ZvodLztLBH1iqnEr3fC5hFGYgiAIbKmbwXITQdJ6efZ2J6a4Ne5dEK7nSq8Bky9lsF2g/R6Yug7kd5m+AHc1BEZoXFDer3Gm30trqQgKEgafKEJftuh+Cf8/Wic="}], [{"__bytes_b64__": "BAGEPgIHAQABLIQMAgBQ1ryPaiEATOXfVZTPg8FP3oJkx7RwFyn+2sKiKDDTGe/zN3pxBhO+t0++nKxLvCGlZ5/q8uMRVU0e9XsXOeH4uR4SDyxAajG0+/6OmOaOjtXwZGmhkY8d0UaJSyT1OukC02GESg3KjDFOeQsNQsfWEdvhNUWozvT4y7TUo1fiKMzWpKvIVK3NRaVFs8Dxgs0dNirE73Feyeps2GRq6CrF1hisNwoWNAp6H62mYO4OSgpbH8vIo7HKytAfYok6JzGpW2KUnXjsI/aLOg+OVz5a7WbtNPtX2EZ93WfLmRflqbD03VPN73Bgz6ENlzB79bNuPDr6EXSiBjUg4lRre7kwsO7iIo2Hv70JZFsyhJfQ2A=="}]], "Total_raw_rows": 15, "Exploration_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT URL FROM BOOKMARKS WHERE URL REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT SURL FROM BOOKMARKS WHERE SURL REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT SOURCEID FROM BOOKMARKS WHERE SOURCEID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "BAGBHAIGAQABLGwCAOx/Yz8pWMaZgKzK9gidY1JbWlHtbmZoPVRvHa8L1Qa5v77osj/b9cxf6AihGfAj9/oMzNgzwG4TEa1ocxhMgTw="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCADg08Y0rLftwtKLewxQylCXdY9YcWUe01qQU3juIWvYiZTepFwA/AGQEV8xammaotcT+LNCNEQBvYK49zZmdniQ="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAx0od46RvJj3ZMpmE/r++aNuxFfDaTafncAW0XddYSB0WkI7vryB4lplJKYOFVJvriCJ54MlN56/+r6ZnwIIKx3TF4rvHTUNRIc9LKLCfh5hqUwF5ebYY+wMqebfiqMSY="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAN/bPhb+tihkAfwO8uIxTzh9YWVp1U/kZ3oy/IzxRDnWH35ch+01jfwXwTtCmEj+LyGgSjHzzowXmue9uLyUvfpmVNbt3JCOqCl0EyBAo5+xpVCiij7EFhenIbvW/5cN0="}], [{"__bytes_b64__": "BAGBfgIHAQABLIFMAgAxMZf3KoVtVYHMTrajimnorfRebkfgH/qYhDfOJ2RRzWYOGMxn9xTFfrGxr/Cg60A6HnjLCVgpgftWYAW/bKRQc57iUOY3/35T/FmViNlLg/0T1xmtyNMJL85eTN6Ty8FnisaqUE3+iEK+drFSfnJt"}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgDferB3B+clQ8gWXYeFleQ01pIC6VzQ+FxtlyoVYuGZ/sO3K+0Bwv1BqzJe5oM8CyJQtis/qRu/Li9LMYVDQxRCkfClKVoXFf6qVbzv+0XrXKADvEyQD083AV/geGnfwx8="}]], "Total_raw_rows": 6, "Exploration_sql": "SELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL \nSELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL \nSELECT ACCOUNT_TYPE FROM BOOKMARKS WHERE ACCOUNT_TYPE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL \nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL \nSELECT description FROM BOOKMARKS WHERE description REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAx0od46RvJj3ZMpmE/r++aNuxFfDaTafncAW0XddYSB0WkI7vryB4lplJKYOFVJvriCJ54MlN56/+r6ZnwIIKx3TF4rvHTUNRIc9LKLCfh5hqUwF5ebYY+wMqebfiqMSY="}]], "Total_raw_rows": 1, "Exploration_sql": "SELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT TAGS FROM BOOKMARKS WHERE TAGS REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT description FROM BOOKMARKS WHERE description REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "EMAIL", "PII": ["sharononeil368@gmail.com"], "Num_of_PII": 1, "source_columns": ["BOOKMARKS.ACCOUNT_NAME", "INTERNET_SYNC.SYNC_KEY", "SYNC_STATE.account_name", "TABS.ACCOUNT_NAME"], "Raw_rows_first_100": [["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"]], "Total_raw_rows": 6, "Exploration_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL \nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://www.samsung.com/mobile/?cid=global_ow_app_s-internet_none_none_bookmark_bookmark_202008_none"], ["SBROWSER_TAB1724467631361__BROWSER1724467632107__SBROWSER_SAVEDPAGES1724467635256__QUICKACCESS_SYNC_V21724467633471__SBROWSER_HISTORY1724467634746__"], ["https://www.pinterest.com/pin/410812797236816112/"]], "Total_raw_rows": 3, "Exploration_sql": "SELECT URL FROM BOOKMARKS WHERE URL REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT data FROM SYNC_STATE WHERE data REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT TAB_URL FROM TABS WHERE TAB_URL REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT TAB_TITLE FROM TABS WHERE TAB_TITLE REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "USERNAME", "PII": ["sharononeil368", "sync_internet_data", "sync_bookmarks", "sync_open_pages", "sync_saved_pages"], "Num_of_PII": 5, "source_columns": ["BOOKMARKS.ACCOUNT_NAME", "TABS.ACCOUNT_NAME", "SYNC_STATE.account_name", "INTERNET_SYNC.SYNC_KEY"], "Raw_rows_first_100": [["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sharononeil368@gmail.com"], ["sync_internet_data"], ["sync_bookmarks"], ["sync_open_pages"], ["sync_saved_pages"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ACCOUNT_NAME FROM TABS WHERE ACCOUNT_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": ["BOOKMARKS.ACCOUNT_NAME", "INTERNET_SYNC.SYNC_KEY", "SYNC_STATE.account_name", "TABS.TAB_TITLE", "android_metadata.locale"], "Raw_rows_first_100": [["sharononeil368@gmail.com"], ["sync_internet_data"], ["sync_bookmarks"], ["sync_open_pages"], ["sync_saved_pages"], ["sharononeil368@gmail.com"], ["Pin on Simon, God of Hairdos"], ["puck from.glee - Google Search"], ["Midjourney AI - Free Image Generator"], ["billie eilish birds of a feather lyrics - Google Search"], ["en_US"]], "Total_raw_rows": 11, "Exploration_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT TAB_TITLE FROM TABS WHERE TAB_TITLE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": "SELECT ACCOUNT_NAME FROM BOOKMARKS WHERE ACCOUNT_NAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT SYNC_KEY FROM INTERNET_SYNC WHERE SYNC_KEY REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT account_name FROM SYNC_STATE WHERE account_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT TAB_TITLE FROM TABS WHERE TAB_TITLE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT URL FROM BOOKMARKS WHERE URL REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT TITLE FROM BOOKMARKS WHERE TITLE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT data FROM SYNC_STATE WHERE data REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT TAB_URL FROM TABS WHERE TAB_URL REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT TAB_TITLE FROM TABS WHERE TAB_TITLE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title FROM searchengine WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT url FROM searchengine WHERE url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT extra1 FROM searchengine WHERE extra1 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT extra2 FROM searchengine WHERE extra2 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL SELECT extra3 FROM searchengine WHERE extra3 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://home.imgsmail.ru/resplash/123689/i/meta/favicon.ico"], ["https://search.seznam.cz/re/media/favicon.192a42730e.ico"]], "Total_raw_rows": 2, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT title FROM searchengine WHERE title REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT url FROM searchengine WHERE url REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT extra1 FROM searchengine WHERE extra1 REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT extra2 FROM searchengine WHERE extra2 REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' \nUNION ALL \nSELECT extra3 FROM searchengine WHERE extra3 REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "USERNAME", "PII": ["google", "duckduckgo", "yahoo", "youtube", "bing", "so360", "qwant", "toutiao", "startpage", "shenma", "naver", "yandex", "mailru", "seznam", "yandexru", "daum", "baidu"], "Num_of_PII": 17, "source_columns": ["android_metadata.locale", "searchengine.title", "searchengine.url", "searchengine.image_url", "searchengine.extra1", "searchengine.extra2", "searchengine.extra3"], "Raw_rows_first_100": [["en_US"], ["google"], ["DuckDuckGo"], ["yahoo"], ["youtube"], ["bing"], ["so360"], ["qwant"], ["toutiao"], ["StartPage"], ["shenma"], ["naver"], ["yandex_com"], ["mail_ru"], ["seznam"], ["yandex_ru"], ["daum"], ["baidu"], ["youtube"], ["google"], ["https://duckduckgo.com/favicon.ico"], ["https://home.imgsmail.ru/resplash/123689/i/meta/favicon.ico"], ["https://m.toutiao.com/favicon.ico"], ["https://p0.ssl.qhimg.com/d/inn/128c749e/icon.png"], ["https://search.daum.net/favicon.ico"], ["https://search.naver.com/favicon.ico"], ["https://search.seznam.cz/re/media/favicon.192a42730e.ico"], ["https://search.yahoo.com/favicon.ico"], ["https://sm01.alicdn.com/L1/272/1990/favicon/favicon.ico"], ["https://www.baidu.com/favicon.ico"], ["https://www.bing.com/sa/simg/bing_p_rr_teal_min.ico"], ["https://www.google.com/favicon.ico"], ["https://www.google.com/images/branding/product/ico/googleg_alldp.ico"], ["https://www.qwant.com/favicon-64.png"], ["https://www.startpage.com/favicon.ico"], ["https://www.youtube.com/img/favicon_32.png"], ["https://www.youtube.com/s/desktop/fadc8afc/img/favicon_48x48.png"], ["https://yandex.com/favicon.ico"], ["https://yandex.ru/favicon.ico"]], "Total_raw_rows": 39, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT title FROM searchengine WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT url FROM searchengine WHERE url REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT image_url FROM searchengine WHERE image_url REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT extra1 FROM searchengine WHERE extra1 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT extra2 FROM searchengine WHERE extra2 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT extra3 FROM searchengine WHERE extra3 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT title FROM searchengine WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT url FROM searchengine WHERE url REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT image_url FROM searchengine WHERE image_url REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT extra1 FROM searchengine WHERE extra1 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT extra2 FROM searchengine WHERE extra2 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' UNION ALL SELECT extra3 FROM searchengine WHERE extra3 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"], ["google"], ["DuckDuckGo"], ["yahoo"], ["youtube"], ["bing"], ["so360"], ["qwant"], ["toutiao"], ["StartPage"], ["shenma"], ["https://duckduckgo.com/favicon.ico"], ["https://home.imgsmail.ru/resplash/123689/i/meta/favicon.ico"], ["https://m.toutiao.com/favicon.ico"], ["https://p0.ssl.qhimg.com/d/inn/128c749e/icon.png"], ["https://search.daum.net/favicon.ico"], ["https://search.naver.com/favicon.ico"], ["https://search.seznam.cz/re/media/favicon.192a42730e.ico"], ["https://search.yahoo.com/favicon.ico"], ["https://sm01.alicdn.com/L1/272/1990/favicon/favicon.ico"], ["https://www.baidu.com/favicon.ico"]], "Total_raw_rows": 21, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT title FROM searchengine WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT url FROM searchengine WHERE url REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT extra1 FROM searchengine WHERE extra1 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT extra2 FROM searchengine WHERE extra2 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' UNION ALL SELECT extra3 FROM searchengine WHERE extra3 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://www.youtube.com/s/desktop/fadc8afc/img/favicon_48x48.png"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title FROM searchengine WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT url FROM searchengine WHERE url REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT extra1 FROM searchengine WHERE extra1 REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT extra2 FROM searchengine WHERE extra2 REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT extra3 FROM searchengine WHERE extra3 REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "EMAIL", "PII": ["19735203731@s.whatsapp.net", "923402582955@s.whatsapp.net", "14847353029@s.whatsapp.net", "19199037779@s.whatsapp.net"], "Num_of_PII": 4, "source_columns": ["ZWAAGGREGATECALLEVENT.ZLINKTOKEN", "ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENT.ZGROUPCALLCREATORUSERJIDSTRING", "ZWACDCALLEVENT.ZGROUPJIDSTRING", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING"], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": ["ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING", "ZWAAGGREGATECALLEVENT.ZLINKTOKEN"], "Raw_rows_first_100": [["372FA57E129467051E04B3E4DD5A26D5"], ["3A9CEF8B4996D645358B"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 6, "Exploration_sql": "SELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "Extraction_sql": "SELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL\nSELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}'", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "USERNAME", "PII": ["19735203731", "923402582955", "14847353029", "19199037779", "WAAggregateCallEvent", "WACDCallEvent", "WACDCallEventParticipant", "WAJoinableCallEvent", "WAJoinableCallEventParticipant", "WAUpcomingCallEvent"], "Num_of_PII": 10, "source_columns": ["ZWAAGGREGATECALLEVENT.ZLINKTOKEN", "ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENT.ZGROUPCALLCREATORUSERJIDSTRING", "ZWACDCALLEVENT.ZGROUPJIDSTRING", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING", "Z_PRIMARYKEY.Z_NAME"], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["WAAggregateCallEvent"], ["WACDCallEvent"], ["WACDCallEventParticipant"], ["WAJoinableCallEvent"], ["WAJoinableCallEventParticipant"], ["WAUpcomingCallEvent"]], "Total_raw_rows": 15, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZGROUPJIDSTRING FROM ZWACDCALLEVENT WHERE ZGROUPJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["3C399CDDAF11A41F7AFF2892E0A4B10C"], ["3C37CBFE11C261E6CD80C2DE7834D770"], ["372FA57E129467051E04B3E4DD5A26D5"], ["3A6DF670F7121CD6D08B"], ["3A9CEF8B4996D645358B"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["WAAggregateCallEvent"], ["WACDCallEvent"], ["WACDCallEventParticipant"], ["WAJoinableCallEvent"], ["WAJoinableCallEventParticipant"], ["WAUpcomingCallEvent"]], "Total_raw_rows": 15, "Exploration_sql": "SELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT Z_NAME FROM Z_PRIMARYKEY WHERE Z_NAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT ZLINKTOKEN FROM ZWAAGGREGATECALLEVENT WHERE ZLINKTOKEN REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZCALLIDSTRING FROM ZWACDCALLEVENT WHERE ZCALLIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZJIDSTRING FROM ZWACDCALLEVENTPARTICIPANT WHERE ZJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT device_uuid FROM cloud_tab_devices WHERE device_uuid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT title FROM cloud_tabs WHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT url FROM cloud_tabs WHERE url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT key FROM metadata WHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' \nUNION ALL \nSELECT value FROM metadata WHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["3075F5C2-E558-4E12-B421-6118960D1D2E"], ["ambarrestaurant.com/wp-content/uploads/2024/07/ambar-ch-dinner-07012024.pdf"], ["https://www.bluebite.com/?utm_source=https://www.themtag.com/n10053654&utm_medium=301"], ["https://www.google.com/search?q=snack+with+dairy+kids&client=safari&sca_esv=6eac42e19cef7bdf&hl=en-us&sxsrf=ADLYWIJQfVNS-z6971OqeDnskNzgmBnxVA%3A1723546457188&ei=WTu7Zu6YC9vl5NoPsZT5uAM&oq=snack+with+dairy+kids&gs_lp=EhNtb2JpbGUtZ3dzLXdpei1zZXJwIhVzbmFjayB3aXRoIGRhaXJ5IGtpZHNIkXVQmR9Yym5wEXgBkAEAmAGkAaABthWqAQQzMi4yuAEDyAEA-AEBmAIVoALyC6gCD8ICChAAGLADGNYEGEfCAg0QABiABBiwAxhDGIoFwgIHECMYJxjqAsICChAuGIAEGEMYigXCAgoQABiABBhDGIoFwgIQEC4YgAQY0QMYQxjHARiKBcICDhAuGIAEGLEDGNEDGMcBwgILEC4YgAQY0QMYxwHCAgUQABiABMICDhAAGIAEGLEDGIMBGIoFwgILEC4YgAQYkQIYigXCAgsQABiABBiRAhiKBcICDRAAGIAEGEMY5QQYigXCAggQABiABBixA8ICDRAAGIAEGLEDGEMYigXCAhYQLhiABBixAxjRAxhDGIMBGMcBGIoFwgILEAAYgAQYsQMYgwHCAggQLhiABBixA8ICExAuGIAEGLEDGNEDGIMBGMcBGArCAgoQABiABBgUGIcCwgIHEAAYgAQYCsICCBAAGIAEGMkDwgILEC4YgAQYsQMYgwHCAgYQABgWGB6YAwiIBgGQBhGSBwQxOC4zoAfzbQ&sclient=mobile-gws-wiz-serp"], ["https://www.ravensmanorexperience.com/uploads/b/10bcaef0-743a-11ea-b3f4-31522c100dea/Summer%20PDF_NTkzNT.pdf"], ["https://ambarrestaurant.com/wp-content/uploads/2024/07/ambar-ch-dinner-07012024.pdf"], ["https://support.apple.com/en-us/104959"], ["https://www.bing.com/search?q=figs+tre+wont+ripen+green&form=QBLH&sp=-1&ghc=1&lq=0&pq=figs+tre+wont+ripen+green&sc=10-25&qs=n&sk=&cvid=E8428067064D4726B92401B41C5C64A5&ghsh=0&ghacc=0&ghpl="], ["https://found.apple.com/airtag?pid=5500&b=00&pt=004c&fv=00200240&dg=00&z=00&pi=fb28165432edfeebc48867d872c4acc82721e710cd8a4eede50401ec"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT device_uuid FROM cloud_tab_devices WHERE device_uuid REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT title FROM cloud_tabs WHERE title REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT url FROM cloud_tabs WHERE url REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT key FROM metadata WHERE key REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}' UNION ALL \nSELECT value FROM metadata WHERE value REGEXP '\\+?[0-9]{1,4}[- .]?\\(?[0-9]{1,3}?\\)?[- .]?[0-9]{1,4}[- .]?[0-9]{1,4}[- .]?[0-9]{1,9}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "USERNAME", "PII": ["Cellebrite", "falafelhardboiledeggisrael", "DickensCider", "BlueBite", "Mapat", "snackwithdairykids", "figsgrowinggreennotripen", "Hersheypark", "HowtoChangeaLightBulb", "Tolls", "ravensmanorexperience", "cooldryplacestorage", "HaifaAirport", "whats thesalestaxinnyconclothing", "canyoucopyamiibowithflipperzero", "jackalope", "ambarrestaurant", "RavensManor", "UseCrashDetectiononiPhoneorAppleWatch", "figstre won'tripengreen", "Hersheypark", "AirTag", "CatFishCops", "myfilesdownload", "serverchangetoken", "usemanateecontainer"], "Num_of_PII": 26, "source_columns": ["cloud_tab_devices.device_name", "cloud_tabs.title", "metadata.key"], "Raw_rows_first_100": [["Cellebrite"], ["falafel hardboiled egg israel - Google Search"], ["Dickens Cider is now Dickins Cider Company | Hard Cider Drinks | Dickens Cider"], ["Blue Bite | Connecting Possibility"], ["Home page - Mapat"], ["snack with dairy kids - Google Search"], ["figs growing green not ripe - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["How to Change a Light Bulb"], ["Tolls"], ["ravensmanorexperience.com"], ["cool dry place storage - Google Search"], ["Haifa Airport - Wikipedia"], ["whats the sales tax in nyc on clothing - Google Search"], ["can you copy amiibo with flipper zero - Google Search"], ["jackalope - Google Search"], ["ambarrestaurant.com/wp-content/uploads/2024/07/ambar-ch-dinner-07012024.pdf"], ["Menu | Raven's Manor"], ["Use Crash Detection on iPhone or Apple Watch to call for help in an accident - Apple Support"], ["figs tre wont ripen green - Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["AirTag"], ["CatFish Cops"], ["my files download - Google Search"], ["server_change_token"], ["use_manatee_container"]], "Total_raw_rows": 26, "Exploration_sql": "SELECT device_name FROM cloud_tab_devices WHERE device_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT title FROM cloud_tabs WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' \nUNION ALL \nSELECT key FROM metadata WHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": "SELECT device_name FROM cloud_tab_devices WHERE device_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT title FROM cloud_tabs WHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT key FROM metadata WHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Cellebrite"], ["falafel hardboiled egg israel - Google Search"], ["Dickens Cider is now Dickins Cider Company | Hard Cider Drinks | Dickens Cider"], ["Blue Bite | Connecting Possibility"], ["Home page - Mapat"], ["snack with dairy kids - Google Search"], ["figs growing green not ripe - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["How to Change a Light Bulb"], ["Tolls"], ["ravensmanorexperience.com"], [{"__bytes_b64__": "YnBsaXN0MDDUAQIDBAUGBwpYJHZlcnNpb25ZJGFyY2hpdmVyVCR0b3BYJG9iamVjdHMSAAGGoF8QD05TS2V5ZWRBcmNoaXZlctEICVRyb290gAGkCwwRElUkbnVsbNINDg8QViRjbGFzc18QD0NoYW5nZVRva2VuRGF0YYADgAJPEC8fChASDAAATBJW9UHWAAAAABgBGAAiFgj5m+me89ruvc4BEM2Hk5/Ph+jnpgEoANITFBUWWiRjbGFzc25hbWVYJGNsYXNzZXNfEBNDS1NlcnZlckNoYW5nZVRva2VuohUXWE5TT2JqZWN0CBEaJCkyN0lMUVNYXmNqfH6AsrfCy+HkAAAAAAAAAQEAAAAAAAAAGAAAAAAAAAAAAAAAAAAAAO0="}]], "Total_raw_rows": 12, "Exploration_sql": "SELECT device_name FROM cloud_tab_devices WHERE device_name REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT title FROM cloud_tabs WHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}' \nUNION ALL \nSELECT value FROM metadata WHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["cool dry place storage - Google Search"], ["Menu | Raven's Manor"]], "Total_raw_rows": 2, "Exploration_sql": "SELECT title FROM cloud_tabs WHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' \nUNION ALL \nSELECT value FROM metadata WHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale\nFROM android_metadata\nWHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}';", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale\nFROM android_metadata\nWHERE locale REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale AS possible_username\nFROM android_metadata\nWHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale\nFROM android_metadata\nWHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT NULL\nFROM android_metadata\nWHERE 0;", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT path AS possible_email\nFROM journal\nWHERE path REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}' UNION ALL\nSELECT key AS possible_email\nFROM journal_entry\nWHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["BD8E9D7526970329EBAA1947E3555FF6.discover_story_streaming_snap_ff"], ["2DB0D566CE0BFC10322344128086AD99.discover_story_streaming_snap"], ["2E6AD61E5AC1518921549291B17B78C4.discover_story_streaming_snap"], ["4E45C3749501999D41DA43D3E94FB163.discover_story_streaming_snap_ff"], ["A87458944357595BEF05BD6DA3B1FD99.discover_story_streaming_snap_ff"], ["9A57DEBAD4A3345055253FDE194BF37E.discover_story_streaming_snap_ff"], ["C63944D5009403772B9407E370E9876F.discover_story_streaming_snap_ff"], ["30918F1765D509CF5073178240329C28.snap_loading_frame"], ["07D59D2A708B4088F4954525453296F9.snap_loading_frame"], ["358501AF78004E4013FF8802869271D9.discover_story_streaming_snap"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT path AS possible_phone\nFROM journal\nWHERE path REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT key AS possible_phone\nFROM journal_entry\nWHERE key REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["C730963C61386A34712C819CA25436C9.media"], ["EF47D267E8FBBD7CC1051BF6D3EB77FB.edits"], ["E2176FA713B2A1B1870E6AB99D6B9CFA.edits"], ["D38DF61214F1AC5578A4E3D70D68D5A2.snap_loading_frame"], ["A1B63A789086B7516FCD1E5EE9035C5C.snap_loading_frame"], ["ED86EFA3B1D855000DC39B8F715E3C32.snap_loading_frame"], ["A35E532E17C781BD95B551760AA087D9.snap_loading_frame"], ["B06FF61E48D8A31FB3F9CC8D2765CBDE.snap_loading_frame"], ["AF24FE5D839F47BF49E132FC50B2D8FC.snap_loading_frame"], ["B3CBFB1E6E75F3E892BA6E91AED16E83.snap_loading_frame"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT key AS possible_username\nFROM journal_entry\nWHERE key REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"], ["/data/data/com.snapchat.android/files/file_manager/BLOOPS_STICKER"], ["/data/data/com.snapchat.android/files/file_manager/Bitmoji_Preview"], ["/data/data/com.snapchat.android/files/file_manager/LENS_ASSET_CONTENT_TYPE_NAME"], ["/data/data/com.snapchat.android/files/file_manager/Live_Mirror_Model"], ["/data/data/com.snapchat.android/files/file_manager/Login_Kit_Privacy"], ["/data/data/com.snapchat.android/files/file_manager/MUSIC_GENERIC_ASSET_TYPE"], ["/data/data/com.snapchat.android/files/file_manager/Maps_Kashmir"], ["/data/data/com.snapchat.android/files/file_manager/Maps_WorldEffects"], ["/data/data/com.snapchat.android/files/file_manager/Perception"], ["/data/data/com.snapchat.android/files/file_manager/PerceptionMl"], ["12DB3FD3B46FC8F9DD60F79CB359FBFE.khand_medium"], ["9F3F465DC00D96696DDDFE0A946AAB99.khand_medium"], ["2FC6ABAAFF969A947FAB4E52FE0971FC.thumbnail"], ["C730963C61386A34712C819CA25436C9.media"], ["70177660B739FDDF75DE848B97DC6A6E.edits"], ["03FD66A15523689AD035E1E2B1AD6DAE.chat_wallpaper_media"], ["D41F76126B39D1F7E7EC3D8FA4079D0F.discover_story_streaming_snap"], ["5BBE52CE6D0010CB50CA3221C4741E7D.discover_story_streaming_snap_ff"], ["F05AD4876AFE7190FBF88E879238978A.discover_story_streaming_snap_ff"], ["67B685FF2948DC22416716E822D4F5A1.discover_story_streaming_snap_ff"]], "Total_raw_rows": 21, "Exploration_sql": "SELECT locale AS possible_name\nFROM android_metadata\nWHERE locale REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' UNION ALL\nSELECT path AS possible_name\nFROM journal\nWHERE path REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' UNION ALL\nSELECT key AS possible_name\nFROM journal_entry\nWHERE key REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A2_journal.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["/data/data/com.snapchat.android/files/file_manager/map-place-icons"], ["/data/data/com.snapchat.android/files/file_manager/place-profile-annotation"], ["/data/data/com.snapchat.android/files/file_manager/place-profile-info"]], "Total_raw_rows": 3, "Exploration_sql": "SELECT path AS possible_address\nFROM journal\nWHERE path REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b' UNION ALL\nSELECT key AS possible_address\nFROM journal_entry\nWHERE key REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_email\nFROM dialog_filter\nWHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_phone\nFROM dialog_filter\nWHERE title REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title AS possible_username\nFROM dialog_filter\nWHERE title REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title AS possible_person_name\nFROM dialog_filter\nWHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}';", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account1cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_address\nFROM dialog_filter\nWHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_email\nFROM dialog_filter\nWHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_phone\nFROM dialog_filter\nWHERE title REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}';", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title AS possible_username\nFROM dialog_filter\nWHERE title REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title AS possible_person_name\nFROM dialog_filter\nWHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account2cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_address\nFROM dialog_filter\nWHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_email\nFROM dialog_filter\nWHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_phone\nFROM dialog_filter\nWHERE title REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title AS possible_username\nFROM dialog_filter\nWHERE title REGEXP '^[A-Za-z][A-Za-z0-9._-]{2,51}$';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["ALL_CHATS"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT title AS possible_person_name\nFROM dialog_filter\nWHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}';", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A3_account3cache4.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT title AS possible_address\nFROM dialog_filter\nWHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string AS possible_email\nFROM sync_item\nWHERE key_string REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string AS possible_phone\nFROM sync_item\nWHERE key_string REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string AS possible_username\nFROM sync_item\nWHERE key_string REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string AS possible_person_name\nFROM sync_item\nWHERE key_string REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_myplaces.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT key_string\nFROM sync_item\nWHERE key_string REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_gmm_storage.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale AS potential_email\nFROM android_metadata\nWHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT _key_pri AS potential_email\nFROM gmm_storage_table\nWHERE _key_pri REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT _key_sec AS potential_email\nFROM gmm_storage_table\nWHERE _key_sec REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_storage.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale AS possible_phone\nFROM android_metadata\nWHERE locale REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT _key_pri AS possible_phone\nFROM gmm_storage_table\nWHERE _key_pri REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT _key_sec AS possible_phone\nFROM gmm_storage_table\nWHERE _key_sec REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_storage.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["CompletedNavigation"], ["GeofenceData"], ["WaypointsHaveChangedInNav"], ["bundled"], ["STORED_GEOFENCE_INDEX_STORAGE_ID"]], "Total_raw_rows": 5, "Exploration_sql": "SELECT\n _key_pri AS possible_username\nFROM\n gmm_storage_table\nWHERE\n _key_pri REGEXP '^[A-Za-z][A-Za-z0-9._-]{2,51}$'\nUNION ALL\nSELECT\n _key_sec AS possible_username\nFROM\n gmm_storage_table\nWHERE\n _key_sec REGEXP '^[A-Za-z][A-Za-z0-9._-]{2,51}$'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_storage.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"], ["CompletedNavigation"], ["GeofenceData"], ["WaypointsHaveChangedInNav"], ["bundled"], ["STORED_GEOFENCE_INDEX_STORAGE_ID"]], "Total_raw_rows": 6, "Exploration_sql": "SELECT locale AS possible_person_name\nFROM android_metadata\nWHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n\nUNION ALL\n\nSELECT _key_pri AS possible_person_name\nFROM gmm_storage_table\nWHERE _key_pri REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n\nUNION ALL\n\nSELECT _key_sec AS possible_person_name\nFROM gmm_storage_table\nWHERE _key_sec REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_gmm_storage.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT\n _key_pri,\n _key_sec,\n CAST(_data AS TEXT) AS possible_address\nFROM gmm_storage_table\nWHERE\n _key_pri REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\n OR\n _key_sec REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\n OR\n CAST(_data AS TEXT) REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "EMAIL", "PII": ["heather@cellebrite.com", "hmahalik@gmail.com"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["hmahalik@gmail.com"], ["heather@cellebrite.com"], ["hmahalik@gmail.com"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT value\nFROM Tokens\nWHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value\nFROM Tokens_content\nWHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "SELECT value\nFROM Tokens\nWHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT c1value\nFROM Tokens_content\nWHERE c1value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PHONE", "PII": ["7423794330"], "Num_of_PII": 1, "source_columns": ["Tokens_content.c1value"], "Raw_rows_first_100": [["17423794330"], ["7423794330"]], "Total_raw_rows": 2, "Exploration_sql": "SELECT value AS possible_phone\nFROM Contacts\nWHERE value REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT c1value AS possible_phone\nFROM Tokens_content\nWHERE c1value REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}';", "Extraction_sql": "SELECT value AS possible_phone\nFROM Contacts\nWHERE value REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT c1value AS possible_phone\nFROM Tokens_content\nWHERE c1value REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}';", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "USERNAME", "PII": ["heather", "hmahalik"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["heather"], ["hmahalik"], ["heather"], ["hmahalik"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT value AS possible_username\nFROM Tokens\nWHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n AND value NOT LIKE '%@%'\n\nUNION ALL\n\nSELECT c1value AS possible_username\nFROM Tokens_content\nWHERE c1value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n AND c1value NOT LIKE '%@%'", "Extraction_sql": "SELECT value AS possible_username\nFROM Tokens\nWHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' AND value NOT LIKE '%@%'\nUNION ALL\nSELECT c1value AS possible_username\nFROM Tokens_content\nWHERE c1value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b' AND c1value NOT LIKE '%@%'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "PERSON_NAME", "PII": ["Heather", "Bo"], "Num_of_PII": 2, "source_columns": ["Tokens.value", "Tokens_content.c1value"], "Raw_rows_first_100": [["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["Bo"], ["heather@cellebrite.com"], ["heather"], ["hmahalik@gmail.com"], ["hmahalik"], ["Bo"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT value AS possible_person_name\nFROM Tokens\nWHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT c1value AS possible_person_name\nFROM Tokens_content\nWHERE c1value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": "SELECT value AS possible_person_name\nFROM Tokens\nWHERE value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT c1value AS possible_person_name\nFROM Tokens_content\nWHERE c1value REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A4_peopleCache_sharononeil368@gmail.com_com.google_14.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value AS possible_address\nFROM Tokens\nWHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT c1value AS possible_address\nFROM Tokens_content\nWHERE c1value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT\n URL AS possible_email_source\nFROM BOOKMARKS\nWHERE URL REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SURL AS possible_email_source\nFROM BOOKMARKS\nWHERE SURL REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n TITLE AS possible_email_source\nFROM BOOKMARKS\nWHERE TITLE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n TAGS AS possible_email_source\nFROM BOOKMARKS\nWHERE TAGS REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SOURCEID AS possible_email_source\nFROM BOOKMARKS\nWHERE SOURCEID REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n ACCOUNT_NAME AS possible_email_source\nFROM BOOKMARKS\nWHERE ACCOUNT_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n ACCOUNT_TYPE AS possible_email_source\nFROM BOOKMARKS\nWHERE ACCOUNT_TYPE REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n DEVICE_NAME AS possible_email_source\nFROM BOOKMARKS\nWHERE DEVICE_NAME REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SYNC1 AS possible_email_source\nFROM BOOKMARKS\nWHERE SYNC1 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SYNC2 AS possible_email_source\nFROM BOOKMARKS\nWHERE SYNC2 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SYNC3 AS possible_email_source\nFROM BOOKMARKS\nWHERE SYNC3 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SYNC4 AS possible_email_source\nFROM BOOKMARKS\nWHERE SYNC4 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n SYNC5 AS possible_email_source\nFROM BOOKMARKS\nWHERE SYNC5 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n keyword AS possible_email_source\nFROM BOOKMARKS\nWHERE keyword REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT\n description AS possible_email_source\nFROM BOOKMARKS\nWHERE description REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT URL AS possible_phone\nFROM BOOKMARKS\nWHERE URL REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT SURL AS possible_phone\nFROM BOOKMARKS\nWHERE SURL REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT TITLE AS possible_phone\nFROM BOOKMARKS\nWHERE TITLE REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT TAGS AS possible_phone\nFROM BOOKMARKS\nWHERE TAGS REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Sharon's S21"], ["Sharon's S21"], ["Sharon's S21"], ["Sharon's S21"]], "Total_raw_rows": 4, "Exploration_sql": "SELECT ACCOUNT_NAME AS possible_username\nFROM BOOKMARKS\nWHERE ACCOUNT_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT DEVICE_NAME AS possible_username\nFROM BOOKMARKS\nWHERE DEVICE_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT SOURCEID AS possible_username\nFROM BOOKMARKS\nWHERE SOURCEID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT TAGS AS possible_username\nFROM BOOKMARKS\nWHERE TAGS REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT keyword AS possible_username\nFROM BOOKMARKS\nWHERE keyword REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT description AS possible_username\nFROM BOOKMARKS\nWHERE description REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT guid AS possible_username\nFROM BOOKMARKS\nWHERE guid REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "PERSON_NAME", "PII": ["Sharon"], "Num_of_PII": 1, "source_columns": ["BOOKMARKS.TITLE", "BOOKMARKS.TAGS", "BOOKMARKS.ACCOUNT_NAME", "BOOKMARKS.DEVICE_NAME", "BOOKMARKS.keyword", "BOOKMARKS.description"], "Raw_rows_first_100": [[{"__bytes_b64__": "BAGBHAIGAQABLGwCAOx/Yz8pWMaZgKzK9gidY1JbWlHtbmZoPVRvHa8L1Qa5v77osj/b9cxf6AihGfAj9/oMzNgzwG4TEa1ocxhMgTw="}], [{"__bytes_b64__": "BAGBHAIGAQABLGwCADg08Y0rLftwtKLewxQylCXdY9YcWUe01qQU3juIWvYiZTepFwA/AGQEV8xammaotcT+LNCNEQBvYK49zZmdniQ="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAx0od46RvJj3ZMpmE/r++aNuxFfDaTafncAW0XddYSB0WkI7vryB4lplJKYOFVJvriCJ54MlN56/+r6ZnwIIKx3TF4rvHTUNRIc9LKLCfh5hqUwF5ebYY+wMqebfiqMSY="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAN/bPhb+tihkAfwO8uIxTzh9YWVp1U/kZ3oy/IzxRDnWH35ch+01jfwXwTtCmEj+LyGgSjHzzowXmue9uLyUvfpmVNbt3JCOqCl0EyBAo5+xpVCiij7EFhenIbvW/5cN0="}], [{"__bytes_b64__": "BAGBfgIHAQABLIFMAgAxMZf3KoVtVYHMTrajimnorfRebkfgH/qYhDfOJ2RRzWYOGMxn9xTFfrGxr/Cg60A6HnjLCVgpgftWYAW/bKRQc57iUOY3/35T/FmViNlLg/0T1xmtyNMJL85eTN6Ty8FnisaqUE3+iEK+drFSfnJt"}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgDferB3B+clQ8gWXYeFleQ01pIC6VzQ+FxtlyoVYuGZ/sO3K+0Bwv1BqzJe5oM8CyJQtis/qRu/Li9LMYVDQxRCkfClKVoXFf6qVbzv+0XrXKADvEyQD083AV/geGnfwx8="}], ["Sharon's S21"], ["Sharon's S21"], ["Sharon's S21"], ["Sharon's S21"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT TITLE AS possible_person_name\nFROM BOOKMARKS\nWHERE TITLE REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\n\nUNION ALL\n\nSELECT TAGS AS possible_person_name\nFROM BOOKMARKS\nWHERE TAGS REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\n\nUNION ALL\n\nSELECT ACCOUNT_NAME AS possible_person_name\nFROM BOOKMARKS\nWHERE ACCOUNT_NAME REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\n\nUNION ALL\n\nSELECT DEVICE_NAME AS possible_person_name\nFROM BOOKMARKS\nWHERE DEVICE_NAME REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\n\nUNION ALL\n\nSELECT keyword AS possible_person_name\nFROM BOOKMARKS\nWHERE keyword REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\n\nUNION ALL\n\nSELECT description AS possible_person_name\nFROM BOOKMARKS\nWHERE description REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": "SELECT TITLE AS possible_person_name\nFROM BOOKMARKS\nWHERE TITLE REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT TAGS AS possible_person_name\nFROM BOOKMARKS\nWHERE TAGS REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT ACCOUNT_NAME AS possible_person_name\nFROM BOOKMARKS\nWHERE ACCOUNT_NAME REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT DEVICE_NAME AS possible_person_name\nFROM BOOKMARKS\nWHERE DEVICE_NAME REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT keyword AS possible_person_name\nFROM BOOKMARKS\nWHERE keyword REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\nUNION ALL\nSELECT description AS possible_person_name\nFROM BOOKMARKS\nWHERE description REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_SBrowser2.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [[{"__bytes_b64__": "BAGBHAIGAQABLGwCAFgwiN0XYaRNwN6JFtBRdWfQw5YoTxjvsswMtBRYpQ4bzjZW6jjqVulUtvEdo3wPiKvtT0SzbxZ9i5yPZb27tpI="}], [{"__bytes_b64__": "BAGEPgIHAQABLIQMAgABgxFFetbBD88wsavVtVjy+KN6LQaF52tl9Ztc+fzXT8MhsjknjCsDwrr+9tZQ1uZZNjvrZf13/vt7Nn58Xe1+sdDXmFRvJGfComqfeWyTQONx07TYcFCxWvZNWaecNUuUw+EC87PJColRgnZwE0JLLZ8Zcjsh8AjPicnUGgdkOfN8I1TaXKxMGebpzElMuqtVIhlph5EGeSm7pg0v/ELp/VeGLuxGeKbA6tXvUoiGaT51XBQebcsvu7qUegGuoIrZLf8Od7Q3JpKpH9miAs8O6o+o4zZXEI5LBv1suoFxmU6MRC7lTPGYgU6e+O1Wd9cSg4F2f7U2fAOBGDPYg3BrCZONls5ungK74IoKY48a5A=="}], [{"__bytes_b64__": "BAGBPgIHAQABLIEMAgD443e4SeU/jxbaN7+6lk4CFvovH1ui72l0PE6Mr20DtdnV/jQxlqAi9jhvXfYxTbDjh9dKl6yNgZm/19GPdqzMV0aYY9i3A05cPRL/VKYMpw=="}], [{"__bytes_b64__": "BAGDHgIHAQABLIJsAgCKKvrixPJ+dMqD7ppuoI0MyZaiuUvIgtJ4WHgnxrQGklMS6lrCMckJrtZnmVGBcHWPgbEIH/JKEmczg7KSJqaMfK+BKSyUC+v3ydvl2m/UC0JEA37crOZHBfy5z4B7KF1j7b1u7DDYe4DzyPE0+JyV0dfHonPF0zGA+yDZUAOoReeMJ9yHcuCKnASWELWEEvSukVLIZBmZ2OhTv4KNnbCyLBcA0Xz3SQ32AC3/+ef77BgKgSzNArHW3R5aUBmC7EE="}], [{"__bytes_b64__": "BAGDHgIHAQABLIJsAgDa5rn5/h/uPxLOY8KfuGKu45sg2E1RRV79AuDrwZAO/CdOjK94CeByOdIR/dW/LnMwaCJ/Fzsktoej/DoH9XIfnD+9F+UZYDRgfpb9Ie0a/0TZyy2zL4HhatC455OfG5sGqlu7ZvodLztLBH1iqnEr3fC5hFGYgiAIbKmbwXITQdJ6efZ2J6a4Ne5dEK7nSq8Bky9lsF2g/R6Yug7kd5m+AHc1BEZoXFDer3Gm30trqQgKEgafKEJftuh+Cf8/Wic="}], [{"__bytes_b64__": "BAGEPgIHAQABLIQMAgBQ1ryPaiEATOXfVZTPg8FP3oJkx7RwFyn+2sKiKDDTGe/zN3pxBhO+t0++nKxLvCGlZ5/q8uMRVU0e9XsXOeH4uR4SDyxAajG0+/6OmOaOjtXwZGmhkY8d0UaJSyT1OukC02GESg3KjDFOeQsNQsfWEdvhNUWozvT4y7TUo1fiKMzWpKvIVK3NRaVFs8Dxgs0dNirE73Feyeps2GRq6CrF1hisNwoWNAp6H62mYO4OSgpbH8vIo7HKytAfYok6JzGpW2KUnXjsI/aLOg+OVz5a7WbtNPtX2EZ93WfLmRflqbD03VPN73Bgz6ENlzB79bNuPDr6EXSiBjUg4lRre7kwsO7iIo2Hv70JZFsyhJfQ2A=="}], [{"__bytes_b64__": "BAGBPgIHAQABLIEMAgB/6+uZMDK39vfkGeXZ94x8HT2s4mGPQAcYJhlvjrZsx/FALnRkp5fEspNZKtEkku2zkIZzFtG4mDnV4b0hLpq/HEyEikPekmGfVSgDniYNpg=="}], [{"__bytes_b64__": "BAGDHgIHAQABLIJsAgBwvy2V6oP1GFaG5qu3Y+17nx7mxsU35WfB3ALBxs71iPNCuztsZV3ef7wmH7hMfFHfLo6gAnxafQkx7W+yh3d7gqtqsxxDhl8oRIGXZ8O8mIJQN87jXx/OzIV7jpVX4vIW2kP773vllT1cTagB4rpWx2sk8kEWCBKPRadIjgJjBNAh3e3alczuqrxeraLCXzC3wsmaCq3EHAkGC8KXuMdBJkH/s1cLUHAa6Ke0jYIhjwXKuEOIBu3bICdrPZR1UAE="}], [{"__bytes_b64__": "BAGBXgIHAQABLIEsAgAx0od46RvJj3ZMpmE/r++aNuxFfDaTafncAW0XddYSB0WkI7vryB4lplJKYOFVJvriCJ54MlN56/+r6ZnwIIKx3TF4rvHTUNRIc9LKLCfh5hqUwF5ebYY+wMqebfiqMSY="}]], "Total_raw_rows": 9, "Exploration_sql": "SELECT URL AS possible_address\nFROM BOOKMARKS\nWHERE URL REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT SURL AS possible_address\nFROM BOOKMARKS\nWHERE SURL REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT TITLE AS possible_address\nFROM BOOKMARKS\nWHERE TITLE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT TAGS AS possible_address\nFROM BOOKMARKS\nWHERE TAGS REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT description AS possible_address\nFROM BOOKMARKS\nWHERE description REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale AS possible_email\nFROM android_metadata\nWHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT title AS possible_email\nFROM searchengine\nWHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT url AS possible_email\nFROM searchengine\nWHERE url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT image_url AS possible_email\nFROM searchengine\nWHERE image_url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT extra1 AS possible_email\nFROM searchengine\nWHERE extra1 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT extra2 AS possible_email\nFROM searchengine\nWHERE extra2 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT extra3 AS possible_email\nFROM searchengine\nWHERE extra3 REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT locale AS possible_phone\nFROM android_metadata\nWHERE locale REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT title AS possible_phone\nFROM searchengine\nWHERE title REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT url AS possible_phone\nFROM searchengine\nWHERE url REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT image_url AS possible_phone\nFROM searchengine\nWHERE image_url REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT extra1 AS possible_phone\nFROM searchengine\nWHERE extra1 REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT extra2 AS possible_phone\nFROM searchengine\nWHERE extra2 REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT extra3 AS possible_phone\nFROM searchengine\nWHERE extra3 REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"], ["google"], ["DuckDuckGo"], ["yahoo"], ["youtube"], ["bing"], ["so360"], ["qwant"], ["toutiao"], ["StartPage"], ["shenma"]], "Total_raw_rows": 11, "Exploration_sql": "SELECT locale AS possible_username\nFROM android_metadata\nWHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT title AS possible_username\nFROM searchengine\nWHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT extra1 AS possible_username\nFROM searchengine\nWHERE extra1 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT extra2 AS possible_username\nFROM searchengine\nWHERE extra2 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\n\nUNION ALL\n\nSELECT extra3 AS possible_username\nFROM searchengine\nWHERE extra3 REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["en_US"], ["google"], ["DuckDuckGo"], ["yahoo"], ["youtube"], ["bing"], ["so360"], ["qwant"], ["toutiao"], ["StartPage"], ["shenma"]], "Total_raw_rows": 11, "Exploration_sql": "SELECT locale AS possible_name\nFROM android_metadata\nWHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n\nUNION ALL\n\nSELECT title AS possible_name\nFROM searchengine\nWHERE title REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n\nUNION ALL\n\nSELECT extra1 AS possible_name\nFROM searchengine\nWHERE extra1 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n\nUNION ALL\n\nSELECT extra2 AS possible_name\nFROM searchengine\nWHERE extra2 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\n\nUNION ALL\n\nSELECT extra3 AS possible_name\nFROM searchengine\nWHERE extra3 REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A5_searchengine.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://www.youtube.com/s/desktop/fadc8afc/img/favicon_48x48.png"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT url AS possible_address\nFROM searchengine\nWHERE url REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT title AS possible_address\nFROM searchengine\nWHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT extra1 AS possible_address\nFROM searchengine\nWHERE extra1 REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT extra2 AS possible_address\nFROM searchengine\nWHERE extra2 REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT extra3 AS possible_address\nFROM searchengine\nWHERE extra3 REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZLINKTOKEN AS possible_email\nFROM ZWAAGGREGATECALLEVENT\nWHERE ZLINKTOKEN REGEXP '[a-zA-Z0-9._%+-]+@(?!whatsapp\\\\.com)[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT ZCALLIDSTRING AS possible_email\nFROM ZWACDCALLEVENT\nWHERE ZCALLIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@(?!whatsapp\\\\.com)[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS possible_email\nFROM ZWACDCALLEVENT\nWHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@(?!whatsapp\\\\.com)[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT ZGROUPJIDSTRING AS possible_email\nFROM ZWACDCALLEVENT\nWHERE ZGROUPJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@(?!whatsapp\\\\.com)[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT ZSCHEDULEDID AS possible_email\nFROM ZWACDCALLEVENT\nWHERE ZSCHEDULEDID REGEXP '[a-zA-Z0-9._%+-]+@(?!whatsapp\\\\.com)[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'\n\nUNION ALL\n\nSELECT ZJIDSTRING AS possible_email\nFROM ZWACDCALLEVENTPARTICIPANT\nWHERE ZJIDSTRING REGEXP '[a-zA-Z0-9._%+-]+@(?!whatsapp\\\\.com)[a-zA-Z0-9.-]+\\\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "Do not include whatsaap domain link this in email. a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PHONE", "PII": ["9735203731", "4847353029", "9199037779"], "Num_of_PII": 3, "source_columns": ["ZWAAGGREGATECALLEVENT.ZLINKTOKEN", "ZWACDCALLEVENT.ZCALLIDSTRING", "ZWACDCALLEVENT.ZGROUPCALLCREATORUSERJIDSTRING", "ZWACDCALLEVENT.ZGROUPJIDSTRING", "ZWACDCALLEVENT.ZSCHEDULEDID", "ZWACDCALLEVENTPARTICIPANT.ZJIDSTRING"], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT ZLINKTOKEN AS possible_phone\nFROM ZWAAGGREGATECALLEVENT\nWHERE ZLINKTOKEN REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT ZCALLIDSTRING AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZCALLIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT ZGROUPJIDSTRING AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZGROUPJIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT ZSCHEDULEDID AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZSCHEDULEDID REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT ZJIDSTRING AS possible_phone\nFROM ZWACDCALLEVENTPARTICIPANT\nWHERE ZJIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": "SELECT ZLINKTOKEN AS possible_phone\nFROM ZWAAGGREGATECALLEVENT\nWHERE ZLINKTOKEN REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZCALLIDSTRING AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZCALLIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZGROUPJIDSTRING AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZGROUPJIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZSCHEDULEDID AS possible_phone\nFROM ZWACDCALLEVENT\nWHERE ZSCHEDULEDID REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\nUNION ALL\nSELECT ZJIDSTRING AS possible_phone\nFROM ZWACDCALLEVENTPARTICIPANT\nWHERE ZJIDSTRING REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZLINKTOKEN AS possible_username\nFROM ZWAAGGREGATECALLEVENT\nWHERE ZLINKTOKEN REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$'\nUNION ALL\nSELECT ZCALLIDSTRING AS possible_username\nFROM ZWACDCALLEVENT\nWHERE ZCALLIDSTRING REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS possible_username\nFROM ZWACDCALLEVENT\nWHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$'\nUNION ALL\nSELECT ZGROUPJIDSTRING AS possible_username\nFROM ZWACDCALLEVENT\nWHERE ZGROUPJIDSTRING REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$'\nUNION ALL\nSELECT ZSCHEDULEDID AS possible_username\nFROM ZWACDCALLEVENT\nWHERE ZSCHEDULEDID REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$'\nUNION ALL\nSELECT ZJIDSTRING AS possible_username\nFROM ZWACDCALLEVENTPARTICIPANT\nWHERE ZJIDSTRING REGEXP '^[a-zA-Z][a-zA-Z0-9._-]{2,51}$'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["3C399CDDAF11A41F7AFF2892E0A4B10C"], ["3C37CBFE11C261E6CD80C2DE7834D770"], ["372FA57E129467051E04B3E4DD5A26D5"], ["3A6DF670F7121CD6D08B"], ["3A9CEF8B4996D645358B"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["WAAggregateCallEvent"], ["WACDCallEvent"], ["WACDCallEventParticipant"], ["WAJoinableCallEvent"], ["WAJoinableCallEventParticipant"], ["WAUpcomingCallEvent"]], "Total_raw_rows": 20, "Exploration_sql": "SELECT ZLINKTOKEN AS possible_name\nFROM ZWAAGGREGATECALLEVENT\nWHERE ZLINKTOKEN REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE\n\nUNION ALL\n\nSELECT ZCALLIDSTRING AS possible_name\nFROM ZWACDCALLEVENT\nWHERE ZCALLIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE\n\nUNION ALL\n\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS possible_name\nFROM ZWACDCALLEVENT\nWHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE\n\nUNION ALL\n\nSELECT ZGROUPJIDSTRING AS possible_name\nFROM ZWACDCALLEVENT\nWHERE ZGROUPJIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE\n\nUNION ALL\n\nSELECT ZSCHEDULEDID AS possible_name\nFROM ZWACDCALLEVENT\nWHERE ZSCHEDULEDID REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE\n\nUNION ALL\n\nSELECT ZJIDSTRING AS possible_name\nFROM ZWACDCALLEVENTPARTICIPANT\nWHERE ZJIDSTRING REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE\n\nUNION ALL\n\nSELECT Z_NAME AS possible_name\nFROM Z_PRIMARYKEY\nWHERE Z_NAME REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' COLLATE NOCASE;", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I1_CallHistory.sqlite", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["19735203731@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["923402582955@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["14847353029@s.whatsapp.net"], ["19199037779@s.whatsapp.net"], ["923402582955@s.whatsapp.net"]], "Total_raw_rows": 9, "Exploration_sql": "SELECT ZCALLIDSTRING AS possible_address\nFROM ZWACDCALLEVENT\nWHERE ZCALLIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZGROUPCALLCREATORUSERJIDSTRING AS possible_address\nFROM ZWACDCALLEVENT\nWHERE ZGROUPCALLCREATORUSERJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZGROUPJIDSTRING AS possible_address\nFROM ZWACDCALLEVENT\nWHERE ZGROUPJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZJIDSTRING AS possible_address\nFROM ZWACDCALLEVENTPARTICIPANT\nWHERE ZJIDSTRING REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value AS possible_email\nFROM _SqliteDatabaseProperties\nWHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value\nFROM _SqliteDatabaseProperties\nWHERE value REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value AS possible_username\nFROM _SqliteDatabaseProperties\nWHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["1BB6D11F-7D93-4A3D-80B7-9B37DFB90EED"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT value AS possible_person_name\nFROM _SqliteDatabaseProperties\nWHERE value REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I2_AddressBookImages.sqlitedb", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT value\nFROM _SqliteDatabaseProperties\nWHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT device_name AS possible_email\nFROM cloud_tab_devices\nWHERE device_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT title AS possible_email\nFROM cloud_tabs\nWHERE title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT url AS possible_email\nFROM cloud_tabs\nWHERE url REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT key AS possible_email\nFROM metadata\nWHERE key REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT value AS possible_email\nFROM metadata\nWHERE value REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["https://www.google.com/search?q=snack+with+dairy+kids&client=safari&sca_esv=6eac42e19cef7bdf&hl=en-us&sxsrf=ADLYWIJQfVNS-z6971OqeDnskNzgmBnxVA%3A1723546457188&ei=WTu7Zu6YC9vl5NoPsZT5uAM&oq=snack+with+dairy+kids&gs_lp=EhNtb2JpbGUtZ3dzLXdpei1zZXJwIhVzbmFjayB3aXRoIGRhaXJ5IGtpZHNIkXVQmR9Yym5wEXgBkAEAmAGkAaABthWqAQQzMi4yuAEDyAEA-AEBmAIVoALyC6gCD8ICChAAGLADGNYEGEfCAg0QABiABBiwAxhDGIoFwgIHECMYJxjqAsICChAuGIAEGEMYigXCAgoQABiABBhDGIoFwgIQEC4YgAQY0QMYQxjHARiKBcICDhAuGIAEGLEDGNEDGMcBwgILEC4YgAQY0QMYxwHCAgUQABiABMICDhAAGIAEGLEDGIMBGIoFwgILEC4YgAQYkQIYigXCAgsQABiABBiRAhiKBcICDRAAGIAEGEMY5QQYigXCAggQABiABBixA8ICDRAAGIAEGLEDGEMYigXCAhYQLhiABBixAxjRAxhDGIMBGMcBGIoFwgILEAAYgAQYsQMYgwHCAggQLhiABBixA8ICExAuGIAEGLEDGNEDGIMBGMcBGArCAgoQABiABBgUGIcCwgIHEAAYgAQYCsICCBAAGIAEGMkDwgILEC4YgAQYsQMYgwHCAgYQABgWGB6YAwiIBgGQBhGSBwQxOC4zoAfzbQ&sclient=mobile-gws-wiz-serp"], ["https://www.bing.com/search?q=figs+tre+wont+ripen+green&form=QBLH&sp=-1&ghc=1&lq=0&pq=figs+tre+wont+ripen+green&sc=10-25&qs=n&sk=&cvid=E8428067064D4726B92401B41C5C64A5&ghsh=0&ghacc=0&ghpl="]], "Total_raw_rows": 2, "Exploration_sql": "SELECT device_name AS possible_phone\nFROM cloud_tab_devices\nWHERE device_name REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT title AS possible_phone\nFROM cloud_tabs\nWHERE title REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT url AS possible_phone\nFROM cloud_tabs\nWHERE url REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT key AS possible_phone\nFROM metadata\nWHERE key REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'\n\nUNION ALL\n\nSELECT value AS possible_phone\nFROM metadata\nWHERE value REGEXP '\\+?1?[- .]?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["falafel hardboiled egg israel - Google Search"], ["Dickens Cider is now Dickins Cider Company | Hard Cider Drinks | Dickens Cider"], ["Blue Bite | Connecting Possibility"], ["Home page - Mapat"], ["snack with dairy kids - Google Search"], ["figs growing green not ripe - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["How to Change a Light Bulb"], ["Tolls"], ["ravensmanorexperience.com"], ["https://www.google.com/search?q=falafel+hardboiled+egg+israel&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari#ip=1"], ["https://www.dickinscidercompany.com/"], ["https://www.bluebite.com/?utm_source=https://www.themtag.com/n10053654&utm_medium=301"], ["https://www.mapat.org.il/eng/main"], ["https://www.google.com/search?q=snack+with+dairy+kids&client=safari&sca_esv=6eac42e19cef7bdf&hl=en-us&sxsrf=ADLYWIJQfVNS-z6971OqeDnskNzgmBnxVA%3A1723546457188&ei=WTu7Zu6YC9vl5NoPsZT5uAM&oq=snack+with+dairy+kids&gs_lp=EhNtb2JpbGUtZ3dzLXdpei1zZXJwIhVzbmFjayB3aXRoIGRhaXJ5IGtpZHNIkXVQmR9Yym5wEXgBkAEAmAGkAaABthWqAQQzMi4yuAEDyAEA-AEBmAIVoALyC6gCD8ICChAAGLADGNYEGEfCAg0QABiABBiwAxhDGIoFwgIHECMYJxjqAsICChAuGIAEGEMYigXCAgoQABiABBhDGIoFwgIQEC4YgAQY0QMYQxjHARiKBcICDhAuGIAEGLEDGNEDGMcBwgILEC4YgAQY0QMYxwHCAgUQABiABMICDhAAGIAEGLEDGIMBGIoFwgILEC4YgAQYkQIYigXCAgsQABiABBiRAhiKBcICDRAAGIAEGEMY5QQYigXCAggQABiABBixA8ICDRAAGIAEGLEDGEMYigXCAhYQLhiABBixAxjRAxhDGIMBGMcBGIoFwgILEAAYgAQYsQMYgwHCAggQLhiABBixA8ICExAuGIAEGLEDGNEDGIMBGMcBGArCAgoQABiABBgUGIcCwgIHEAAYgAQYCsICCBAAGIAEGMkDwgILEC4YgAQYsQMYgwHCAgYQABgWGB6YAwiIBgGQBhGSBwQxOC4zoAfzbQ&sclient=mobile-gws-wiz-serp"], ["https://www.google.com/search?q=figs+growing+green+not+ripe&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari"], ["https://www.hersheypark.com/info/hours/"], ["https://www.angi.com/articles/how-change-lightbulb.htm"], ["https://www.panynj.gov/bridges-tunnels/en/tolls.html"], ["https://www.ravensmanorexperience.com/uploads/b/10bcaef0-743a-11ea-b3f4-31522c100dea/Summer%20PDF_NTkzNT.pdf"], ["Cellebrite"], ["server_change_token"], ["use_manatee_container"], [{"__bytes_b64__": "YnBsaXN0MDDUAQIDBAUGBwpYJHZlcnNpb25ZJGFyY2hpdmVyVCR0b3BYJG9iamVjdHMSAAGGoF8QD05TS2V5ZWRBcmNoaXZlctEICVRyb290gAGkCwwRElUkbnVsbNINDg8QViRjbGFzc18QD0NoYW5nZVRva2VuRGF0YYADgAJPEC8fChASDAAATBJW9UHWAAAAABgBGAAiFgj5m+me89ruvc4BEM2Hk5/Ph+jnpgEoANITFBUWWiRjbGFzc25hbWVYJGNsYXNzZXNfEBNDS1NlcnZlckNoYW5nZVRva2VuohUXWE5TT2JqZWN0CBEaJCkyN0lMUVNYXmNqfH6AsrfCy+HkAAAAAAAAAQEAAAAAAAAAGAAAAAAAAAAAAAAAAAAAAO0="}]], "Total_raw_rows": 24, "Exploration_sql": "SELECT title AS possible_username\nFROM cloud_tabs\nWHERE title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT url AS possible_username\nFROM cloud_tabs\nWHERE url REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT device_name AS possible_username\nFROM cloud_tab_devices\nWHERE device_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT key AS possible_username\nFROM metadata\nWHERE key REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT value AS possible_username\nFROM metadata\nWHERE value REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Cellebrite"], ["falafel hardboiled egg israel - Google Search"], ["Dickens Cider is now Dickins Cider Company | Hard Cider Drinks | Dickens Cider"], ["Blue Bite | Connecting Possibility"], ["Home page - Mapat"], ["snack with dairy kids - Google Search"], ["figs growing green not ripe - Google Search"], ["Hours: Amusement Park & Hershey Attractions | Hersheypark"], ["How to Change a Light Bulb"], ["Tolls"], ["ravensmanorexperience.com"]], "Total_raw_rows": 11, "Exploration_sql": "SELECT device_name AS possible_name\nFROM cloud_tab_devices\nWHERE device_name REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'\n\nUNION ALL\n\nSELECT title AS possible_name\nFROM cloud_tabs\nWHERE title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I4_CloudTabs.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["cool dry place storage - Google Search"], ["Menu | Raven's Manor"], ["https://www.google.com/search?q=cool+dry+place+storage&ie=UTF-8&oe=UTF-8&hl=en-us&client=safari"], ["https://www.bing.com/search?q=figs+tre+wont+ripen+green&form=QBLH&sp=-1&ghc=1&lq=0&pq=figs+tre+wont+ripen+green&sc=10-25&qs=n&sk=&cvid=E8428067064D4726B92401B41C5C64A5&ghsh=0&ghacc=0&ghpl="]], "Total_raw_rows": 4, "Exploration_sql": "SELECT device_name AS possible_address\nFROM cloud_tab_devices\nWHERE device_name REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT title AS possible_address\nFROM cloud_tabs\nWHERE title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT url AS possible_address\nFROM cloud_tabs\nWHERE url REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT value AS possible_address\nFROM metadata\nWHERE value REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
File diff suppressed because one or more lines are too long
File diff suppressed because one or more lines are too long
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT\n NULL AS possible_email\nWHERE\n NULL IS NOT NULL;", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZVALUE AS possible_phone\nFROM ZSETTING\nWHERE ZVALUE REGEXP '(^|[^0-9])(\\+?1[- .]?)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}([^0-9]|$)' UNION ALL\nSELECT ZKEY AS possible_phone\nFROM ZSETTING\nWHERE ZKEY REGEXP '(^|[^0-9])(\\+?1[- .]?)?\\(?[2-9][0-9]{2}\\)?[- .]?[2-9][0-9]{2}[- .]?[0-9]{4}([^0-9]|$)'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["CacheEndDate"], ["LastDBSequence"], ["AE9BAC24-6E29-4FA2-9FA4-699FD2BE7479"], ["Alarm"], ["Setting"]], "Total_raw_rows": 5, "Exploration_sql": "SELECT ZKEY AS possible_username\nFROM ZSETTING\nWHERE ZKEY REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT ZVALUE AS possible_username\nFROM ZSETTING\nWHERE ZVALUE REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_UUID AS possible_username\nFROM Z_METADATA\nWHERE Z_UUID REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT Z_NAME AS possible_username\nFROM Z_PRIMARYKEY\nWHERE Z_NAME REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b';", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["CacheEndDate"], ["LastDBSequence"], ["AE9BAC24-6E29-4FA2-9FA4-699FD2BE7479"], ["Alarm"], ["Setting"]], "Total_raw_rows": 5, "Exploration_sql": "SELECT ZKEY AS possible_name\nFROM ZSETTING\nWHERE ZKEY REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT ZVALUE AS possible_name\nFROM ZSETTING\nWHERE ZVALUE REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT Z_UUID AS possible_name\nFROM Z_METADATA\nWHERE Z_UUID REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'\nUNION ALL\nSELECT Z_NAME AS possible_name\nFROM Z_PRIMARYKEY\nWHERE Z_NAME REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}';", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\I5_Extras.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [], "Total_raw_rows": 0, "Exploration_sql": "SELECT ZKEY AS potential_address_field\nFROM ZSETTING\nWHERE ZKEY REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT ZVALUE AS potential_address_field\nFROM ZSETTING\nWHERE ZVALUE REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b';", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
@@ -0,0 +1,5 @@
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "EMAIL", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["android_metadata", "locale", "en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": null, "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["android_metadata", "locale", "en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\+?1?[-. ]?\\(?[0-9]{3}\\)?[-. ]?[0-9]{3}[-. ]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "USERNAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["android_metadata", "locale", "en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": null, "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["android_metadata", "locale", "en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '[A-Za-z][A-Za-z\\s\\.\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
|
||||
{"db_path": "selectedDBs\\A1_commerce.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["android_metadata", "locale", "en_US"]], "Total_raw_rows": 1, "Exploration_sql": "SELECT locale FROM android_metadata WHERE locale REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}
|
||||
Some files were not shown because too many files have changed in this diff Show More
Reference in New Issue
Block a user