Files
mobile-pii-discovery-agent/model_PII_results/GPT-4.1/PII_I3_sms_20260208T172505Z.jsonl
2026-02-11 22:13:22 -05:00

6 lines
30 KiB
JSON
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
{"db_path": "selectedDBs\\I3_sms.db", "PII_type": "EMAIL", "PII": ["aniulka616@hotmail.com", "josephphw3r5@outlook.com", "jreynoldscbdemo+this.is.secret@gmail.com", "jthskp131699@icloud.com", "sousiezorjrc@outlook.com", "sweeneyfrank594@gmail.com", "ottomatik1234@gmail.com"], "Num_of_PII": 7, "source_columns": ["attachment.filename", "attachment.transfer_name", "handle.id", "handle.uncanonicalized_id", "chat.account_id", "chat.chat_identifier", "chat.account_login", "chat.last_addressed_handle", "chat.display_name", "message.text", "message.subject", "message.service_center", "message.account", "message.account_guid", "message.cache_roomnames", "message.group_title"], "Raw_rows_first_100": [["aniulka616@hotmail.com"], ["josephphw3r5@outlook.com"], ["jreynoldscbdemo+this.is.secret@gmail.com"], ["jthskp131699@icloud.com"], ["sousiezorjrc@outlook.com"], ["sweeneyfrank594@gmail.com"], ["aniulka616@hotmail.com"], ["josephphw3r5@outlook.com"], ["jreynoldscbdemo+this.is.secret@gmail.com"], ["jthskp131699@icloud.com"], ["sousiezorjrc@outlook.com"], ["sweeneyfrank594@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"]], "Total_raw_rows": 24, "Exploration_sql": "SELECT filename FROM attachment WHERE filename REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT transfer_name FROM attachment WHERE transfer_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT id FROM handle WHERE id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_id FROM chat WHERE account_id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_login FROM chat WHERE account_login REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT last_addressed_handle FROM chat WHERE last_addressed_handle REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT display_name FROM chat WHERE display_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT text FROM message WHERE text REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT subject FROM message WHERE subject REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT service_center FROM message WHERE service_center REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account FROM message WHERE account REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_guid FROM message WHERE account_guid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT cache_roomnames FROM message WHERE cache_roomnames REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT group_title FROM message WHERE group_title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "Extraction_sql": "SELECT filename FROM attachment WHERE filename REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT transfer_name FROM attachment WHERE transfer_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT id FROM handle WHERE id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_id FROM chat WHERE account_id REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_login FROM chat WHERE account_login REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT last_addressed_handle FROM chat WHERE last_addressed_handle REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT display_name FROM chat WHERE display_name REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT text FROM message WHERE text REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT subject FROM message WHERE subject REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT service_center FROM message WHERE service_center REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account FROM message WHERE account REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT account_guid FROM message WHERE account_guid REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT cache_roomnames FROM message WHERE cache_roomnames REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'\nUNION ALL\nSELECT group_title FROM message WHERE group_title REGEXP '[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,}'", "PII_Prompt": "a unique identifier for a destination to which electronic mail (email) can be sent and received over the internet; examples include jane.doe@example.com, john.smith@provider.net, dev-team@startup.io, and user.name+label@domain.org"}
{"db_path": "selectedDBs\\I3_sms.db", "PII_type": "PHONE", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["~/Library/SMS/Attachments/0e/14/E90B9F3E-C971-4424-975D-BBB0909CBEB0/_com.apple.Pasteboard.IKFnjZ.png"], ["~/Library/SMS/Attachments/56/06/2121EE7C-1D2A-4322-9611-DD57A570BCC7/IMG_3525.jpeg"], ["~/Library/SMS/Attachments/5b/11/75161DC7-C94C-4108-9939-962316471903/IMG_0035.MOV"], ["~/Library/SMS/Attachments/75/05/AA871C9A-4535-43D7-AE8C-BFFB0D645331/20240603_195340.vcf"], ["~/Library/SMS/Attachments/1f/15/5EE4CBA9-5582-4739-9EB2-E62BBE5589E2/Resized_20240603_213954_1717465199266.jpeg"], ["~/Library/SMS/Attachments/99/09/8D629C9F-6B65-4DC2-80FF-2C3610483F28/IMG_0324.HEIC"], ["~/Library/SMS/Attachments/cd/13/8D48C8DC-F27D-4017-9D99-6339A625045A/56484227-F6D5-4FA5-8F32-B8FB0060FA32.pluginPayloadAttachment"], ["~/Library/SMS/Attachments/84/04/A58BE5BD-9431-42B8-BD9A-D0FEBA093C55/Resized_20240605_162458_1717619104441.jpeg"], ["~/Library/SMS/Attachments/35/05/1D10BF40-140A-4B12-B0F6-61C0F4B6764A/73931709728__F55DDDF6-EF3A-4C91-B159-A11B3BAEAA87.HEIC"], ["~/Library/SMS/Attachments/33/03/1D7B2838-CAB4-4C26-8E92-3FC2D072D260/Resized_20240605_193505_1717630512670.jpeg"], ["20240603_195340.vcf"], ["Resized_20240603_213954_1717465199266.jpeg"], ["56484227-F6D5-4FA5-8F32-B8FB0060FA32.pluginPayloadAttachment"], ["Resized_20240605_162458_1717619104441.jpeg"], ["73931709728__F55DDDF6-EF3A-4C91-B159-A11B3BAEAA87.HEIC"], ["Resized_20240605_193505_1717630512670.jpeg"], ["666649e5296925.82215293.png"], ["66671148bd6390.74289362.png"], ["Resized_20240620_071946_1718895471091.jpeg"], ["Resized_20240619_112503_1718895476715.jpeg"], ["+12065937224"], ["+12065937224"], ["+12185715037"], ["+12484345508"], ["+13017157263"], ["+14155346421"], ["+14197574625"], ["+14259796297"], ["+14325353346"], ["+14847353029"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+19735203731"], ["+12065937224"], ["+12065937224"], ["+12155817608"], ["+12185715037"], ["+12484345508"], ["+13017157263"], ["+14155346421"], ["+14197574625"], ["+14259796297"], ["+14325353346"], ["+14197574625"], ["5162879924"], ["+14325353346"], ["+18553965089"], ["9195796465"], ["+17852533080"], ["9195796456"], ["+14155346421"], ["1410100001"], ["+13017157263"], ["FRM:93557\nSUBJ:Verify Wells Fargo Activity\nMSG:Reach +1 (844) 407.4819 if you haven't made the acquisition for $666.02 @Rite Aid WellsID: ZST2T8TALSOWZ"], ["The temporary PIN you requested is 7233. Please use this PIN to complete set up. If you received this in error, call 800-331-0500 or 611 and say representative."], ["AT&T free Msg- your PIN was changed. Have questions? Please dial 1-800-331-0500 or 611 from your wireless phone."], ["Hi, my name is Anna and I am a recruiter at VM Agency. We need a team of part-time assistants. The online hours are flexible and you can work from home with no restrictions. Pay ranges from at least $200 to $1,280 per day. All you need is a smartphone or computer to get the job done. You will be paid immediately at the end of each workday. Work 7 days a week. If you are interested, please contact me on WhatsA-p-p +15044930650"], ["Hi, my name is Anna and I am a recruiter at VM Agency. We need a team of part-time assistants. The online hours are flexible and you can work from home with no restrictions. Pay ranges from at least $200 to $1,280 per day. All you need is a smartphone or computer to get the job done. You will be paid immediately at the end of each workday. Work 7 days a week. If you are interested, please contact me on WhatsA-p-p +12109299940 \n"], ["Welcome! We've noticed that your background and resume have been recommended by several online recruitment agencies, so we'd like to offer you a part-time job that you can do in your free time. Our job is simple: we simply rate your favorite restaurants. There are no time constraints and you can complete the assessment from home. Daily pay ranges from $300 to $600, you can easily earn $10K+ per month, and all wages are paid on the same day. If you would like to take part, please contact us via WhatsApp: +15797987022\n(Note: You must be at least 24 years old)\n"], ["Hi, it's AT&T. Welcome aboard! Please note this ship is not covered by your International Day Pass. Standard rates apply: $2.05/MB, $3.00/min, $0.50/text msg sent, $1.30/photo or video msg sent. AT&T Cruise packages are available, go to att.com/cruise (free view) for details. Or you may turn off Data Roaming in your device Settings. Questions? Call +1.214.547.2300 (free call)."], ["https://ambarrestaurant.com/wp-content/uploads/2024/07/ambar-ch-dinner-07012024.pdf"], ["chat70863266579689223"], ["chat70863266579689223"], ["chat818965589567390604"]], "Total_raw_rows": 71, "Exploration_sql": "SELECT filename FROM attachment WHERE filename REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT transfer_name FROM attachment WHERE transfer_name REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT last_addressed_handle FROM chat WHERE last_addressed_handle REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT display_name FROM chat WHERE display_name REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT id FROM handle WHERE id REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT text FROM message WHERE text REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT subject FROM message WHERE subject REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT service_center FROM message WHERE service_center REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT cache_roomnames FROM message WHERE cache_roomnames REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}' \nUNION ALL\nSELECT group_title FROM message WHERE group_title REGEXP '(\\+1[\\s\\-\\.]?)?(\\(?[2-9][0-9]{2}\\)?[\\s\\-\\.]?)?[2-9][0-9]{2}[\\s\\-\\.]?[0-9]{4}'", "Extraction_sql": null, "PII_Prompt": "a US phone number is a 10-digit NANP number (area code + exchange + line) that may be written as 2023133725, 202-313-3725, (202) 313-3725, 202.313.3725, +1 202 313 3725, or 1-202-313-3725"}
{"db_path": "selectedDBs\\I3_sms.db", "PII_type": "USERNAME", "PII": ["chat70863266579689223", "chat818965589567390604"], "Num_of_PII": 2, "source_columns": ["chat.account_id", "chat.chat_identifier", "chat.service_name", "chat.room_name", "chat.account_login", "chat.last_addressed_handle", "chat.display_name", "chat.group_id", "handle.id", "handle.uncanonicalized_id", "handle.person_centric_id", "message.account", "message.account_guid", "message.other_handle", "message.group_title"], "Raw_rows_first_100": [["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["CBE9797C-F36D-4678-960B-659CD3618AB2"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["B0690F46-EE5F-4019-ACFC-7782054C012B"], ["aniulka616@hotmail.com"], ["chat70863266579689223"], ["chat818965589567390604"], ["josephphw3r5@outlook.com"], ["jreynoldscbdemo+this.is.secret@gmail.com"], ["jthskp131699@icloud.com"], ["sousiezorjrc@outlook.com"], ["sweeneyfrank594@gmail.com"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["SMS"], ["iMessage"], ["iMessage"], ["iMessage"], ["iMessage"], ["iMessage"], ["iMessage"], ["iMessage"], ["iMessage"], ["SMS"], ["iMessage"], ["chat70863266579689223"], ["chat818965589567390604"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"], ["E:ottomatik1234@gmail.com"]], "Total_raw_rows": 355, "Exploration_sql": "SELECT account_id FROM chat WHERE account_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT service_name FROM chat WHERE service_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT room_name FROM chat WHERE room_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account_login FROM chat WHERE account_login REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT last_addressed_handle FROM chat WHERE last_addressed_handle REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT display_name FROM chat WHERE display_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT group_id FROM chat WHERE group_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT id FROM handle WHERE id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT person_centric_id FROM handle WHERE person_centric_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account FROM message WHERE account REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account_guid FROM message WHERE account_guid REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT other_handle FROM message WHERE other_handle REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT group_title FROM message WHERE group_title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "Extraction_sql": "SELECT account_id FROM chat WHERE account_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT service_name FROM chat WHERE service_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT room_name FROM chat WHERE room_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account_login FROM chat WHERE account_login REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT last_addressed_handle FROM chat WHERE last_addressed_handle REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT display_name FROM chat WHERE display_name REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT group_id FROM chat WHERE group_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT id FROM handle WHERE id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT person_centric_id FROM handle WHERE person_centric_id REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account FROM message WHERE account REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT account_guid FROM message WHERE account_guid REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT other_handle FROM message WHERE other_handle REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'\nUNION ALL\nSELECT group_title FROM message WHERE group_title REGEXP '\\b[a-zA-Z][a-zA-Z0-9._-]{2,51}\\b'", "PII_Prompt": "a username is a short textual identifier chosen by a user to represent their account or public handle within an application or service it is stored as plain text contains no whitespace does not include a domain component and is intended for human recognition rather than internal system uniqueness"}
{"db_path": "selectedDBs\\I3_sms.db", "PII_type": "PERSON_NAME", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["~/Library/SMS/Attachments/0e/14/E90B9F3E-C971-4424-975D-BBB0909CBEB0/_com.apple.Pasteboard.IKFnjZ.png"], ["~/Library/SMS/Attachments/56/06/2121EE7C-1D2A-4322-9611-DD57A570BCC7/IMG_3525.jpeg"], ["~/Library/SMS/Attachments/5b/11/75161DC7-C94C-4108-9939-962316471903/IMG_0035.MOV"], ["~/Library/SMS/Attachments/75/05/AA871C9A-4535-43D7-AE8C-BFFB0D645331/20240603_195340.vcf"], ["~/Library/SMS/Attachments/1f/15/5EE4CBA9-5582-4739-9EB2-E62BBE5589E2/Resized_20240603_213954_1717465199266.jpeg"], ["~/Library/SMS/Attachments/99/09/8D629C9F-6B65-4DC2-80FF-2C3610483F28/IMG_0324.HEIC"], ["~/Library/SMS/Attachments/cd/13/8D48C8DC-F27D-4017-9D99-6339A625045A/56484227-F6D5-4FA5-8F32-B8FB0060FA32.pluginPayloadAttachment"], ["~/Library/SMS/Attachments/a8/08/5D5035C3-5B0C-4FEB-A53B-69C77BE70D39/5446FD3D-DA30-4278-9B87-62F9D5CBF6BA.pluginPayloadAttachment"], ["~/Library/SMS/Attachments/62/02/75F9C875-72BD-4487-ADBC-3FF7B8830F2E/E9518E52-E72C-4E9E-8F03-425EBC95DA68.pluginPayloadAttachment"], ["~/Library/SMS/Attachments/7a/10/E0DC5025-4832-452A-8D3B-212117C9CF63/86C56268-02EB-4D2C-89CE-8DAEF7E6D36A.pluginPayloadAttachment"], ["_com.apple.Pasteboard.IKFnjZ.png"], ["IMG_3525.jpeg"], ["IMG_0035.MOV"], ["20240603_195340.vcf"], ["Resized_20240603_213954_1717465199266.jpeg"], ["IMG_0324.HEIC"], ["56484227-F6D5-4FA5-8F32-B8FB0060FA32.pluginPayloadAttachment"], ["5446FD3D-DA30-4278-9B87-62F9D5CBF6BA.pluginPayloadAttachment"], ["E9518E52-E72C-4E9E-8F03-425EBC95DA68.pluginPayloadAttachment"], ["86C56268-02EB-4D2C-89CE-8DAEF7E6D36A.pluginPayloadAttachment"], ["chat70863266579689223"], ["chat818965589567390604"], ["aniulka616@hotmail.com"], ["chat70863266579689223"], ["chat818965589567390604"], ["josephphw3r5@outlook.com"], ["jreynoldscbdemo+this.is.secret@gmail.com"], ["jthskp131699@icloud.com"], ["sousiezorjrc@outlook.com"], ["sweeneyfrank594@gmail.com"], ["0701BE7B-9317-4708-9FE7-D23F7032B434"], ["0DF3D995-0151-4CC0-B73A-60479EC1313E"], ["1A295C7C-D6F5-4B5A-B3B9-8E5645185CFD"], ["1DC2793D-9BE1-4350-9884-85418F5D48B7"], ["2067D1DE-94FA-4072-B470-0E7796B67335"], ["2B080E23-62C2-4AC4-9FC8-AE8605199086"], ["2CD2D256-8506-4E78-A9F0-B0D0A5827A65"], ["2F3EA790-C0EB-47A7-AC9E-571B9D3A5F81"], ["31129875-34A3-4C83-B81A-071D6468DA87"], ["328E5B21-DABD-4C71-AAE9-3E95BF55D2F6"], ["aniulka616@hotmail.com"], ["josephphw3r5@outlook.com"], ["jreynoldscbdemo+this.is.secret@gmail.com"], ["jthskp131699@icloud.com"], ["sousiezorjrc@outlook.com"], ["sweeneyfrank594@gmail.com"], ["I'm Anya, director of Gmary jewelry, Hope you like that Rose Gold bracelet, if you have any comments, please contact me, Have a nice day"], ["Hola"], ["[TikTok] 810197 is your verification code, valid for 5 minutes. To keep your account safe, never forward this code."], ["[TikTok] 122628 is your verification code, valid for 5 minutes. To keep your account safe, never forward this code."], ["[TikTok] 172994 is your verification code, valid for 5 minutes. To keep your account safe, never forward this code."], ["Your Google verification code is 326338."], ["Wrong number "], ["Your SIGNAL verification code is: 902475"], ["If someone requests this code, it is a scam. Use code 914337 only in Google Voice app to sign up. g.co/voice/help"], ["Your Viber code is: 827215.\nClose this message and enter the code into Viber to activate your account."], ["chat70863266579689223"], ["chat70863266579689223"], ["chat818965589567390604"]], "Total_raw_rows": 59, "Exploration_sql": "SELECT filename FROM attachment WHERE filename REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT transfer_name FROM attachment WHERE transfer_name REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT display_name FROM chat WHERE display_name REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT room_name FROM chat WHERE room_name REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT last_addressed_handle FROM chat WHERE last_addressed_handle REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT group_id FROM chat WHERE group_id REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT id FROM handle WHERE id REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT person_centric_id FROM handle WHERE person_centric_id REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT text FROM message WHERE text REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT subject FROM message WHERE subject REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT cache_roomnames FROM message WHERE cache_roomnames REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}' \nUNION ALL \nSELECT group_title FROM message WHERE group_title REGEXP '[A-Za-z][A-Za-z\\\\s\\\\.\\\\-]{1,50}'", "Extraction_sql": null, "PII_Prompt": "a loosely structured human name-like strings that typically consist of a first name, a first name and a last name, and may also include middle names, initials, prefixes (e.g., Mr., Dr.), and suffixes (e.g., Jr., Sr.)"}
{"db_path": "selectedDBs\\I3_sms.db", "PII_type": "POSTAL_ADDRESS", "PII": [], "Num_of_PII": 0, "source_columns": [], "Raw_rows_first_100": [["Opps!, isn't this William's phone number?? I will check the phone number again"], ["My man....what's uo"], ["Yayza \nHow's your weekend so far?"], ["Lol, mine should be good. How's Eddie V? Haven't heard from him in awhile. "], ["He's just waking up. Just busy on his other phone so maybe he's behind "], ["Hi, it's AT&T. You're all set! Enjoy unlimited talk, text & data at no extra cost while traveling in 19 Latin America countries. Coverage/data speeds vary by country. Details at att.com/latamcountries (free view). "], ["🎁 Crypto Results 3731: Aspire to earn $5K to $15K daily? Text \"Yes\" to get strategic insights from C0INBASE'S elite crypto experts and a chance to win $500. Supercharge your portfolio now."], ["C0INBASE 3731: Race in the champions circuit of crypto trading! Reply \"Yes\" to train with Coinbases elite and sprint towards daily profits of $5K to $15K, with a pit stop for a $500 win."], ["1 of 5: How satisfied are you with Dimitra's ability to assist you with your call?\r\n1=Very DISSATISFIED\r\n2=Dissatisfied\r\n3=Neutral\r\n4=Satisfied\r\n5=Very SATISFIED"], ["It's Otto"]], "Total_raw_rows": 10, "Exploration_sql": "SELECT filename FROM attachment WHERE filename REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT transfer_name FROM attachment WHERE transfer_name REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT chat_identifier FROM chat WHERE chat_identifier REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT room_name FROM chat WHERE room_name REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT display_name FROM chat WHERE display_name REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT id FROM handle WHERE id REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT uncanonicalized_id FROM handle WHERE uncanonicalized_id REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT text FROM message WHERE text REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT subject FROM message WHERE subject REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT cache_roomnames FROM message WHERE cache_roomnames REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'\nUNION ALL\nSELECT group_title FROM message WHERE group_title REGEXP '(?i)\\b(?:p\\.?\\s*o\\.?\\s*box|post\\s+office\\s+box|ave\\.?|avenue|st\\.?|street|rd\\.?|road|blvd\\.?|boulevard|dr\\.?|drive|ln\\.?|lane|ct\\.?|court|pl\\.?|place|way|pkwy\\.?|parkway|cir\\.?|circle|ter\\.?|terrace|hwy\\.?|highway|trl\\.?|trail|sq\\.?|square|pike|loop|run|walk|path|byp\\.?|bypass|(?:n|s|e|w|ne|nw|se|sw)\\b)\\b'", "Extraction_sql": null, "PII_Prompt": "a US postal address is a street-level mailing location in the United States, commonly appearing as a street name and suffix (e.g., 'Market St') optionally with a street number (e.g., '1500 Market St'), unit, city/state, ZIP, or a PO Box (e.g., 'P.O. Box 123')"}