|
1 |
| -# import os |
2 |
| -# import sys |
| 1 | +import os |
| 2 | +import sys |
3 | 3 |
|
4 |
| -# import requests |
| 4 | +import requests |
5 | 5 |
|
6 |
| -# from datafog import PresidioEngine as presidio |
| 6 | +from datafog import PresidioEngine as presidio |
7 | 7 |
|
8 |
| -# sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))) |
| 8 | +sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))) |
9 | 9 |
|
10 | 10 |
|
11 |
| -# def test_piiscan_json_detection(): |
12 |
| -# # Assuming sample_file already contains the data you want to test |
13 |
| -# sample_file = "tests/files/input_files/sample.json" |
| 11 | +def test_piiscan_json_detection(): |
| 12 | + # Assuming sample_file already contains the data you want to test |
| 13 | + sample_file = "tests/files/input_files/sample.json" |
14 | 14 |
|
15 |
| -# # Read the contents of sample_file into original_value |
16 |
| -# with open(sample_file, "r") as f: |
17 |
| -# original_value = f.read() |
| 15 | + # Read the contents of sample_file into original_value |
| 16 | + with open(sample_file, "r") as f: |
| 17 | + original_value = f.read() |
18 | 18 |
|
19 |
| -# pii_detected = presidio.scan(original_value) |
| 19 | + pii_detected = presidio.scan(original_value) |
20 | 20 |
|
21 |
| -# # write pii_detected to a JSON file called output.json in the same directory as sample_file |
22 |
| -# with open( |
23 |
| -# "tests/files/output_files/output.json", |
24 |
| -# "w", |
25 |
| -# ) as f: |
26 |
| -# for entity in pii_detected: |
27 |
| -# f.write(entity.entity_type) |
28 |
| -# f.write("\n") |
| 21 | + # write pii_detected to a JSON file called output.json in the same directory as sample_file |
| 22 | + with open( |
| 23 | + "tests/files/output_files/output.json", |
| 24 | + "w", |
| 25 | + ) as f: |
| 26 | + for entity in pii_detected: |
| 27 | + f.write(entity.entity_type) |
| 28 | + f.write("\n") |
29 | 29 |
|
30 | 30 |
|
31 |
| -# def test_piiscan_csv_detection(): |
32 |
| -# # Assuming sample_file already contains the data you want to test |
33 |
| -# sample_file = "tests/files/input_files/sample.csv" |
| 31 | +def test_piiscan_csv_detection(): |
| 32 | + # Assuming sample_file already contains the data you want to test |
| 33 | + sample_file = "tests/files/input_files/sample.csv" |
34 | 34 |
|
35 |
| -# # Read the contents of sample_file into original_value |
36 |
| -# with open(sample_file, "r") as f: |
37 |
| -# original_value = f.read() |
| 35 | + # Read the contents of sample_file into original_value |
| 36 | + with open(sample_file, "r") as f: |
| 37 | + original_value = f.read() |
38 | 38 |
|
39 |
| -# pii_detected = presidio.scan(original_value) |
| 39 | + pii_detected = presidio.scan(original_value) |
40 | 40 |
|
41 |
| -# # write pii_detected to a JSON file called output.json in the same directory as sample_file |
42 |
| -# with open( |
43 |
| -# "tests/files/output_files/output.csv", |
44 |
| -# "w", |
45 |
| -# ) as f: |
46 |
| -# for entity in pii_detected: |
47 |
| -# f.write(entity.entity_type) |
48 |
| -# f.write("\n") |
| 41 | + # write pii_detected to a JSON file called output.json in the same directory as sample_file |
| 42 | + with open( |
| 43 | + "tests/files/output_files/output.csv", |
| 44 | + "w", |
| 45 | + ) as f: |
| 46 | + for entity in pii_detected: |
| 47 | + f.write(entity.entity_type) |
| 48 | + f.write("\n") |
49 | 49 |
|
50 | 50 |
|
51 |
| -# def test_piiscan_txt_detection(): |
52 |
| -# # Assuming sample_file already contains the data you want to test |
53 |
| -# sample_file = "tests/files/input_files/sample.txt" |
54 |
| -# # Read the contents of sample_file into original_value |
55 |
| -# with open(sample_file, "r") as f: |
56 |
| -# original_value = f.read() |
| 51 | +def test_piiscan_txt_detection(): |
| 52 | + # Assuming sample_file already contains the data you want to test |
| 53 | + sample_file = "tests/files/input_files/sample.txt" |
| 54 | + # Read the contents of sample_file into original_value |
| 55 | + with open(sample_file, "r") as f: |
| 56 | + original_value = f.read() |
57 | 57 |
|
58 |
| -# pii_detected = presidio.scan(original_value) |
| 58 | + pii_detected = presidio.scan(original_value) |
59 | 59 |
|
60 |
| -# # write pii_detected to a JSON file called output.json in the same directory as sample_file |
61 |
| -# with open( |
62 |
| -# "tests/files/output_files/output.txt", |
63 |
| -# "w", |
64 |
| -# ) as f: |
65 |
| -# for entity in pii_detected: |
66 |
| -# f.write(entity.entity_type) |
67 |
| -# f.write("\n") |
| 60 | + # write pii_detected to a JSON file called output.json in the same directory as sample_file |
| 61 | + with open( |
| 62 | + "tests/files/output_files/output.txt", |
| 63 | + "w", |
| 64 | + ) as f: |
| 65 | + for entity in pii_detected: |
| 66 | + f.write(entity.entity_type) |
| 67 | + f.write("\n") |
68 | 68 |
|
69 | 69 |
|
70 |
| -# def test_piiscan_url_detection(): |
71 |
| -# # Assuming sample_file already contains the data you want to test |
72 |
| -# sample_url = "https://gist.githubusercontent.com/sidmohan0/1aa3ec38b4e6594d3c34b113f2e0962d/raw/42e57146197be0f85a5901cd1dcdd9ad15b31bab/sotu_2023.txt" |
| 70 | +def test_piiscan_url_detection(): |
| 71 | + # Assuming sample_file already contains the data you want to test |
| 72 | + sample_url = "https://gist.githubusercontent.com/sidmohan0/1aa3ec38b4e6594d3c34b113f2e0962d/raw/42e57146197be0f85a5901cd1dcdd9ad15b31bab/sotu_2023.txt" |
73 | 73 |
|
74 |
| -# response = requests.get(sample_url) |
75 |
| -# original_value = response.text |
76 |
| -# pii_detected = presidio.scan(original_value) |
| 74 | + response = requests.get(sample_url) |
| 75 | + original_value = response.text |
| 76 | + pii_detected = presidio.scan(original_value) |
77 | 77 |
|
78 |
| -# # write pii_detected to a output.md in the same directory as sample_url |
79 |
| -# with open( |
80 |
| -# "tests/files/output_files/output.md", |
81 |
| -# "w", |
82 |
| -# ) as f: |
83 |
| -# for entity in pii_detected: |
84 |
| -# f.write(entity.entity_type) |
85 |
| -# f.write("\n") |
| 78 | + # write pii_detected to a output.md in the same directory as sample_url |
| 79 | + with open( |
| 80 | + "tests/files/output_files/output.md", |
| 81 | + "w", |
| 82 | + ) as f: |
| 83 | + for entity in pii_detected: |
| 84 | + f.write(entity.entity_type) |
| 85 | + f.write("\n") |
0 commit comments