Skip to content

Commit e931ed8

Browse files
authored
Create data_masking.py
1 parent 2076046 commit e931ed8

File tree

1 file changed

+28
-0
lines changed

1 file changed

+28
-0
lines changed

data_privacy/data_masking.py

Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
import pandas as pd
2+
3+
def mask_data(dataframe, columns_to_mask):
4+
"""Mask sensitive data in specified columns of a DataFrame."""
5+
masked_dataframe = dataframe.copy()
6+
for column in columns_to_mask:
7+
if column in masked_dataframe.columns:
8+
# Replace sensitive data with asterisks or a masking pattern
9+
masked_dataframe[column] = masked_dataframe[column].apply(lambda x: '*' * len(str(x)))
10+
return masked_dataframe
11+
12+
# Example Usage:
13+
if __name__ == "__main__":
14+
# Sample DataFrame
15+
data = {
16+
'Name': ['Alice', 'Bob', 'Charlie'],
17+
18+
'Phone': ['123-456-7890', '987-654-3210', '555-555-5555']
19+
}
20+
df = pd.DataFrame(data)
21+
22+
# Columns to mask
23+
columns_to_mask = ['Email', 'Phone']
24+
25+
# Mask the data
26+
masked_df = mask_data(df, columns_to_mask)
27+
print("Original DataFrame:\n", df)
28+
print("Masked DataFrame:\n", masked_df)

0 commit comments

Comments
 (0)