Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
15 changes: 14 additions & 1 deletion data_cleaning/clean_wpdx_sample_data.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,4 +26,17 @@ def clean_col_country_name(input_data):


if __name__ == '__main__':
clean_columns('wpdx_sample_data.csv', 'cleaned_wpdx_sample_data.csv')
clean_columns('wpdx_sample_data.csv', 'cleaned_wpdx_sample_data.csv')


def clean_col_count(input_data):
"""
Clean values in column: "count"
Trello card: https://trello.com/c/HHzNs0hS/1-column-countryname
"""
try:
input_data = int(input_data)
except ValueError:
input_data = None

return input_data
9 changes: 9 additions & 0 deletions data_cleaning/test_clean_wpdx_sample_data.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,3 +7,12 @@ def test_clean_col_country_name():
Test the cleaning for column: "country_name"
"""
assert clean_wpdx_sample_data.clean_col_country_name('NA') == 'NA'


def test_clean_col_count():
"""
Test the cleaning for column: "country_name"
"""
assert clean_wpdx_sample_data.clean_col_count('hello') == None