diff --git a/csv_metadata_quality/app.py b/csv_metadata_quality/app.py index 5571526..3951528 100644 --- a/csv_metadata_quality/app.py +++ b/csv_metadata_quality/app.py @@ -6,7 +6,7 @@ def run(): # Read all fields as strings so dates don't get converted from 1998 to 1998.0 #df = pd.read_csv('/home/aorth/Downloads/2019-07-26-Bioversity-Migration.csv', dtype=str) #df = pd.read_csv('/tmp/quality.csv', dtype=str) - df = pd.read_csv('/tmp/omg.csv', dtype=str) + df = pd.read_csv('tests/test.csv', dtype=str) # Fix whitespace in all columns for column in df.columns.values.tolist(): @@ -21,4 +21,4 @@ def run(): df[column] = df[column].apply(check.isbn) # Write - df.to_csv('/tmp/omg.fixed.csv', index=False) + df.to_csv('/tmp/test.fixed.csv', index=False) diff --git a/tests/test.csv b/tests/test.csv new file mode 100644 index 0000000..b973c6f --- /dev/null +++ b/tests/test.csv @@ -0,0 +1,3 @@ +dc.contributor.author,birthdate,dc.identifier.issn,dc.identifier.isbn + Alan|| Alan||Alan Orth||Alan ||Alan Orth ||Alan ,1984,0378-5955,978-0-306-40615-6||99921-58-10-7 +Stella|| Stella ||Stella Orth||Stella ,1984-11-27,2321-2302,99921-58-10-7