From dfd961d720f4a9ba4e7ccc5bb4321b4abe6ffba8 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Fri, 26 Jul 2019 23:14:37 +0300 Subject: [PATCH] Bring test.csv into project --- csv_metadata_quality/app.py | 4 ++-- tests/test.csv | 3 +++ 2 files changed, 5 insertions(+), 2 deletions(-) create mode 100644 tests/test.csv diff --git a/csv_metadata_quality/app.py b/csv_metadata_quality/app.py index 5571526..3951528 100644 --- a/csv_metadata_quality/app.py +++ b/csv_metadata_quality/app.py @@ -6,7 +6,7 @@ def run(): # Read all fields as strings so dates don't get converted from 1998 to 1998.0 #df = pd.read_csv('/home/aorth/Downloads/2019-07-26-Bioversity-Migration.csv', dtype=str) #df = pd.read_csv('/tmp/quality.csv', dtype=str) - df = pd.read_csv('/tmp/omg.csv', dtype=str) + df = pd.read_csv('tests/test.csv', dtype=str) # Fix whitespace in all columns for column in df.columns.values.tolist(): @@ -21,4 +21,4 @@ def run(): df[column] = df[column].apply(check.isbn) # Write - df.to_csv('/tmp/omg.fixed.csv', index=False) + df.to_csv('/tmp/test.fixed.csv', index=False) diff --git a/tests/test.csv b/tests/test.csv new file mode 100644 index 0000000..b973c6f --- /dev/null +++ b/tests/test.csv @@ -0,0 +1,3 @@ +dc.contributor.author,birthdate,dc.identifier.issn,dc.identifier.isbn + Alan|| Alan||Alan Orth||Alan ||Alan Orth ||Alan ,1984,0378-5955,978-0-306-40615-6||99921-58-10-7 +Stella|| Stella ||Stella Orth||Stella ,1984-11-27,2321-2302,99921-58-10-7