import csv_metadata_quality.fix as fix def test_fix_leading_whitespace(): """Test fixing leading whitespace.""" value = " Alan" assert fix.whitespace(value) == "Alan" def test_fix_trailing_whitespace(): """Test fixing trailing whitespace.""" value = "Alan " assert fix.whitespace(value) == "Alan" def test_fix_excessive_whitespace(): """Test fixing excessive whitespace.""" value = "Alan Orth" assert fix.whitespace(value) == "Alan Orth" def test_fix_invalid_separators(): """Test fixing invalid multi-value separators.""" value = "Alan|Orth" assert fix.separators(value) == "Alan||Orth" def test_fix_unnecessary_unicode(): """Test fixing unnecessary Unicode.""" value = "Alan​ Orth" assert fix.unnecessary_unicode(value) == "Alan Orth" def test_fix_duplicates(): """Test fixing duplicate metadata values.""" value = "Kenya||Kenya" assert fix.duplicates(value) == "Kenya" def test_fix_newlines(): """Test fixing newlines.""" value = """Ken ya""" assert fix.newlines(value) == "Kenya" def test_fix_comma_space(): """Test adding space after comma.""" value = "Orth,Alan S." field_name = "dc.contributor.author" assert fix.comma_space(value, field_name) == "Orth, Alan S."