mirror of
https://github.com/ISEAL-Community/iseal-core.git
synced 2024-10-30 20:03:02 +01:00
cleaning code to generate rdf
This commit is contained in:
parent
4e34581797
commit
78e3dce29e
@ -4,23 +4,25 @@
|
|||||||
import json
|
import json
|
||||||
import os
|
import os
|
||||||
import re
|
import re
|
||||||
|
import argparse
|
||||||
|
import sys
|
||||||
|
|
||||||
|
|
||||||
import pandas as pd
|
import pandas as pd
|
||||||
from rdflib import BNode, Graph, Literal, URIRef
|
from rdflib import BNode, Graph, Literal, URIRef
|
||||||
from rdflib.namespace import DC, DCTERMS, OWL, RDF, RDFS, SKOS, XSD
|
from rdflib.namespace import DC, DCTERMS, OWL, RDF, RDFS, SKOS, XSD
|
||||||
|
|
||||||
|
|
||||||
def make_core():
|
def make_rdf(file, ns):
|
||||||
g = Graph()
|
g = Graph()
|
||||||
|
|
||||||
##namespace
|
##namespace
|
||||||
# NS = "http://iseal.org/terms/"
|
# NS = "https://iseal-community.github.io/iseal-core#"
|
||||||
NS = "https://alanorth.github.io/iseal-schema/#"
|
NS = ns
|
||||||
## create ontology
|
## create ontology
|
||||||
iseal = URIRef(NS)
|
iseal = URIRef(NS)
|
||||||
g.add((iseal, RDF.type, OWL.Ontology))
|
g.add((iseal, RDF.type, OWL.Ontology))
|
||||||
|
df = pd.read_csv(file)
|
||||||
df = pd.read_csv("../data/iseal-core.csv")
|
|
||||||
df.dropna(how="all", axis=1)
|
df.dropna(how="all", axis=1)
|
||||||
df.fillna("", inplace=True)
|
df.fillna("", inplace=True)
|
||||||
|
|
||||||
@ -31,9 +33,14 @@ def make_core():
|
|||||||
example = row["element link for more information"]
|
example = row["element link for more information"]
|
||||||
cardinality = row["element options"]
|
cardinality = row["element options"]
|
||||||
prop_type = row["element type"]
|
prop_type = row["element type"]
|
||||||
controlled_vocab = row["element controlled values or terms"]
|
# controlled_vocab = row["element controlled values or terms"]
|
||||||
module = row["idss element cluster"]
|
module = row["idss element cluster"]
|
||||||
module_cat = row["idss schema module"]
|
module_cat = ""
|
||||||
|
try: ## for extensions
|
||||||
|
module_cat = row["idss schema module"]
|
||||||
|
except:
|
||||||
|
module_cat_name = [col for col in df.columns if "module" in col][0]
|
||||||
|
module_cat = row[module_cat_name]
|
||||||
dc = row["element link for dublin core attributes"]
|
dc = row["element link for dublin core attributes"]
|
||||||
dspace = row["dspace field name"]
|
dspace = row["dspace field name"]
|
||||||
|
|
||||||
@ -43,99 +50,70 @@ def make_core():
|
|||||||
##create module as skos concept
|
##create module as skos concept
|
||||||
g.add((moduleUri, RDF.type, OWL.Class)) ## SKOS.Concept
|
g.add((moduleUri, RDF.type, OWL.Class)) ## SKOS.Concept
|
||||||
g.add((moduleUri, SKOS.prefLabel, Literal(module)))
|
g.add((moduleUri, SKOS.prefLabel, Literal(module)))
|
||||||
##element
|
|
||||||
# if '-' not in element_name:
|
|
||||||
if True: ## lazy reindenting
|
|
||||||
concept = module_cat # element_name.split(' - ')[0]
|
|
||||||
# element = element_name.strip()
|
|
||||||
## code from Alan
|
|
||||||
# Make sure element name is URL friendly because we need to use it in
|
|
||||||
# the file system and in the URL.
|
|
||||||
#
|
|
||||||
# Replace two or more whitespaces with one
|
|
||||||
element_name = re.sub(r"\s{2,}", " ", element_name)
|
|
||||||
# Replace unnecessary stuff in some element names (I should tell Peter
|
|
||||||
# that these belong in the description)
|
|
||||||
element_name = re.sub(r"\s?\(\w+\)", "", element_name)
|
|
||||||
# Remove commas and question marks
|
|
||||||
element_name = re.sub(r"[,?]", "", element_name)
|
|
||||||
# Replace ": " with a dash (as in "Evaluation: ")
|
|
||||||
element_name = element_name.replace(": ", "-")
|
|
||||||
# Replace " / " with a dash (as in "biome / zone")
|
|
||||||
element_name = element_name.replace(" / ", "-")
|
|
||||||
# Replace whitespace, colons, and slashes with dashes
|
|
||||||
element_name = re.sub(r"[\s/]", "-", element_name)
|
|
||||||
# Lower case it
|
|
||||||
element_name = element_name.lower()
|
|
||||||
# Strip just in case
|
|
||||||
element_name = element_name.strip()
|
|
||||||
|
|
||||||
# For example Certifying Body, FSC audit, Certificate, etc
|
conceptUri = URIRef(NS + module_cat.replace(" ", "_"))
|
||||||
cluster = row["idss element cluster"].capitalize()
|
if not (None, SKOS.prefLabel, Literal(module_cat)) in g:
|
||||||
|
##create concept as skos concept
|
||||||
|
g.add((conceptUri, RDF.type, OWL.Class)) ## SKOS.Concept
|
||||||
|
g.add((conceptUri, SKOS.prefLabel, Literal(module_cat)))
|
||||||
|
g.add((conceptUri, RDFS.subClassOf, moduleUri))
|
||||||
|
|
||||||
# For example Assurance, Certification, Core, Impact, etc
|
## create properties
|
||||||
module = row["idss schema module"].capitalize()
|
elementURI = URIRef(NS + dspace.replace(".", "-").lower())
|
||||||
|
if prop_type == "CONTROLLED VALUE": ## object property
|
||||||
# Generate a "safe" version of the element name for use in URLs and
|
g.add((elementURI, SKOS.prefLabel, Literal(element_name)))
|
||||||
# files by combining the cluster and the element name. This could
|
g.add((elementURI, RDF.type, OWL.ObjectProperty))
|
||||||
# change in the future.
|
g.add((elementURI, OWL.domain, conceptUri))
|
||||||
element_name_safe = cluster.replace(" ", "-").lower() + "-" + element_name
|
## add suproperty link
|
||||||
|
if dc:
|
||||||
element = element_name_safe
|
dct = dc.split(":")[1]
|
||||||
|
if "||" in dct:
|
||||||
conceptUri = URIRef(NS + concept.replace(" ", "_"))
|
dct = dc.split(":")[0]
|
||||||
if not (None, SKOS.prefLabel, Literal(concept)) in g:
|
if "wgs84" in dc:
|
||||||
##create concept as skos concept
|
g.add(
|
||||||
g.add((conceptUri, RDF.type, OWL.Class)) ## SKOS.Concept
|
(
|
||||||
g.add((conceptUri, SKOS.prefLabel, Literal(concept)))
|
elementURI,
|
||||||
g.add((conceptUri, RDFS.subClassOf, moduleUri))
|
RDFS.subPropertyOf,
|
||||||
|
URIRef("http://www.w3.org/2003/01/geo/wgs84_pos#" + dct),
|
||||||
## create properties
|
|
||||||
elementURI = URIRef(NS + element.replace(" ", "_"))
|
|
||||||
if prop_type == "CONTROLLED VALUE": ## object property
|
|
||||||
g.add((elementURI, SKOS.prefLabel, Literal(element)))
|
|
||||||
g.add((elementURI, RDF.type, OWL.ObjectProperty))
|
|
||||||
g.add((elementURI, OWL.domain, conceptUri))
|
|
||||||
## add suproperty link
|
|
||||||
if dc:
|
|
||||||
dct = dc.split(":")[1]
|
|
||||||
if "wgs84" in dc:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef(
|
|
||||||
"http://www.w3.org/2003/01/geo/wgs84_pos#" + dct
|
|
||||||
),
|
|
||||||
)
|
|
||||||
)
|
)
|
||||||
else:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef("http://purl.org/dc/terms/" + dct),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
## add dspace alternative ID
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
URIRef("http://purl.org/dc/terms/alternative"),
|
|
||||||
Literal(dspace),
|
|
||||||
)
|
)
|
||||||
|
else:
|
||||||
|
g.add(
|
||||||
|
(
|
||||||
|
elementURI,
|
||||||
|
RDFS.subPropertyOf,
|
||||||
|
URIRef("http://purl.org/dc/terms/" + dct),
|
||||||
|
)
|
||||||
|
)
|
||||||
|
## add dspace alternative ID
|
||||||
|
g.add(
|
||||||
|
(
|
||||||
|
elementURI,
|
||||||
|
URIRef("http://purl.org/dc/terms/alternative"),
|
||||||
|
Literal(dspace),
|
||||||
)
|
)
|
||||||
## create controlled vocab
|
)
|
||||||
cvURI = URIRef(NS + "VOCAB_" + element.replace(" ", "_"))
|
## create controlled vocab
|
||||||
g.add(
|
cvURI = URIRef(NS + "VOCAB_" + element_name.replace(" ", "_"))
|
||||||
(cvURI, RDF.type, OWL.Class)
|
g.add((cvURI, RDF.type, OWL.Class)) ## SKOS.Concept ## SKOS.Collection??
|
||||||
) ## SKOS.Concept ## SKOS.Collection??
|
g.add((cvURI, SKOS.prefLabel, Literal("VOCAB " + element_name)))
|
||||||
g.add((cvURI, SKOS.prefLabel, Literal("VOCAB " + element)))
|
## open controlled vocab file
|
||||||
for term in controlled_vocab.split("||"):
|
## open controlled vocab file
|
||||||
termURI = URIRef(NS + term.replace(" ", "_").replace("|", ""))
|
try:
|
||||||
g.add((termURI, RDF.type, OWL.Class)) ## SKOS.Concept
|
with open(
|
||||||
g.add((termURI, SKOS.prefLabel, Literal(term)))
|
"data/controlled-vocabularies/"
|
||||||
g.add((termURI, RDFS.subClassOf, cvURI)) ## SKOS.member???
|
+ dspace.replace(".", "-").lower()
|
||||||
|
+ ".txt",
|
||||||
|
"r",
|
||||||
|
encoding="utf-8",
|
||||||
|
) as f:
|
||||||
|
lines = f.readlines()
|
||||||
|
for line in lines:
|
||||||
|
term = line.strip()
|
||||||
|
termURI = URIRef(NS + term.replace(" ", "_").replace("|", ""))
|
||||||
|
g.add((termURI, RDF.type, OWL.Class)) ## SKOS.Concept
|
||||||
|
g.add((termURI, SKOS.prefLabel, Literal(term)))
|
||||||
|
g.add((termURI, RDFS.subClassOf, cvURI)) ## SKOS.member???
|
||||||
g.add((elementURI, OWL.range, cvURI))
|
g.add((elementURI, OWL.range, cvURI))
|
||||||
|
|
||||||
## add the controlled vocab information on properties directly
|
## add the controlled vocab information on properties directly
|
||||||
@ -144,324 +122,119 @@ def make_core():
|
|||||||
elementURI,
|
elementURI,
|
||||||
URIRef("http://purl.org/dc/dcam/rangeIncludes"),
|
URIRef("http://purl.org/dc/dcam/rangeIncludes"),
|
||||||
Literal(
|
Literal(
|
||||||
"https://raw.githubusercontent.com/alanorth/iseal-schema/main/data/controlled-vocabularies/"
|
"data/controlled-vocabularies/"
|
||||||
+ element
|
+ dspace.replace(".", "-").lower()
|
||||||
+ ".txt"
|
+ ".txt"
|
||||||
),
|
),
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
except FileNotFoundError:
|
||||||
|
continue
|
||||||
|
|
||||||
## cardinality
|
## cardinality
|
||||||
if cardinality == "MULTI SELECT FROM CONTROL LIST":
|
if cardinality == "MULTI SELECT FROM CONTROL LIST":
|
||||||
br = BNode()
|
br = BNode()
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
g.add((br, RDF.type, OWL.Restriction))
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
g.add((br, OWL.onProperty, elementURI))
|
||||||
g.add((br, OWL.minQualifiedCardinality, Literal(1)))
|
g.add((br, OWL.minQualifiedCardinality, Literal(1)))
|
||||||
g.add((br, OWL.someValuesFrom, cvURI))
|
g.add((br, OWL.someValuesFrom, cvURI))
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
g.add((conceptUri, RDFS.subClassOf, br))
|
||||||
else:
|
else:
|
||||||
br = BNode()
|
br = BNode()
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
g.add((br, RDF.type, OWL.Restriction))
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
g.add((br, OWL.onProperty, elementURI))
|
||||||
g.add((br, OWL.maxQualifiedCardinality, Literal(1)))
|
g.add((br, OWL.maxQualifiedCardinality, Literal(1)))
|
||||||
g.add((br, OWL.onClass, cvURI))
|
g.add((br, OWL.onClass, cvURI))
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
g.add((conceptUri, RDFS.subClassOf, br))
|
||||||
|
|
||||||
# elif prop_type == 'URL': ## object property
|
else: ## datatype properties
|
||||||
# g.add((elementURI, RDF.type, OWL.ObjectProperty))
|
g.add((elementURI, SKOS.prefLabel, Literal(element_name)))
|
||||||
# g.add((elementURI, OWL.domain, conceptUri))
|
g.add((elementURI, RDF.type, OWL.DatatypeProperty))
|
||||||
# g.add((elementURI, OWL.range, URIRef("") ))
|
g.add((elementURI, OWL.domain, conceptUri))
|
||||||
# g.add((elementURI, SKOS.prefLabel, Literal(element)))
|
if dc:
|
||||||
else: ## datatype properties
|
dct = dc.split(":")[1]
|
||||||
g.add((elementURI, SKOS.prefLabel, Literal(element)))
|
if "||" in dct:
|
||||||
g.add((elementURI, RDF.type, OWL.DatatypeProperty))
|
dct = dc.split(":")[0]
|
||||||
g.add((elementURI, OWL.domain, conceptUri))
|
if "wgs84" in dc:
|
||||||
if dc:
|
g.add(
|
||||||
dct = dc.split(":")[1]
|
(
|
||||||
if "wgs84" in dc:
|
elementURI,
|
||||||
g.add(
|
RDFS.subPropertyOf,
|
||||||
(
|
URIRef("http://www.w3.org/2003/01/geo/wgs84_pos#" + dct),
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef(
|
|
||||||
"http://www.w3.org/2003/01/geo/wgs84_pos#" + dct
|
|
||||||
),
|
|
||||||
)
|
|
||||||
)
|
)
|
||||||
else:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef("http://purl.org/dc/terms/" + dct),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
## add dspace alternative ID
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
URIRef("http://purl.org/dc/terms/alternative"),
|
|
||||||
Literal(dspace),
|
|
||||||
)
|
)
|
||||||
|
else:
|
||||||
|
g.add(
|
||||||
|
(
|
||||||
|
elementURI,
|
||||||
|
RDFS.subPropertyOf,
|
||||||
|
URIRef("http://purl.org/dc/terms/" + dct),
|
||||||
|
)
|
||||||
|
)
|
||||||
|
## add dspace alternative ID
|
||||||
|
g.add(
|
||||||
|
(
|
||||||
|
elementURI,
|
||||||
|
URIRef("http://purl.org/dc/terms/alternative"),
|
||||||
|
Literal(dspace),
|
||||||
)
|
)
|
||||||
range = None
|
)
|
||||||
if prop_type == "DATE":
|
range = None
|
||||||
g.add((elementURI, OWL.range, XSD.date))
|
if prop_type == "DATE":
|
||||||
range = XSD.date
|
g.add((elementURI, OWL.range, XSD.date))
|
||||||
elif prop_type == "NUMERIC VALUE":
|
range = XSD.date
|
||||||
g.add((elementURI, OWL.range, XSD.float))
|
elif prop_type == "NUMERIC VALUE":
|
||||||
range = XSD.float
|
g.add((elementURI, OWL.range, XSD.float))
|
||||||
else:
|
range = XSD.float
|
||||||
g.add((elementURI, OWL.range, XSD.string))
|
else:
|
||||||
range = XSD.string
|
g.add((elementURI, OWL.range, XSD.string))
|
||||||
##cardinality
|
range = XSD.string
|
||||||
if cardinality == "REPEAT VALUES":
|
##cardinality
|
||||||
br = BNode()
|
if cardinality == "REPEAT VALUES":
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
br = BNode()
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
g.add((br, RDF.type, OWL.Restriction))
|
||||||
g.add((br, OWL.someValuesFrom, range))
|
g.add((br, OWL.onProperty, elementURI))
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
g.add((br, OWL.someValuesFrom, range))
|
||||||
else:
|
g.add((conceptUri, RDFS.subClassOf, br))
|
||||||
br = BNode()
|
else:
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
br = BNode()
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
g.add((br, RDF.type, OWL.Restriction))
|
||||||
g.add((br, OWL.maxQualifiedCardinality, Literal(1)))
|
g.add((br, OWL.onProperty, elementURI))
|
||||||
g.add((br, OWL.onDataRange, range))
|
g.add((br, OWL.maxQualifiedCardinality, Literal(1)))
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
g.add((br, OWL.onDataRange, range))
|
||||||
|
g.add((conceptUri, RDFS.subClassOf, br))
|
||||||
|
|
||||||
if comment:
|
if comment:
|
||||||
g.add((elementURI, SKOS.scopeNote, Literal(comment)))
|
g.add((elementURI, SKOS.scopeNote, Literal(comment)))
|
||||||
if example:
|
if example:
|
||||||
g.add((elementURI, RDFS.comment, Literal(example)))
|
g.add((elementURI, RDFS.comment, Literal(example)))
|
||||||
if element_description:
|
if element_description:
|
||||||
g.add((elementURI, SKOS.definition, Literal(element_description)))
|
g.add((elementURI, SKOS.definition, Literal(element_description)))
|
||||||
# else:
|
|
||||||
# print(element_name)
|
|
||||||
|
|
||||||
## save graph
|
## save graph
|
||||||
g.serialize(destination="idds_new3.ttl", format="turtle")
|
head, tail = os.path.split(file)
|
||||||
|
filename = tail.split(".")[0]
|
||||||
|
g.serialize(destination="data/rdf/" + filename + ".ttl", format="turtle")
|
||||||
|
|
||||||
|
|
||||||
def make_fsc():
|
parser = argparse.ArgumentParser(
|
||||||
g = Graph()
|
description="Parse an ISEAL schema CSV file to export it as RDF."
|
||||||
|
)
|
||||||
##namespace
|
parser.add_argument(
|
||||||
# NS = "http://iseal.org/terms/"
|
"-i",
|
||||||
NS = "https://alanorth.github.io/iseal-schema/FSC#"
|
"--input-file",
|
||||||
## create ontology
|
help="Path to schema fields file (ie, iseal-core.csv).",
|
||||||
iseal = URIRef(NS)
|
required=True,
|
||||||
g.add((iseal, RDF.type, OWL.Ontology))
|
type=argparse.FileType("r"),
|
||||||
|
)
|
||||||
df = pd.read_excel("./idss_schema_fields_new2.xlsx", "fsc extension")
|
parser.add_argument(
|
||||||
df.dropna(how="all", axis=1)
|
"-ns",
|
||||||
df.fillna("", inplace=True)
|
"--namespace",
|
||||||
|
help="Namespace of the schema. Used to create the URIs, should point to the website (ie. https://iseal-community.github.io/iseal-core#).",
|
||||||
for index, row in df.iterrows():
|
required=True,
|
||||||
element_name = row["element name"]
|
)
|
||||||
element_description = row["element description"]
|
args = parser.parse_args()
|
||||||
comment = row["element guidance"]
|
try:
|
||||||
example = row["element link for more information"]
|
make_rdf(args.input_file.name, args.namespace)
|
||||||
cardinality = row["element options"]
|
except FileNotFoundError:
|
||||||
prop_type = row["element type"]
|
sys.stderr.write(f" Could not open {args.input_file.name}\n")
|
||||||
controlled_vocab = row["element controlled values or terms"]
|
|
||||||
module = row["idss element cluster"]
|
|
||||||
module_cat = row["fsc extension module"]
|
|
||||||
dc = row["element link for dublin core attributes"]
|
|
||||||
dspace = row["dspace field name"]
|
|
||||||
|
|
||||||
##module
|
|
||||||
moduleUri = URIRef(NS + module)
|
|
||||||
if not (None, SKOS.prefLabel, Literal(module)) in g:
|
|
||||||
##create module as skos concept
|
|
||||||
g.add((moduleUri, RDF.type, OWL.Class)) ## SKOS.Concept
|
|
||||||
g.add((moduleUri, SKOS.prefLabel, Literal(module)))
|
|
||||||
##element
|
|
||||||
# if '-' not in element_name:
|
|
||||||
if True: ## lazy reindenting
|
|
||||||
concept = module_cat # element_name.split(' - ')[0]
|
|
||||||
# element = element_name.strip()
|
|
||||||
## code from Alan
|
|
||||||
# Make sure element name is URL friendly because we need to use it in
|
|
||||||
# the file system and in the URL.
|
|
||||||
#
|
|
||||||
# Replace two or more whitespaces with one
|
|
||||||
element_name = re.sub(r"\s{2,}", " ", element_name)
|
|
||||||
# Replace unnecessary stuff in some element names (I should tell Peter
|
|
||||||
# that these belong in the description)
|
|
||||||
element_name = re.sub(r"\s?\(\w+\)", "", element_name)
|
|
||||||
# Remove commas and question marks
|
|
||||||
element_name = re.sub(r"[,?]", "", element_name)
|
|
||||||
# Replace ": " with a dash (as in "Evaluation: ")
|
|
||||||
element_name = element_name.replace(": ", "-")
|
|
||||||
# Replace " / " with a dash (as in "biome / zone")
|
|
||||||
element_name = element_name.replace(" / ", "-")
|
|
||||||
# Replace whitespace, colons, and slashes with dashes
|
|
||||||
element_name = re.sub(r"[\s/]", "-", element_name)
|
|
||||||
# Lower case it
|
|
||||||
element_name = element_name.lower()
|
|
||||||
# Strip just in case
|
|
||||||
element_name = element_name.strip()
|
|
||||||
|
|
||||||
# For example Certifying Body, FSC audit, Certificate, etc
|
|
||||||
cluster = row["idss element cluster"].capitalize()
|
|
||||||
|
|
||||||
# For example Assurance, Certification, Core, Impact, etc
|
|
||||||
module = row["fsc extension module"].capitalize()
|
|
||||||
|
|
||||||
# Generate a "safe" version of the element name for use in URLs and
|
|
||||||
# files by combining the cluster and the element name. This could
|
|
||||||
# change in the future.
|
|
||||||
element_name_safe = cluster.replace(" ", "-").lower() + "-" + element_name
|
|
||||||
|
|
||||||
element = element_name_safe
|
|
||||||
# remove extra fsc in name
|
|
||||||
element = element.replace("fsc-fsc-", "fsc-")
|
|
||||||
|
|
||||||
conceptUri = URIRef(NS + concept.replace(" ", "_"))
|
|
||||||
if not (None, SKOS.prefLabel, Literal(concept)) in g:
|
|
||||||
##create concept as skos concept
|
|
||||||
g.add((conceptUri, RDF.type, OWL.Class)) ## SKOS.Concept
|
|
||||||
g.add((conceptUri, SKOS.prefLabel, Literal(concept)))
|
|
||||||
g.add((conceptUri, RDFS.subClassOf, moduleUri))
|
|
||||||
|
|
||||||
## create properties
|
|
||||||
elementURI = URIRef(NS + element.replace(" ", "_"))
|
|
||||||
if prop_type == "CONTROLLED VALUE": ## object property
|
|
||||||
g.add((elementURI, SKOS.prefLabel, Literal(element)))
|
|
||||||
g.add((elementURI, RDF.type, OWL.ObjectProperty))
|
|
||||||
g.add((elementURI, OWL.domain, conceptUri))
|
|
||||||
## add suproperty link
|
|
||||||
if dc:
|
|
||||||
dct = dc.split(":")[1]
|
|
||||||
if "wgs84" in dc:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef(
|
|
||||||
"http://www.w3.org/2003/01/geo/wgs84_pos#" + dct
|
|
||||||
),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
else:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef("http://purl.org/dc/terms/" + dct),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
## add dspace alternative ID
|
|
||||||
# g.add((elementURI, URIRef("http://purl.org/dc/terms/alternative"), Literal(dspace)))
|
|
||||||
## create controlled vocab
|
|
||||||
cvURI = URIRef(NS + "VOCAB_" + element.replace(" ", "_"))
|
|
||||||
g.add(
|
|
||||||
(cvURI, RDF.type, OWL.Class)
|
|
||||||
) ## SKOS.Concept ## SKOS.Collection??
|
|
||||||
g.add((cvURI, SKOS.prefLabel, Literal("VOCAB " + element)))
|
|
||||||
for term in controlled_vocab.split("||"):
|
|
||||||
termURI = URIRef(NS + term.replace(" ", "_").replace("|", ""))
|
|
||||||
g.add((termURI, RDF.type, OWL.Class)) ## SKOS.Concept
|
|
||||||
g.add((termURI, SKOS.prefLabel, Literal(term)))
|
|
||||||
g.add((termURI, RDFS.subClassOf, cvURI)) ## SKOS.member???
|
|
||||||
g.add((elementURI, OWL.range, cvURI))
|
|
||||||
|
|
||||||
## add the controlled vocab information on properties directly
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
URIRef("http://purl.org/dc/dcam/rangeIncludes"),
|
|
||||||
Literal(
|
|
||||||
"https://raw.githubusercontent.com/alanorth/iseal-schema/main/data/controlled-vocabularies/"
|
|
||||||
+ element
|
|
||||||
+ ".txt"
|
|
||||||
),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
|
|
||||||
## cardinality
|
|
||||||
if cardinality == "MULTI SELECT FROM CONTROL LIST":
|
|
||||||
br = BNode()
|
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
|
||||||
g.add((br, OWL.minQualifiedCardinality, Literal(1)))
|
|
||||||
g.add((br, OWL.someValuesFrom, cvURI))
|
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
|
||||||
else:
|
|
||||||
br = BNode()
|
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
|
||||||
g.add((br, OWL.maxQualifiedCardinality, Literal(1)))
|
|
||||||
g.add((br, OWL.onClass, cvURI))
|
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
|
||||||
|
|
||||||
# elif prop_type == 'URL': ## object property
|
|
||||||
# g.add((elementURI, RDF.type, OWL.ObjectProperty))
|
|
||||||
# g.add((elementURI, OWL.domain, conceptUri))
|
|
||||||
# g.add((elementURI, OWL.range, URIRef("") ))
|
|
||||||
# g.add((elementURI, SKOS.prefLabel, Literal(element)))
|
|
||||||
else: ## datatype properties
|
|
||||||
g.add((elementURI, SKOS.prefLabel, Literal(element)))
|
|
||||||
g.add((elementURI, RDF.type, OWL.DatatypeProperty))
|
|
||||||
g.add((elementURI, OWL.domain, conceptUri))
|
|
||||||
if dc:
|
|
||||||
dct = dc.split(":")[1]
|
|
||||||
if "wgs84" in dc:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef(
|
|
||||||
"http://www.w3.org/2003/01/geo/wgs84_pos#" + dct
|
|
||||||
),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
else:
|
|
||||||
g.add(
|
|
||||||
(
|
|
||||||
elementURI,
|
|
||||||
RDFS.subPropertyOf,
|
|
||||||
URIRef("http://purl.org/dc/terms/" + dct),
|
|
||||||
)
|
|
||||||
)
|
|
||||||
## add dspace alternative ID
|
|
||||||
# g.add((elementURI, URIRef("http://purl.org/dc/terms/alternative"), Literal(dspace)))
|
|
||||||
range = None
|
|
||||||
if prop_type == "DATE":
|
|
||||||
g.add((elementURI, OWL.range, XSD.date))
|
|
||||||
range = XSD.date
|
|
||||||
elif prop_type == "NUMERIC VALUE":
|
|
||||||
g.add((elementURI, OWL.range, XSD.float))
|
|
||||||
range = XSD.float
|
|
||||||
else:
|
|
||||||
g.add((elementURI, OWL.range, XSD.string))
|
|
||||||
range = XSD.string
|
|
||||||
##cardinality
|
|
||||||
if cardinality == "REPEAT VALUES":
|
|
||||||
br = BNode()
|
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
|
||||||
g.add((br, OWL.someValuesFrom, range))
|
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
|
||||||
else:
|
|
||||||
br = BNode()
|
|
||||||
g.add((br, RDF.type, OWL.Restriction))
|
|
||||||
g.add((br, OWL.onProperty, elementURI))
|
|
||||||
g.add((br, OWL.maxQualifiedCardinality, Literal(1)))
|
|
||||||
g.add((br, OWL.onDataRange, range))
|
|
||||||
g.add((conceptUri, RDFS.subClassOf, br))
|
|
||||||
|
|
||||||
if comment:
|
|
||||||
g.add((elementURI, SKOS.scopeNote, Literal(comment)))
|
|
||||||
if example:
|
|
||||||
g.add((elementURI, RDFS.comment, Literal(example)))
|
|
||||||
if element_description:
|
|
||||||
g.add((elementURI, SKOS.definition, Literal(element_description)))
|
|
||||||
# else:
|
|
||||||
# print(element_name)
|
|
||||||
|
|
||||||
## save graph
|
|
||||||
g.serialize(destination="fsc.ttl", format="turtle")
|
|
||||||
|
|
||||||
|
|
||||||
make_core()
|
|
||||||
|
Loading…
Reference in New Issue
Block a user