diff --git a/Scripts/DataCleaning/dbpedia-uri.py b/Scripts/DataCleaning/dbpedia-uri.py index 4107e71..f0c5ede 100644 --- a/Scripts/DataCleaning/dbpedia-uri.py +++ b/Scripts/DataCleaning/dbpedia-uri.py @@ -44,7 +44,8 @@ def print_dbpedia(file: str, out: str): if len(sections) < 3: continue - URI = "/".join(sections[:3]) + URI = "/".join(sections[1:3]) + URI = "//".join([sections[0], URI]) if URI in already_parsed: continue