diff --git a/Scripts/DataBaseQueries/dataset.sql b/Scripts/DataBaseQueries/dataset.sql index 7a9e4cb..18185e8 100644 --- a/Scripts/DataBaseQueries/dataset.sql +++ b/Scripts/DataBaseQueries/dataset.sql @@ -14,15 +14,17 @@ INNER JOIN WikipediaAbstracts USING (MovieID); SELECT * FROM Abbreviations; +-- More complex to have clean dataset -- More complex to have clean dataset SELECT MovieID, GROUP_CONCAT('' || '' || SubjectURI || '' || RelationshipURI || '' || ObjectURI || '', '') as RDF_String, Abstract FROM RDFs +INNER JOIN SubjectsCountInRDFs USING (SubjectID) INNER JOIN RelationshipsCountInRDFs USING(RelationshipID) +INNER JOIN ObjectsCountInRDFs USING (ObjectID) INNER JOIN ParsedSubjects USING (SubjectID) INNER JOIN ParsedRelationships USING (RelationshipID) INNER JOIN ParsedObjects USING (ObjectID) INNER JOIN WikipediaAbstracts USING (MovieID) -- insert WHERE here --- WHERE Rel_Count > 10 --- AND MovieID IN (10, 100, 1000) -GROUP BY MovieID; +-- WHERE SubjectID = 134626 +GROUP BY MovieID; \ No newline at end of file