29 lines
884 B
SQL
29 lines
884 B
SQL
-- To pass to Pandas
|
|
SELECT *
|
|
FROM RDFs
|
|
INNER JOIN Subjects USING (SubjectID)
|
|
INNER JOIN Relationships USING (RelationshipID)
|
|
INNER JOIN Objects USING (ObjectID);
|
|
|
|
-- To pass to Pandas for abstracts
|
|
SELECT *
|
|
FROM RDFs
|
|
INNER JOIN WikipediaAbstracts USING (MovieID);
|
|
|
|
-- To pass to Pandas for abbreviations
|
|
SELECT *
|
|
FROM Abbreviations;
|
|
|
|
-- More complex to have clean dataset
|
|
SELECT MovieID, GROUP_CONCAT('<SOT>' || '<SUB>' || SubjectURI || '<REL>' || RelationshipURI || '<OBJ>' || ObjectURI || '<EOT>', '') as RDF_String, Abstract
|
|
FROM RDFs
|
|
INNER JOIN RelationshipsCountInRDFs USING(RelationshipID)
|
|
INNER JOIN ParsedSubjects USING (SubjectID)
|
|
INNER JOIN ParsedRelationships USING (RelationshipID)
|
|
INNER JOIN ParsedObjects USING (ObjectID)
|
|
INNER JOIN WikipediaAbstracts USING (MovieID)
|
|
-- insert WHERE here
|
|
-- WHERE Rel_Count > 10
|
|
-- AND MovieID IN (10, 100, 1000)
|
|
GROUP BY MovieID;
|