From e2337fa6270ea541950cf121263879eb08f4f01e Mon Sep 17 00:00:00 2001 From: Enrico Daga Date: Sun, 13 Feb 2022 10:03:56 +0000 Subject: [PATCH 1/5] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 5c10217d..50f3c07f 100644 --- a/README.md +++ b/README.md @@ -1,4 +1,4 @@ -# Building a knowledge graph of artists and artoworks of the IMMA museum website +# Building a knowledge graph of artists and artworks of the IMMA museum website In what follows, `fx` refers to the following command ``` From cb591bd9c076c82ac3400056bd8db79fd429ccfc Mon Sep 17 00:00:00 2001 From: Enrico Daga Date: Sun, 13 Feb 2022 10:06:09 +0000 Subject: [PATCH 2/5] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 50f3c07f..37e82218 100644 --- a/README.md +++ b/README.md @@ -1,4 +1,4 @@ -# Building a knowledge graph of artists and artworks of the IMMA museum website +# Building a knowledge graph of artists and artworks scraping the IMMA museum website In what follows, `fx` refers to the following command ``` From 4baf6b3cb3921e6ea1b3ab349379c9f511b4960f Mon Sep 17 00:00:00 2001 From: Enrico Daga Date: Wed, 30 Mar 2022 11:39:22 +0100 Subject: [PATCH 3/5] Changes --- README.md | 15 ++++++++------- artworks/berry-dress.jsonld | 2 +- 2 files changed, 9 insertions(+), 8 deletions(-) diff --git a/README.md b/README.md index 5c10217d..34e7053c 100644 --- a/README.md +++ b/README.md @@ -2,26 +2,26 @@ In what follows, `fx` refers to the following command ``` -java -jar sparql-anything-0.3.2-SNAPSHOT.jar +java -jar sparql-anything-0.5.0-SNAPSHOT.jar ``` ## Process Extract the list of artists from the Web page and build an XML result set with ?artistNickname and ?artistUrl. ``` -fx -q imma-artists.sparql -o imma-artists.xml -f xml +fx -q queries/imma-artists.sparql -o imma-artists.xml -f xml ``` Extract data from the artists' Web page and build one JSON-LD file each (create folder 'artists' first). ``` -fx -q imma-artist.sparql -i imma-artists.xml -p "artists/?artistNickname.jsonld" -f json +fx -q queries/imma-artist.sparql -i imma-artists.xml -p "artists/?artistNickname.jsonld" -f json ``` Extract the list of artworks' Web pages from the JSON-LD files of the artists. ``` -fx -q imma-artworks.sparql -l artists/ -o imma-artworks.xml -f xml +fx -q queries/imma-artworks.sparql -l artists/ -o imma-artworks.xml -f xml ``` Extract data from the artworks' Web pages and build one JSON-LD file each (create folder 'artworks' first). ``` -fx -q imma-artwork.sparql -i imma-artworks.xml -p "artworks/?artworkNickname.jsonld" -f json +fx -q queries/imma-artwork.sparql -i imma-artworks.xml -p "artworks/?artworkNickname.jsonld" -f json ``` Load into your favourite triple store. @@ -29,9 +29,10 @@ Load into your favourite triple store. Extract data from a specific artist Web page: ``` -fx -q imma-artist.sparql -v artistNickname=lambert-gene -v artistUrl=https://imma.ie/artists/gene-lambert/ -p "artists/?artistNickname.jsonld" -f json +fx -q queries/imma-artist.sparql -v artistNickname=lambert-gene -v artistUrl=https://imma.ie/artists/gene-lambert/ -p "artists/?artistNickname.jsonld" -f json ``` Extract data from a specific artwork Web page: ``` -fx -q imma-artwork.sparql -v artworkNickname=naturaleza-desde-la-ventana -v artworkUrl=https://imma.ie/collection/naturaleza-desde-la-ventana/ -p "artworks/?artworkNickname.jsonld" -f json +fx -q queries/imma-artwork.sparql -v artworkNickname=naturaleza-desde-la-ventana -v artworkUrl=https://imma.ie/collection/naturaleza-desde-la-ventana/ -p "artworks/?artworkNickname.jsonld" -f json +fx -q queries/imma-artwork.sparql -v artworkNickname=berry-dress -v artworkUrl=https://imma.ie/collection/berry-dress/ -p "artworks/?artworkNickname.jsonld" -f json ``` diff --git a/artworks/berry-dress.jsonld b/artworks/berry-dress.jsonld index cb4fabf0..6a780f0c 100644 --- a/artworks/berry-dress.jsonld +++ b/artworks/berry-dress.jsonld @@ -16,7 +16,7 @@ "caption" : "Alice Maher, Berry Dress, 1994, Rosehips, cotton, paint, sewing pins, 25 x 32 x 24 cm, Collection Irish Museum of Modern Art, Purchase, assisted by funding from Maire and Maurice Foley, 1995 ", "copyrightNotice" : "For copyright information, please contact the IMMA Collections team.", "maintainer" : "https://w3id.org/spice/institute/imma", - "url" : "https://imma.ie/wp-content/uploads/2021/07/3.jpg" + "url" : "https://imma.ie/wp-content/uploads/2022/01/3.jpg" } ], "@context" : { "copyrightNotice" : { From 38a0645e3c0f85c666ac9c113c77932d289593ed Mon Sep 17 00:00:00 2001 From: Enrico Daga Date: Wed, 30 Mar 2022 11:41:25 +0100 Subject: [PATCH 4/5] Update artwork --- ...tutions-republicaines-iv-checkpoint.jsonld | 71 +++++++++++++++++++ ...r-les-institutions-republicaines-iv.jsonld | 4 +- 2 files changed, 73 insertions(+), 2 deletions(-) create mode 100644 artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld diff --git a/artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld b/artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld new file mode 100644 index 00000000..77f8f223 --- /dev/null +++ b/artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld @@ -0,0 +1,71 @@ +{ + "@graph" : [ { + "@id" : "spice:artefact/fragmens-sur-les-institutions-republicaines-iv", + "@type" : "schema:CreativeWork", + "description" : "Shane Cullen is an Irish artist whose largely text-based work deals with political issues, often specifically with official documents and symbols. ‘Fragmens Sur Les Institutions Republicaines IV’ was made over a period of four years and consists of 96 large styrofoam panels, each carrying transcriptions of the secret messages smuggled out of the H-Blocks in the Maze Prison in Northern Ireland during the period of the 1981 hunger strike by Republican prisoners. The subject matter is controversial and subversive but presented in a highly disciplined fashion that suggests historical, sculptural monuments. Each painted word is straight-jacketed into a typeface, which mimics official government documents. The piece has been widely shown – both as a work in progress, in various contexts, not least at the Irish exhibition at the Venice Biennale in 1995; and as a completed installation. More recently the artist was commissioned to create an artwork on the subject of the Good Friday Agreement, signed in Belfast in 1998.", + "source" : "https://imma.ie/collection/fragmens-sur-les-institutions-republicaines-iv/", + "creditText" : "IMMA Collection: Purchase, 2000", + "image" : "spice:documentation/fragmens-sur-les-institutions-republicaines-iv", + "maintainer" : "https://w3id.org/spice/institute/imma", + "material" : "Painted text; acyrlic on 96 styrofoam panels", + "size" : "12 blocks of 8 panels, each block 251 x 480 x 6 cm", + "hasInventory" : "IMMA.846" + }, { + "@id" : "spice:documentation/fragmens-sur-les-institutions-republicaines-iv", + "@type" : "schema:ImageObject", + "caption" : "Shane Cullen, Fragmens sur les Institutions Républicaines IV, 1993, Painted text; acyrlic on 96 styrofoam panels, 12 blocks of 8 panels, each block 251 x 480 x 6 cm, Collection Irish Museum of Modern Art, Purchase, 2000 ", + "copyrightNotice" : "For copyright information, please contact the IMMA Collections team.", + "maintainer" : "https://w3id.org/spice/institute/imma", + "url" : "https://imma.ie/wp-content/uploads/2021/08/1750.jpg" + } ], + "@context" : { + "copyrightNotice" : { + "@id" : "http://schema.org/copyrightNotice" + }, + "caption" : { + "@id" : "http://schema.org/caption" + }, + "maintainer" : { + "@id" : "http://schema.org/maintainer", + "@type" : "@id" + }, + "url" : { + "@id" : "http://schema.org/url" + }, + "hasInventory" : { + "@id" : "https://w3id.org/arco/ontology/context-description/hasInventory" + }, + "creditText" : { + "@id" : "http://schema.org/creditText" + }, + "size" : { + "@id" : "http://schema.org/size" + }, + "material" : { + "@id" : "http://schema.org/material" + }, + "description" : { + "@id" : "http://purl.org/dc/elements/1.1/description" + }, + "image" : { + "@id" : "http://schema.org/image", + "@type" : "@id" + }, + "source" : { + "@id" : "http://purl.org/dc/elements/1.1/source" + }, + "schema" : "http://schema.org/", + "arco-core" : "https://w3id.org/arco/ontology/core/", + "dom" : "https://html.spec.whatwg.org/#", + "owl" : "http://www.w3.org/2002/07/owl#", + "spice" : "https://w3id.org/spice/imma/", + "rdfs" : "http://www.w3.org/2000/01/rdf-schema#", + "xhtml" : "http://www.w3.org/1999/xhtml#", + "arco" : "https://w3id.org/arco/ontology/arco/", + "fx" : "http://sparql.xyz/facade-x/ns/", + "rdf" : "http://www.w3.org/1999/02/22-rdf-syntax-ns#", + "arco-cd" : "https://w3id.org/arco/ontology/context-description/", + "foaf" : "http://xmlns.com/foaf/0.1/", + "dc" : "http://purl.org/dc/elements/1.1/" + } +} diff --git a/artworks/fragmens-sur-les-institutions-republicaines-iv.jsonld b/artworks/fragmens-sur-les-institutions-republicaines-iv.jsonld index 77f8f223..e8efde30 100644 --- a/artworks/fragmens-sur-les-institutions-republicaines-iv.jsonld +++ b/artworks/fragmens-sur-les-institutions-republicaines-iv.jsonld @@ -16,7 +16,7 @@ "caption" : "Shane Cullen, Fragmens sur les Institutions Républicaines IV, 1993, Painted text; acyrlic on 96 styrofoam panels, 12 blocks of 8 panels, each block 251 x 480 x 6 cm, Collection Irish Museum of Modern Art, Purchase, 2000 ", "copyrightNotice" : "For copyright information, please contact the IMMA Collections team.", "maintainer" : "https://w3id.org/spice/institute/imma", - "url" : "https://imma.ie/wp-content/uploads/2021/08/1750.jpg" + "url" : "https://imma.ie/wp-content/uploads/2021/11/1750.jpg" } ], "@context" : { "copyrightNotice" : { @@ -54,8 +54,8 @@ "source" : { "@id" : "http://purl.org/dc/elements/1.1/source" }, - "schema" : "http://schema.org/", "arco-core" : "https://w3id.org/arco/ontology/core/", + "schema" : "http://schema.org/", "dom" : "https://html.spec.whatwg.org/#", "owl" : "http://www.w3.org/2002/07/owl#", "spice" : "https://w3id.org/spice/imma/", From e3f6690032ce7e434857a87021284c73f433261f Mon Sep 17 00:00:00 2001 From: Enrico Daga Date: Wed, 30 Mar 2022 11:45:15 +0100 Subject: [PATCH 5/5] Removed file --- ...tutions-republicaines-iv-checkpoint.jsonld | 71 ------------------- 1 file changed, 71 deletions(-) delete mode 100644 artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld diff --git a/artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld b/artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld deleted file mode 100644 index 77f8f223..00000000 --- a/artworks/.ipynb_checkpoints/fragmens-sur-les-institutions-republicaines-iv-checkpoint.jsonld +++ /dev/null @@ -1,71 +0,0 @@ -{ - "@graph" : [ { - "@id" : "spice:artefact/fragmens-sur-les-institutions-republicaines-iv", - "@type" : "schema:CreativeWork", - "description" : "Shane Cullen is an Irish artist whose largely text-based work deals with political issues, often specifically with official documents and symbols. ‘Fragmens Sur Les Institutions Republicaines IV’ was made over a period of four years and consists of 96 large styrofoam panels, each carrying transcriptions of the secret messages smuggled out of the H-Blocks in the Maze Prison in Northern Ireland during the period of the 1981 hunger strike by Republican prisoners. The subject matter is controversial and subversive but presented in a highly disciplined fashion that suggests historical, sculptural monuments. Each painted word is straight-jacketed into a typeface, which mimics official government documents. The piece has been widely shown – both as a work in progress, in various contexts, not least at the Irish exhibition at the Venice Biennale in 1995; and as a completed installation. More recently the artist was commissioned to create an artwork on the subject of the Good Friday Agreement, signed in Belfast in 1998.", - "source" : "https://imma.ie/collection/fragmens-sur-les-institutions-republicaines-iv/", - "creditText" : "IMMA Collection: Purchase, 2000", - "image" : "spice:documentation/fragmens-sur-les-institutions-republicaines-iv", - "maintainer" : "https://w3id.org/spice/institute/imma", - "material" : "Painted text; acyrlic on 96 styrofoam panels", - "size" : "12 blocks of 8 panels, each block 251 x 480 x 6 cm", - "hasInventory" : "IMMA.846" - }, { - "@id" : "spice:documentation/fragmens-sur-les-institutions-republicaines-iv", - "@type" : "schema:ImageObject", - "caption" : "Shane Cullen, Fragmens sur les Institutions Républicaines IV, 1993, Painted text; acyrlic on 96 styrofoam panels, 12 blocks of 8 panels, each block 251 x 480 x 6 cm, Collection Irish Museum of Modern Art, Purchase, 2000 ", - "copyrightNotice" : "For copyright information, please contact the IMMA Collections team.", - "maintainer" : "https://w3id.org/spice/institute/imma", - "url" : "https://imma.ie/wp-content/uploads/2021/08/1750.jpg" - } ], - "@context" : { - "copyrightNotice" : { - "@id" : "http://schema.org/copyrightNotice" - }, - "caption" : { - "@id" : "http://schema.org/caption" - }, - "maintainer" : { - "@id" : "http://schema.org/maintainer", - "@type" : "@id" - }, - "url" : { - "@id" : "http://schema.org/url" - }, - "hasInventory" : { - "@id" : "https://w3id.org/arco/ontology/context-description/hasInventory" - }, - "creditText" : { - "@id" : "http://schema.org/creditText" - }, - "size" : { - "@id" : "http://schema.org/size" - }, - "material" : { - "@id" : "http://schema.org/material" - }, - "description" : { - "@id" : "http://purl.org/dc/elements/1.1/description" - }, - "image" : { - "@id" : "http://schema.org/image", - "@type" : "@id" - }, - "source" : { - "@id" : "http://purl.org/dc/elements/1.1/source" - }, - "schema" : "http://schema.org/", - "arco-core" : "https://w3id.org/arco/ontology/core/", - "dom" : "https://html.spec.whatwg.org/#", - "owl" : "http://www.w3.org/2002/07/owl#", - "spice" : "https://w3id.org/spice/imma/", - "rdfs" : "http://www.w3.org/2000/01/rdf-schema#", - "xhtml" : "http://www.w3.org/1999/xhtml#", - "arco" : "https://w3id.org/arco/ontology/arco/", - "fx" : "http://sparql.xyz/facade-x/ns/", - "rdf" : "http://www.w3.org/1999/02/22-rdf-syntax-ns#", - "arco-cd" : "https://w3id.org/arco/ontology/context-description/", - "foaf" : "http://xmlns.com/foaf/0.1/", - "dc" : "http://purl.org/dc/elements/1.1/" - } -}