From 7e22ba7e38e2dd68612246d3c357936d6710224c Mon Sep 17 00:00:00 2001 From: giulia Date: Wed, 17 Jul 2024 13:08:30 +0200 Subject: [PATCH 1/9] Table Datasets --- src/pages/datasets-temp.astro | 344 +++++++++++++++++++++++++++++++--- 1 file changed, 322 insertions(+), 22 deletions(-) diff --git a/src/pages/datasets-temp.astro b/src/pages/datasets-temp.astro index 79c6f01..1c0b40b 100644 --- a/src/pages/datasets-temp.astro +++ b/src/pages/datasets-temp.astro @@ -32,6 +32,8 @@ import data from "@/assets/sti-survey.json";
+ + @@ -99,7 +101,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >WebTableStitching[112]WebTableStitching [112] @@ -285,7 +287,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >SOTAB[77]SOTAB [77] @@ -302,7 +304,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >Wikary[89]Wikary [89] @@ -319,7 +321,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >GitTables[55]GitTables [55] @@ -363,7 +365,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >TURL[37]TURL [37] @@ -407,7 +409,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >TSOTSACorpus[64]TSOTSACorpus [64] @@ -468,8 +470,6 @@ import data from "@/assets/sti-survey.json"; - - @@ -491,8 +491,6 @@ import data from "@/assets/sti-survey.json"; - - @@ -514,15 +512,14 @@ import data from "@/assets/sti-survey.json"; - - @@ -545,7 +542,19 @@ import data from "@/assets/sti-survey.json"; - + @@ -561,8 +570,6 @@ import data from "@/assets/sti-survey.json"; - - - - @@ -594,9 +599,304 @@ import data from "@/assets/sti-survey.json"; - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
50 @@ -214,7 +216,7 @@ import data from "@/assets/sti-survey.json"; scope="row" colspan="2" class="p-3 min-w-40 font-medium whitespace-nowrap" - >Taheriyan[129]Taheriyan [129] 29 MammoTab[87]MammoTab [87] 980K 5,6M 108K - 81,7K 22,5K 962K 11,5M 484K 2,8M 16K -14,8K 464K 6,7K
5,7K 407K 7,6K
1,7K 107K 2,7K
SemTab2020 985K 136K Wikidata[1, 11, ][1, + 11, + 13, + 23, + 27, + 30, + 59, + 69, + 71, + 99, + 118, + 134, + 143]
- 1,2M -DBpedia[37]
- 1,2M -DBpedia[37]
- 1,2M -DBpedia[37]
+ SemTab2021 + + R1 + 180
+ 802 + (1|8|4,46) +
+ 194K + (6|15,5K|1,08K) +
539667K56,5K +
+ Wikidata + DBpedia +
[2, 3, 9, + 12, + 58, + 100, + 121, + 142 + ]
+ R2 + 1,7K
+ 5,6K + (2|7|3,19) +
+ 29,3K + (5|58|17,73) +
2,1K47,4K3,8KWikidata
+ R3 + 7,2KK
+ 17,9K + (2|5|2,48) +
+ 58,9K + (5|21|9,18) +
7,2K58,9K10,7K
+ SemTab2022 + + R1 + 3,8K
+ 9,9K + (2|5|2,56) +
+ 22,4K + (4|8|5,69) +
2401,4K319Wikidata[4, + 24, + 13, + 29, + 57, + 84]
+ R2 HT + 5,1K
+ 13,3K + (2|5|2,56) +
+ 28,5K + (4|8|5,57) +
3981,9K348
+ R2 2T + 180802195K
+ 97 + 111 +
+ 81K + 177K +
-
+ Wikipedia + DBpedia +
+ R3 Biodiv + 501,2K12,9K431,5K-
+ R3 GitTables + 7,6K198K841K
+ 6,2K + 4,4K + 1K +
--
+ Wikidata + Schema.org + Schema.org +
+ SemTab2023 + + R1 + 10,4K
+ 26,1K + (2|4|2,51) +
+ 49,1K + (3|11|5,72) +
--- +
+ Wikidata + tfood + Schema.org +
-
+ R2 + ------ +
+ Schema.org + dbpedia +
-
From 330ccb5aac9e4ee479c57e62750869831d59d30c Mon Sep 17 00:00:00 2001 From: giulia Date: Wed, 17 Jul 2024 13:30:48 +0200 Subject: [PATCH 2/9] Link --- src/pages/datasets-temp.astro | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pages/datasets-temp.astro b/src/pages/datasets-temp.astro index 1c0b40b..f9779d0 100644 --- a/src/pages/datasets-temp.astro +++ b/src/pages/datasets-temp.astro @@ -518,7 +518,7 @@ import data from "@/assets/sti-survey.json"; SemTab2020 From 4f86b91c7667055d517e91af451ff9527fa2768e Mon Sep 17 00:00:00 2001 From: giulia Date: Wed, 17 Jul 2024 14:31:09 +0200 Subject: [PATCH 3/9] Datasets --- src/pages/datasets-temp.astro | 25 +++++++++++++------------ 1 file changed, 13 insertions(+), 12 deletions(-) diff --git a/src/pages/datasets-temp.astro b/src/pages/datasets-temp.astro index f9779d0..8dd4609 100644 --- a/src/pages/datasets-temp.astro +++ b/src/pages/datasets-temp.astro @@ -13,18 +13,6 @@ import data from "@/assets/sti-survey.json";
-
-

- Datasets infographic -

-
- -
-

@@ -901,6 +889,19 @@ import data from "@/assets/sti-survey.json";

+
+

+ Datasets infographic +

+
+ +
+
+ From 347b7b172a68592e87e2fc5009210b31298a4118 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Giulia=20Volont=C3=A9?= Date: Wed, 17 Jul 2024 14:57:48 +0200 Subject: [PATCH 4/9] table color fix --- src/pages/datasets-temp.astro | 911 ++++++++++++++++++++-------------- tailwind.config.mjs | 2 + 2 files changed, 541 insertions(+), 372 deletions(-) diff --git a/src/pages/datasets-temp.astro b/src/pages/datasets-temp.astro index 8dd4609..7902e5c 100644 --- a/src/pages/datasets-temp.astro +++ b/src/pages/datasets-temp.astro @@ -20,8 +20,6 @@ import data from "@/assets/sti-survey.json";
- - @@ -49,12 +47,15 @@ import data from "@/assets/sti-survey.json"; - + T2Dv2 [112]21, 22, 30, 37, 40, 43, 44 + , 48, 56, 69, 78, 84, 105, 113, + 144, 148] - + WebTableStitching [112] - + - + - + [21, 22, 30, 40, 44 + , 48, 69, 84, 149, 152] - + LimayeAll [149] @@ -148,12 +212,15 @@ import data from "@/assets/sti-survey.json"; - + Limaye200 [149] @@ -162,15 +229,23 @@ import data from "@/assets/sti-survey.json"; - + - + MusicBrainz [149] @@ -179,15 +254,23 @@ import data from "@/assets/sti-survey.json"; - + - + IMDB [149] @@ -196,15 +279,23 @@ import data from "@/assets/sti-survey.json"; - + - + Taheriyan [129] - + - + Tough Table (2T) [32] - + MammoTab [87] @@ -270,12 +370,14 @@ import data from "@/assets/sti-survey.json"; - + SOTAB [77] @@ -287,12 +389,15 @@ import data from "@/assets/sti-survey.json"; - + Wikary [89] @@ -304,12 +409,13 @@ import data from "@/assets/sti-survey.json"; - + GitTables [55] @@ -321,12 +427,15 @@ import data from "@/assets/sti-survey.json"; - + RedTab [119] - + TURL [37] @@ -362,15 +473,21 @@ import data from "@/assets/sti-survey.json"; - + - + BiodivTab [5] - + - + TSOTSACorpus [64] @@ -409,7 +530,7 @@ import data from "@/assets/sti-survey.json"; - + - - + + - + - + - - + + - + - - + + - + - - + + - + @@ -518,34 +666,43 @@ import data from "@/assets/sti-survey.json"; R1 - - + + - - + + - + - + - + - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
T2Dv2 [112] 234 @@ -74,22 +75,53 @@ import data from "@/assets/sti-survey.json"; 154 DBpedia - [21, 22, 30, 37, 40, 43, 44 - , 48, 56, 69, 78, 84, 105, 113, - 144, 148]
WebTableStitching [112] 50 @@ -108,10 +140,15 @@ import data from "@/assets/sti-survey.json"; 400 6 DBpedia [112] + [112] +
143K 90 Wikipedia, Yago [21, 22, 30, 40, 44 - , 48, 69, 84, 149, 152]
LimayeAll [149] 6,3K 28,5K-
Limaye200 [149] 200 903- 361 Freebase[149][149]
MusicBrainz [149] 1,4K 9,8K93,3K 7K Freebase[149][149]
IMDB [149] 7,4K 7,4K92,3K - Freebase[149][149]
Taheriyan [129] 29 - - Schema.org[129][129]
Tough Table (2T) [32] 180 -
MammoTab [87] 980K 5,6M-
SOTAB [77] 108K --
Wikary [89] 81,7K 22,5K-
GitTables [55] 962K 11,5M-
RedTab [119] 9K -
TURL [37] 484K 2,8M1,2M - DBpedia[37][37]
BiodivTab [5] 50 1,2K - Wikidata[5][5]
TSOTSACorpus [64] 16K --
64
- 320 - (3|14|5,05) -
- 9K - (7|586|143) -
+ 320 + (3|14|5,05) +
+ 9K + (7|586|143) +
120 8,4K 116 DBpedia[20, 28, 91, 97, 122, 133 ][20, 28, 91, 97, 122, 133 ]
11,9K
- 59,6K - (1|51|5,55) -
- 29,8K - (1|1,5K|27,06) -
+ 59,6K + (1|51|5,55) +
+ 29,8K + (1|1,5K|27,06) +
14,8K 464K 6,7K
2,1K
- 10,8K - (4|8|4,51) -
- 153K - (6|207|71,69) -
+ 10,8K + (4|8|4,51) +
+ 153K + (6|207|71,69) +
5,7K 407K 7,6K
817
- 3,3K - (4|8|4,36) -
- 51,4K - (6|198|63,73) -
+ 3,3K + (4|8|4,36) +
+ 51,4K + (6|198|63,73) +
1,7K 107K 2,7K
SemTab2020 34,3K
- 170K - (4|8|4,96) -
- 249K - (5|16|8,7) -
+ 170K + (4|8|4,96) +
+ 249K + (5|16|8,7) +
136K 985K 136KWikidata[1, - 11, - 13, - 23, - 27, - 30, - 59, - 69, - 71, - 99, - 118, - 134, - 143]Wikidata[1, + 11, + 13, + 23, + 27, + 30, + 59, + 69, + 71, + 99, + 118, + 134, + 143]
1,2M -
-
-
+ R2 + 1,7K
+ 5,6K + (2|7|3,19) +
+ 29,3K + (5|58|17,73) +
2,1K47,4K3,8KWikidata
+ R3 + 7,2KK
+ 17,9K + (2|5|2,48) +
+ 58,9K + (5|21|9,18) +
7,2K58,9K10,7K
+ SemTab2022 + + R1 + 3,8K
+ 9,9K + (2|5|2,56) +
+ 22,4K + (4|8|5,69) +
2401,4K319Wikidata[4, + 24, + 13, + 29, + 57, + 84]
+ R2 HT + 5,1K
+ 13,3K + (2|5|2,56) +
+ 28,5K + (4|8|5,57) +
3981,9K348
+ R2 2T + 180802195K
+ 97 + 111 +
+ 81K + 177K +
-
+ Wikipedia + DBpedia +
+ +
+ R3 Biodiv + 501,2K12,9K431,5K-
- R2 - 1,7K
- 5,6K - (2|7|3,19) -
- 29,3K - (5|58|17,73) -
2,1K47,4K3,8KWikidata
- R3 - 7,2KK
- 17,9K - (2|5|2,48) -
- 58,9K - (5|21|9,18) -
7,2K58,9K10,7K
- SemTab2022 - - R1 - 3,8K
- 9,9K - (2|5|2,56) -
- 22,4K - (4|8|5,69) -
2401,4K319Wikidata[4, - 24, - 13, - 29, - 57, - 84]
- R2 HT - 5,1K
- 13,3K - (2|5|2,56) -
- 28,5K - (4|8|5,57) -
3981,9K348
- R2 2T - 180802195K
- 97 - 111 -
- 81K - 177K -
-
- Wikipedia - DBpedia -
- R3 Biodiv - 501,2K12,9K431,5K-
- R3 GitTables - 7,6K198K841K
- 6,2K - 4,4K - 1K -
--
- Wikidata - Schema.org - Schema.org -
- SemTab2023 - - R1 - 10,4K
- 26,1K - (2|4|2,51) -
- 49,1K - (3|11|5,72) -
--- -
- Wikidata - tfood - Schema.org -
-
- R2 - ------ -
- Schema.org - dbpedia -
-
+ R3 GitTables + 7,6K198K841K
+ 6,2K + 4,4K + 1K +
--
+ Wikidata + Schema.org + Schema.org +
+ SemTab2023 + + R1 + 10,4K
+ 26,1K + (2|4|2,51) +
+ 49,1K + (3|11|5,72) +
--- +
+ Wikidata + tfood + Schema.org +
-
+ R2 + ------ +
+ Schema.org + dbpedia +
-
-
-
-

- Datasets infographic -

-
- +
+

+ Datasets infographic +

+
+ +
- diff --git a/tailwind.config.mjs b/tailwind.config.mjs index c80ff1c..9208f29 100644 --- a/tailwind.config.mjs +++ b/tailwind.config.mjs @@ -44,8 +44,10 @@ export default { }, cardBackground: "#0C0C2F", sectionBackground: "#0C0C2F", + tableTop: "#38384C", tableBottom: "#1E1A26", + tableDark: "#19121C", tableAlt: "#282332", tableText: "#A5A0B5", iconBackground: { From fb45bf820ac73e378a58c0913d261f59eda0f3aa Mon Sep 17 00:00:00 2001 From: giulia Date: Wed, 17 Jul 2024 15:30:53 +0200 Subject: [PATCH 5/9] tools layout --- src/components/Header.astro | 1 + src/pages/tools.astro | 81 +++++++++++++++++++++++++++++++++++++ 2 files changed, 82 insertions(+) create mode 100644 src/pages/tools.astro diff --git a/src/components/Header.astro b/src/components/Header.astro index 7f87572..73df540 100644 --- a/src/components/Header.astro +++ b/src/components/Header.astro @@ -40,6 +40,7 @@ import MenuItem from "@components/MenuItem.astro"; +
diff --git a/src/pages/tools.astro b/src/pages/tools.astro new file mode 100644 index 0000000..bbf97b3 --- /dev/null +++ b/src/pages/tools.astro @@ -0,0 +1,81 @@ +--- +import Layout from "@/layouts/Layout.astro"; +import Section from "@components/Section.astro"; +--- + + +
+
+

Tools

+

In this page you will find the tools

+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Functionalities Karma TableMminer+ Magic MTab MantisTable STAN OpenRefine Trifacta Odalic DataGraft Dagobah SemTUI
Semtab2019 R4 0.983 - 0.832
Semtab2020 R4 0.907 0.993 0.997
Semtab2020 2T 0.907 0.728 -
Semtab2021 R3 0.968 0.984 0.993
MammoTab 22 0.853 0.659 -
+
+
+
+ From 5553be986799e9fc95877881b0be88e70312c51f Mon Sep 17 00:00:00 2001 From: giulia Date: Wed, 17 Jul 2024 18:06:28 +0200 Subject: [PATCH 6/9] fixes tools and dataset --- src/assets/check.svg | 1 + src/assets/x.svg | 1 + src/pages/datasets-temp.astro | 378 ++++++------ src/pages/datasets.astro | 1073 ++++++++++++++++++++++++++++++++- src/pages/tools.astro | 428 +++++++++++-- 5 files changed, 1638 insertions(+), 243 deletions(-) create mode 100644 src/assets/check.svg create mode 100644 src/assets/x.svg diff --git a/src/assets/check.svg b/src/assets/check.svg new file mode 100644 index 0000000..f5d8fb1 --- /dev/null +++ b/src/assets/check.svg @@ -0,0 +1 @@ + \ No newline at end of file diff --git a/src/assets/x.svg b/src/assets/x.svg new file mode 100644 index 0000000..9a44d00 --- /dev/null +++ b/src/assets/x.svg @@ -0,0 +1 @@ + \ No newline at end of file diff --git a/src/pages/datasets-temp.astro b/src/pages/datasets-temp.astro index 7902e5c..5155541 100644 --- a/src/pages/datasets-temp.astro +++ b/src/pages/datasets-temp.astro @@ -24,8 +24,8 @@ import data from "@/assets/sti-survey.json"; GS - Tables - + Tables +
cols (min|max|x) @@ -37,9 +37,9 @@ import data from "@/assets/sti-survey.json"; (min|max|x)
- Classes - Entities - Pred. + Classes + Entities + Pred. KG Used for validation by @@ -57,7 +57,7 @@ import data from "@/assets/sti-survey.json"; >112] - 234 + 234
1,2K @@ -70,9 +70,9 @@ import data from "@/assets/sti-survey.json"; (1|5K|84,55)
- 39 - - - 154 + 39 + - + 154 DBpedia [112] - 50 + 50
300 @@ -136,9 +136,9 @@ import data from "@/assets/sti-survey.json"; (3|83|14,84)
- 9 - 400 - 6 + 9 + 400 + 6 DBpedia [Limaye [82] - 6,5K - - - - - 747 - 143K - 90 + 6,5K + - + - + 747 + 143K + 90 Wikipedia, Yago [149] - 6,3K - 28,5K - 136K - - - 227K - - + 6,3K + 28,5K + 136K + - + 227K + - Freebase - - + - @@ -222,12 +222,12 @@ import data from "@/assets/sti-survey.json"; >149] - 200 - 903 - 4,1K - 615 - - - 361 + 200 + 903 + 4,1K + 615 + - + 361 Freebase [149] - 1,4K - 9,8K - - - - - 93,3K - 7K - Freebase + 1,4K + 9,8K + - + - + 93,3K + 7K + Freebase [149] - 7,4K - 7,4K - - - - - 92,3K - - + 7,4K + 7,4K + - + - + 92,3K + - Freebase [129] - 29 + 29
2,5K @@ -310,9 +310,9 @@ import data from "@/assets/sti-survey.json"; (1|13,8K|937)
- - - - - - + - + - + - Schema.org [32] - 180 + 180
194K @@ -344,11 +344,11 @@ import data from "@/assets/sti-survey.json"; (6|15,5K|108K)
- 540 - 667K - 0 + 540 + 667K + 0 Wikidata, DBpedia - - + - @@ -360,14 +360,14 @@ import data from "@/assets/sti-survey.json"; >87] - 980K - 5,6M - 2,3M - 2M - 2,8M - - + 980K + 5,6M + 2,3M + 2M + 2,8M + - Wikidata - - + - @@ -379,14 +379,14 @@ import data from "@/assets/sti-survey.json"; >77] - 108K - - - - - 91 - - - 176 + 108K + - + - + 91 + - + 176 Schema.org - - + - @@ -399,14 +399,14 @@ import data from "@/assets/sti-survey.json"; >89] - 81,7K - 22,5K - 63,9K - - - 30,6K - 188 + 81,7K + 22,5K + 63,9K + - + 30,6K + 188 Wikidata - - + - @@ -417,14 +417,14 @@ import data from "@/assets/sti-survey.json"; >GitTables [55] - 962K - 11,5M - 13,6M - 2,4K - - - - + 962K + 11,5M + 13,6M + 2,4K + - + - Schema.org, DBpedia - - + - @@ -437,7 +437,7 @@ import data from "@/assets/sti-survey.json"; >119] - 9K + 9K
44,6K @@ -450,11 +450,11 @@ import data from "@/assets/sti-survey.json"; (1|353|17,09)
- 70 - - - 23 + 70 + - + 23 Music, Literature - - + - @@ -466,12 +466,12 @@ import data from "@/assets/sti-survey.json"; href="https://dl.acm.org/doi/10.1145/3542700.3542709">37] - 484K - 2,8M - 7,9M - - - 1,2M - - + 484K + 2,8M + 7,9M + - + 1,2M + - DBpedia [5] - 50 + 50
1,2K @@ -502,9 +502,9 @@ import data from "@/assets/sti-survey.json"; (26|4,9K|261)
- 84 - 1,2K - - + 84 + 1,2K + - Wikidata [5]64] - 16K - - - - - 200 - 60K - - + 16K + - + - + 200 + 60K + - Food Data - - + - @@ -544,7 +544,7 @@ import data from "@/assets/sti-survey.json"; > R1 - 64 + 64
320 @@ -557,9 +557,9 @@ import data from "@/assets/sti-survey.json"; (7|586|143)
- 120 - 8,4K - 116 + 120 + 8,4K + 116 DBpedia [ R2 - 11,9K + 11,9K
59,6K @@ -596,9 +596,9 @@ import data from "@/assets/sti-survey.json"; (1|1,5K|27,06)
- 14,8K - 464K - 6,7K + 14,8K + 464K + 6,7K @@ -608,7 +608,7 @@ import data from "@/assets/sti-survey.json"; > R3 - 2,1K + 2,1K
10,8K @@ -621,9 +621,9 @@ import data from "@/assets/sti-survey.json"; (6|207|71,69)
- 5,7K - 407K - 7,6K + 5,7K + 407K + 7,6K @@ -633,7 +633,7 @@ import data from "@/assets/sti-survey.json"; > R4 - 817 + 817
3,3K @@ -646,9 +646,9 @@ import data from "@/assets/sti-survey.json"; (6|198|63,73)
- 1,7K - 107K - 2,7K + 1,7K + 107K + 2,7K @@ -665,7 +665,7 @@ import data from "@/assets/sti-survey.json"; > R1 - 34,3K + 34,3K
170K @@ -678,9 +678,9 @@ import data from "@/assets/sti-survey.json"; (5|16|8,7)
- 136K - 985K - 136K + 136K + 985K + 136K Wikidata [
1, @@ -709,12 +709,12 @@ import data from "@/assets/sti-survey.json"; > R2 - 484K - 2,8M - 7,9M - - - 1,2M - - + 484K + 2,8M + 7,9M + - + 1,2M + - R3 - 484K - 2,8M - 7,9M - - - 1,2M - - + 484K + 2,8M + 7,9M + - + 1,2M + - @@ -738,12 +738,12 @@ import data from "@/assets/sti-survey.json"; > R4 - 484K - 2,8M - 7,9M - - - 1,2M - - + 484K + 2,8M + 7,9M + - + 1,2M + - @@ -760,7 +760,7 @@ import data from "@/assets/sti-survey.json"; > R1 - 180 + 180
802 @@ -773,9 +773,9 @@ import data from "@/assets/sti-survey.json"; (6|15,5K|1,08K)
- 539 - 667K - 56,5K + 539 + 667K + 56,5K
Wikidata @@ -805,7 +805,7 @@ import data from "@/assets/sti-survey.json"; > R2 - 1,7K + 1,7K
5,6K @@ -818,9 +818,9 @@ import data from "@/assets/sti-survey.json"; (5|58|17,73)
- 2,1K - 47,4K - 3,8K + 2,1K + 47,4K + 3,8K Wikidata @@ -832,7 +832,7 @@ import data from "@/assets/sti-survey.json"; > R3 - 7,2KK + 7,2KK
17,9K @@ -845,9 +845,9 @@ import data from "@/assets/sti-survey.json"; (5|21|9,18)
- 7,2K - 58,9K - 10,7K + 7,2K + 58,9K + 10,7K @@ -864,7 +864,7 @@ import data from "@/assets/sti-survey.json"; > R1 - 3,8K + 3,8K
9,9K @@ -877,9 +877,9 @@ import data from "@/assets/sti-survey.json"; (4|8|5,69)
- 240 - 1,4K - 319 + 240 + 1,4K + 319 Wikidata [4, @@ -900,7 +900,7 @@ import data from "@/assets/sti-survey.json"; > R2 HT - 5,1K + 5,1K
13,3K @@ -913,9 +913,9 @@ import data from "@/assets/sti-survey.json"; (4|8|5,57)
- 398 - 1,9K - 348 + 398 + 1,9K + 348 @@ -925,9 +925,9 @@ import data from "@/assets/sti-survey.json"; > R2 2T - 180 - 802 - 195K + 180 + 802 + 195K
97 @@ -940,7 +940,7 @@ import data from "@/assets/sti-survey.json"; 177K
- - + -
Wikipedia @@ -954,12 +954,12 @@ import data from "@/assets/sti-survey.json"; > R3 Biodiv - 50 - 1,2K - 12,9K - 43 - 1,5K - - + 50 + 1,2K + 12,9K + 43 + 1,5K + - @@ -969,9 +969,9 @@ import data from "@/assets/sti-survey.json"; > R3 GitTables - 7,6K - 198K - 841K + 7,6K + 198K + 841K
6,2K @@ -979,8 +979,8 @@ import data from "@/assets/sti-survey.json"; 1K
- - - - + - + -
Wikidata @@ -1004,7 +1004,7 @@ import data from "@/assets/sti-survey.json"; > R1 - 10,4K + 10,4K
26,1K @@ -1017,9 +1017,9 @@ import data from "@/assets/sti-survey.json"; (3|11|5,72)
- - - - - - + - + - + -
Wikidata @@ -1027,7 +1027,7 @@ import data from "@/assets/sti-survey.json"; Schema.org
- - + - @@ -1037,19 +1037,19 @@ import data from "@/assets/sti-survey.json"; > R2 - - - - - - - - - - - - + - + - + - + - + - + -
Schema.org dbpedia
- - + - diff --git a/src/pages/datasets.astro b/src/pages/datasets.astro index 2466999..5155541 100644 --- a/src/pages/datasets.astro +++ b/src/pages/datasets.astro @@ -6,26 +6,1069 @@ import StiTable from "@components/sti-table"; import statistics from "@/assets/statistics.json"; const { approaches } = statistics; + +import data from "@/assets/sti-survey.json"; --- - +
-
-

- Datasets -

- Cooming soon +

+ Datasets +

+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
GS Tables +
+ cols + (min|max|x) +
+
+
+ rows + (min|max|x) +
+
Classes Entities Pred. KG + Used for validation by +
T2Dv2 [112] 234 +
+ 1,2K + (1|30|4,52) +
+
+
+ 2,8K + (1|5K|84,55) +
+
39 - 154 DBpedia + [21, 22, 30, 37, 40, 43, 44 + , 48, 56, 69, 78, 84, 105, 113, + 144, 148]
WebTableStitching [112] 50 +
+ 300 + (6|6|6) +
+
+
+ 717 + (3|83|14,84) +
+
9 400 6 DBpedia + [112] +
Limaye [82]6,5K- - 747 143K 90 Wikipedia, Yago + [21, 22, 30, 40, 44 + , 48, 69, 84, 149, 152]
LimayeAll [149]6,3K28,5K136K-227K- Freebase-
Limaye200 [149]2009034,1K615-361 Freebase[149]
MusicBrainz [149]1,4K9,8K--93,3K7K Freebase[149]
IMDB [149]7,4K7,4K--92,3K-Freebase[149]
Taheriyan [129]29
+ 2,5K + (3|71,3K|529K) +
+ 16K + (1|13,8K|937) +
---Schema.org[129]
Tough Table (2T) [32]180
+ 194K + (1|8|4,46) +
+ 802 + (6|15,5K|108K) +
540667K0Wikidata, DBpedia-
MammoTab [87]980K5,6M2,3M2M2,8M-Wikidata-
SOTAB [77]108K--91-176Schema.org-
Wikary [89]81,7K22,5K63,9K-30,6K188Wikidata-
GitTables [55]962K11,5M13,6M2,4K--Schema.org, DBpedia-
RedTab [119]9K
+ 44,6K + (1|11|4,86) +
+ 148K + (1|353|17,09) +
70-23Music, Literature-
TURL [37]484K2,8M7,9M-1,2M-DBpedia[37]
BiodivTab [5]50
+ 1,2K + (1|43|23,96) +
+ 12,9K + (26|4,9K|261) +
841,2K-Wikidata[5]
TSOTSACorpus [64]16K--20060K-Food Data-
+ SemTab2019 + + R1 + 64
+ 320 + (3|14|5,05) +
+ 9K + (7|586|143) +
1208,4K116DBpedia[20, 28, 91, 97, 122, 133 ]
+ R2 + 11,9K
+ 59,6K + (1|51|5,55) +
+ 29,8K + (1|1,5K|27,06) +
14,8K464K6,7K
+ R3 + 2,1K
+ 10,8K + (4|8|4,51) +
+ 153K + (6|207|71,69) +
5,7K407K7,6K
+ R4 + 817
+ 3,3K + (4|8|4,36) +
+ 51,4K + (6|198|63,73) +
1,7K107K2,7K
+ SemTab2020 + + R1 + 34,3K
+ 170K + (4|8|4,96) +
+ 249K + (5|16|8,7) +
136K985K136KWikidata[1, + 11, + 13, + 23, + 27, + 30, + 59, + 69, + 71, + 99, + 118, + 134, + 143]
+ R2 + 484K2,8M7,9M-1,2M-
+ R3 + 484K2,8M7,9M-1,2M-
+ R4 + 484K2,8M7,9M-1,2M-
+ SemTab2021 + + R1 + 180
+ 802 + (1|8|4,46) +
+ 194K + (6|15,5K|1,08K) +
539667K56,5K +
+ Wikidata + DBpedia +
[2, 3, 9, + 12, + 58, + 100, + 121, + 142 + ]
+ R2 + 1,7K
+ 5,6K + (2|7|3,19) +
+ 29,3K + (5|58|17,73) +
2,1K47,4K3,8KWikidata
+ R3 + 7,2KK
+ 17,9K + (2|5|2,48) +
+ 58,9K + (5|21|9,18) +
7,2K58,9K10,7K
+ SemTab2022 + + R1 + 3,8K
+ 9,9K + (2|5|2,56) +
+ 22,4K + (4|8|5,69) +
2401,4K319Wikidata[4, + 24, + 13, + 29, + 57, + 84]
+ R2 HT + 5,1K
+ 13,3K + (2|5|2,56) +
+ 28,5K + (4|8|5,57) +
3981,9K348
+ R2 2T + 180802195K
+ 97 + 111 +
+ 81K + 177K +
-
+ Wikipedia + DBpedia +
+ +
+ R3 Biodiv + 501,2K12,9K431,5K-
+ R3 GitTables + 7,6K198K841K
+ 6,2K + 4,4K + 1K +
--
+ Wikidata + Schema.org + Schema.org +
+ SemTab2023 + + R1 + 10,4K
+ 26,1K + (2|4|2,51) +
+ 49,1K + (3|11|5,72) +
--- +
+ Wikidata + tfood + Schema.org +
-
+ R2 + ------ +
+ Schema.org + dbpedia +
-
+
+
+

+ Datasets infographic +

+
+ +
+
-

- In this page, a comparative analysis of all STI datasets will be - included. -

diff --git a/src/pages/tools.astro b/src/pages/tools.astro index bbf97b3..ccfea22 100644 --- a/src/pages/tools.astro +++ b/src/pages/tools.astro @@ -1,6 +1,8 @@ --- import Layout from "@/layouts/Layout.astro"; import Section from "@components/Section.astro"; +import x from "@/assets/x.svg"; +import check from "@/assets/check.svg"; --- @@ -14,65 +16,413 @@ import Section from "@components/Section.astro"; - - - - - - - - - - - - - + + + + + + + + + + + + + Import of tables - - - - + + + + + + + + + + + + Import of tables via API - - - + + + + + + + + + + + + - + - - - + >Import of ontologies + + + + + + + + + + + + + - - - + >Definition of personalised ontologies + + + + + + + + + + + + + - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Functionalities Karma TableMminer+ Magic MTab MantisTable STAN OpenRefine Trifacta Odalic DataGraft Dagobah SemTUI Functionalities Karma TableMminer+ Magic MTab MantisTable STAN OpenRefine Trifacta Odalic DataGraft Dagobah SemTUI
Semtab2019 R4 0.983 - 0.832
Semtab2020 R4 0.907 0.993 0.997
Semtab2020 2T 0.907 0.728 -
Semtab2021 R3 0.968 0.984 0.993
MammoTab 22 0.853 0.659 - Semi-automatic annotation/HITL
Annotation suggestions
Auto-complete support
Subject column detection
CEA
CTA
CPA (NE columns)
CPA (LIT columns)
Table manipulation
Automatic table extension
Visualisation of annotations
Auto save
Export mapping
Export RDF triplets
Open Source
From b8bc05404fabdb5f6865622c9148735cdd0cec91 Mon Sep 17 00:00:00 2001 From: giulia Date: Wed, 17 Jul 2024 18:07:45 +0200 Subject: [PATCH 7/9] copy --- src/pages/tools.astro | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pages/tools.astro b/src/pages/tools.astro index ccfea22..e1fa21c 100644 --- a/src/pages/tools.astro +++ b/src/pages/tools.astro @@ -11,7 +11,7 @@ import check from "@/assets/check.svg";

Tools

-

In this page you will find the tools

+

In this page you will find a table containing the functionalities associated with the presented tools

From 65210282879673fc7023017f0b2ca40648342f2a Mon Sep 17 00:00:00 2001 From: Marco Date: Thu, 18 Jul 2024 12:35:30 +0200 Subject: [PATCH 8/9] Uodate dataset page --- src/pages/tools.astro | 848 ++++++++++++++++++++++-------------------- 1 file changed, 453 insertions(+), 395 deletions(-) diff --git a/src/pages/tools.astro b/src/pages/tools.astro index e1fa21c..a86fc2b 100644 --- a/src/pages/tools.astro +++ b/src/pages/tools.astro @@ -6,426 +6,484 @@ import check from "@/assets/check.svg"; --- -
-
-

+
+

Tools

-

In this page you will find a table containing the functionalities associated with the presented tools

-
-

- - - - - - - - - - - - - - - - - - - - - + Tools + +

+ In this page you will find a table containing the functionalities + offered by various STI tools +

+
+
Functionalities Karma TableMminer+ Magic MTab MantisTable STAN OpenRefine Trifacta Odalic DataGraft Dagobah SemTUI
Import of tables
+ + + + + + + - - - - - - - - - - - - - - + - - - - - - - - - - - - + MantisTable + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - + - - - - - - - - - - - - - + >Import of ontologies + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - + + + + + + + + + + + + + + - - - - - - - - - - - - - - + + + + + + + + + + + + + + - - - - - - - - - - - - - - + + + + + + + + + + + + + + - - - - - - - - - - - - - + >Subject column detection + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + - -
+ Functionalities + Karma + + TableMminer+ + + + + Magic + + + + MTab -
Import of tables via API + -
+ STAN + + + OpenRefine + + + Trifacta + + + + Odalic + + + DataGraft + + + DAGOBAH UI + + + + SemTUI + +
Import of ontologies
Import of tables
Definition of personalised ontologies
Import of tables via API
Semi-automatic annotation/HITL
Annotation suggestions
Definition of personalised ontologies
Auto-complete support
Semi-automatic annotation/HITL
Subject column detection
Annotation suggestions
CEA
Auto-complete support
CTA
CPA (NE columns)
CEA
CPA (LIT columns)
CTA
Table manipulation
CPA (NE columns)
Automatic table extension
CPA (LIT columns)
Visualisation of annotations
Table manipulation
Auto save
Automatic table extension
Export mapping
Visualisation of annotations
Export RDF triplets
Auto save
Open Source
Export mapping
-
- - + + Export RDF triplets + + + + + + + + + + + + + + + Open Source + + + + + + + + + + + + + + + +
+ + + From 133de2f417ab37cb67f866b77b5121526d982f2d Mon Sep 17 00:00:00 2001 From: Marco Date: Thu, 18 Jul 2024 14:56:44 +0200 Subject: [PATCH 9/9] change title --- src/pages/index.astro | 162 ++++++++++++++++++++++-------------------- 1 file changed, 83 insertions(+), 79 deletions(-) diff --git a/src/pages/index.astro b/src/pages/index.astro index 6a4fdfd..081238d 100644 --- a/src/pages/index.astro +++ b/src/pages/index.astro @@ -22,91 +22,95 @@ import HorizontalTimeline from "@components/HorizontalTimeline.astro"; What's Semantic Table Interpretation?

- Semantic Table Interpretation, as defined by the the SemTab challenge, involves annotating relational - tables with information from a Knowledge Graph (KG). This process - includes associating each column in a table with one or more KG types, - known as Column Type Annotation (CTA). Additionally, Cell Entity - Annotation (CEA) is applied to annotate each cell in named entity columns - with a KG entity or mark it as Not In Lexicon (NIL) if it does not exist in the KG. - Columns Property Annotation (CPA) involves annotating pairs of columns - with a KG property. The result of this annotation process is a - table enriched with semantic information -

- -
+ Semantic Table Interpretation, as defined by the the SemTab challenge, involves annotating relational tables with information from a + Knowledge Graph (KG). This process includes associating each column in a + table with one or more KG types, known as Column Type Annotation (CTA). + Additionally, Cell Entity Annotation (CEA) is applied to annotate each + cell in named entity columns with a KG entity or mark it as Not In + Lexicon (NIL) if it does not exist in the KG. Columns Property + Annotation (CPA) involves annotating pairs of columns with a KG + property. The result of this annotation process is a table enriched with + semantic information +

+ +
+

+ TUTSTI @ISWC2024 +

+

+ Discover the comprehensive world of Semantic Table Interpretation + (STI) in this tutorial, which covers both theoretical and practical + aspects, and trace the evolution of STI from heuristic-based methods + to machine learning (ML) techniques and the latest large language + model (LLM) innovations. By examining the unique characteristics, + advantages, and limitations of each approach you will understand + their optimal contexts of use +

+
+ + +
+
+

+ +

- TUTSTI @ISWC2024 + Our Approaches, Datasets, Tools and UIs

-

- Discover the comprehensive world of Semantic Table Interpretation - (STI) in this tutorial, which covers both theoretical and practical - aspects, and trace the evolution of STI from heuristic-based methods - to machine learning (ML) techniques and the latest large language - model (LLM) innovations. By examining the unique characteristics, - advantages, and limitations of each approach you will understand their - optimal contexts of use -

-
- - -
-
-
- -
-

- Our Approaches, Dataset, Tools and UI -

- -
+ + -
-

- Our Datasets -

-
-
- table illustration -
-
-

Mammotab

-

- MammoTab is a unique dataset consisting of 1 million Wikipedia - tables, extracted from over 20 million Wikipedia pages, and - annotated using Wikidata. This dataset fills a gap in the current - state-of-the-art resources, making it an excellent tool for testing - and training Semantic Table Interpretation approaches. MammoTab is - specifically designed to address several key challenges, including - disambiguation, homonymy, and NIL-mentions, providing a - comprehensive resource for advancing STI research and applications -

-

- +
+

+ Our Datasets +

+
+
+ table illustration +
+
+

Mammotab

+

+ MammoTab is a unique dataset consisting of 1 million Wikipedia + tables, extracted from over 20 million Wikipedia pages, and + annotated using Wikidata. This dataset fills a gap in the current + state-of-the-art resources, making it an excellent tool for + testing and training Semantic Table Interpretation approaches. + MammoTab is specifically designed to address several key + challenges, including disambiguation, homonymy, and NIL-mentions, + providing a comprehensive resource for advancing STI research and + applications +

+

+ +
-
+