The text2sdg package provides functions for detecting SDGs in text, as well as for analyzing and visualization the hits found in text. The following provides a brief overview of the contents of the package.
detect_sdg detects SDGs in text using up to five different
query systems: Aurora, Elsevier, SIRIS, SDSN, and OSDG
detect_any detects SDGs in text using self-specified queries
utilizing the lucene-style syntax of the
corpustools
package.
plot_sdg visualizes the relative frequency of SDG hits across
query systems.
crosstab_sdg calculates cross tables of correlations between
either the query systems or the different SDGs.
projects contain random selection of research project
descriptions from the P3 database of the Swiss National Science Foundation.
aurora_queries, elsevier_queries,
siris_queries, sdsn_queries, auckland_queries and
sdgo_queries contain a mapping of SDGs and search queries
as they are employed in the respective systems.
# \donttest{
# detect SDGs using default systems
hits <- detect_sdg_systems(projects)
#> Running Aurora
#> Running Elsevier
#> Running Auckland
#> Running SIRIS
#' # detect SDGs using all five systems
hits <- detect_sdg_systems(projects,
system = c("Aurora", "Elsevier", "SIRIS", "SDSN", "SDGO")
)
#> Running Aurora
#> Running Elsevier
#> Running SIRIS
#> Running SDSN
#> Running SDGO
# visualize SDG frequencies
plot_sdg(hits)
#> 2511 duplicate hits removed. Set remove_duplicates = FALSE to retain duplicates.
# correlations between systems
crosstab_sdg(hits)
#> Aurora Elsevier SDGO SDSN SIRIS
#> Aurora 1.0000000 0.2434814 0.1386527 0.1218384 0.3028867
#> Elsevier 0.2434814 1.0000000 0.2919052 0.2258820 0.2702591
#> SDGO 0.1386527 0.2919052 1.0000000 0.3531476 0.1854036
#> SDSN 0.1218384 0.2258820 0.3531476 1.0000000 0.1935117
#> SIRIS 0.3028867 0.2702591 0.1854036 0.1935117 1.0000000
# correlations between SDGs
crosstab_sdg(hits, compare = "sdgs")
#> SDG-01 SDG-02 SDG-03 SDG-04 SDG-05 SDG-06
#> SDG-01 1.00000000 0.47243260 0.05377124 0.05960021 0.11694397 0.17689403
#> SDG-02 0.47243260 1.00000000 0.08874120 0.06917626 0.06403653 0.17167897
#> SDG-03 0.05377124 0.08874120 1.00000000 0.22115676 0.17081657 0.04264144
#> SDG-04 0.05960021 0.06917626 0.22115676 1.00000000 0.13771788 0.07550215
#> SDG-05 0.11694397 0.06403653 0.17081657 0.13771788 1.00000000 0.10773742
#> SDG-06 0.17689403 0.17167897 0.04264144 0.07550215 0.10773742 1.00000000
#> SDG-07 0.07842569 0.12861946 0.01594629 0.09176819 0.05098589 0.19088388
#> SDG-08 0.15722789 0.16209480 0.22222210 0.17926297 0.09185875 0.16165248
#> SDG-09 0.32323357 0.29133072 0.17619482 0.14773401 0.14634302 0.18358260
#> SDG-10 0.17956575 0.15225795 0.34461688 0.26668702 0.20000820 0.10939990
#> SDG-11 0.20423511 0.22395873 0.22204222 0.20143305 0.15753089 0.32517901
#> SDG-12 0.23882648 0.27512454 0.09694438 0.05418890 0.06949188 0.29477153
#> SDG-13 0.05496570 0.07877807 -0.02848180 0.04285162 0.01425682 0.20697251
#> SDG-14 0.05442432 0.08850223 0.03394400 0.01954488 0.02335111 0.14939543
#> SDG-15 0.07469163 0.17837071 0.14007452 0.05016042 0.03132997 0.21482130
#> SDG-16 0.13650534 0.11018098 0.16579452 0.26168407 0.33141916 0.13499705
#> SDG-17 -0.01741154 0.01580426 0.25585998 0.24782207 0.04794814 0.04155092
#> SDG-07 SDG-08 SDG-09 SDG-10 SDG-11 SDG-12
#> SDG-01 0.078425692 0.15722789 0.32323357 0.17956575 0.2042351 0.23882648
#> SDG-02 0.128619459 0.16209480 0.29133072 0.15225795 0.2239587 0.27512454
#> SDG-03 0.015946287 0.22222210 0.17619482 0.34461688 0.2220422 0.09694438
#> SDG-04 0.091768192 0.17926297 0.14773401 0.26668702 0.2014330 0.05418890
#> SDG-05 0.050985889 0.09185875 0.14634302 0.20000820 0.1575309 0.06949188
#> SDG-06 0.190883884 0.16165248 0.18358260 0.10939990 0.3251790 0.29477153
#> SDG-07 1.000000000 0.12747932 0.28479413 0.10472055 0.2190218 0.27587686
#> SDG-08 0.127479323 1.00000000 0.35251130 0.33051644 0.2693716 0.13457737
#> SDG-09 0.284794133 0.35251130 1.00000000 0.31469590 0.3145663 0.30658118
#> SDG-10 0.104720552 0.33051644 0.31469590 1.00000000 0.2837277 0.14301861
#> SDG-11 0.219021802 0.26937161 0.31456628 0.28372772 1.0000000 0.31011192
#> SDG-12 0.275876855 0.13457737 0.30658118 0.14301861 0.3101119 1.00000000
#> SDG-13 0.397037368 0.06693026 0.15272320 0.03730426 0.1654065 0.12959628
#> SDG-14 0.154203297 0.08791454 0.09459597 0.08586034 0.1170959 0.09775298
#> SDG-15 0.134668279 0.17971335 0.21069413 0.13487097 0.1896257 0.19043761
#> SDG-16 0.038289774 0.22900007 0.17124607 0.24454931 0.2561869 0.08213455
#> SDG-17 -0.009755392 0.13735910 0.03884005 0.20570856 0.1757141 0.06846304
#> SDG-13 SDG-14 SDG-15 SDG-16 SDG-17
#> SDG-01 0.054965704 0.054424319 0.07469163 0.136505340 -0.017411542
#> SDG-02 0.078778070 0.088502232 0.17837071 0.110180978 0.015804265
#> SDG-03 -0.028481801 0.033943997 0.14007452 0.165794519 0.255859979
#> SDG-04 0.042851617 0.019544879 0.05016042 0.261684065 0.247822074
#> SDG-05 0.014256824 0.023351115 0.03132997 0.331419161 0.047948138
#> SDG-06 0.206972513 0.149395431 0.21482130 0.134997052 0.041550924
#> SDG-07 0.397037368 0.154203297 0.13466828 0.038289774 -0.009755392
#> SDG-08 0.066930264 0.087914542 0.17971335 0.229000069 0.137359096
#> SDG-09 0.152723205 0.094595973 0.21069413 0.171246067 0.038840047
#> SDG-10 0.037304257 0.085860337 0.13487097 0.244549312 0.205708557
#> SDG-11 0.165406506 0.117095907 0.18962575 0.256186926 0.175714122
#> SDG-12 0.129596280 0.097752977 0.19043761 0.082134545 0.068463040
#> SDG-13 1.000000000 0.292688371 0.26688113 0.008503651 -0.003516404
#> SDG-14 0.292688371 1.000000000 0.22901423 -0.006388333 0.010002345
#> SDG-15 0.266881126 0.229014229 1.00000000 0.069125302 0.111535430
#> SDG-16 0.008503651 -0.006388333 0.06912530 1.000000000 0.179953553
#> SDG-17 -0.003516404 0.010002345 0.11153543 0.179953553 1.000000000
# }