```r
rm(list = ls())

Sys.setenv(LANG = \en\)
library(xlsx)
library(readr)
library(readxl)
library(tidyverse)
library(stringr)
library(stringi)
library(gghighlight)
library(countrycode)
library(countries)
library(janitor)
library(sf)

library(janitor)
library(sf)
library(ggthemes)
library(here)
library(viridis)
library(ggplot2)
library(formatR)
library(gtools)
library(nnet) 
library(patchwork)
library(ggh4x)

# Packages for the regression. Move to different script.
#install.packages(\plm\) # a package of \panel data econometrics in R\ (by Croissant and Millo)
#install.packages(\lme4\) # this is the first multilevel (random effects) package we'll use
library(plm)
library(broom)
library(ggalluvial)

library(pals)

<!-- rnb-source-end -->

<!-- rnb-chunk-end -->


<!-- rnb-text-begin -->


# Load data ---------------------------------------------------------------

## Corpus.

<!-- rnb-text-end -->


<!-- rnb-chunk-begin -->


<!-- rnb-source-begin eyJkYXRhIjoiYGBgclxuYGBgclxuc2Nfc2NvcmVzIDwtIHJlYWRfY3N2KFxcLi4vYWdncmVnYXRlZF9kYXRhL3NjX3Njb3Jlcy5jc3ZcXCkgXG5cbnNjX3Njb3JlcyAlPiVcbiAgICBnZ3Bsb3QoKSArIFxuICAgIGdlb21fYm94cGxvdChhZXMoeCA9IG1pZ19qb3VybmFsLCB5ID0gc2NvcmUsIGNvbG9yID0gYXMuZmFjdG9yKG1pZ19qb3VybmFsKSkpICtcbiAgICB0aGVtZShheGlzLnRleHQueD1lbGVtZW50X2JsYW5rKCkpICtcbiAgICBmYWNldF93cmFwKHZhcnMoY29ycHVzX2Nfc2QxKSxcbiAgICAgICAgICAgICAgIGxhYmVsbGVyID0gbGFiZWxsZXIoY29ycHVzX2Nfc2QxID0gYyhcXFRSVUVcXCA9IFxcSW5jbHVkZWQgaW4gY29ycHVzOiBcXG4gPD0gMVNEIGF2ZXJhZ2Ugc2NvcmUgb2YgbWlncmF0aW9uIGpvdXJuYWxzXFwsIFxcRkFMU0VcXCA9IFxcTm90IGluY2x1ZGVkIGluIGNvcnB1czogXFxuID4gMVNEIGF2ZXJhZ2Ugc2NvcmUgb2YgbWlncmF0aW9uIGpvdXJuYWxzXFwpKSkgK1xuICBsYWJzKGNvbG9yID0gXFxKb3VybmFsIGNsYXNzaWZpY2F0aW9uXFwsXG4gICAgICAgICB4ID0gXFxcXCxcbiAgICAgICAgIHkgPSBcXE1pZ3JhdGlvbiByZWxhdGlvbiBzY29yZVxcKSArXG4gIHNjYWxlX2NvbG91cl9kaXNjcmV0ZShsYWJlbHMgPSBjKFxcT3RoZXIgam91cm5hbHNcXCwgXFxNaWdyYXRpb24gam91cm5hbHNcXCkpICtcbiAgdGhlbWVfbWluaW1hbCgpICtcbiAgdGhlbWUoYXhpcy50aXRsZS54PWVsZW1lbnRfYmxhbmsoKSxcbiAgICAgICAgYXhpcy50ZXh0Lng9ZWxlbWVudF9ibGFuaygpLFxuICAgICAgICBheGlzLnRpY2tzLng9ZWxlbWVudF9ibGFuaygpLFxuICAgICAgICBsZWdlbmQucG9zaXRpb24gPSBcXGJvdHRvbVxcKVxuXG5nZ3NhdmUoXFwuLi9vdXRwdXRfZmlndXJlcy9ib3hfc2NvcmVfbWlnX2pvdXJuYWxfc2QxLnBuZ1xcLCB3aWR0aCA9IDcsIGhlaWdodCA9IDcsIGRwaSA9IDUwMCwgbGltaXRzaXplID0gRiwgcGxvdCA9IGxhc3RfcGxvdCgpKVxuYGBgXG5gYGAifQ== -->

```r
```r
sc_scores <- read_csv(\../aggregated_data/sc_scores.csv\) 

sc_scores %>%
    ggplot() + 
    geom_boxplot(aes(x = mig_journal, y = score, color = as.factor(mig_journal))) +
    theme(axis.text.x=element_blank()) +
    facet_wrap(vars(corpus_c_sd1),
               labeller = labeller(corpus_c_sd1 = c(\TRUE\ = \Included in corpus: \n <= 1SD average score of migration journals\, \FALSE\ = \Not included in corpus: \n > 1SD average score of migration journals\))) +
  labs(color = \Journal classification\,
         x = \\,
         y = \Migration relation score\) +
  scale_colour_discrete(labels = c(\Other journals\, \Migration journals\)) +
  theme_minimal() +
  theme(axis.title.x=element_blank(),
        axis.text.x=element_blank(),
        axis.ticks.x=element_blank(),
        legend.position = \bottom\)

ggsave(\../output_figures/box_score_mig_journal_sd1.png\, width = 7, height = 7, dpi = 500, limitsize = F, plot = last_plot())

```

LS0tDQp0aXRsZTogIlIgTm90ZWJvb2siDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQpgYGB7cn0NCnJtKGxpc3QgPSBscygpKQ0KDQpTeXMuc2V0ZW52KExBTkcgPSAiZW4iKQ0KbGlicmFyeSh4bHN4KQ0KbGlicmFyeShyZWFkcikNCmxpYnJhcnkocmVhZHhsKQ0KbGlicmFyeSh0aWR5dmVyc2UpDQpsaWJyYXJ5KHN0cmluZ3IpDQpsaWJyYXJ5KHN0cmluZ2kpDQpsaWJyYXJ5KGdnaGlnaGxpZ2h0KQ0KbGlicmFyeShjb3VudHJ5Y29kZSkNCmxpYnJhcnkoY291bnRyaWVzKQ0KbGlicmFyeShqYW5pdG9yKQ0KbGlicmFyeShzZikNCg0KbGlicmFyeShqYW5pdG9yKQ0KbGlicmFyeShzZikNCmxpYnJhcnkoZ2d0aGVtZXMpDQpsaWJyYXJ5KGhlcmUpDQpsaWJyYXJ5KHZpcmlkaXMpDQpsaWJyYXJ5KGdncGxvdDIpDQpsaWJyYXJ5KGZvcm1hdFIpDQpsaWJyYXJ5KGd0b29scykNCmxpYnJhcnkobm5ldCkgDQpsaWJyYXJ5KHBhdGNod29yaykNCmxpYnJhcnkoZ2doNHgpDQoNCiMgUGFja2FnZXMgZm9yIHRoZSByZWdyZXNzaW9uLiBNb3ZlIHRvIGRpZmZlcmVudCBzY3JpcHQuDQojaW5zdGFsbC5wYWNrYWdlcygicGxtIikgIyBhIHBhY2thZ2Ugb2YgInBhbmVsIGRhdGEgZWNvbm9tZXRyaWNzIGluIFIiIChieSBDcm9pc3NhbnQgYW5kIE1pbGxvKQ0KI2luc3RhbGwucGFja2FnZXMoImxtZTQiKSAjIHRoaXMgaXMgdGhlIGZpcnN0IG11bHRpbGV2ZWwgKHJhbmRvbSBlZmZlY3RzKSBwYWNrYWdlIHdlJ2xsIHVzZQ0KbGlicmFyeShwbG0pDQpsaWJyYXJ5KGJyb29tKQ0KbGlicmFyeShnZ2FsbHV2aWFsKQ0KDQpsaWJyYXJ5KHBhbHMpDQpgYGANCg0KIyBMb2FkIGRhdGEgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tDQoNCiMjIENvcnB1cy4NCmBgYHtyfQ0Kc2Nfc2NvcmVzIDwtIHJlYWRfY3N2KCIuLi9hZ2dyZWdhdGVkX2RhdGEvc2Nfc2NvcmVzLmNzdiIpIA0KDQpzY19zY29yZXMgJT4lDQogICAgZ2dwbG90KCkgKyANCiAgICBnZW9tX2JveHBsb3QoYWVzKHggPSBtaWdfam91cm5hbCwgeSA9IHNjb3JlLCBjb2xvciA9IGFzLmZhY3RvcihtaWdfam91cm5hbCkpKSArDQogICAgdGhlbWUoYXhpcy50ZXh0Lng9ZWxlbWVudF9ibGFuaygpKSArDQogICAgZmFjZXRfd3JhcCh2YXJzKGNvcnB1c19jX3NkMSksDQogICAgICAgICAgICAgICBsYWJlbGxlciA9IGxhYmVsbGVyKGNvcnB1c19jX3NkMSA9IGMoIlRSVUUiID0gIkluY2x1ZGVkIGluIGNvcnB1czogXG4gPD0gMVNEIGF2ZXJhZ2Ugc2NvcmUgb2YgbWlncmF0aW9uIGpvdXJuYWxzIiwgIkZBTFNFIiA9ICJOb3QgaW5jbHVkZWQgaW4gY29ycHVzOiBcbiA+IDFTRCBhdmVyYWdlIHNjb3JlIG9mIG1pZ3JhdGlvbiBqb3VybmFscyIpKSkgKw0KICBsYWJzKGNvbG9yID0gIkpvdXJuYWwgY2xhc3NpZmljYXRpb24iLA0KICAgICAgICAgeCA9ICIiLA0KICAgICAgICAgeSA9ICJNaWdyYXRpb24gcmVsYXRpb24gc2NvcmUiKSArDQogIHNjYWxlX2NvbG91cl9kaXNjcmV0ZShsYWJlbHMgPSBjKCJPdGhlciBqb3VybmFscyIsICJNaWdyYXRpb24gam91cm5hbHMiKSkgKw0KICB0aGVtZV9taW5pbWFsKCkgKw0KICB0aGVtZShheGlzLnRpdGxlLng9ZWxlbWVudF9ibGFuaygpLA0KICAgICAgICBheGlzLnRleHQueD1lbGVtZW50X2JsYW5rKCksDQogICAgICAgIGF4aXMudGlja3MueD1lbGVtZW50X2JsYW5rKCksDQogICAgICAgIGxlZ2VuZC5wb3NpdGlvbiA9ICJib3R0b20iKQ0KDQpnZ3NhdmUoIi4uL291dHB1dF9maWd1cmVzL2ZpZ3VyZV9zMS5wbmciLCB3aWR0aCA9IDcsIGhlaWdodCA9IDcsIGRwaSA9IDUwMCwgbGltaXRzaXplID0gRiwgcGxvdCA9IGxhc3RfcGxvdCgpKQ0KYGBgDQoNCg0KDQoNCg0KDQoNCg==