diff --git a/analysis.Rmd b/analysis.Rmd index 1fa2d11..3f0d04b 100644 --- a/analysis.Rmd +++ b/analysis.Rmd @@ -287,11 +287,15 @@ point_sizes <- oa_shares_inst_sector %>% filter(n_total >= 100) %>% mutate(point_shape = ifelse(inst_label =="", 1.5, 2)) %>% .$point_shape +point_color <- oa_shares_inst_sector %>% + filter(n_total >= 100) %>% + mutate(point_color = ifelse(inst_label =="", "#56b4e9", "#490206")) %>% + .$point_color oa_shares_inst_sector %>% filter(n_total >= 100) %>% left_join(oa_shares_inst_sector_stats, by = "sector") %>% ggplot(aes(x = n_total, y = oa_share, label = INST_NAME)) + - geom_point(color = "#56b4e9", alpha = .7, shape = point_shapes, size = point_sizes) + + geom_point(color = point_color, alpha = .7, shape = point_shapes, size = point_sizes) + scale_x_log10(labels = scales::number_format(big.mark = ","), expand = expansion(mult = c(0.05, 0.1))) + scale_y_continuous(labels = scales::percent_format(accuracy = 5L), @@ -676,13 +680,14 @@ oa_shares_sector <-pubs_cat %>% values_from = fig_val) %>% mutate(share_sec_cat = ifelse(oa_category == "not_oa", 1-share_sec_cat, share_sec_cat), oa_category = fct_recode(oa_category, all_oa = "not_oa")) %>% - rename(share = share_sec_cat) + rename(share = share_sec_cat) %>% + mutate(text_color = ifelse(share > .3, "black", "#cccccc")) ggplot(oa_shares_sector, aes(x = fct_rev(fct_recode(fct_relevel(fct_reorder(sec_abbr, n_sec), "all_sec"), all = "all_sec")), y = fct_rev(oa_category), size = share, fill = share))+ geom_point(shape = 21, color = "#666666") + - geom_text(aes(label = round(share*100)), color = "#cccccc", size = 4) + + geom_text(aes(label = round(share*100), colour = text_color), size = 4, show_guide = FALSE) + geom_vline(xintercept = 6.5, color = "black") + geom_hline(yintercept = 1.5, color = "black") + scale_size(name = "OA percentage", @@ -695,6 +700,7 @@ ggplot(oa_shares_sector, aes(x = fct_rev(fct_recode(fct_relevel(fct_reorder(sec_ guide = guide_colorbar(frame.colour = "#666666", barwidth = 17)) + labs(x = "Sector", y = "OA Category") + # coord_flip() + + scale_color_manual(values = c("black" = "black", "#cccccc" = "white")) + theme_minimal_grid() + theme(legend.position = "top", legend.justification = "right") + theme(legend.direction = "horizontal", legend.box = "vertical") + diff --git a/analysis.md b/analysis.md index eca2933..bc14fc7 100644 --- a/analysis.md +++ b/analysis.md @@ -30,7 +30,7 @@ following figure displays the number of publications associated with one of the German research institutions we considered and highlights they part that is freely accessible online according to Unpaywall over the considered time period from 2010 until 2018. The total number of -articles over the whole period is 871922 with an overall OA share of 44 +articles over the whole period is 871922 with an overall OA share of 45 %.
@@ -50,12 +50,12 @@ articles. As can be seen, the total number of articles, as well as the part that is OA increases constantly over time. The number of articles that are -not openly available, is quite stable with a slow increase from 54492 in -2010 to 56234 in 2013, and decreasing again continuously from that point -onwards to 52103 publications in 2018. Since the number of OA articles -increases continuously from 28975 publications in 2010 to 54976 in 2018, -the relative proportion of OA articles rises significantly from 34.71 % -in 2010 to 51.34 % in 2018. +not openly available, is quite stable with a slow increase from 52803 in +2010 to 54873 in 2013, and decreasing again continuously from that point +onwards to 51430 publications in 2018. Since the number of OA articles +increases continuously from 30664 publications in 2010 to 55649 in 2018, +the relative proportion of OA articles rises significantly from 36.74 % +in 2010 to 51.97 % in 2018. ### Differences between sectors @@ -151,8 +151,8 @@ different.
-Significance: HGF against all non-research oriented, MPG against all -non-research oriented, FhG against all others Significance groups: +Significance: HGF against all non-research oriented, MPS against all +non-research oriented, FhS against all others Significance groups: research against all others, practise against all others, mixed not well separated from universities (maybe sector\_cat classification should be inst\_cat, i.e. on the level of institutions - would have to be manually diff --git a/analysis_files/figure-gfm/unnamed-chunk-10-1.png b/analysis_files/figure-gfm/unnamed-chunk-10-1.png index d18c9da..b2af057 100644 Binary files a/analysis_files/figure-gfm/unnamed-chunk-10-1.png and b/analysis_files/figure-gfm/unnamed-chunk-10-1.png differ diff --git a/analysis_files/figure-gfm/unnamed-chunk-17-1.png b/analysis_files/figure-gfm/unnamed-chunk-17-1.png index cf00068..7c77a40 100644 Binary files a/analysis_files/figure-gfm/unnamed-chunk-17-1.png and b/analysis_files/figure-gfm/unnamed-chunk-17-1.png differ