Najko Jahn njahn82

## abstract_analytics.md

      
              2 files
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / abstract_analytics.md
            
            
              Created
              March 27, 2024 10:19
            
              
                Abstract infos in Crossref and OpenAlex
              
          
    Abstracts in Crossref

Get abstract counts per year and publisher

SELECT
cr_year,
publisher,
COUNT(DISTINCT doi) AS cr_articles,

  
## 03-manipulating-data.R
#' Manipulating, analyzing and exporting data with tidyverse
#' https://datacarpentry.org/R-ecology-lesson/03-dplyr.html

library(tidyverse)

#' dplyr
#' - the most common data manipulation tasks
#' - https://github.com/rstudio/cheatsheets/raw/master/data-transformation.pdf
#' tidyr
#' - reshape your data

## hoad_dash_beispiel.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / hoad_dash_beispiel.md
            
            
              Created
              November 15, 2021 11:18
            
              
                hoad_dash_beispiel
              
          
    library(tidyverse)
library(bigrquery)
library(DBI)
Connection


## doi_check.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / doi_check.md
            
            
              Created
              September 9, 2021 13:21
            
              
                doi check
              
          
    library(tidyverse)
#> Warning: package 'tibble' was built under R version 4.1.1
#> Warning: package 'readr' was built under R version 4.1.1
library(biblids) # install via GitHub https://github.com/subugoe/biblids

tt <- readr::read_csv("~/Downloads/DOIs.txt")
#> Rows: 40479 Columns: 1
#> ── Column specification ────────────────────────────────────────────────────────
#> Delimiter: ","

  
## mag_subject.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / mag_subject.md
            
            
              Created
              July 27, 2021 07:52
            
              
                mag subjects
              
          
    library(tidyverse)
# raw subject table
subject_mag_raw <- readr::read_csv("data/NPL_DOI_FOS.csv",
  col_types =  cols(.default = "c"))
subject_mag_raw %>%
  # Represents https://academic.microsoft.com/paper/2518129109/
  filter(doi == "10.7717/peerj.2369") %>%
  # Only top level subjects
  filter(is.na(fos_1)) %>%

  
## esac.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / esac.md
            
            
              Created
              March 30, 2021 14:16
            
              
                Fetch ESAC registry info
              
          
    library(rvest)
library(tidyverse)
library(janitor)
#> 
#> Attaching package: 'janitor'
#> The following objects are masked from 'package:stats':
#> 
#>     chisq.test, fisher.test
esac <-

  
## reprex.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / reprex.md
            
            
              Created
              March 4, 2021 15:14
            
              
                reprex_doi_validation
              
          
    library(rcrossref)
library(purrr)

my_dois <-
  c(
    "skksks",
    "10.5281/zenodo.4032609",
    "10.1667/rr13708.1",
    "10.1016/s0021-9258(19)52311-0",

  
## open_apc.R
#' Get most current Open APC snapshot
#'
#' Open APC shares several csv files via GitHub, which contain data about
#' institutional spending for open access articles.
#'
#'
#' @param open_apc_cols character vector representing Open APC collections.
#'   See `open_apc_collections()` for an overview.
#'
#' @importFrom dplyr filter `%>%` inner_join

## vanished_with_r.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                njahn82
                / vanished_with_r.md
            
            
              Created
              September 16, 2020 07:45
            
              
                vanished example
              
          
    # import csv file
tt <- read.delim("~/Downloads/vanished_v2.csv", sep = ";")
# table dimensions
dim(tt)
#> [1] 807  61
# empty rows at bottom like row 635
tt[635,]
#>     Source If.Identified.by.second.source Journal.Name ISSN E.ISSN URL
#> 635                                                                   

  
## ci_wos.R
library(tidyverse)
my_df <- readr::read_csv("data/u4_13_17.csv")
no_group <- my_df %>%
  filter(is.na(CA))
no_group %>%
  select(PY, UT, C1) %>%
  mutate(adresses = strsplit(C1, "; \\[")) -> tt
tt %>%
  unnest() %>%
  tidyr::separate(adresses, sep ="] ", c("authors", "address"), fill = "left") %>%
	#' Manipulating, analyzing and exporting data with tidyverse
	#' https://datacarpentry.org/R-ecology-lesson/03-dplyr.html

	library(tidyverse)

	#' dplyr
	#' - the most common data manipulation tasks
	#' - https://github.com/rstudio/cheatsheets/raw/master/data-transformation.pdf
	#' tidyr
	#' - reshape your data
	#' Get most current Open APC snapshot
	#'
	#' Open APC shares several csv files via GitHub, which contain data about
	#' institutional spending for open access articles.
	#'
	#'
	#' @param open_apc_cols character vector representing Open APC collections.
	#' See `open_apc_collections()` for an overview.
	#'
	#' @importFrom dplyr filter `%>%` inner_join
	library(tidyverse)
	my_df <- readr::read_csv("data/u4_13_17.csv")
	no_group <- my_df %>%
	filter(is.na(CA))
	no_group %>%
	select(PY, UT, C1) %>%
	mutate(adresses = strsplit(C1, "; \\[")) -> tt
	tt %>%
	unnest() %>%
	tidyr::separate(adresses, sep ="] ", c("authors", "address"), fill = "left") %>%