Name: Rerun update with knitr (2022-09-03 for preprints posted up until 202… · nicholasmfraser/covid19_preprints@c0b1dde · GitHub
Rating: 4.8 (2757 reviews)
nicholasmfraser
diff --git a/‎covid19_preprints.md
+8-3 b/‎covid19_preprints.md
+8-3
diff --git a/‎covid19_preprints_files/figure-gfm/unnamed-chunk-20-1.png
-312 Bytes b/‎covid19_preprints_files/figure-gfm/unnamed-chunk-20-1.png
-312 Bytes
diff --git a/‎covid19_preprints_files/figure-gfm/unnamed-chunk-21-1.png
327 Bytes b/‎covid19_preprints_files/figure-gfm/unnamed-chunk-21-1.png
327 Bytes
diff --git a/‎covid19_preprints_files/figure-gfm/unnamed-chunk-22-1.png
-184 Bytes b/‎covid19_preprints_files/figure-gfm/unnamed-chunk-22-1.png
-184 Bytes
diff --git a/‎covid19_preprints_files/figure-gfm/unnamed-chunk-23-1.png
-193 Bytes b/‎covid19_preprints_files/figure-gfm/unnamed-chunk-23-1.png
-193 Bytes
diff --git a/‎covid19_preprints_files/figure-gfm/unnamed-chunk-24-1.png
-78 Bytes b/‎covid19_preprints_files/figure-gfm/unnamed-chunk-24-1.png
-78 Bytes
diff --git a/‎data/covid19_preprints.csv
+2-2 b/‎data/covid19_preprints.csv
+2-2
diff --git a/‎data/metadata.json
+1-1 b/‎data/metadata.json
+1-1
diff --git a/‎outputs/figures/covid19_preprints_day.png
-11.4 KB b/‎outputs/figures/covid19_preprints_day.png
-11.4 KB
diff --git a/‎outputs/figures/covid19_preprints_day_cumulative_by_month.png
-1.31 KB b/‎outputs/figures/covid19_preprints_day_cumulative_by_month.png
-1.31 KB
diff --git a/‎outputs/figures/covid19_preprints_day_cumulative_by_week.png
-2.05 KB b/‎outputs/figures/covid19_preprints_day_cumulative_by_week.png
-2.05 KB
diff --git a/‎outputs/figures/covid19_preprints_month.png
3.13 KB b/‎outputs/figures/covid19_preprints_month.png
3.13 KB
diff --git a/‎outputs/figures/covid19_preprints_week.png
625 Bytes b/‎outputs/figures/covid19_preprints_week.png
625 Bytes
@@ -440,7 +440,9 @@ processed further to extract the needed information.
 ```r
 parseDataCiteDescription<-function(x) {
 if(length(x) >0) {
-if(x$descriptionType=="Abstract") {
+#descriptionType and description are character vectors, spanning content of description field
+#testing (2022-08) found that selecting on "Abstract" could be omitted
+if("Abstract"%in%x$descriptionType) {
 return(str_to_sentence(str_c(x$description, collapse="; ")))
  } else {
 return(NA_character_)
@@ -459,7 +461,10 @@ parseDataCitePreprints <- function(item) {
 title= map_chr(item$data$attributes$titles, 
 ~ str_to_sentence(str_c(.x$title, collapse="; "))),
 abstract= map_chr(item$data$attributes$descriptions, 
-function(x) parseDataCiteDescription(x)))
+function(x) parseDataCiteDescription(x)),
+abstract_length= map_int(item$data$attributes$descriptions,
+function(x) length(x))
+ )
 }
 
 dc_preprints_df<- map_df(dc_preprints, parseDataCitePreprints) %>%
@@ -620,7 +625,7 @@ covid_preprints_update <- covid_preprints_update %>%
 title= str_squish(title))
 ```
 
-#Remove duplicate records (incl. versions) on same preprint server
+\#Remove duplicate records (incl. versions) on same preprint server
 
 ```r
 covid_preprints_previous<- read_csv("data/covid19_preprints.csv")
 
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3703940a1dd97d45e8f993e278082ece7a168c3ec93b3b957363744b305a879f
-size 122867213
+oid sha256:fb485b21b462512369574a125cc6e4ef79b64cd342d4466bb11959d0d41693fa
+size 123090842
@@ -1,6 +1,6 @@
 {
 "release_date": "2022-09-03",
-"sample_date": "2022-08-31",
+"sample_date": "2022-09-03",
 "posted_date": "2022-08-28",
 "url": "https://github.com/nicholasmfraser/covid19_preprints/blob/master/data/covid19_preprints.csv?raw=true"
 }
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"release_date": "2022-09-03",`
`3`		`-"sample_date": "2022-08-31",`
	`3`	`+"sample_date": "2022-09-03",`
`4`	`4`	`"posted_date": "2022-08-28",`
`5`	`5`	`"url": "https://github.com/nicholasmfraser/covid19_preprints/blob/master/data/covid19_preprints.csv?raw=true"`
`6`	`6`	`}`