---
title: "Datasets information"
output: html_notebook
---

In [None]:
root_dir <- rprojroot::is_git_root$find_file()
if (getwd() != root_dir) setwd(root_dir)
config <- yaml::read_yaml('config.yml')

library(magrittr)

## Experimental design

In [None]:
read.delim('annot/datasets.tsv', na.strings='')

## Choose dataset

In [None]:
config$geo_datasets %>% paste(seq_along(.), ., sep=': ') %>% cat(sep=', ')

In [None]:
gse_id <- config$geo_datasets[3]
cat('Selected dataset:', gse_id)

## Description
Information retrieved from NCBI database, GEO website and `GEOmetadb`.

In [None]:
gse_id %>%
    sprintf(fmt='output/info/%s.txt') %>%
    dget() %>%
    extract(c('title', 'summary', 'Overall design', 'geo_url', 'article_url', 'article_title', 'article_abstract')) %>%
    lapply(paste, collapse=' ') %>%
    paste(toupper(names(.)), ., sep=': ') %>%
    stringr::str_wrap(width=90) %>%
    cat(sep='\n\n')

## Article highlights
Relevant excerpts from associated publication.

In [None]:
gse_id %>%
    sprintf(fmt='annot/article/%s.txt') %>%
    scan(character(), sep='\n', quote='"', comment.char='(', quiet=T) %>%
    stringr::str_wrap(width=90) %>%
    cat(sep='\n\n')