Simon Anders simon-anders

## smoothing_demo.R

# Make example data
n <- 15
x <- runif( n, 0, 10 )
y <- sin(x) + rnorm( n, sd=.1 )

# Make grid to plot smooth curves
xg <- seq( 0, 10, length.out=1000 )

# Determine knot positions:

## check_c.py
import gzip, random

# Load FASTQ file for Chromosome 10 from GRCm38
with gzip.open("data/Mus_musculus.GRCm38.dna.chromosome.10.fa.gz") as f:
    firstline = f.readline()
    assert firstline.startswith(b'>')
    chrom_seq = b"".join(l.rstrip() for l in f)

# This here is the file from papagei:mnt/raid/scnmt_data/CpG_filtered
cpg = scipy.sparse.load_npz( "data/CpG_10.npz" ).tocoo()

## example_figure_size.Rmd
## Beispiel für Plot-Größe

Tidyverse laden:

```{r}
library( tidyverse )
```

Wir benutzen `mtcars`, eine Standard-Beispiel-Tabelle von R mit technischen Daten
für (recht alte) Autos:

## pca.R
library( irlba )

m <- 10000 # nbr of features (rows)
n <- 5000  # nbr of cells (colums)
r <- 5  # nbr of latent components

## The true latent values

# True importance of latent factors
true_importance <- c( 1, .8, .4, .2, .1 )

## rg_flou_simu.R
# Wir haben 300 Stämme
m <- 300

# Die wahre mittlere Floureszenz der Stämme ist
true_mu <- exp( rnorm( m, 3, 2) )

# Die mittlere Hintergrund-Floureszenz ist
true_bg <- 10

# Die Hintergrund-Floureszenz schwankt mit einer Standardabweichung von

## rnorm_example.R
# So zieht man 10000 Werte mit Mittelwert 178 und Standardabweichung 7:

rnorm( 10000, 178, 7 ) -> x


# Und so plotted man das Histogramm aller Werte in x

library( tidyverse)

tibble(x) %>% ggplot + geom_histogram(aes(x))

## test.R
library( jrc )
library( rlc )

myfun <- function(x) { print( paste( "user clicked on", x ) ) }

rlc::openPage(useViewer=FALSE)

jrc::allowFunctions( "myfun" )

genes <- c( "gene1", "gene2", "gene3" )

## ll_methods.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                simon-anders
                / ll_methods.md
            
            
              Created
              August 12, 2020 16:06
            
          
    In order to estimate transduction efficiency from sc-RNA-Seq data, we use the following model: We assume that a
non-transduced cell expresses NeoR such that an expected fraction $\mu^\text{R}$ of its UMIs maps to this gene.
For each individual cell $j$, the actual expression strength of the gene varies around this expectation with some
coefficient of variation, which we denote $\alpha^R$.

  
## seegene_curves.R
library( tidyverse )

readRDS("~/sds/sd17l002/p/covidTests/data/allCurvesSeegene.rds") %>% ungroup() -> tbl
readRDS("~/sds/sd17l002/p/covidTests/data/testResults.rds" ) -> testres

tbl %>% pull( plateId ) %>% unique()

c( "FAM" = "E", "HEX" = "IC", "Cal Red 610" = "R", "Quasar 670" = "N" ) ->flph2gene

tbl %>%

## covid.R
library( tidyverse )
library( ggplot2 )

jhu_url <- paste("https://raw.githubusercontent.com/CSSEGISandData/",
  "COVID-19/master/csse_covid_19_data/", "csse_covid_19_time_series/",
  "time_series_19-covid-Confirmed.csv", sep = "")

seq( 0, by=.211, length.out=300 ) -> a
hsv( a - floor(a), 1, 1 ) -> palette

	# Make example data
	n <- 15
	x <- runif( n, 0, 10 )
	y <- sin(x) + rnorm( n, sd=.1 )

	# Make grid to plot smooth curves
	xg <- seq( 0, 10, length.out=1000 )

	# Determine knot positions:
	import gzip, random

	# Load FASTQ file for Chromosome 10 from GRCm38
	with gzip.open("data/Mus_musculus.GRCm38.dna.chromosome.10.fa.gz") as f:
	firstline = f.readline()
	assert firstline.startswith(b'>')
	chrom_seq = b"".join(l.rstrip() for l in f)

	# This here is the file from papagei:mnt/raid/scnmt_data/CpG_filtered
	cpg = scipy.sparse.load_npz( "data/CpG_10.npz" ).tocoo()
	## Beispiel für Plot-Größe

	Tidyverse laden:

	```{r}
	library( tidyverse )
	```

	Wir benutzen `mtcars`, eine Standard-Beispiel-Tabelle von R mit technischen Daten
	für (recht alte) Autos:
	library( irlba )

	m <- 10000 # nbr of features (rows)
	n <- 5000 # nbr of cells (colums)
	r <- 5 # nbr of latent components

	## The true latent values

	# True importance of latent factors
	true_importance <- c( 1, .8, .4, .2, .1 )
	# Wir haben 300 Stämme
	m <- 300

	# Die wahre mittlere Floureszenz der Stämme ist
	true_mu <- exp( rnorm( m, 3, 2) )

	# Die mittlere Hintergrund-Floureszenz ist
	true_bg <- 10

	# Die Hintergrund-Floureszenz schwankt mit einer Standardabweichung von
	# So zieht man 10000 Werte mit Mittelwert 178 und Standardabweichung 7:

	rnorm( 10000, 178, 7 ) -> x


	# Und so plotted man das Histogramm aller Werte in x

	library( tidyverse)

	tibble(x) %>% ggplot + geom_histogram(aes(x))
	library( jrc )
	library( rlc )

	myfun <- function(x) { print( paste( "user clicked on", x ) ) }

	rlc::openPage(useViewer=FALSE)

	jrc::allowFunctions( "myfun" )

	genes <- c( "gene1", "gene2", "gene3" )
	library( tidyverse )

	readRDS("~/sds/sd17l002/p/covidTests/data/allCurvesSeegene.rds") %>% ungroup() -> tbl
	readRDS("~/sds/sd17l002/p/covidTests/data/testResults.rds" ) -> testres

	tbl %>% pull( plateId ) %>% unique()

	c( "FAM" = "E", "HEX" = "IC", "Cal Red 610" = "R", "Quasar 670" = "N" ) ->flph2gene

	tbl %>%
	library( tidyverse )
	library( ggplot2 )

	jhu_url <- paste("https://raw.githubusercontent.com/CSSEGISandData/",
	"COVID-19/master/csse_covid_19_data/", "csse_covid_19_time_series/",
	"time_series_19-covid-Confirmed.csv", sep = "")

	seq( 0, by=.211, length.out=300 ) -> a
	hsv( a - floor(a), 1, 1 ) -> palette