Ricardo Avila ravila4

## parallel.py
# Functions for parallelizing things

def init_spark(nproc=-1, appname="sparksession"):
    """Function to start a Spark executor."""
    from pyspark.sql import SparkSession
    if nproc == -1:
        # Use all CUPs
        spark = SparkSession.builder.master(
                "local[*]").appName(appname).getOrCreate()
    else:

## flatten_json.py
def flatten_json(y):
    out = {}

    def flatten(x, name=''):
        if type(x) is dict:
            for a in x:
                flatten(x[a], name + a + '_')
        elif type(x) is list:
            i = 0
            for a in x:

## HTS_gaussian.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ravila4
                / HTS_gaussian.ipynb
            
            
              Created
              October 24, 2019 20:38
            
              
                Fitting Gaussian curves to histograms
              
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## align.py
#!/usr/bin/env python

# Sequence alignment using PyMOL
# The purpose of this script is to generate a sequence alignment between
# the original crystal structure of the apo and holo models, and the sequence
# of the finalised, ungapped Rosetta models. This allows us to get a 1 to 1
# corresponcence between the residue numberings in both structures.

# USAGE: Run once from the project root.
# "pockets.csv" contains the information about apo holo pairs.

## parse_drugbank_xml.py
import xmltodict
import pandas as pd

with open("full_database.xml") as db:
    doc = xmltodict.parse(db.read())

values = []
for item in doc['drugbank']['drug']:
    logp = None
    try:

## ORA_docking_results.ipynb

      
              1 file
            
          
              1 fork
            
          
              0 comments
            
          
              0 stars
            
          
                ravila4
                / ORA_docking_results.ipynb
            
            
              Created
              April 29, 2018 16:39
            
              
                Orexin docking results
              
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## id_mapping_mygene.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ravila4
                / id_mapping_mygene.ipynb
            
            
              Created
              November 16, 2020 16:04
                — forked from newgene/id_mapping_mygene.ipynb
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## gist:9aacae443c50a168b4267fca7448d88b
#!/usr/bin/env bash

set -Eeuo pipefail

cd "$(dirname "${BASH_SOURCE[0]}")" >/dev/null 2>&1

trap cleanup SIGINT SIGTERM ERR EXIT

usage() {
  cat <<EOF

## count_taxids.sh
#!/bin/bash

# Genesets aggregated by taxid
aggs=`curl -s "https://mygeneset.info/v1/query?q=*&facets=taxid&facet_size=100"`
taxids=`echo $aggs | jq -r '.facets.taxid.terms | map(.term) | @csv'`
counts=`echo $aggs | jq -r '.facets.taxid.terms | map(.count) | @csv'`

# Query scientific name for each taxid
resp=`curl -s -X POST -d "q=${taxids}" "http://t.biothings.io/v1/query"`
species=`echo $resp | jq -r 'map(.scientific_name) | @csv'`

## ROC.ipynb

      
              1 file
            
          
              1 fork
            
          
              0 comments
            
          
              1 star
            
          
                ravila4
                / ROC.ipynb
            
            
              Created
              April 10, 2018 03:32
            
              
                Notebook for ROC/AUC and enrichment factor analysis
              
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
	# Functions for parallelizing things

	def init_spark(nproc=-1, appname="sparksession"):
	"""Function to start a Spark executor."""
	from pyspark.sql import SparkSession
	if nproc == -1:
	# Use all CUPs
	spark = SparkSession.builder.master(
	"local[*]").appName(appname).getOrCreate()
	else:
	def flatten_json(y):
	out = {}

	def flatten(x, name=''):
	if type(x) is dict:
	for a in x:
	flatten(x[a], name + a + '_')
	elif type(x) is list:
	i = 0
	for a in x:
	#!/usr/bin/env python

	# Sequence alignment using PyMOL
	# The purpose of this script is to generate a sequence alignment between
	# the original crystal structure of the apo and holo models, and the sequence
	# of the finalised, ungapped Rosetta models. This allows us to get a 1 to 1
	# corresponcence between the residue numberings in both structures.

	# USAGE: Run once from the project root.
	# "pockets.csv" contains the information about apo holo pairs.
	import xmltodict
	import pandas as pd

	with open("full_database.xml") as db:
	doc = xmltodict.parse(db.read())

	values = []
	for item in doc['drugbank']['drug']:
	logp = None
	try:
	#!/usr/bin/env bash

	set -Eeuo pipefail

	cd "$(dirname "${BASH_SOURCE[0]}")" >/dev/null 2>&1

	trap cleanup SIGINT SIGTERM ERR EXIT

	usage() {
	cat <<EOF
	#!/bin/bash

	# Genesets aggregated by taxid
	aggs=`curl -s "https://mygeneset.info/v1/query?q=*&facets=taxid&facet_size=100"`
	taxids=`echo $aggs \| jq -r '.facets.taxid.terms \| map(.term) \| @csv'`
	counts=`echo $aggs \| jq -r '.facets.taxid.terms \| map(.count) \| @csv'`

	# Query scientific name for each taxid
	resp=`curl -s -X POST -d "q=${taxids}" "http://t.biothings.io/v1/query"`
	species=`echo $resp \| jq -r 'map(.scientific_name) \| @csv'`