Ana Trisovic atrisovic

## gist:4e68ebfc1841c60fb87bf83bfb220361
import pandas as pd
from huggingface_hub import HfApi
import datetime
import json

df = pd.read_csv('../../data/llm_leaderboard.csv', index_col=1, header=1)

def get_model_info(model_id):
    api = HfApi()
    try:

## fasse_analytic_data_docs.md

      
              1 file
            
          
              0 forks
            
          
              57 comments
            
          
              0 stars
            
          
                atrisovic
                / fasse_analytic_data_docs.md
            
            
              Last active
              February 20, 2023 15:40
            
              
                Form to document new analytic data on FASSE
              
          
    Step 1: Check analytic data

Is the data you need already on FASSE? Check out the catalog here: https://nsaph.info/analytic.html#analytic-data
If it is not, see step 2.
Step 2: Fill in the form below and add it in the comments here.

The format of the form goes like this:

  
## tree.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                atrisovic
                / tree.md
            
            
              Created
              June 21, 2022 21:06
            
          
     |-hospital
 | |-zip.rds
 | |-zip2.rds
 | |-SA_COPD2.Rmd
 | |-review.R
 | |-SA_MI-New.Rmd
 | |-SA_CHF2.Rmd
 | |-SA_LungCancer2.Rmd
 | |-SA_LungCancer-New.Rmd


## whanhee.py
import pandas as pd
import numpy as np
import json
from simplejson import loads


def get_outcomes():
    """ Get and return ICD codes """""
    f = open('icd_codes.json')
    outcomes_ = json.load(f)

## gist:0e8f592ed950112f1427f7ee4996cf33
{
    "aki": {
        "icd10": [
            "N17"
        ],
        "icd9": [
            "584"
        ]
    },
    "all_kidney": {

## gist:3d45cf9a37b7853597c5a258e2aa1908
# Before running, activate env:

# export CONDA_ENVS_PATH=/nfs/projects/n/nsaph_common/conda/envs/
# export CONDA_PKGS_PATH=/nfs/projects/n/nsaph_common/conda/pkgs/
# source activate nsaph


## Code to ID hospitalizations

library(data.table)

## sample_file_summaries.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                atrisovic
                / sample_file_summaries.md
            
            
              Last active
              March 9, 2022 02:50
            
              
                sample file summaries in R
              
          
    Get data sample

To get the data sample, we take first 25k rows and last 25k rows from the sample of 59mil rows in bash:
>> tail -n25000 /2016/mbsf_abcd_summary_res000017155_req008183_2016.dat \
        > sample_mbsf_abcd_summary_res000017155_req008183_2016.dat
>> head -n25000 /2016/mbsf_abcd_summary_res000017155_req008183_2016.dat \
        >> sample_mbsf_abcd_summary_res000017155_req008183_2016.dat
# word count:

  
## rewriting_history_process.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                atrisovic
                / rewriting_history_process.md
            
            
              Last active
              March 3, 2022 15:35
            
              
                Rewriting git history for data_requests
              
          
    Rewriting git history for data_requests

What happened

Beneficiery ID numbers were shared in a private GitHub repositry, in the following directories:
data_requests/request_projects/medicaid_duplicate_check_2019_09_27


## dataverse_SQL_for_DOI_and_mime.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                atrisovic
                / dataverse_SQL_for_DOI_and_mime.md
            
            
              Last active
              May 3, 2021 21:11
            
          
    Dataset stats from Dataverse

in the format DOI, release_year, mime_type

SQL DB query:
SELECT p.authority, p.identifier, f.contenttype, p.publicationdate 
FROM datafile f, dvobject o, dataset s, dvobject p 
WHERE f.id = o.id AND o.owner_id = s.id AND s.id = p.id AND s.harvestingclient_id IS NULL


## app.py
from flask import Flask, redirect, url_for
from celery import Celery
from celery import Task
from subprocess import PIPE, Popen
import logging, os
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Running locally:
	import pandas as pd
	from huggingface_hub import HfApi
	import datetime
	import json

	df = pd.read_csv('../../data/llm_leaderboard.csv', index_col=1, header=1)

	def get_model_info(model_id):
	api = HfApi()
	try:
	import pandas as pd
	import numpy as np
	import json
	from simplejson import loads


	def get_outcomes():
	""" Get and return ICD codes """""
	f = open('icd_codes.json')
	outcomes_ = json.load(f)
	# Before running, activate env:

	# export CONDA_ENVS_PATH=/nfs/projects/n/nsaph_common/conda/envs/
	# export CONDA_PKGS_PATH=/nfs/projects/n/nsaph_common/conda/pkgs/
	# source activate nsaph


	## Code to ID hospitalizations

	library(data.table)
	from flask import Flask, redirect, url_for
	from celery import Celery
	from celery import Task
	from subprocess import PIPE, Popen
	import logging, os
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	# Running locally: