Sérgio Spagnuolo sergiospagnuolo

## product_generator.rb
#------------------------------------------------------------------------
# encoding: utf-8
# @(#)product_generator.rb	1.00 29-Nov-2011 16:38
#
# Copyright (c) 2011 Jim Pravetz. All Rights Reserved.
# Licensed under the MIT license (http://www.opensource.org/licenses/mit-license.php)
#
# Description:  A generator that creates product, products and
#		ingredients pages for jekyll sites.  Uses a JSON data
#		file as the database file from which to read and

## estados-cidades.json
{
  "estados": [
    {
      "sigla": "AC",
      "nome": "Acre",
      "cidades": [
        "Acrelândia",
        "Assis Brasil",
        "Brasiléia",
        "Bujari",

## LICENSE
This is free and unencumbered software released into the public domain.

Anyone is free to copy, modify, publish, use, compile, sell, or
distribute this software, either in source code form or as a compiled
binary, for any purpose, commercial or non-commercial, and by any
means.

In jurisdictions that recognize copyright laws, the author or authors
of this software dedicate any and all copyright interest in the
software to the public domain. We make this dedication for the benefit

## PDF-2-text-or-CSV.r
# Here are a few methods for getting text from PDF files. Do read through
# the instructions carefully! NOte that this code is written for Windows 7,
# slight adjustments may be needed for other OSs

# Tell R what folder contains your 1000s of PDFs
dest <- "G:/somehere/with/many/PDFs"

# make a vector of PDF file names
myfiles <- list.files(path = dest, pattern = "pdf",  full.names = TRUE)

## import_json_appsscript.js
/**
 * Retrieves all the rows in the active spreadsheet that contain data and logs the
 * values for each row.
 * For more information on using the Spreadsheet API, see
 * https://developers.google.com/apps-script/service_spreadsheet
 */
function readRows() {
  var sheet = SpreadsheetApp.getActiveSheet();
  var rows = sheet.getDataRange();
  var numRows = rows.getNumRows();

## normalize_string.py
import unicodedata

def normalize_string(string):
    if isinstance(string, str):
        nfkd_form = unicodedata.normalize('NFKD', string.lower())
        return nfkd_form.encode('ASCII', 'ignore').decode('utf-8')

## api-similarweb.R
library(httr)
library(jsonlite)

# https://dataseolabs.com
# Doc : https://www.similarweb.com/corp/developer/
# Create your key here : https://pro.similarweb.com/#/account/api-management
# You can have freely 3 Months of Web Traffic Data

# conf
myList <- c("cuisineaz.com","marmiton.org","odelices.com","allrecipes.fr")

## gist:0cf27d994e39700663551b2d14387b08
hack_datasus <- function(sistema, modalidade, tipo_arquivo, ano, UF, mes){

  #Função gera dataframe a partir de ftp feita na página do datasus

  #sistema ex:'SIHSUS' Verificar os sistemas disponíveis em http://www2.datasus.gov.br/DATASUS/index.php?area=0901&item=1
  #modalidade  'dados'
  #tipo_arquivo ex: 'RD'#Varia conforme o sistema
  #ano ex: 17 Dois últimos dígitos do ano
  #UF ex:'AL' Sigla de UF Brasileira
  #mes ex:'12' strings entre 01 e 12

## verba_ministerio_saude.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              12 stars
            
          
                nportinari
                / verba_ministerio_saude.ipynb
            
            
              Last active
              March 12, 2020 17:40
            
              
                Verba - Ministério da Saúde
              
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## notas.md

      
              2 files
            
          
              0 forks
            
          
              0 comments
            
          
              6 stars
            
          
                sergiospagnuolo
                / notas.md
            
            
              Last active
              April 29, 2020 01:33
            
              
                Buscas no Twitter por minuto
              
          
    Análise de buscas no Twitter no calor do momento

Este caderno contém funções para que seja possível medir o interesse de buscas no Twitter, com a finalidade de saber de algum assunto está realmente popular na rede social em certo momento. Por conta de limitações na API gratuita do Twitter, recomenda-se a utilização dessa metodologia para saber se um tópico foi popular no último dia ou período do dia.
Um exemplo de como isso foi usado pode ser visto neste tweet
Esta metodologia utiliza as bibliotecas de R Tidyverse e TwitteR para acessar os dados do Twitter.
Você também vai precisar de uma conta de desenvolvedor, a fim de conseguir todas as chaves de API para fazer as buscas (caso não tenha, garanto que é bem fácil).
	#------------------------------------------------------------------------
	# encoding: utf-8
	# @(#)product_generator.rb 1.00 29-Nov-2011 16:38
	#
	# Copyright (c) 2011 Jim Pravetz. All Rights Reserved.
	# Licensed under the MIT license (http://www.opensource.org/licenses/mit-license.php)
	#
	# Description: A generator that creates product, products and
	# ingredients pages for jekyll sites. Uses a JSON data
	# file as the database file from which to read and
	{
	"estados": [
	{
	"sigla": "AC",
	"nome": "Acre",
	"cidades": [
	"Acrelândia",
	"Assis Brasil",
	"Brasiléia",
	"Bujari",
	This is free and unencumbered software released into the public domain.

	Anyone is free to copy, modify, publish, use, compile, sell, or
	distribute this software, either in source code form or as a compiled
	binary, for any purpose, commercial or non-commercial, and by any
	means.

	In jurisdictions that recognize copyright laws, the author or authors
	of this software dedicate any and all copyright interest in the
	software to the public domain. We make this dedication for the benefit
	# Here are a few methods for getting text from PDF files. Do read through
	# the instructions carefully! NOte that this code is written for Windows 7,
	# slight adjustments may be needed for other OSs

	# Tell R what folder contains your 1000s of PDFs
	dest <- "G:/somehere/with/many/PDFs"

	# make a vector of PDF file names
	myfiles <- list.files(path = dest, pattern = "pdf", full.names = TRUE)
	/**
	* Retrieves all the rows in the active spreadsheet that contain data and logs the
	* values for each row.
	* For more information on using the Spreadsheet API, see
	* https://developers.google.com/apps-script/service_spreadsheet
	*/
	function readRows() {
	var sheet = SpreadsheetApp.getActiveSheet();
	var rows = sheet.getDataRange();
	var numRows = rows.getNumRows();
	import unicodedata

	def normalize_string(string):
	if isinstance(string, str):
	nfkd_form = unicodedata.normalize('NFKD', string.lower())
	return nfkd_form.encode('ASCII', 'ignore').decode('utf-8')
	library(httr)
	library(jsonlite)

	# https://dataseolabs.com
	# Doc : https://www.similarweb.com/corp/developer/
	# Create your key here : https://pro.similarweb.com/#/account/api-management
	# You can have freely 3 Months of Web Traffic Data

	# conf
	myList <- c("cuisineaz.com","marmiton.org","odelices.com","allrecipes.fr")
	hack_datasus <- function(sistema, modalidade, tipo_arquivo, ano, UF, mes){

	#Função gera dataframe a partir de ftp feita na página do datasus

	#sistema ex:'SIHSUS' Verificar os sistemas disponíveis em http://www2.datasus.gov.br/DATASUS/index.php?area=0901&item=1
	#modalidade 'dados'
	#tipo_arquivo ex: 'RD'#Varia conforme o sistema
	#ano ex: 17 Dois últimos dígitos do ano
	#UF ex:'AL' Sigla de UF Brasileira
	#mes ex:'12' strings entre 01 e 12