Mikhail Popov bearloga

## wdqs-cocktails.R
cocktails <- WikidataQueryServiceR::query_wikidata('
SELECT DISTINCT ?cocktailLabel ?ingredientLabel ?instanceOfLabel ?subclassLabel
WHERE
{
  ?cocktail wdt:P31/wdt:P279* wd:Q134768 .
  ?cocktail wdt:P186 ?ingredient .
  OPTIONAL {
    ?ingredient wdt:P279 ?subclass .
  }
  OPTIONAL {

## mkrproj.sh
#!/bin/bash

# Usage: mkproj [projectname]
# projectname defaults to name of current directory

template="Version: 1.0\nRestoreWorkspace: Default\nSaveWorkspace: Default\nAlwaysSaveHistory: Default\n\nEnableCodeIndexing: Yes\nUseSpacesForTab: Yes\nNumSpacesForTab: 4\nEncoding: UTF-8\n\nRnwWeave: knitr\nLaTeX: pdfLaTeX"

wd=$(basename `pwd`)

if [ -z $1 ]; then

## dl2csv.R
library(rvest)

x <- "<dl>
  <dt>Coffee</dt>
  <dd>Black hot drink</dd>
  <dt>Milk</dt>
  <dd>White cold drink</dd>
</dl>"

y <- read_html(x)

## druid-csv-spec_country-all.json
{
  "type": "index_hadoop",
  "spec": {
    "ioConfig": {
      "type": "hadoop",
      "inputSpec": {
        "paths": "hdfs://analytics-hadoop/tmp/gsc-all.csv.gz",
        "type": "static"
      }
    },

## pavement.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                bearloga
                / pavement.ipynb
            
            
              Created
              January 9, 2019 03:23
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## pavement-r.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                bearloga
                / pavement-r.ipynb
            
            
              Created
              January 10, 2019 15:03
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## logarithmic-time.R
# daily_stats has 5 columns used by this code: date, time_spent_10/25/50/75/90

ggplot(daily_stats) +
    geom_segment(aes(x = date, xend = date, y = time_spent_10, yend = time_spent_90),
                 size = 1, color = "#00af89") +
    geom_segment(aes(x = date, xend = date, y = time_spent_25, yend = time_spent_75),
                 size = 2, color = "#14866d") +
    # geom_ribbon(aes(x = date, ymin = time_spent_lower, ymax = time_spent_upper), alpha = 0.3) +
    # geom_line(aes(x = date, y = time_spent_middle)) +
    geom_label(

## sql-murder-mystery-solution.md

      
              1 file
            
          
              2 forks
            
          
              2 comments
            
          
              6 stars
            
          
                bearloga
                / sql-murder-mystery-solution.md
            
            
              Created
              October 13, 2019 01:42
            
              
                A walkthrough of the solution to SQL Murder Mystery by Northwestern University Knight Lab. Solution by Mikhail Popov (@bearloga)
              
          
    Solution to SQL Murdery Mystery

A walkthrough of the solution to SQL Murder Mystery by Northwestern University Knight Lab. Solution by Mikhail Popov
Prompt


A crime has taken place and the detective needs your help. The detective gave you the crime scene report, but you somehow lost it. You vaguely remember that the crime was a murder that occurred sometime on Jan.15, 2018 and that it took place in SQL City. Start by retrieving the corresponding crime scene report from the police department’s database.

Witness reports


## engines.Rmd
---
title: "Printing chunk engine via hook"
output: github_document
---

```{r setup, include=FALSE}
library(knitr)
opts_chunk$set(echo = TRUE, warning = FALSE, message = FALSE)

print_engine_hook <- function(before, options, envir) {

## waxer-demo.ipynb

      
              1 file
            
          
              0 forks
            
          
              1 comment
            
          
              0 stars
            
          
                bearloga
                / waxer-demo.ipynb
            
            
              Created
              July 23, 2020 14:15
            
              
                Demo of using {waxer} R package in a Jupyter Notebook to fetch different Wikipedia languages' pageviews with different access methods
              
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
	cocktails <- WikidataQueryServiceR::query_wikidata('
	SELECT DISTINCT ?cocktailLabel ?ingredientLabel ?instanceOfLabel ?subclassLabel
	WHERE
	{
	?cocktail wdt:P31/wdt:P279* wd:Q134768 .
	?cocktail wdt:P186 ?ingredient .
	OPTIONAL {
	?ingredient wdt:P279 ?subclass .
	}
	OPTIONAL {
	#!/bin/bash

	# Usage: mkproj [projectname]
	# projectname defaults to name of current directory

	template="Version: 1.0\nRestoreWorkspace: Default\nSaveWorkspace: Default\nAlwaysSaveHistory: Default\n\nEnableCodeIndexing: Yes\nUseSpacesForTab: Yes\nNumSpacesForTab: 4\nEncoding: UTF-8\n\nRnwWeave: knitr\nLaTeX: pdfLaTeX"

	wd=$(basename `pwd`)

	if [ -z $1 ]; then
	library(rvest)

	x <- "<dl>
	<dt>Coffee</dt>
	<dd>Black hot drink</dd>
	<dt>Milk</dt>
	<dd>White cold drink</dd>
	</dl>"

	y <- read_html(x)
	{
	"type": "index_hadoop",
	"spec": {
	"ioConfig": {
	"type": "hadoop",
	"inputSpec": {
	"paths": "hdfs://analytics-hadoop/tmp/gsc-all.csv.gz",
	"type": "static"
	}
	},
	# daily_stats has 5 columns used by this code: date, time_spent_10/25/50/75/90

	ggplot(daily_stats) +
	geom_segment(aes(x = date, xend = date, y = time_spent_10, yend = time_spent_90),
	size = 1, color = "#00af89") +
	geom_segment(aes(x = date, xend = date, y = time_spent_25, yend = time_spent_75),
	size = 2, color = "#14866d") +
	# geom_ribbon(aes(x = date, ymin = time_spent_lower, ymax = time_spent_upper), alpha = 0.3) +
	# geom_line(aes(x = date, y = time_spent_middle)) +
	geom_label(
	---
	title: "Printing chunk engine via hook"
	output: github_document
	---

	```{r setup, include=FALSE}
	library(knitr)
	opts_chunk$set(echo = TRUE, warning = FALSE, message = FALSE)

	print_engine_hook <- function(before, options, envir) {