Skip to content

Instantly share code, notes, and snippets.

View BERENZ's full-sized avatar

Maciej Beręsewicz BERENZ

View GitHub Profile
@BERENZ
BERENZ / misclass-example.R
Created June 21, 2024 07:19
An example code for the misclassification and misclassGLM
library("misclassGLM")
library("data.table")
library("simex")
## population definition
set.seed(2024)
N <- 100000
pop_data <- data.table(age = sample(c("Young", "Middle-aged", "Old"), size = N, c(0.40, 0.35, 0.25), replace = T),
ethnic = sample(c("Native", "Nonnative"), size = N, prob = c(0.85, 0.15), replace = T))
@BERENZ
BERENZ / example-code-hnsw-rnn.R
Created May 5, 2024 20:16
RcppHNSW vs rnndescent
library(RcppHNSW)
library(rnndescent)
library(tokenizers)
library(text2vec)
library(igraph)
## read and process data
census <- read.csv("https://raw.githubusercontent.com/djvanderlaan/tutorial-reclin-uros2021/main/data/census.csv")
cis <- read.csv("https://raw.githubusercontent.com/djvanderlaan/tutorial-reclin-uros2021/main/data/cis.csv")
@BERENZ
BERENZ / symulacja.R
Created April 11, 2024 11:11
Przykład z overlap
library(nonprobsvy)
seed_for_sim <- 2024
set.seed(seed_for_sim)
## pop and sample sizes
N <- 100000 ## populacja
n_a <- N*0.7 ## proba big data o wielkosci 70%
n_b <- 10000 ## duza proba losowa
n_a1 <- 0.7 * n_a
{
"ogolem": 51.5,
"wiek": {
"18-29-lat": 38.6,
"30-39-lat": 49.5,
"40-49-lat": 55.1,
"50-59-lat": 62.4,
"60-i-wiecej-lat": 51.4
},
"plec": {
{
"NR": {
"PIS": {
"support": 1
},
"KONF": {
"support": 2
},
"TRZE": {
"support": 3
{
"126101": {
"community": "Kraków",
"county": "",
"voivodeship": "",
"frequence": 50.1,
"result": [
{
"name": "Aleskander Miszalski",
"support": 39.4,
{
"support": {
"PIS": 33.7,
"KO": 31.9,
"TRZE": 13.5,
"KONF": 7.5,
"LEW": 6.8,
"BEZP": 2.7
},
"country": {
{
"country": {
"frequence": 51.5
},
"voivods": {
"dolnoslaskie": {
"frequence": 48.3
},
"kujawsko-pomorskie": {
"frequence": 50.6
{
"support": {
"PIS": 33.7,
"KONF": 7.5,
"TRZE": 13.5,
"LEW": 6.8,
"KO": 31.9,
"BEZP": 2.7,
"INNE": 3.9
},
@BERENZ
BERENZ / 2024-ipsos-wykresy.R
Created April 7, 2024 19:56
IPSOS exit poll 2024 (wykresy)
library(jsonlite)
library(ggplot2)
library(tidyverse)
library(data.table)
library(ggrepel)
exit_poll <- read_json("https://gist.githubusercontent.com/BERENZ/d9c193c63d432f55bf7e9d3f6ec2f9fd/raw/e32e15c006563895a0d471068a17acc7c76c3546/2024-ipsos-wyniki.json")
bind_rows(