mfansler/read_ad_df.R

## read_ad_df.R
library(rhdf5)
library(tidyverse)

read_ad_df <- function (file, name) {
    x_attrs <- h5readAttributes(file, name)

    ## check requested entry is a dataframe
    ## TODO: do we need to check encoding-version?
    stopifnot(x_attrs[['encoding-type']] == "dataframe")

    ## rownames and columns in order
    idx_cols <- unlist(x_attrs[c("_index", "column-order")], use.names=FALSE)

    ## load the factor levels
    x_levels <- h5read(file, str_c(name, "/__categories"))

    ## load dataframe
    h5read(file, name)[idx_cols] %>% as_tibble() %>%
        ## replace categorical columns with proper factors
        mutate(across(any_of(names(x_levels)), ~ factor(x_levels[[cur_column()]][.x+1L])))
}
	library(rhdf5)
	library(tidyverse)

	read_ad_df <- function (file, name) {
	x_attrs <- h5readAttributes(file, name)

	## check requested entry is a dataframe
	## TODO: do we need to check encoding-version?
	stopifnot(x_attrs[['encoding-type']] == "dataframe")

	## rownames and columns in order
	idx_cols <- unlist(x_attrs[c("_index", "column-order")], use.names=FALSE)

	## load the factor levels
	x_levels <- h5read(file, str_c(name, "/__categories"))

	## load dataframe
	h5read(file, name)[idx_cols] %>% as_tibble() %>%
	## replace categorical columns with proper factors
	mutate(across(any_of(names(x_levels)), ~ factor(x_levels[[cur_column()]][.x+1L])))
	}