toolero is an R package designed to help researchers
implement best practices for their coding projects. It provides a small
set of opinionated, practical functions that reduce friction at the
start of a project and during day-to-day data work.
You can install toolero from GitHub with:
# install.packages("pak")
pak::pak("erwinlares/toolero")init_project()Creates a new R project with a standard folder structure suited for
research workflows. Optionally initializes renv for package
management and git for version control.
library(toolero)
# Create a project with the standard folder structure
init_project("~/Documents/my-project")
# Add extra folders
init_project("~/Documents/my-project", extra_folders = c("notebooks", "presentations"))
# Skip renv and git
init_project("~/Documents/my-project", use_renv = FALSE, use_git = FALSE)The default folder structure includes: data/,
data-raw/, R/, scripts/,
plots/, images/, results/, and
docs/.
read_clean_csv()Reads a CSV file and cleans the column names in one step, producing a tidyverse-friendly tibble.
library(toolero)
data <- read_clean_csv("path/to/file.csv")
# Show column type messages
data <- read_clean_csv("path/to/file.csv", verbose = TRUE)detect_execution_context()Identifies which of three execution environments the code is
currently running in: an interactive R session, a
quarto render call, or a plain Rscript
invocation. Returns one of "interactive",
"quarto", or "rscript".
library(toolero)
context <- detect_execution_context()
input_file <- switch(context,
interactive = "data/sample.csv",
quarto = params$input_file,
rscript = commandArgs(trailingOnly = TRUE)[1]
)create_qmd()Scaffolds a new Quarto document from a reproducible template, including a sample dataset and UW-Madison branded assets. Optionally pre-populates the YAML header from a user-supplied YAML config file.
library(toolero)
# Create with placeholder YAML
create_qmd(path = "~/Documents/my-project")
# Create with a custom filename
create_qmd(path = "~/Documents/my-project", filename = "report.qmd")
# Pre-populate YAML from a personal config file
create_qmd(path = "~/Documents/my-project", yaml_data = "~/my_config.yml")write_by_group()Splits a data frame by a single grouping column and writes each group
to a separate CSV file. Filenames are derived from sanitized group
values. Optionally writes a manifest.csv listing output
files, group values, and row counts.
library(toolero)
# Load the bundled sample dataset
sample_path <- system.file("templates", "sample.csv", package = "toolero")
penguins <- read_clean_csv(sample_path)
# Split by species
write_by_group(penguins, group_col = "species", output_dir = tempdir())
# Also write a manifest
write_by_group(penguins, group_col = "species",
output_dir = tempdir(), manifest = TRUE)To cite toolero in publications:
citation("toolero")MIT © Erwin Lares