{
  "_id": "6a2280dacd65a98ecbd518f7",
  "Package": "leakr",
  "Type": "Package",
  "Title": "Data Leakage Detection Tools for Machine Learning",
  "Version": "0.1.0",
  "Authors@R": "person(given = c(\"Cheryl\", \"Isabella\"), family = \"Lim\", role = c(\"aut\", \"cre\"), email =\n\"cheryl.academic@gmail.com\")",
  "Description": "Provides utilities to detect common data leakage patterns\nincluding train/test contamination, temporal leakage, and data\nduplication, enhancing model reliability and reproducibility in\nmachine learning workflows. Generates diagnostic reports and\nvisual summaries to support data validation. Methods based on\nbest practices from Hastie, Tibshirani, and Friedman (2009,\nISBN:978-0387848570).",
  "License": "MIT + file LICENSE",
  "Encoding": "UTF-8",
  "Roxygen": "list(markdown = TRUE)",
  "RoxygenNote": "7.3.3",
  "VignetteBuilder": "knitr",
  "Config/pak/sysreqs": "cmake libicu-dev libssl-dev",
  "Repository": "https://cherylisabella.r-universe.dev",
  "Date/Publication": "2025-12-07 17:00:19 UTC",
  "RemoteUrl": "https://github.com/cherylisabella/leakr",
  "RemoteRef": "HEAD",
  "RemoteSha": "51d111855cb9161856cfe0aa09a282ff43147774",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-06-05 07:44:55 UTC",
    "User": "root"
  },
  "Author": "Cheryl Isabella Lim [aut, cre]",
  "Maintainer": "Cheryl Isabella Lim <cheryl.academic@gmail.com>",
  "MD5sum": "4ff1b2184fcbbe7056ae803ec50cc2ae",
  "_user": "cherylisabella",
  "_type": "src",
  "_file": "leakr_0.1.0.tar.gz",
  "_fileid": "7f5e40d8e37fb538cab88ee7994e36b311f921d7f36c6e7ec51d5d651d1bc3f8",
  "_filesize": 327143,
  "_sha256": "7f5e40d8e37fb538cab88ee7994e36b311f921d7f36c6e7ec51d5d651d1bc3f8",
  "_created": "2026-06-05T07:44:55.000Z",
  "_published": "2026-06-05T07:55:06.494Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 79685761935,
      "time": 171,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "NOTE",
      "artifact": "7431463971"
    },
    {
      "job": 79685761932,
      "time": 149,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7431456896"
    },
    {
      "job": 79685761933,
      "time": 265,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "NOTE",
      "artifact": "7431572280"
    },
    {
      "job": 79685761937,
      "time": 140,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7431533339"
    },
    {
      "job": 79685233275,
      "time": 223,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7431411576"
    },
    {
      "job": 79685761925,
      "time": 139,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7431453503"
    },
    {
      "job": 79685761926,
      "time": 110,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "NOTE",
      "artifact": "7431444856"
    },
    {
      "job": 79685761936,
      "time": 101,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "NOTE",
      "artifact": "7431442476"
    },
    {
      "job": 79685761951,
      "time": 87,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7431438288"
    }
  ],
  "_buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/cherylisabella/leakr",
  "_commit": {
    "id": "51d111855cb9161856cfe0aa09a282ff43147774",
    "author": "cherylisabella <104558827+cherylisabella@users.noreply.github.com>",
    "committer": "GitHub <noreply@github.com>",
    "message": "Update R-CMD-check.yaml",
    "time": 1765126819
  },
  "_maintainer": {
    "name": "Cheryl Isabella Lim",
    "email": "cheryl.academic@gmail.com",
    "login": "cherylisabella",
    "description": "",
    "uuid": 104558827
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "ggplot2",
      "role": "Imports"
    },
    {
      "package": "arrow",
      "role": "Imports"
    },
    {
      "package": "data.table",
      "role": "Imports"
    },
    {
      "package": "digest",
      "role": "Imports"
    },
    {
      "package": "htmltools",
      "role": "Imports"
    },
    {
      "package": "openxlsx",
      "role": "Imports"
    },
    {
      "package": "readxl",
      "role": "Imports"
    },
    {
      "package": "stringr",
      "role": "Imports"
    },
    {
      "package": "workflows",
      "role": "Imports"
    },
    {
      "package": "jsonlite",
      "role": "Imports"
    },
    {
      "package": "testthat",
      "version": ">= 3.0.0",
      "role": "Suggests"
    },
    {
      "package": "caret",
      "role": "Suggests"
    },
    {
      "package": "mlr3",
      "role": "Suggests"
    },
    {
      "package": "tidymodels",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    }
  ],
  "_owner": "cherylisabella",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2025-44",
      "n": 1
    },
    {
      "week": "2025-45",
      "n": 2
    },
    {
      "week": "2025-46",
      "n": 2
    },
    {
      "week": "2025-49",
      "n": 4
    }
  ],
  "_tags": [
    {
      "name": "v0.1.0",
      "date": "2025-10-28"
    }
  ],
  "_topics": [
    "data-science",
    "machine-learning",
    "ml"
  ],
  "_stars": 1,
  "_contributors": [
    {
      "user": "cherylisabella",
      "count": 9,
      "uuid": 104558827
    }
  ],
  "_userbio": {
    "uuid": 104558827,
    "type": "user",
    "name": "cherylisabella"
  },
  "_downloads": {
    "count": 137,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/leakr"
  },
  "_devurl": "https://github.com/cherylisabella/leakr",
  "_searchresults": 9,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/leakr.html",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/cherylisabella/leakr",
  "_realowner": "cherylisabella",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.1.0",
      "date": "2025-10-26"
    }
  ],
  "_exports": [
    "%||%",
    "compile_report",
    "format_detector_name",
    "generate_diagnostic_plots",
    "generate_recommendations",
    "get_detector_info",
    "leakr_audit",
    "leakr_create_snapshot",
    "leakr_export_data",
    "leakr_from_caret",
    "leakr_from_mlr3",
    "leakr_from_tidymodels",
    "leakr_import",
    "leakr_list_snapshots",
    "leakr_load_snapshot",
    "leakr_plot",
    "leakr_quick_import",
    "leakr_summarise",
    "list_registered_detectors",
    "new_temporal_detector",
    "new_train_test_detector",
    "prepare_audit_data",
    "register_detector",
    "run_detector",
    "run_detectors",
    "stratified_sample",
    "validate_and_preprocess_data"
  ],
  "_help": [
    {
      "page": "compile_report",
      "title": "Enhanced report compilation with numeric severity scores",
      "topics": [
        "compile_report"
      ]
    },
    {
      "page": "format_detector_name",
      "title": "Format detector names for display.",
      "topics": [
        "format_detector_name"
      ]
    },
    {
      "page": "grapes-or-or-grapes",
      "title": "Null-coalescing operator for clean default value handling",
      "topics": [
        "%||%",
        "grapes-or-or-grapes"
      ]
    },
    {
      "page": "leakr",
      "title": "leakr: Data Leakage Detection for Machine Learning in R",
      "topics": [
        "leakr-package",
        "leakr"
      ]
    },
    {
      "page": "leakr_audit",
      "title": "Audit dataset for data leakage",
      "topics": [
        "leakr_audit"
      ]
    },
    {
      "page": "leakr_create_snapshot",
      "title": "Create data snapshots with improved metadata handling",
      "topics": [
        "leakr_create_snapshot"
      ]
    },
    {
      "page": "leakr_export_data",
      "title": "Export data in various formats",
      "topics": [
        "leakr_export_data"
      ]
    },
    {
      "page": "leakr_from_caret",
      "title": "Convert caret training objects to standard format",
      "topics": [
        "leakr_from_caret"
      ]
    },
    {
      "page": "leakr_from_mlr3",
      "title": "Convert mlr3 Task objects to standard format",
      "topics": [
        "leakr_from_mlr3"
      ]
    },
    {
      "page": "leakr_from_tidymodels",
      "title": "Convert tidymodels workflow to standard format",
      "topics": [
        "leakr_from_tidymodels"
      ]
    },
    {
      "page": "leakr_import",
      "title": "Import data from various sources for leakage analysis",
      "topics": [
        "leakr_import"
      ]
    },
    {
      "page": "leakr_list_snapshots",
      "title": "List available snapshots with enhanced information",
      "topics": [
        "leakr_list_snapshots"
      ]
    },
    {
      "page": "leakr_load_snapshot",
      "title": "Load data snapshot with enhanced validation",
      "topics": [
        "leakr_load_snapshot"
      ]
    },
    {
      "page": "leakr_plot",
      "title": "Plot leakage detection results",
      "topics": [
        "leakr_plot"
      ]
    },
    {
      "page": "leakr_quick_import",
      "title": "Fast import with default preprocessing",
      "topics": [
        "leakr_quick_import"
      ]
    },
    {
      "page": "leakr_summarise",
      "title": "Enhanced summarise with better formatting",
      "topics": [
        "leakr_summarise"
      ]
    },
    {
      "page": "list_registered_detectors",
      "title": "List Registered Detectors",
      "topics": [
        "list_registered_detectors"
      ]
    },
    {
      "page": "new_temporal_detector",
      "title": "Create a new temporal detector",
      "topics": [
        "new_temporal_detector"
      ]
    },
    {
      "page": "new_train_test_detector",
      "title": "Create a new train-test detector",
      "topics": [
        "new_train_test_detector"
      ]
    },
    {
      "page": "plot.detector_result",
      "title": "Plot a detector_result object",
      "topics": [
        "plot.detector_result"
      ]
    },
    {
      "page": "plot.udld_report",
      "title": "Plot a udld_report object",
      "topics": [
        "plot.udld_report"
      ]
    },
    {
      "page": "register_detector",
      "title": "Register a new detector",
      "topics": [
        "register_detector"
      ]
    },
    {
      "page": "run_detector",
      "title": "Run a detector on data",
      "topics": [
        "run_detector"
      ]
    }
  ],
  "_readme": "https://github.com/cherylisabella/leakr/raw/HEAD/README.md",
  "_rundeps": [
    "arrow",
    "assertthat",
    "base64enc",
    "bit",
    "bit64",
    "cellranger",
    "class",
    "cli",
    "clock",
    "codetools",
    "cpp11",
    "crayon",
    "data.table",
    "diagram",
    "digest",
    "dplyr",
    "farver",
    "fastmap",
    "future",
    "future.apply",
    "generics",
    "ggplot2",
    "globals",
    "glue",
    "gower",
    "gtable",
    "hardhat",
    "hms",
    "htmltools",
    "ipred",
    "isoband",
    "jsonlite",
    "KernSmooth",
    "labeling",
    "lattice",
    "lava",
    "lifecycle",
    "listenv",
    "lubridate",
    "magrittr",
    "MASS",
    "Matrix",
    "modelenv",
    "nnet",
    "numDeriv",
    "openxlsx",
    "parallelly",
    "parsnip",
    "pillar",
    "pkgconfig",
    "prettyunits",
    "prodlim",
    "progress",
    "progressr",
    "purrr",
    "R6",
    "RColorBrewer",
    "Rcpp",
    "readxl",
    "recipes",
    "rematch",
    "rlang",
    "rpart",
    "S7",
    "scales",
    "shape",
    "sparsevctrs",
    "SQUAREM",
    "stringi",
    "stringr",
    "survival",
    "tibble",
    "tidyr",
    "tidyselect",
    "timechange",
    "timeDate",
    "tzdb",
    "utf8",
    "vctrs",
    "viridisLite",
    "withr",
    "workflows",
    "zip"
  ],
  "_vignettes": [
    {
      "source": "advanced-detection.Rmd",
      "filename": "advanced-detection.html",
      "title": "Advanced Leakage Detection with leakr",
      "author": "Cheryl Isabella Lim",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Understanding leakr's Detection Capabilities",
        "Advanced Target Leakage Scenarios",
        "Medical Diagnosis Example",
        "Financial Data with Temporal Issues",
        "Advanced Duplication Detection",
        "Near-Duplicate Detection in Customer Data",
        "Configuration and Customisation",
        "Custom Configuration Options",
        "Working with Large Datasets",
        "Stratified Sampling for Balanced Analysis",
        "Advanced Reporting and Analysis",
        "Detailed Report Analysis",
        "Best Practices for Advanced Usage",
        "1. Multi-Stage Validation",
        "2. Domain-Specific Validation",
        "Summary"
      ],
      "created": "2025-10-28 00:31:19",
      "modified": "2025-10-28 00:31:19",
      "commits": 1
    },
    {
      "source": "framework-integration.Rmd",
      "filename": "framework-integration.html",
      "title": "Framework Integration with leakr",
      "author": "Cheryl Isabella Lim",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Integration with caret",
        "Basic caret Integration",
        "Advanced caret Integration with Preprocessing",
        "Integration with mlr3",
        "Basic mlr3 Integration",
        "Advanced mlr3 Integration with Pipelines",
        "Integration with tidymodels",
        "Basic tidymodels Integration",
        "Advanced tidymodels Integration with Feature Engineering",
        "Data Import and Export Integration",
        "Import with Automatic Auditing",
        "Export with Audit Reports",
        "Snapshot and Version Control Integration",
        "Creating Data Snapshots",
        "Workflow Integration Patterns",
        "Pattern 1: Pre-Training Validation",
        "Pattern 2: Post-Training Audit",
        "Pattern 3: Continuous Monitoring",
        "Performance Considerations",
        "Memory-Efficient Processing",
        "Best Practices for Framework Integration",
        "1. Integration Timing",
        "2. Configuration Management",
        "3. Error Handling and Logging",
        "Summary"
      ],
      "created": "2025-10-28 00:31:19",
      "modified": "2025-10-28 00:31:19",
      "commits": 1
    },
    {
      "source": "getting-started.Rmd",
      "filename": "getting-started.html",
      "title": "Getting Started with leakr",
      "author": "Cheryl Isabella Lim",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Basic Usage: The leakr_audit() Function",
        "Simple Example with iris Dataset",
        "Understanding the Output",
        "Working with Train/Test Splits",
        "Detecting Specific Leakage Patterns",
        "Target Leakage Detection",
        "Duplication Detection",
        "Configuration and Customisation",
        "Visualising Results",
        "Working with Large Datasets",
        "Next Steps",
        "Summary"
      ],
      "created": "2025-10-28 00:31:19",
      "modified": "2025-10-28 00:31:19",
      "commits": 1
    }
  ],
  "_score": 4.778151250383644,
  "_indexed": true,
  "_nocasepkg": "leakr",
  "_universes": [
    "cherylisabella"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.1.0",
      "date": "2026-06-05T07:47:35.000Z",
      "distro": "noble",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "23f787ccb40ba4f96c4b337b26f9e579102e85b41566ddda643d6ed4a394fc50",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.1.0",
      "date": "2026-06-05T07:47:14.000Z",
      "distro": "noble",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "e8a2e99115c03c90c4a79ba822cedcc02e9e5a404f91a1b48949221fffb826a3",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.1.0",
      "date": "2026-06-05T07:53:30.000Z",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "914fffcf35babd06149f4ecb5af9f9d87a39bd7043d299b0fa980097a530ae2b",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.1.0",
      "date": "2026-06-05T07:51:32.000Z",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "e524e443eaaa5a7cacf6d8d6cf0a1965af3e15403413c5b7d6430e3eb4fc982f",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.1.0",
      "date": "2026-06-05T07:47:29.000Z",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "cfe029a1c22fd3c29456d92208beafb0873f341e3ff6a3911f5de5fe6648491a",
      "status": "success",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.1.0",
      "date": "2026-06-05T07:46:23.000Z",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "29a905eeb92a644c686f6de20c7640f50ac20c6c879afe591601adbd75d938a3",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.1.0",
      "date": "2026-06-05T07:46:17.000Z",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "029ba57bd922d40fb371cff86f5984452939f7b3097afd7d6839e19c2c11f530",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.1.0",
      "date": "2026-06-05T07:46:09.000Z",
      "commit": "51d111855cb9161856cfe0aa09a282ff43147774",
      "fileid": "1db9bd1848ed8725a9e992f613b17f57ce04e7488c9549b3968811ae97b74c65",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/cherylisabella/actions/runs/27002236845"
    }
  ]
}