{
  "_id": "6a27d73b24555f66ed5464a1",
  "Package": "rsdv",
  "Type": "Package",
  "Title": "Synthetic Tabular Data Generation with Gaussian Copulas",
  "Version": "0.2.0",
  "Authors@R": "person(given = \"Kailas\",\nfamily = \"Venkitasubramanian\",\nemail = \"kailasv@gmail.com\",\nrole = c(\"aut\", \"cre\"))",
  "Description": "Generates synthetic tabular data from real datasets using\nGaussian copula models, with parametric marginal selection for\nnumerical columns and a cumulative-frequency embedding that\nbrings categorical and boolean columns into the same joint\ncopula. Includes a metadata system with column types and\nprimary keys, declarative constraints enforced via rejection\nsampling, conditional sampling, and quality, validity and\nprivacy reports modeled on those of the 'SDMetrics' library.\nInspired by the Python 'SDV' (Synthetic Data Vault) library by\n'DataCebo'; see Patki, Wedge and Veeramachaneni (2016) \"The\nSynthetic Data Vault\" <doi:10.1109/DSAA.2016.49>.",
  "License": "MIT + file LICENSE",
  "Encoding": "UTF-8",
  "Language": "en-US",
  "Roxygen": "list(markdown = TRUE)",
  "RoxygenNote": "7.3.3",
  "URL": "https://kvenkita.github.io/rsdv/, https://github.com/kvenkita/rsdv",
  "BugReports": "https://github.com/kvenkita/rsdv/issues",
  "Config/testthat/edition": "3",
  "VignetteBuilder": "knitr",
  "LazyData": "true",
  "Config/pak/sysreqs": "libgsl0-dev",
  "Repository": "https://kvenkita.r-universe.dev",
  "Date/Publication": "2026-06-08 18:42:50 UTC",
  "RemoteUrl": "https://github.com/kvenkita/rsdv",
  "RemoteRef": "HEAD",
  "RemoteSha": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-06-09 09:01:52 UTC",
    "User": "root"
  },
  "Author": "Kailas Venkitasubramanian [aut, cre]",
  "Maintainer": "Kailas Venkitasubramanian <kailasv@gmail.com>",
  "MD5sum": "af4545337b8fcb9ead43e3d0c6e752e6",
  "_user": "kvenkita",
  "_type": "src",
  "_file": "rsdv_0.2.0.tar.gz",
  "_fileid": "97ba3ca6308f85673bfb88d48e51abb11d9a59af8042bb9695d8f4def737ee1c",
  "_filesize": 588751,
  "_sha256": "97ba3ca6308f85673bfb88d48e51abb11d9a59af8042bb9695d8f4def737ee1c",
  "_created": "2026-06-09T09:01:52.000Z",
  "_published": "2026-06-09T09:04:59.050Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 80286020002,
      "time": 142,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7503188472"
    },
    {
      "job": 80286020050,
      "time": 152,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7503192558"
    },
    {
      "job": 80286019926,
      "time": 145,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7503181705"
    },
    {
      "job": 80286019913,
      "time": 133,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7503177169"
    },
    {
      "job": 80285237329,
      "time": 259,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7503134800"
    },
    {
      "job": 80286019896,
      "time": 112,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7503176501"
    },
    {
      "job": 80286020006,
      "time": 127,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7503182397"
    },
    {
      "job": 80286020058,
      "time": 112,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7503177272"
    },
    {
      "job": 80286019918,
      "time": 84,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7503166731"
    }
  ],
  "_buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/kvenkita/rsdv",
  "_commit": {
    "id": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
    "author": "Kailas Venkitasubramanian <kailasv@gmail.com>",
    "committer": "GitHub <noreply@github.com>",
    "message": "Merge pull request #20 from kvenkita/chore/rhub-setup\n\nci: add R-hub v2 workflow for pre-CRAN platform checks",
    "time": 1780944170
  },
  "_maintainer": {
    "name": "Kailas Venkitasubramanian",
    "email": "kailasv@gmail.com",
    "login": "kvenkita",
    "description": "",
    "uuid": 26449590
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 4.3.0",
      "role": "Depends"
    },
    {
      "package": "copula",
      "version": ">= 1.1-0",
      "role": "Imports"
    },
    {
      "package": "generics",
      "version": ">= 0.1.3",
      "role": "Imports"
    },
    {
      "package": "jsonlite",
      "version": ">= 1.8.0",
      "role": "Imports"
    },
    {
      "package": "ggplot2",
      "version": ">= 3.4.0",
      "role": "Imports"
    },
    {
      "package": "tibble",
      "version": ">= 3.2.0",
      "role": "Imports"
    },
    {
      "package": "FNN",
      "version": ">= 1.1.3",
      "role": "Imports"
    },
    {
      "package": "rpart",
      "version": ">= 4.1.0",
      "role": "Imports"
    },
    {
      "package": "scales",
      "version": ">= 1.2.0",
      "role": "Imports"
    },
    {
      "package": "stats",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "testthat",
      "version": ">= 3.0.0",
      "role": "Suggests"
    },
    {
      "package": "withr",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "version": ">= 1.40",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "version": ">= 2.20",
      "role": "Suggests"
    }
  ],
  "_owner": "kvenkita",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2026-22",
      "n": 49
    },
    {
      "week": "2026-23",
      "n": 5
    },
    {
      "week": "2026-24",
      "n": 5
    }
  ],
  "_tags": [
    {
      "name": "v0.1.0",
      "date": "2026-05-29"
    },
    {
      "name": "v0.1.1",
      "date": "2026-05-29"
    },
    {
      "name": "v0.2.0",
      "date": "2026-06-08"
    }
  ],
  "_stars": 1,
  "_contributors": [
    {
      "user": "kvenkita",
      "count": 84,
      "uuid": 26449590
    }
  ],
  "_userbio": {
    "uuid": 26449590,
    "type": "user",
    "name": "Kailas Venkitasubramanian"
  },
  "_downloads": {
    "count": 0,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/rsdv"
  },
  "_devurl": "https://github.com/kvenkita/rsdv",
  "_pkgdown": "https://kvenkita.github.io/rsdv/",
  "_searchresults": 0,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/rsdv.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/kvenkita/rsdv",
  "_realowner": "kvenkita",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.1.0",
      "date": "2026-06-08"
    }
  ],
  "_exports": [
    "add_constraint",
    "attribute_disclosure_risk",
    "check_constraint",
    "check_constraints",
    "contingency_similarity",
    "correlation_similarity",
    "custom_constraint",
    "diagnostic_report",
    "equality_constraint",
    "fit",
    "fixed_combinations_constraint",
    "gaussian_copula_synthesizer",
    "inequality_constraint",
    "is_fitted",
    "ks_similarity",
    "load_metadata",
    "metadata",
    "metadata_from_json",
    "metadata_to_json",
    "ml_efficacy",
    "nndr",
    "privacy_report",
    "quality_report",
    "sample",
    "sample_conditions",
    "save_metadata",
    "set_column_type",
    "set_primary_key",
    "tvd_similarity",
    "validate_data"
  ],
  "_datasets": [
    {
      "name": "adult_income",
      "title": "Adult Income dataset (500-row sample)",
      "object": "adult_income",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "id",
        "age",
        "workclass",
        "fnlwgt",
        "education",
        "education_num",
        "marital_status",
        "occupation",
        "relationship",
        "race",
        "sex",
        "capital_gain",
        "capital_loss",
        "hours_per_week",
        "native_country",
        "income"
      ],
      "rows": 500,
      "table": true,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "add_constraint",
      "title": "Add a constraint to metadata",
      "topics": [
        "add_constraint"
      ]
    },
    {
      "page": "adult_income",
      "title": "Adult Income dataset (500-row sample)",
      "topics": [
        "adult_income"
      ]
    },
    {
      "page": "attribute_disclosure_risk",
      "title": "Attribute disclosure risk",
      "topics": [
        "attribute_disclosure_risk"
      ]
    },
    {
      "page": "autoplot.rsdv_diagnostic_report",
      "title": "Plot a diagnostic report",
      "topics": [
        "autoplot.rsdv_diagnostic_report"
      ]
    },
    {
      "page": "autoplot.rsdv_privacy_report",
      "title": "Plot a privacy report",
      "topics": [
        "autoplot.rsdv_privacy_report"
      ]
    },
    {
      "page": "autoplot.rsdv_quality_report",
      "title": "Plot a quality report",
      "topics": [
        "autoplot.rsdv_quality_report"
      ]
    },
    {
      "page": "check_constraint",
      "title": "Check a single constraint against each row of a data frame",
      "topics": [
        "check_constraint"
      ]
    },
    {
      "page": "check_constraints",
      "title": "Check all constraints in metadata against a data frame",
      "topics": [
        "check_constraints"
      ]
    },
    {
      "page": "contingency_similarity",
      "title": "Contingency similarity between real and synthetic categorical column pairs",
      "topics": [
        "contingency_similarity"
      ]
    },
    {
      "page": "correlation_similarity",
      "title": "Correlation similarity between real and synthetic numerical column pairs",
      "topics": [
        "correlation_similarity"
      ]
    },
    {
      "page": "custom_constraint",
      "title": "Constraint: arbitrary row-wise predicate",
      "topics": [
        "custom_constraint"
      ]
    },
    {
      "page": "diagnostic_report",
      "title": "Generate a diagnostic (validity) report for synthetic data",
      "topics": [
        "diagnostic_report"
      ]
    },
    {
      "page": "equality_constraint",
      "title": "Constraint: two columns must be equal row-wise",
      "topics": [
        "equality_constraint"
      ]
    },
    {
      "page": "fixed_combinations_constraint",
      "title": "Constraint: only observed column combinations are valid",
      "topics": [
        "fixed_combinations_constraint"
      ]
    },
    {
      "page": "gaussian_copula_synthesizer",
      "title": "Create a Gaussian Copula synthesizer",
      "topics": [
        "gaussian_copula_synthesizer"
      ]
    },
    {
      "page": "inequality_constraint",
      "title": "Constraint: col_a must be less than / greater than col_b",
      "topics": [
        "inequality_constraint"
      ]
    },
    {
      "page": "is_fitted",
      "title": "Check whether a synthesizer has been fitted",
      "topics": [
        "is_fitted"
      ]
    },
    {
      "page": "ks_similarity",
      "title": "Kolmogorov-Smirnov similarity score per numerical column",
      "topics": [
        "ks_similarity"
      ]
    },
    {
      "page": "load_metadata",
      "title": "Load metadata from a JSON file",
      "topics": [
        "load_metadata"
      ]
    },
    {
      "page": "metadata",
      "title": "Create a metadata object describing a dataset's column types",
      "topics": [
        "metadata"
      ]
    },
    {
      "page": "metadata_from_json",
      "title": "Deserialize metadata from a JSON string",
      "topics": [
        "metadata_from_json"
      ]
    },
    {
      "page": "metadata_to_json",
      "title": "Serialize metadata to a JSON string",
      "topics": [
        "metadata_to_json"
      ]
    },
    {
      "page": "ml_efficacy",
      "title": "ML efficacy: train-on-synthetic / test-on-real accuracy ratio (TSTR)",
      "topics": [
        "ml_efficacy"
      ]
    },
    {
      "page": "nndr",
      "title": "Nearest-Neighbor Distance Ratio privacy score",
      "topics": [
        "nndr"
      ]
    },
    {
      "page": "print.custom_constraint",
      "title": "Print method for a custom_constraint",
      "topics": [
        "print.custom_constraint"
      ]
    },
    {
      "page": "print.equality_constraint",
      "title": "Print method for an equality_constraint",
      "topics": [
        "print.equality_constraint"
      ]
    },
    {
      "page": "print.fixed_combinations_constraint",
      "title": "Print method for a fixed_combinations_constraint",
      "topics": [
        "print.fixed_combinations_constraint"
      ]
    },
    {
      "page": "print.inequality_constraint",
      "title": "Print method for an inequality_constraint",
      "topics": [
        "print.inequality_constraint"
      ]
    },
    {
      "page": "print.rsdv_diagnostic_report",
      "title": "Print method for rsdv_diagnostic_report",
      "topics": [
        "print.rsdv_diagnostic_report"
      ]
    },
    {
      "page": "print.rsdv_metadata",
      "title": "Print method for rsdv_metadata",
      "topics": [
        "print.rsdv_metadata"
      ]
    },
    {
      "page": "print.rsdv_privacy_report",
      "title": "Print method for rsdv_privacy_report",
      "topics": [
        "print.rsdv_privacy_report"
      ]
    },
    {
      "page": "print.rsdv_quality_report",
      "title": "Print method for rsdv_quality_report",
      "topics": [
        "print.rsdv_quality_report"
      ]
    },
    {
      "page": "privacy_report",
      "title": "Generate a privacy report comparing real and synthetic data",
      "topics": [
        "privacy_report"
      ]
    },
    {
      "page": "quality_report",
      "title": "Generate a quality report comparing real and synthetic data",
      "topics": [
        "quality_report"
      ]
    },
    {
      "page": "sample",
      "title": "Sample synthetic rows from a fitted synthesizer",
      "topics": [
        "sample"
      ]
    },
    {
      "page": "sample_conditions",
      "title": "Sample synthetic rows that match fixed column values (conditional sampling)",
      "topics": [
        "sample_conditions"
      ]
    },
    {
      "page": "save_metadata",
      "title": "Save metadata to a JSON file",
      "topics": [
        "save_metadata"
      ]
    },
    {
      "page": "set_column_type",
      "title": "Set the type of a column in metadata",
      "topics": [
        "set_column_type"
      ]
    },
    {
      "page": "set_primary_key",
      "title": "Set the primary key column of the metadata",
      "topics": [
        "set_primary_key"
      ]
    },
    {
      "page": "tvd_similarity",
      "title": "Total variation distance similarity score per categorical column",
      "topics": [
        "tvd_similarity"
      ]
    },
    {
      "page": "validate_data",
      "title": "Validate that a data frame is compatible with metadata",
      "topics": [
        "validate_data"
      ]
    }
  ],
  "_readme": "https://github.com/kvenkita/rsdv/raw/HEAD/README.md",
  "_rundeps": [
    "ADGofTest",
    "cli",
    "cluster",
    "colorspace",
    "copula",
    "cpp11",
    "farver",
    "FNN",
    "generics",
    "ggplot2",
    "glue",
    "gsl",
    "gtable",
    "isoband",
    "jsonlite",
    "labeling",
    "lattice",
    "lifecycle",
    "magrittr",
    "Matrix",
    "mvtnorm",
    "numDeriv",
    "pcaPP",
    "pillar",
    "pkgconfig",
    "pspline",
    "R6",
    "RColorBrewer",
    "rlang",
    "rpart",
    "S7",
    "scales",
    "stabledist",
    "tibble",
    "utf8",
    "vctrs",
    "viridisLite",
    "withr"
  ],
  "_vignettes": [
    {
      "source": "getting-started.Rmd",
      "filename": "getting-started.html",
      "title": "Getting Started with rsdv: A Practitioner's Guide to Synthetic Data Generation",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "The R Synthetic Data Ecosystem",
        "Where rsdv fits",
        "The Gaussian Copula: A Practitioner's Introduction",
        "Getting Started",
        "Installation",
        "A five-line synthesis",
        "Describing Your Data: The Metadata System",
        "Fitting and Sampling",
        "Choosing marginal distributions",
        "Conditional Sampling",
        "Evaluating Quality",
        "Column-level similarity",
        "Correlation structure",
        "Marginal distributions",
        "Diagnostic checks",
        "Evaluating Privacy",
        "Adding Constraints",
        "Handling Missing Data",
        "What rsdv does by default",
        "When to pre-impute",
        "Considerations and Caveats",
        "Citation",
        "References"
      ],
      "created": "2026-05-25 14:53:09",
      "modified": "2026-06-08 18:23:02",
      "commits": 9
    },
    {
      "source": "migrating-from-synthpop.Rmd",
      "filename": "migrating-from-synthpop.html",
      "title": "Migrating from synthpop",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Why switch?",
        "Side-by-side comparison",
        "synthpop workflow",
        "rsdv workflow",
        "Key differences"
      ],
      "created": "2026-05-25 14:53:09",
      "modified": "2026-05-27 02:32:34",
      "commits": 2
    }
  ],
  "_score": 4.477121254719663,
  "_indexed": true,
  "_nocasepkg": "rsdv",
  "_universes": [
    "kvenkita"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.2.0",
      "date": "2026-06-09T09:04:05.000Z",
      "distro": "noble",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "9384a0843503b8ae1e6bf5d18c695ff3fee59335ff52106c45ebce57f2f122bb",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.2.0",
      "date": "2026-06-09T09:04:13.000Z",
      "distro": "noble",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "93527d9d97e67fb7ca51958ff04e8298ac375b989a97259534d63a60e2ebd55c",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.2.0",
      "date": "2026-06-09T09:03:57.000Z",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "a611b2db3fe71a10bc4396c8a2585b42c5f9d7d243a780dbe19ed66b59b9206a",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.2.0",
      "date": "2026-06-09T09:03:44.000Z",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "0e4f7cd90a65967d520298e5e6489cc02db0925f2403532c8807718efc226f45",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.2.0",
      "date": "2026-06-09T09:04:03.000Z",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "de74778eecfcb009dfc7a6912f4b023f683917e94424fe168b9524e801388aec",
      "status": "success",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.2.0",
      "date": "2026-06-09T09:03:44.000Z",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "bf1c3eeda2b770cd8dabd137a6c651173129eda17e4f68177f79e0d84b92c303",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.2.0",
      "date": "2026-06-09T09:03:26.000Z",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "9246c8062e2cb78da91737ed01645fe7153fffde2b667c431867da9090afdef7",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.2.0",
      "date": "2026-06-09T09:03:02.000Z",
      "commit": "0f20dbd496c7a9bc143bd5a569313ce1d65aa060",
      "fileid": "a0b02e0016fb50decc3d70a12d4f20c45aa659462e7d6419a9ffafe0d5ba3ae3",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/kvenkita/actions/runs/27195275889"
    }
  ]
}