{
  "_id": "6a1ef8ccb401979e73417e53",
  "Package": "funModeling",
  "Type": "Package",
  "Title": "Exploratory Data Analysis and Data Preparation Tool-Box",
  "Description": "Around 10% of almost any predictive modeling project is\nspent in predictive modeling, 'funModeling' and the book Data\nScience Live Book (<https://livebook.datascienceheroes.com/>)\nare intended to cover remaining 90%: data preparation,\nprofiling, selecting best variables 'dataViz', assessing model\nperformance and other functions.",
  "Version": "1.9.6",
  "Date": "2026-02-17",
  "Authors@R": "person(\"Pablo\", \"Casas\", role = c(\"aut\", \"cre\"), email = \"pcasas.biz@gmail.com\")",
  "Maintainer": "Pablo Casas <pcasas.biz@gmail.com>",
  "License": "GPL-2",
  "BugReports": "https://github.com/pablo14/funModeling/issues",
  "URL": "https://livebook.datascienceheroes.com",
  "LazyData": "true",
  "Encoding": "UTF-8",
  "VignetteBuilder": "knitr",
  "RoxygenNote": "7.1.0",
  "Config/pak/sysreqs": "cmake make libicu-dev libuv1-dev",
  "Repository": "https://pablo14.r-universe.dev",
  "Date/Publication": "2026-02-17 23:58:55 UTC",
  "RemoteUrl": "https://github.com/pablo14/funmodeling",
  "RemoteRef": "HEAD",
  "RemoteSha": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-19 05:57:02 UTC",
    "User": "root"
  },
  "Author": "Pablo Casas [aut, cre]",
  "MD5sum": "6a43c4bee73e2584344fe70a17ee3635",
  "_user": "pablo14",
  "_type": "src",
  "_file": "funModeling_1.9.6.tar.gz",
  "_fileid": "e189914c3190f5a9d0461eccd5d87dca3927eaf66b5ddf0eb5d969d90d42b43a",
  "_filesize": 1973532,
  "_sha256": "e189914c3190f5a9d0461eccd5d87dca3927eaf66b5ddf0eb5d969d90d42b43a",
  "_created": "2026-05-19T05:57:02.000Z",
  "_published": "2026-06-02T15:37:48.040Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 79110000316,
      "time": 166,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7075956975"
    },
    {
      "job": 79110000231,
      "time": 141,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7075951257"
    },
    {
      "job": 79110001172,
      "time": 231,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7075955591"
    },
    {
      "job": 79110000401,
      "time": 162,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7075950496"
    },
    {
      "job": 79110000354,
      "time": 222,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7075918017"
    },
    {
      "job": 79109999574,
      "time": 137,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7362494108"
    },
    {
      "job": 79110000445,
      "time": 114,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7075944643"
    },
    {
      "job": 79110000904,
      "time": 100,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7075941451"
    },
    {
      "job": 79110000484,
      "time": 109,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7075943656"
    }
  ],
  "_buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/pablo14/funmodeling",
  "_commit": {
    "id": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
    "author": "pablo14 <pcasas.biz@gmail.com>",
    "committer": "pablo14 <pcasas.biz@gmail.com>",
    "message": "Update Twitter link to X.com in vignette\n",
    "time": 1771372735
  },
  "_maintainer": {
    "name": "Pablo Casas",
    "email": "pcasas.biz@gmail.com",
    "login": "pablo14",
    "description": "Data Science | Machine Learning | AI - Deep Learning",
    "uuid": 9369685
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.4.0",
      "role": "Depends"
    },
    {
      "package": "Hmisc",
      "version": ">= 3.17.1",
      "role": "Depends"
    },
    {
      "package": "ROCR",
      "role": "Imports"
    },
    {
      "package": "ggplot2",
      "role": "Imports"
    },
    {
      "package": "gridExtra",
      "role": "Imports"
    },
    {
      "package": "pander",
      "role": "Imports"
    },
    {
      "package": "reshape2",
      "role": "Imports"
    },
    {
      "package": "scales",
      "role": "Imports"
    },
    {
      "package": "dplyr",
      "role": "Imports"
    },
    {
      "package": "rlang",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "RColorBrewer",
      "role": "Imports"
    },
    {
      "package": "moments",
      "role": "Imports"
    },
    {
      "package": "entropy",
      "role": "Imports"
    },
    {
      "package": "cli",
      "role": "Imports"
    },
    {
      "package": "stringr",
      "role": "Imports"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    }
  ],
  "_owner": "pablo14",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2026-08",
      "n": 2
    }
  ],
  "_tags": [],
  "_stars": 100,
  "_contributors": [
    {
      "user": "pablo14",
      "count": 142,
      "uuid": 9369685
    },
    {
      "user": "sicarul",
      "count": 6,
      "uuid": 4952116
    },
    {
      "user": "choonghyunryu",
      "count": 2,
      "uuid": 1195558
    },
    {
      "user": "fede654",
      "count": 1,
      "uuid": 116310534
    }
  ],
  "_userbio": {
    "uuid": 9369685,
    "type": "user",
    "name": "Pablo Casas",
    "description": "Data Science | Machine Learning | AI - Deep Learning"
  },
  "_downloads": {
    "count": 1156,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/funModeling"
  },
  "_mentions": 2,
  "_devurl": "https://github.com/pablo14/funmodeling",
  "_searchresults": 737,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/funModeling.html",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/pablo14/funmodeling",
  "_realowner": "pablo14",
  "_cranurl": true,
  "_releases": [
    {
      "version": "1.0",
      "date": "2016-02-07"
    },
    {
      "version": "1.1",
      "date": "2016-03-14"
    },
    {
      "version": "1.2",
      "date": "2016-08-10"
    },
    {
      "version": "1.3",
      "date": "2016-10-07"
    },
    {
      "version": "1.4",
      "date": "2016-10-11"
    },
    {
      "version": "1.5",
      "date": "2016-11-12"
    },
    {
      "version": "1.6",
      "date": "2017-01-12"
    },
    {
      "version": "1.6.1",
      "date": "2017-02-26"
    },
    {
      "version": "1.6.2",
      "date": "2017-03-16"
    },
    {
      "version": "1.6.3",
      "date": "2017-06-03"
    },
    {
      "version": "1.6.4",
      "date": "2017-06-17"
    },
    {
      "version": "1.6.5",
      "date": "2017-07-09"
    },
    {
      "version": "1.6.6",
      "date": "2017-12-18"
    },
    {
      "version": "1.6.7",
      "date": "2018-01-21"
    },
    {
      "version": "1.6.8",
      "date": "2018-07-31"
    },
    {
      "version": "1.7",
      "date": "2019-02-13"
    },
    {
      "version": "1.8",
      "date": "2019-08-01"
    },
    {
      "version": "1.9",
      "date": "2019-08-26"
    },
    {
      "version": "1.9.2",
      "date": "2019-09-08"
    },
    {
      "version": "1.9.3",
      "date": "2019-10-09"
    },
    {
      "version": "1.9.4",
      "date": "2020-06-15"
    },
    {
      "version": "1.9.5",
      "date": "2024-04-01"
    },
    {
      "version": "1.9.6",
      "date": "2026-02-18"
    }
  ],
  "_exports": [
    "auto_grouping",
    "categ_analysis",
    "compare_df",
    "concatenate_n_vars",
    "convert_df_to_categoric",
    "coord_plot",
    "correlation_table",
    "cross_plot",
    "data_integrity",
    "data_integrity_model",
    "desc_groups",
    "desc_groups_rank",
    "df_status",
    "discretize_df",
    "discretize_get_bins",
    "discretize_rgr",
    "entropy_2",
    "equal_freq",
    "export_plot",
    "fibonacci",
    "freq",
    "gain_lift",
    "gain_ratio",
    "get_sample",
    "hampel_outlier",
    "infor_magic",
    "information_gain",
    "plot_num",
    "plotar",
    "prep_outliers",
    "profiling_num",
    "range01",
    "status",
    "tukey_outlier",
    "v_compare",
    "var_rank_info"
  ],
  "_datasets": [
    {
      "name": "data_country",
      "title": "People with flu data",
      "object": "data_country",
      "class": [
        "data.frame"
      ],
      "fields": [
        "person",
        "country",
        "has_flu"
      ],
      "rows": 910,
      "table": true,
      "tojson": true
    },
    {
      "name": "data_golf",
      "title": "Play golf",
      "object": "data_golf",
      "class": [
        "data.frame"
      ],
      "fields": [
        "outlook",
        "temperature",
        "humidity",
        "windy",
        "play_golf"
      ],
      "rows": 14,
      "table": true,
      "tojson": true
    },
    {
      "name": "heart_disease",
      "title": "Heart Disease Data",
      "object": "heart_disease",
      "class": [
        "data.frame"
      ],
      "fields": [
        "age",
        "gender",
        "chest_pain",
        "resting_blood_pressure",
        "serum_cholestoral",
        "fasting_blood_sugar",
        "resting_electro",
        "max_heart_rate",
        "exer_angina",
        "oldpeak",
        "slope",
        "num_vessels_flour",
        "thal",
        "heart_disease_severity",
        "exter_angina",
        "has_heart_disease"
      ],
      "rows": 303,
      "table": true,
      "tojson": true
    },
    {
      "name": "metadata_models",
      "title": "Metadata models data integrity",
      "object": "metadata_models",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "name",
        "allow_NA",
        "max_unique",
        "allow_factor",
        "allow_character",
        "only_numeric"
      ],
      "rows": 11,
      "table": true,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "funModeling-package",
      "title": "funModeling: Exploratory data analysis, data preparation and model performance",
      "topics": [
        "funModeling-package",
        "funModeling"
      ]
    },
    {
      "page": "auto_grouping",
      "title": "Reduce cardinality in categorical variable by automatic grouping",
      "topics": [
        "auto_grouping"
      ]
    },
    {
      "page": "categ_analysis",
      "title": "Profiling analysis of categorical vs. target variable",
      "topics": [
        "categ_analysis"
      ]
    },
    {
      "page": "compare_df",
      "title": "Compare two data frames by keys",
      "topics": [
        "compare_df"
      ]
    },
    {
      "page": "concatenate_n_vars",
      "title": "Concatenate 'N' variables",
      "topics": [
        "concatenate_n_vars"
      ]
    },
    {
      "page": "convert_df_to_categoric",
      "title": "Convert every column in a data frame to character",
      "topics": [
        "convert_df_to_categoric"
      ]
    },
    {
      "page": "coord_plot",
      "title": "Coordinate plot",
      "topics": [
        "coord_plot"
      ]
    },
    {
      "page": "correlation_table",
      "title": "Get correlation against target variable",
      "topics": [
        "correlation_table"
      ]
    },
    {
      "page": "cross_plot",
      "title": "Cross-plotting input variable vs. target variable",
      "topics": [
        "cross_plot"
      ]
    },
    {
      "page": "data_country",
      "title": "People with flu data",
      "topics": [
        "data_country"
      ]
    },
    {
      "page": "data_golf",
      "title": "Play golf",
      "topics": [
        "data_golf"
      ]
    },
    {
      "page": "data_integrity",
      "title": "Data integrity",
      "topics": [
        "data_integrity"
      ]
    },
    {
      "page": "data_integrity_model",
      "title": "Check data integrity model",
      "topics": [
        "data_integrity_model"
      ]
    },
    {
      "page": "desc_groups",
      "title": "Profiling categorical variable",
      "topics": [
        "desc_groups"
      ]
    },
    {
      "page": "desc_groups_rank",
      "title": "Profiling categorical variable (rank)",
      "topics": [
        "desc_groups_rank"
      ]
    },
    {
      "page": "df_status",
      "title": "Get a summary for the given data frame (o vector).",
      "topics": [
        "df_status"
      ]
    },
    {
      "page": "discretize_df",
      "title": "Discretize a data frame",
      "topics": [
        "discretize_df"
      ]
    },
    {
      "page": "discretize_get_bins",
      "title": "Get the data frame thresholds for discretization",
      "topics": [
        "discretize_get_bins"
      ]
    },
    {
      "page": "discretize_rgr",
      "title": "Variable discretization by gain ratio maximization",
      "topics": [
        "discretize_rgr"
      ]
    },
    {
      "page": "entropy_2",
      "title": "Computes the entropy between two variables",
      "topics": [
        "entropy_2"
      ]
    },
    {
      "page": "equal_freq",
      "title": "Equal frequency binning",
      "topics": [
        "equal_freq"
      ]
    },
    {
      "page": "export_plot",
      "title": "Export plot to jpeg file",
      "topics": [
        "export_plot"
      ]
    },
    {
      "page": "fibonacci",
      "title": "Fibonacci series",
      "topics": [
        "fibonacci"
      ]
    },
    {
      "page": "freq",
      "title": "Frequency table for categorical variables",
      "topics": [
        "freq"
      ]
    },
    {
      "page": "gain_lift",
      "title": "Generates lift and cumulative gain performance table and plot",
      "topics": [
        "gain_lift"
      ]
    },
    {
      "page": "gain_ratio",
      "title": "Gain ratio",
      "topics": [
        "gain_ratio"
      ]
    },
    {
      "page": "get_sample",
      "title": "Sampling training and test data",
      "topics": [
        "get_sample"
      ]
    },
    {
      "page": "hampel_outlier",
      "title": "Hampel Outlier Threshold",
      "topics": [
        "hampel_outlier"
      ]
    },
    {
      "page": "heart_disease",
      "title": "Heart Disease Data",
      "topics": [
        "heart_disease"
      ]
    },
    {
      "page": "infor_magic",
      "title": "Computes several information theory metrics between two vectors",
      "topics": [
        "infor_magic"
      ]
    },
    {
      "page": "information_gain",
      "title": "Information gain",
      "topics": [
        "information_gain"
      ]
    },
    {
      "page": "metadata_models",
      "title": "Metadata models data integrity",
      "topics": [
        "metadata_models"
      ]
    },
    {
      "page": "plot_num",
      "title": "Plotting numerical data",
      "topics": [
        "plot_num"
      ]
    },
    {
      "page": "plotar",
      "title": "Correlation plots",
      "topics": [
        "plotar"
      ]
    },
    {
      "page": "prep_outliers",
      "title": "Outliers Data Preparation",
      "topics": [
        "prep_outliers"
      ]
    },
    {
      "page": "profiling_num",
      "title": "Profiling numerical data",
      "topics": [
        "profiling_num"
      ]
    },
    {
      "page": "range01",
      "title": "Transform a variable into the [0-1] range",
      "topics": [
        "range01"
      ]
    },
    {
      "page": "status",
      "title": "Get a summary for the given data frame (o vector).",
      "topics": [
        "status"
      ]
    },
    {
      "page": "tukey_outlier",
      "title": "Tukey Outlier Threshold",
      "topics": [
        "tukey_outlier"
      ]
    },
    {
      "page": "v_compare",
      "title": "Compare two vectors",
      "topics": [
        "v_compare"
      ]
    },
    {
      "page": "var_rank_info",
      "title": "Importance variable ranking based on information theory",
      "topics": [
        "var_rank_info"
      ]
    }
  ],
  "_readme": "https://github.com/pablo14/funmodeling/raw/HEAD/README.md",
  "_rundeps": [
    "backports",
    "base64enc",
    "bitops",
    "bslib",
    "cachem",
    "caTools",
    "checkmate",
    "cli",
    "cluster",
    "colorspace",
    "cpp11",
    "data.table",
    "digest",
    "dplyr",
    "entropy",
    "evaluate",
    "farver",
    "fastmap",
    "fontawesome",
    "foreign",
    "Formula",
    "fs",
    "generics",
    "ggplot2",
    "glue",
    "gplots",
    "gridExtra",
    "gtable",
    "gtools",
    "highr",
    "Hmisc",
    "htmlTable",
    "htmltools",
    "htmlwidgets",
    "isoband",
    "jquerylib",
    "jsonlite",
    "KernSmooth",
    "knitr",
    "labeling",
    "lifecycle",
    "magrittr",
    "memoise",
    "mime",
    "moments",
    "nnet",
    "pander",
    "pillar",
    "pkgconfig",
    "plyr",
    "R6",
    "rappdirs",
    "RColorBrewer",
    "Rcpp",
    "reshape2",
    "rlang",
    "rmarkdown",
    "ROCR",
    "rpart",
    "rstudioapi",
    "S7",
    "sass",
    "scales",
    "stringi",
    "stringr",
    "tibble",
    "tidyselect",
    "tinytex",
    "utf8",
    "vctrs",
    "viridisLite",
    "withr",
    "xfun",
    "yaml"
  ],
  "_vignettes": [
    {
      "source": "funModeling_quickstart.Rmd",
      "filename": "funModeling_quickstart.html",
      "title": "funModeling quick-start",
      "author": "Pablo Casas",
      "engine": "knitr::rmarkdown",
      "headings": [
        "funModeling quick-start",
        "Blog posts based on funModeling:",
        "Opening the black-box",
        "About this quick-start",
        "Exploratory data analysis",
        "status: Dataset health status (2nd version)",
        "data_integrity: Dataset health status (2nd version)",
        "plot_num: Plotting distributions for numerical variables",
        "profiling_num: Calculating several statistics for numerical variables",
        "freq: Getting frequency distributions for categoric variables",
        "Correlation",
        "correlation_table: Calculates R statistic",
        "var_rank_info: Correlation based on information theory",
        "cross_plot: Distribution plot between input and target variable",
        "plotar: Boxplot and density histogram between input and target variables",
        "categ_analysis: Quantitative analysis for binary outcome",
        "Data preparation",
        "Data discretization",
        "discretize_get_bins + discretize_df: Convert numeric variables to categoric",
        "equal_freq: Convert numeric variable to categoric",
        "discretize_rgr: Variable discretization based on gain ratio maximization",
        "range01: Scales variable into the 0 to 1 range",
        "Outliers data preparation",
        "hampel_outlier and  tukey_outlier: Gets outliers threshold",
        "prep_outliers: Prepare outliers in a data frame",
        "Predictive model performance",
        "gain_lift: Gain and lift performance curve",
        "coord_plot: Coordinate plot (clustering models)"
      ],
      "created": "2018-01-17 22:43:59",
      "modified": "2026-02-17 23:58:55",
      "commits": 15
    }
  ],
  "_score": 8.407546576663226,
  "_indexed": true,
  "_nocasepkg": "funmodeling",
  "_universes": [
    "pablo14"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.9.6",
      "date": "2026-05-19T05:59:27.000Z",
      "distro": "noble",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "a71681b3d093384657fb4e16e576e68bea10c3cf60f661ac15874506a0749f07",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.9.6",
      "date": "2026-05-19T05:59:16.000Z",
      "distro": "noble",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "4b743ebe26ab5745ee62e80561ce705bcc713e6012028d2e3690a1613ad9f57b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "1.9.6",
      "date": "2026-05-19T05:59:35.000Z",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "b9011c3d12a12f1695be78cf9b8abc27fdb973c2bbf06cedec3340f288455256",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "1.9.6",
      "date": "2026-05-19T05:59:15.000Z",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "a637fe74a8a5d6afe1966c282c8cf60ea056c72dc0d2445adb496b13cbae8579",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "1.9.6",
      "date": "2026-05-19T05:58:31.000Z",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "5675c52ce629130738d9b2058bc969e90198ddc25eaf912269e0d76ed86abb0a",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "1.9.6",
      "date": "2026-05-19T05:58:17.000Z",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "adaeca98f589a4d17574e2f403d1be942f22ca94569a73d7ceb90586c17c935e",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "1.9.6",
      "date": "2026-05-19T05:58:23.000Z",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "e7df7083da3db3016e35737c30462f54b596d3e097115590ec5fbffc815005be",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.9.6",
      "date": "2026-06-02T15:37:15.000Z",
      "commit": "2f5ac63c8a8da17455aef2de8a625650462d1ab2",
      "fileid": "6fc6786dda7d8e79912ff8b0e7778b567ca75698c232bb86dc9afa26c80f94bf",
      "status": "success",
      "buildurl": "https://github.com/r-universe/pablo14/actions/runs/26079052405"
    }
  ]
}