{
  "_id": "6a3a52466265ec60d620eeab",
  "Package": "llmclean",
  "Type": "Package",
  "Title": "LLM-Assisted Data Cleaning with Multi-Provider Support",
  "Version": "0.1.1",
  "Date": "2026-06-01",
  "Authors@R": "c(\nperson(\"Sadikul\", \"Islam\",\nemail   = \"sadikul.islamiasri@gmail.com\",\nrole    = c(\"aut\", \"cre\"),\ncomment = c(ORCID = \"0000-0003-2924-7122\")),\nperson(\"Rajesh\", \"Kaushal\",\nrole    = \"aut\"))",
  "Maintainer": "Sadikul Islam <sadikul.islamiasri@gmail.com>",
  "Description": "Detects and suggests fixes for semantic inconsistencies in\ndata frames by calling large language models (LLMs) through a\nunified, provider-agnostic interface. Supported providers\ninclude 'OpenAI' ('GPT-4o', 'GPT-4o-mini')\n<https://platform.openai.com>, 'Anthropic' ('Claude')\n<https://www.anthropic.com>, 'Google' ('Gemini')\n<https://ai.google.dev>, 'Groq' (free-tier 'LLaMA' and\n'Mixtral') <https://groq.com>, and local 'Ollama' models\n<https://ollama.com>. The package identifies issues that\nrule-based tools cannot detect: abbreviation variants,\ntypographic errors, case inconsistencies, and malformed values.\nResults are returned as tidy data frames with column, row\nindex, detected value, issue type, suggested fix, and\nconfidence score. An offline fallback using statistical and\nfuzzy-matching methods is provided for use without any\napplication programming interface (API) key. Interactive fix\napplication with human review is supported via 'apply_fixes()'.\nMethods follow de Jonge and van der Loo (2013)\n<https://cran.r-project.org/doc/contrib/de_Jonge+van_der_Loo-Introduction_to_data_cleaning_with_R.pdf>\nand Chaudhuri et al. (2003) <doi:10.1145/872757.872796>.",
  "License": "GPL-3",
  "VignetteBuilder": "knitr",
  "Encoding": "UTF-8",
  "LazyData": "true",
  "RoxygenNote": "7.3.3",
  "Config/testthat/edition": "3",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-06-23 09:26:50 UTC",
    "User": "root"
  },
  "Author": "Sadikul Islam [aut, cre] (ORCID:\n<https://orcid.org/0000-0003-2924-7122>), Rajesh Kaushal [aut]",
  "Repository": "https://sadikulislamiasri-hub.r-universe.dev",
  "Date/Publication": "2026-06-09 15:30:34 UTC",
  "RemoteUrl": "https://github.com/cran/llmclean",
  "RemoteRef": "HEAD",
  "RemoteSha": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
  "MD5sum": "f8b8ca257206efcb578f045c296cc147",
  "_user": "sadikulislamiasri-hub",
  "_type": "src",
  "_file": "llmclean_0.1.1.tar.gz",
  "_fileid": "86a74bebf9b00a6ae0d508eefa83dd7e7bca92c32da17ad917bdbb425b43565a",
  "_filesize": 205526,
  "_sha256": "86a74bebf9b00a6ae0d508eefa83dd7e7bca92c32da17ad917bdbb425b43565a",
  "_created": "2026-06-23T09:26:50.000Z",
  "_published": "2026-06-23T09:30:46.017Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 82921313594,
      "time": 131,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7816815122"
    },
    {
      "job": 82921313585,
      "time": 121,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7816811879"
    },
    {
      "job": 82921313623,
      "time": 207,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7816837851"
    },
    {
      "job": 82921313575,
      "time": 122,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7816805824"
    },
    {
      "job": 82920781804,
      "time": 164,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7816763072"
    },
    {
      "job": 82921313565,
      "time": 109,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7816806980"
    },
    {
      "job": 82921313599,
      "time": 114,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7816809220"
    },
    {
      "job": 82921313601,
      "time": 138,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7816818965"
    },
    {
      "job": 82921313586,
      "time": 111,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7816807554"
    }
  ],
  "_buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/cran/llmclean",
  "_commit": {
    "id": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
    "author": "Sadikul Islam <sadikul.islamiasri@gmail.com>",
    "committer": "cran-robot <csardi.gabor+cran@gmail.com>",
    "message": "version 0.1.1\n",
    "time": 1781019034
  },
  "_maintainer": {
    "name": "Sadikul Islam",
    "email": "sadikul.islamiasri@gmail.com",
    "login": "sadikulislamiasri-hub",
    "description": "",
    "uuid": 295794536,
    "orcid": "0000-0003-2924-7122"
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 4.1.0",
      "role": "Depends"
    },
    {
      "package": "stats",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "dplyr",
      "version": ">= 1.0.0",
      "role": "Imports"
    },
    {
      "package": "rlang",
      "version": ">= 1.0.0",
      "role": "Imports"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "version": ">= 3.0.0",
      "role": "Suggests"
    },
    {
      "package": "httr2",
      "version": ">= 1.0.0",
      "role": "Suggests"
    },
    {
      "package": "jsonlite",
      "version": ">= 1.8.0",
      "role": "Suggests"
    }
  ],
  "_owner": "cran",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2026-17",
      "n": 1
    },
    {
      "week": "2026-24",
      "n": 1
    }
  ],
  "_tags": [
    {
      "name": "0.1.0",
      "date": "2026-04-22"
    },
    {
      "name": "0.1.1",
      "date": "2026-06-09"
    }
  ],
  "_stars": 0,
  "_contributors": [
    {
      "user": "sadikulislamiasri-hub",
      "count": 2,
      "uuid": 295794536
    }
  ],
  "_userbio": {
    "uuid": 295794536,
    "type": "user",
    "name": "sadikulislamiasri-hub",
    "followers": 0
  },
  "_downloads": {
    "count": 382,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/llmclean"
  },
  "_searchresults": 0,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/llmclean.html",
    "manual.pdf"
  ],
  "_realowner": "sadikulislamiasri-hub",
  "_cranurl": false,
  "_releases": [
    {
      "version": "0.1.0",
      "date": "2026-04-22"
    },
    {
      "version": "0.1.1",
      "date": "2026-06-09"
    }
  ],
  "_exports": [
    "apply_fixes",
    "detect_issues",
    "get_llm_provider",
    "llmclean_report",
    "offline_detect",
    "set_llm_provider",
    "suggest_fixes"
  ],
  "_datasets": [
    {
      "name": "messy_employees",
      "title": "Hypothetical Messy Employee Records Dataset",
      "object": "messy_employees",
      "class": [
        "data.frame"
      ],
      "fields": [
        "emp_id",
        "name",
        "department",
        "email",
        "age",
        "salary",
        "status",
        "hire_date"
      ],
      "rows": 20,
      "table": true,
      "tojson": true
    },
    {
      "name": "messy_survey",
      "title": "Hypothetical Messy Survey Response Dataset",
      "object": "messy_survey",
      "class": [
        "data.frame"
      ],
      "fields": [
        "respondent_id",
        "country",
        "satisfaction",
        "age_group",
        "income_usd"
      ],
      "rows": 15,
      "table": true,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "llmclean-package",
      "title": "llmclean: LLM-Assisted Data Cleaning with Multi-Provider Support",
      "topics": [
        "llmclean-package",
        "llmclean"
      ]
    },
    {
      "page": "apply_fixes",
      "title": "Apply Suggested Fixes to a Data Frame",
      "topics": [
        "apply_fixes"
      ]
    },
    {
      "page": "detect_issues",
      "title": "Detect Semantic Inconsistencies in a Data Frame Using an LLM",
      "topics": [
        "detect_issues"
      ]
    },
    {
      "page": "get_llm_provider",
      "title": "Get Current LLM Provider Configuration",
      "topics": [
        "get_llm_provider"
      ]
    },
    {
      "page": "llmclean_report",
      "title": "Generate a Summary Report of LLM-Assisted Data Cleaning",
      "topics": [
        "llmclean_report"
      ]
    },
    {
      "page": "messy_employees",
      "title": "Hypothetical Messy Employee Records Dataset",
      "topics": [
        "messy_employees"
      ]
    },
    {
      "page": "messy_survey",
      "title": "Hypothetical Messy Survey Response Dataset",
      "topics": [
        "messy_survey"
      ]
    },
    {
      "page": "offline_detect",
      "title": "Offline Detection of Data Inconsistencies Without an LLM",
      "topics": [
        "offline_detect"
      ]
    },
    {
      "page": "set_llm_provider",
      "title": "Configure the LLM Provider for Data Cleaning",
      "topics": [
        "set_llm_provider"
      ]
    },
    {
      "page": "suggest_fixes",
      "title": "Request Enriched Fix Suggestions for Detected Issues",
      "topics": [
        "suggest_fixes"
      ]
    }
  ],
  "_rundeps": [
    "cli",
    "dplyr",
    "generics",
    "glue",
    "lifecycle",
    "magrittr",
    "pillar",
    "pkgconfig",
    "R6",
    "rlang",
    "tibble",
    "tidyselect",
    "utf8",
    "vctrs",
    "withr"
  ],
  "_vignettes": [
    {
      "source": "llmclean-intro.Rmd",
      "filename": "llmclean-intro.html",
      "title": "LLM-Assisted Data Cleaning with llmclean",
      "author": "Sadikul Islam",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Supported Providers",
        "Quick Start",
        "Step 1 — Configure the provider",
        "Step 2 — Inspect the built-in messy datasets",
        "Stage 1 — Detect Issues",
        "Issue type breakdown",
        "Case inconsistencies",
        "Typos and near-duplicates (Levenshtein)",
        "Malformed email addresses",
        "Numeric outliers (Tukey outer fence)",
        "Stage 2 — Suggest Fixes",
        "Stage 3 — Apply Fixes",
        "Dry run mode",
        "Stage 4 — Offline Detection (No API Key)",
        "Stage 5 — Summary Report",
        "Complete Workflow (One Pipeline)",
        "API Key Storage Best Practice",
        "Session Information",
        "References"
      ],
      "created": "2026-04-22 14:14:02",
      "modified": "2026-04-22 14:14:02",
      "commits": 1
    }
  ],
  "_score": 2.3010299956639813,
  "_indexed": true,
  "_nocasepkg": "llmclean",
  "_universes": [
    "sadikulislamiasri-hub"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:52.000Z",
      "distro": "noble",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "1ffc5e40e6b5c96d621dd62b7991db8fa3005fb0d59ecd82ab95bf050a60092a",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:47.000Z",
      "distro": "noble",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "779ca707e3edd10dad09c5559125f3598f8daca714c54e788720cb6ceae577e3",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.1.1",
      "date": "2026-06-23T09:29:53.000Z",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "37cf03371024d9a5b7e64cf2ffccad3a698964a9001605c91276d3a0681ec425",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:36.000Z",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "e95596afcb6dd79df682ee883523563a9f16c094b971b728759e6f9b087853fe",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:53.000Z",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "dc19fb64bc611c9f3f0810b9915581c711b7bf2bcd81e08bb730d8ee93ba5b2a",
      "status": "success",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:32.000Z",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "74cf7bf4450a01ad8bbc55d2170c509a14ff9049b096057e0c1724ba4d917c20",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:59.000Z",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "0cf9f33afdf3e7e59afa5d9a073109b6a503297c256f399e53feefabe4e94474",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.1.1",
      "date": "2026-06-23T09:28:31.000Z",
      "commit": "03c9478b9ff1f61b55ad539f936e09675ec728b3",
      "fileid": "e62bc1374a9a64c81b62d079bd8949ad71a0d793aac10034225dcd1fef511eab",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/sadikulislamiasri-hub/actions/runs/28016115268"
    }
  ]
}