{
  "_id": "6a4797e52f27a93436c0f88e",
  "Package": "textclean",
  "Title": "Text Cleaning Tools",
  "Version": "0.9.8",
  "Authors@R": "c( \nperson(\"Tyler\", \"Rinker\", email = \"tyler.rinker@gmail.com\", role = c(\"aut\", \"cre\")),\nperson(\"ctwheels\", \"StackOverflow\", role = \"ctb\"),\nperson(\"Surin\", \"Space\", role = \"ctb\")\n)",
  "Maintainer": "Tyler Rinker <tyler.rinker@gmail.com>",
  "Description": "Tools to clean and process text.  Tools are geared at\nchecking for substrings that are not optimal for analysis and\nreplacing or removing them (normalizing) with more analysis\nfriendly substrings (see Sproat, Black, Chen, Kumar, Ostendorf,\n& Richards (2001) <doi:10.1006/csla.2001.0169>) or extracting\nthem into new variables. For example, emoticons are often used\nin text but not always easily handled by analysis algorithms.\nThe replace_emoticon() function replaces emoticons with word\nequivalents.",
  "License": "GPL-2",
  "LazyData": "TRUE",
  "RoxygenNote": "7.3.3",
  "Encoding": "UTF-8",
  "URL": "https://github.com/trinker/textclean",
  "BugReports": "https://github.com/trinker/textclean/issues",
  "Collate": "'add_comma_space.R' 'add_missing_endmark.R' 'utils.R'\n'replace_html.R' 'check_text_logicals.R' 'check_text.R'\n'drop_element.R' 'drop_row.R' 'fgsub.R' 'fix_mdyyyy.R'\n'glue-reexports.R' 'has_endmark.R' 'like.R' 'make_plural.R'\n'match_tokens.R' 'mgsub.R' 'replace_contraction.R'\n'replace_date.R' 'replace_email.R' 'replace_emoji.R'\n'replace_emoticon.R' 'replace_grade.R' 'replace_hash.R'\n'replace_incomplete.R' 'replace_internet_slang.R'\n'replace_kerning.R' 'replace_misspelling.R' 'replace_money.R'\n'replace_names.R' 'replace_non_ascii.R' 'replace_number.R'\n'replace_ordinal.R' 'replace_rating.R' 'replace_symbol.R'\n'replace_tag.R' 'replace_time.R' 'replace_to.R'\n'replace_tokens.R' 'replace_url.R' 'replace_white.R'\n'replace_word_elongation.R' 'strip.R' 'sub_holder.R' 'swap.R'\n'textclean-package.R'",
  "Config/pak/sysreqs": "libicu-dev",
  "Repository": "https://trinker.r-universe.dev",
  "Date/Publication": "2026-03-05 04:56:58 UTC",
  "RemoteUrl": "https://github.com/trinker/textclean",
  "RemoteRef": "HEAD",
  "RemoteSha": "80a30ed4677900c976cc301b9c4f26069ca824fe",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-07-03 08:06:46 UTC",
    "User": "root"
  },
  "Author": "Tyler Rinker [aut, cre],\nctwheels StackOverflow [ctb],\nSurin Space [ctb]",
  "_user": "trinker",
  "_type": "src",
  "_file": "textclean_0.9.8.tar.gz",
  "_fileid": "https://r2.ropensci.org/7b934f59c5e739b2a97ee84ee95010df22d6edf9bf9057cfea3db4923ce91e74",
  "_filesize": 2175957,
  "_sha256": "7b934f59c5e739b2a97ee84ee95010df22d6edf9bf9057cfea3db4923ce91e74",
  "_expires": "2026-10-11T11:07:17.000Z",
  "_created": "2026-07-03T08:06:46.000Z",
  "_published": "2026-07-03T11:07:17.822Z",
  "_jobs": [
    {
      "job": 84986980801,
      "time": 139,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "8061231255"
    },
    {
      "job": 84986981068,
      "time": 133,
      "config": "linux-release-x86_64",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8061228961"
    },
    {
      "job": 84986980627,
      "time": 125,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "8061226318"
    },
    {
      "job": 84986980821,
      "time": 166,
      "config": "macos-release-arm64",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8061239950"
    },
    {
      "job": 84986980196,
      "time": 196,
      "config": "source",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8061183906"
    },
    {
      "job": 84986980746,
      "time": 151,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "8061234393"
    },
    {
      "job": 84986980717,
      "time": 94,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "8061216722"
    },
    {
      "job": 84986980922,
      "time": 92,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "8061216105"
    },
    {
      "job": 84986980992,
      "time": 93,
      "config": "windows-release",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8061216413"
    }
  ],
  "_host": "GitHub-Actions",
  "_buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814",
  "_status": "success",
  "_upstream": "https://github.com/trinker/textclean",
  "_commit": {
    "id": "80a30ed4677900c976cc301b9c4f26069ca824fe",
    "author": "Tyler Rinker <tyler.rinker@kangarootime.com>",
    "committer": "Tyler Rinker <tyler.rinker@kangarootime.com>",
    "message": "Fixing a number of cran warnings and errors.\n",
    "time": 1772686618
  },
  "_maintainer": {
    "name": "Tyler Rinker",
    "email": "tyler.rinker@gmail.com",
    "login": "trinker",
    "description": "Director, Data Scientist, open-source developer , #python/#rstats enthusiast, #dataviz geek, and #nlp buff",
    "uuid": 1763278
  },
  "_distro": "resolute",
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.4.0",
      "role": "Depends"
    },
    {
      "package": "data.table",
      "role": "Imports"
    },
    {
      "package": "english",
      "version": ">= 1.0-2",
      "role": "Imports"
    },
    {
      "package": "glue",
      "version": ">= 1.3.0",
      "role": "Imports"
    },
    {
      "package": "lexicon",
      "version": ">= 1.0.0",
      "role": "Imports"
    },
    {
      "package": "mgsub",
      "version": ">= 1.5.0",
      "role": "Imports"
    },
    {
      "package": "qdapRegex",
      "role": "Imports"
    },
    {
      "package": "stringi",
      "role": "Imports"
    },
    {
      "package": "textshape",
      "version": ">= 1.0.1",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "hunspell",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "role": "Suggests"
    }
  ],
  "_owner": "trinker",
  "_selfowned": true,
  "_usedby": 26,
  "_updates": [
    {
      "week": "2026-10",
      "n": 5
    }
  ],
  "_tags": [],
  "_topics": [
    "data-munging",
    "emoticons",
    "regex",
    "text-analysis",
    "text-cleaning"
  ],
  "_stars": 258,
  "_contributors": [
    {
      "user": "trinker",
      "count": 177,
      "uuid": 1763278
    },
    {
      "user": "tylerrinker-dev",
      "count": 4,
      "uuid": 237491193
    },
    {
      "user": "foehammer-419",
      "count": 2,
      "uuid": 44418830
    },
    {
      "user": "eliocamp",
      "count": 1,
      "uuid": 8617595
    },
    {
      "user": "kguidonimartins",
      "count": 1,
      "uuid": 8163542
    },
    {
      "user": "tonyelhabr",
      "count": 1,
      "uuid": 15663460
    }
  ],
  "_userbio": {
    "uuid": 1763278,
    "type": "user",
    "name": "Tyler Rinker",
    "followers": 623,
    "description": "Director, Data Scientist, open-source developer , #python/#rstats enthusiast, #dataviz geek, and #nlp buff"
  },
  "_downloads": {
    "count": 4639,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/textclean"
  },
  "_mentions": 1,
  "_devurl": "https://github.com/trinker/textclean",
  "_searchresults": 996,
  "_rbuild": "4.6.1",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/textclean.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/trinker/textclean",
  "_realowner": "trinker",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.2.0",
      "date": "2017-01-10"
    },
    {
      "version": "0.3.0",
      "date": "2017-01-25"
    },
    {
      "version": "0.3.1",
      "date": "2017-02-22"
    },
    {
      "version": "0.5.1",
      "date": "2017-12-12"
    },
    {
      "version": "0.6.3",
      "date": "2018-01-14"
    },
    {
      "version": "0.7.2",
      "date": "2018-04-19"
    },
    {
      "version": "0.7.3",
      "date": "2018-04-24"
    },
    {
      "version": "0.9.2",
      "date": "2018-06-09"
    },
    {
      "version": "0.9.3",
      "date": "2018-07-23"
    },
    {
      "version": "0.9.7",
      "date": "2026-03-05"
    }
  ],
  "_exports": [
    "%like%",
    "%LIKE%",
    "%slike%",
    "%SLIKE%",
    "add_comma_space",
    "add_missing_endmark",
    "as_ordinal",
    "available_checks",
    "check_text",
    "drop_element",
    "drop_element_fixed",
    "drop_element_regex",
    "drop_empty_row",
    "drop_NA",
    "drop_row",
    "fgsub",
    "fix_mdyyyy",
    "glue",
    "glue_collapse",
    "has_endmark",
    "is_it",
    "keep_element",
    "keep_element_fixed",
    "keep_element_regex",
    "keep_row",
    "make_plural",
    "match_tokens",
    "mgsub",
    "mgsub_fixed",
    "mgsub_regex",
    "mgsub_regex_safe",
    "replace_contraction",
    "replace_curly_quote",
    "replace_date",
    "replace_email",
    "replace_emoji",
    "replace_emoji_identifier",
    "replace_emoticon",
    "replace_from",
    "replace_grade",
    "replace_hash",
    "replace_html",
    "replace_incomplete",
    "replace_internet_slang",
    "replace_kern",
    "replace_misspelling",
    "replace_money",
    "replace_names",
    "replace_non_ascii",
    "replace_non_ascii2",
    "replace_number",
    "replace_ordinal",
    "replace_rating",
    "replace_symbol",
    "replace_tag",
    "replace_time",
    "replace_to",
    "replace_tokens",
    "replace_url",
    "replace_white",
    "replace_word_elongation",
    "strip",
    "sub_holder",
    "swap",
    "which_are"
  ],
  "_datasets": [
    {
      "name": "DATA",
      "title": "Fictitious Classroom Dialogue",
      "object": "DATA",
      "class": [
        "data.frame"
      ],
      "fields": [
        "person",
        "sex",
        "adult",
        "state",
        "code"
      ],
      "rows": 11,
      "table": true,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "like",
      "title": "SQL Style LIKE",
      "topics": [
        "%LIKE%",
        "%like%",
        "%SLIKE%",
        "%slike%"
      ]
    },
    {
      "page": "add_comma_space",
      "title": "Ensure Space After Comma",
      "topics": [
        "add_comma_space"
      ]
    },
    {
      "page": "add_missing_endmark",
      "title": "Add Missing Endmarks",
      "topics": [
        "add_missing_endmark"
      ]
    },
    {
      "page": "check_text",
      "title": "Check Text For Potential Problems",
      "topics": [
        "available_checks",
        "check_text"
      ]
    },
    {
      "page": "DATA",
      "title": "Fictitious Classroom Dialogue",
      "topics": [
        "DATA"
      ]
    },
    {
      "page": "drop_element",
      "title": "Filter Elements in a Vetor",
      "topics": [
        "drop_element",
        "drop_element_fixed",
        "drop_element_regex",
        "keep_element",
        "keep_element_fixed",
        "keep_element_regex"
      ]
    },
    {
      "page": "drop_row",
      "title": "Filter Rows That Contain Markers",
      "topics": [
        "drop_empty_row",
        "drop_NA",
        "drop_row",
        "keep_row"
      ]
    },
    {
      "page": "fgsub",
      "title": "Replace a Regex with an Functional Operation on the Regex Match",
      "topics": [
        "fgsub"
      ]
    },
    {
      "page": "fix_mdyyyy",
      "title": "Coerce Character m/d/yyyy to Date",
      "topics": [
        "fix_mdyyyy"
      ]
    },
    {
      "page": "has_endmark",
      "title": "Test for Incomplete Sentences",
      "topics": [
        "has_endmark"
      ]
    },
    {
      "page": "make_plural",
      "title": "Make Plural (or Verb to Singular) Versions of Words",
      "topics": [
        "make_plural"
      ]
    },
    {
      "page": "match_tokens",
      "title": "Find Tokens that Match a Regex",
      "topics": [
        "match_tokens"
      ]
    },
    {
      "page": "mgsub",
      "title": "Multiple 'gsub'",
      "topics": [
        "mgsub",
        "mgsub_fixed",
        "mgsub_regex",
        "mgsub_regex_safe"
      ]
    },
    {
      "page": "print.check_text",
      "title": "Prints a check_text Object",
      "topics": [
        "print.check_text"
      ]
    },
    {
      "page": "print.sub_holder",
      "title": "Prints a sub_holder object",
      "topics": [
        "print.sub_holder"
      ]
    },
    {
      "page": "print.which_are_locs",
      "title": "Prints a which_are_locs Object",
      "topics": [
        "print.which_are_locs"
      ]
    },
    {
      "page": "replace_contraction",
      "title": "Replace Contractions",
      "topics": [
        "replace_contraction"
      ]
    },
    {
      "page": "replace_date",
      "title": "Replace Dates With Words",
      "topics": [
        "replace_date"
      ]
    },
    {
      "page": "replace_email",
      "title": "Replace Email Addresses",
      "topics": [
        "replace_email"
      ]
    },
    {
      "page": "replace_emoji",
      "title": "Replace Emojis With Words/Identifier",
      "topics": [
        "replace_emoji",
        "replace_emoji_identifier"
      ]
    },
    {
      "page": "replace_emoticon",
      "title": "Replace Emoticons With Words",
      "topics": [
        "replace_emoticon"
      ]
    },
    {
      "page": "replace_grade",
      "title": "Replace Grades With Words",
      "topics": [
        "replace_grade"
      ]
    },
    {
      "page": "replace_hash",
      "title": "Replace Hashes",
      "topics": [
        "replace_hash"
      ]
    },
    {
      "page": "replace_html",
      "title": "Replace HTML Markup",
      "topics": [
        "replace_html"
      ]
    },
    {
      "page": "replace_incomplete",
      "title": "Denote Incomplete End Marks With \"|\"",
      "topics": [
        "replace_incomplete"
      ]
    },
    {
      "page": "replace_internet_slang",
      "title": "Replace Internet Slang",
      "topics": [
        "replace_internet_slang"
      ]
    },
    {
      "page": "replace_kern",
      "title": "Replace Kerned (Spaced) with No Space Version",
      "topics": [
        "replace_kern"
      ]
    },
    {
      "page": "replace_misspelling",
      "title": "Replace Misspelled Words",
      "topics": [
        "replace_misspelling"
      ]
    },
    {
      "page": "replace_money",
      "title": "Replace Money With Words",
      "topics": [
        "replace_money"
      ]
    },
    {
      "page": "replace_names",
      "title": "Replace First/Last Names",
      "topics": [
        "replace_names"
      ]
    },
    {
      "page": "replace_non_ascii",
      "title": "Replace Common Non-ASCII Characters",
      "topics": [
        "replace_curly_quote",
        "replace_non_ascii",
        "replace_non_ascii2"
      ]
    },
    {
      "page": "replace_number",
      "title": "Replace Numbers With Text Representation",
      "topics": [
        "as_ordinal",
        "replace_number"
      ]
    },
    {
      "page": "replace_ordinal",
      "title": "Replace Mixed Ordinal Numbers With Text Representation",
      "topics": [
        "replace_ordinal"
      ]
    },
    {
      "page": "replace_rating",
      "title": "Replace Ratings With Words",
      "topics": [
        "replace_rating"
      ]
    },
    {
      "page": "replace_symbol",
      "title": "Replace Symbols With Word Equivalents",
      "topics": [
        "replace_symbol"
      ]
    },
    {
      "page": "replace_tag",
      "title": "Replace Handle Tags",
      "topics": [
        "replace_tag"
      ]
    },
    {
      "page": "replace_time",
      "title": "Replace Time Stamps With Words",
      "topics": [
        "replace_time"
      ]
    },
    {
      "page": "replace_to",
      "title": "Grab Begin/End of String to/from Character",
      "topics": [
        "replace_from",
        "replace_to"
      ]
    },
    {
      "page": "replace_tokens",
      "title": "Replace Tokens",
      "topics": [
        "replace_tokens"
      ]
    },
    {
      "page": "replace_url",
      "title": "Replace URLs",
      "topics": [
        "replace_url"
      ]
    },
    {
      "page": "replace_white",
      "title": "Remove White Space Characters",
      "topics": [
        "replace_white"
      ]
    },
    {
      "page": "replace_word_elongation",
      "title": "Replace Word Elongations",
      "topics": [
        "replace_word_elongation"
      ]
    },
    {
      "page": "strip",
      "title": "Strip Text",
      "topics": [
        "strip",
        "strip.character",
        "strip.default",
        "strip.factor",
        "strip.list"
      ]
    },
    {
      "page": "sub_holder",
      "title": "Hold the Place of Characters Prior to Subbing",
      "topics": [
        "sub_holder"
      ]
    },
    {
      "page": "swap",
      "title": "Swap Two Patterns Simultaneously",
      "topics": [
        "swap"
      ]
    },
    {
      "page": "which_are",
      "title": "Detect/Locate Potential Non-Normalized Text",
      "topics": [
        "is_it",
        "which_are"
      ]
    }
  ],
  "_readme": "https://github.com/trinker/textclean/raw/HEAD/README.md",
  "_rundeps": [
    "cli",
    "cpp11",
    "data.table",
    "dplyr",
    "dtt",
    "english",
    "generics",
    "glue",
    "lattice",
    "lexicon",
    "lifecycle",
    "magrittr",
    "mgsub",
    "NLP",
    "pillar",
    "pkgconfig",
    "purrr",
    "qdapRegex",
    "R6",
    "rlang",
    "slam",
    "stringi",
    "stringr",
    "syuzhet",
    "textshape",
    "tibble",
    "tidyr",
    "tidyselect",
    "utf8",
    "vctrs",
    "withr",
    "zoo"
  ],
  "_score": 10.366338028268206,
  "_indexed": true,
  "_nocasepkg": "textclean",
  "_universes": [
    "trinker"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.9.8",
      "date": "2026-07-03T08:09:07.000Z",
      "distro": "resolute",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/e981b52220764e9655a8f56c7c542a4bbb9e6a9c56fae85b14b3653ea573cae6",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.6.1",
      "os": "linux",
      "version": "0.9.8",
      "date": "2026-07-03T08:09:02.000Z",
      "distro": "resolute",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/bd5a30d7f8479268f93ac7389d44dcd158f9c5219af044c4e0c72ce1d785bc07",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.9.8",
      "date": "2026-07-03T08:08:46.000Z",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/a47a9320b51a9c00fd4371aea83ae2605b3f6350fe48a1f289daca18243059e1",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.6.1",
      "os": "mac",
      "version": "0.9.8",
      "date": "2026-07-03T08:09:22.000Z",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/3ad11962642155620bd93f910fe03260b62b7afa981cb61ab6d02f7bf5c6f23a",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.9.8",
      "date": "2026-07-03T08:09:36.000Z",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/f906b6860520084989da0156e36bcc1a0860408f6b494cd503a59bccf6d8de33",
      "status": "success",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.9.8",
      "date": "2026-07-03T08:08:09.000Z",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/a0df3723874f842d462c4e60f0f7b0e1535387bb8867807ee10114a1bda03972",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.9.8",
      "date": "2026-07-03T08:08:08.000Z",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/ff0afc71f952360774bebd0b56f5686e995f91153e7f48ed409178880322b083",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    },
    {
      "r": "4.6.1",
      "os": "win",
      "version": "0.9.8",
      "date": "2026-07-03T08:08:12.000Z",
      "commit": "80a30ed4677900c976cc301b9c4f26069ca824fe",
      "fileid": "https://r2.ropensci.org/3c350540f7ee43e1ddfe0bb0b2ee93343bd2ac4a7a3322af374c92a228ee845d",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/trinker/actions/runs/28647171814"
    }
  ]
}