{
  "_id": "6a1d3d4c1d7bb097a0a3fd69",
  "Package": "grafzahl",
  "Title": "Supervised Machine Learning for Textual Data Using Transformers\nand 'Quanteda'",
  "Version": "0.0.12",
  "Authors@R": "person(\"Chung-hong\", \"Chan\", , \"chainsawtiney@gmail.com\", role = c(\"aut\", \"cre\"),\ncomment = c(ORCID = \"0000-0002-6232-7530\"))",
  "Description": "Duct tape the 'quanteda' ecosystem (Benoit et al., 2018)\n<doi:10.21105/joss.00774> to modern Transformer-based text\nclassification models (Wolf et al., 2020)\n<doi:10.18653/v1/2020.emnlp-demos.6>, in order to facilitate\nsupervised machine learning for textual data. This package\nmimics the behaviors of 'quanteda.textmodels' and provides a\nfunction to setup the 'Python' environment to use the\npretrained models from 'Hugging Face'\n<https://huggingface.co/>. More information:\n<doi:10.5117/CCR2023.1.003.CHAN>.",
  "License": "GPL (>= 3)",
  "Encoding": "UTF-8",
  "Roxygen": "list(markdown = TRUE)",
  "RoxygenNote": "7.3.2",
  "URL": "https://gesistsa.github.io/grafzahl/,\nhttps://github.com/gesistsa/grafzahl",
  "BugReports": "https://github.com/gesistsa/grafzahl/issues",
  "Config/testthat/edition": "3",
  "LazyData": "true",
  "VignetteBuilder": "knitr",
  "Config/Needs/website": "gesistsa/tsatemplate",
  "Config/pak/sysreqs": "libicu-dev libpng-dev libxml2-dev python3",
  "Repository": "https://gesistsa.r-universe.dev",
  "Date/Publication": "2025-09-02 11:50:44 UTC",
  "RemoteUrl": "https://github.com/gesistsa/grafzahl",
  "RemoteRef": "HEAD",
  "RemoteSha": "904066193116b1e0646640d432a0c15a10da5c8d",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-06-01 08:01:52 UTC",
    "User": "root"
  },
  "Author": "Chung-hong Chan [aut, cre] (ORCID:\n<https://orcid.org/0000-0002-6232-7530>)",
  "Maintainer": "Chung-hong Chan <chainsawtiney@gmail.com>",
  "MD5sum": "31f50b5c0d4456af4ea3ca7be592fb2b",
  "_user": "gesistsa",
  "_type": "src",
  "_file": "grafzahl_0.0.12.tar.gz",
  "_fileid": "0a39aa4c804516d6730f023917f38dce42bdf5d06737c9b462af1b0dff3de556",
  "_filesize": 997990,
  "_sha256": "0a39aa4c804516d6730f023917f38dce42bdf5d06737c9b462af1b0dff3de556",
  "_created": "2026-06-01T08:01:52.000Z",
  "_published": "2026-06-01T08:05:32.494Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 78810341093,
      "time": 183,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7326320711"
    },
    {
      "job": 78810341181,
      "time": 164,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7326315437"
    },
    {
      "job": 78810341145,
      "time": 110,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7326297770"
    },
    {
      "job": 78810341125,
      "time": 129,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7326303580"
    },
    {
      "job": 78809846232,
      "time": 196,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7326261801"
    },
    {
      "job": 78810341147,
      "time": 121,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7326301464"
    },
    {
      "job": 78810341225,
      "time": 122,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7326302199"
    },
    {
      "job": 78810341194,
      "time": 97,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7326293516"
    },
    {
      "job": 78810341233,
      "time": 77,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7326286850"
    }
  ],
  "_buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/gesistsa/grafzahl",
  "_commit": {
    "id": "904066193116b1e0646640d432a0c15a10da5c8d",
    "author": "Arthur Mühl <arthur.muehl@gesis.org>",
    "committer": "GitHub <noreply@github.com>",
    "message": "Update methodshub.qmd (#46)\n\nRemoving an outdated section, that does not need to be in the methodshub.qmd-file anymore to prepare for the methods hub launch.",
    "time": 1756813844
  },
  "_maintainer": {
    "name": "Chung-hong Chan",
    "email": "chainsawtiney@gmail.com",
    "login": "chainsawriot",
    "orcid": "0000-0002-6232-7530",
    "description": "",
    "uuid": 637269
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.5",
      "role": "Depends"
    },
    {
      "package": "jsonlite",
      "role": "Imports"
    },
    {
      "package": "lime",
      "role": "Imports"
    },
    {
      "package": "quanteda",
      "role": "Imports"
    },
    {
      "package": "reticulate",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "stats",
      "role": "Imports"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "quanteda.textmodels",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "version": ">= 3.0.0",
      "role": "Suggests"
    },
    {
      "package": "withr",
      "role": "Suggests"
    }
  ],
  "_owner": "gesistsa",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2025-25",
      "n": 1
    },
    {
      "week": "2025-32",
      "n": 1
    },
    {
      "week": "2025-33",
      "n": 1
    },
    {
      "week": "2025-36",
      "n": 1
    }
  ],
  "_tags": [],
  "_stars": 43,
  "_contributors": [
    {
      "user": "chainsawriot",
      "count": 109,
      "uuid": 637269
    },
    {
      "user": "arthurmuehl",
      "count": 3,
      "uuid": 223466305
    },
    {
      "user": "bachl",
      "count": 2,
      "uuid": 6176704
    }
  ],
  "_userbio": {
    "uuid": 143654576,
    "type": "organization",
    "name": "Transparent Social Analytics",
    "description": "Open Science Tools and more maintained by Transparent Social Analytics Team, GESIS"
  },
  "_downloads": {
    "count": 176,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/grafzahl"
  },
  "_devurl": "https://github.com/gesistsa/grafzahl",
  "_pkgdown": "https://gesistsa.github.io/grafzahl/",
  "_searchresults": 5,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/grafzahl.html",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/gesistsa/grafzahl",
  "_realowner": "gesistsa",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.0.5",
      "date": "2023-01-20"
    },
    {
      "version": "0.0.8",
      "date": "2023-04-12"
    },
    {
      "version": "0.0.11",
      "date": "2024-03-26"
    },
    {
      "version": "0.0.12",
      "date": "2025-06-18"
    }
  ],
  "_exports": [
    "detect_conda",
    "detect_cuda",
    "get_amharic_data",
    "grafzahl",
    "hydrate",
    "setup_grafzahl",
    "textmodel_transformer",
    "use_nonconda"
  ],
  "_datasets": [
    {
      "name": "ecosent",
      "title": "A Corpus Of Dutch News Headlines",
      "object": "ecosent",
      "class": [
        "data.frame"
      ],
      "fields": [
        "id",
        "headline",
        "value",
        "gold"
      ],
      "rows": 6322,
      "table": true,
      "tojson": true
    },
    {
      "name": "supported_model_types",
      "title": "Supported model types",
      "object": "supported_model_types",
      "class": [
        "character"
      ],
      "fields": [],
      "table": false,
      "tojson": true
    },
    {
      "name": "unciviltweets",
      "title": "A Corpus Of Tweets With Incivility Labels",
      "object": "unciviltweets",
      "class": [
        "corpus",
        "character"
      ],
      "fields": [],
      "table": false,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "detect_cuda",
      "title": "Detecting Miniconda And Cuda",
      "topics": [
        "detect_conda",
        "detect_cuda"
      ]
    },
    {
      "page": "ecosent",
      "title": "A Corpus Of Dutch News Headlines",
      "topics": [
        "ecosent"
      ]
    },
    {
      "page": "get_amharic_data",
      "title": "Download The Amharic News Text Classification Dataset",
      "topics": [
        "get_amharic_data"
      ]
    },
    {
      "page": "grafzahl",
      "title": "Fine tune a pretrained Transformer model for texts",
      "topics": [
        "grafzahl",
        "grafzahl.character",
        "grafzahl.corpus",
        "grafzahl.default",
        "textmodel_transformer"
      ]
    },
    {
      "page": "hydrate",
      "title": "Create a grafzahl S3 object from the output_dir",
      "topics": [
        "hydrate"
      ]
    },
    {
      "page": "predict.grafzahl",
      "title": "Prediction from a fine-tuned grafzahl object",
      "topics": [
        "predict.grafzahl"
      ]
    },
    {
      "page": "setup_grafzahl",
      "title": "Setup grafzahl",
      "topics": [
        "setup_grafzahl"
      ]
    },
    {
      "page": "supported_model_types",
      "title": "Supported model types",
      "topics": [
        "supported_model_types"
      ]
    },
    {
      "page": "unciviltweets",
      "title": "A Corpus Of Tweets With Incivility Labels",
      "topics": [
        "unciviltweets"
      ]
    },
    {
      "page": "use_nonconda",
      "title": "Set up grafzahl to be used on Google Colab or similar environments",
      "topics": [
        "use_nonconda"
      ]
    }
  ],
  "_readme": "https://github.com/gesistsa/grafzahl/raw/HEAD/README.md",
  "_rundeps": [
    "assertthat",
    "cli",
    "codetools",
    "cpp11",
    "farver",
    "fastmatch",
    "foreach",
    "ggplot2",
    "glmnet",
    "glue",
    "gower",
    "gtable",
    "here",
    "isoband",
    "ISOcodes",
    "iterators",
    "jsonlite",
    "labeling",
    "lattice",
    "lifecycle",
    "lime",
    "magrittr",
    "Matrix",
    "png",
    "quanteda",
    "R6",
    "rappdirs",
    "RColorBrewer",
    "Rcpp",
    "RcppEigen",
    "RcppTOML",
    "reticulate",
    "rlang",
    "rprojroot",
    "S7",
    "scales",
    "shape",
    "SnowballC",
    "stopwords",
    "stringi",
    "survival",
    "vctrs",
    "viridisLite",
    "withr",
    "xml2",
    "yaml"
  ],
  "_vignettes": [
    {
      "source": "grafzahl.Rmd",
      "filename": "grafzahl.html",
      "title": "Setup Guide",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Google Colab and similar services",
        "Default Python",
        "Use conda, but not the grafzahl's default",
        "With Cuda",
        "Without Cuda",
        "Explanation: Important options and envvars"
      ],
      "created": "2024-03-25 09:17:41",
      "modified": "2024-03-25 09:17:41",
      "commits": 1
    }
  ],
  "_score": 6.235528446907549,
  "_indexed": true,
  "_nocasepkg": "grafzahl",
  "_universes": [
    "gesistsa",
    "chainsawriot"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.0.12",
      "date": "2026-06-01T08:04:30.000Z",
      "distro": "noble",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "8a2f1b11519cc9764753ff21d3bd7b57e5d6a5f14305b6a73e548e9d519d85bb",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.0.12",
      "date": "2026-06-01T08:04:13.000Z",
      "distro": "noble",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "59f08db86bf6d332dc1ac95fcb41930fa68a62e540140c08aa3fa65afb2bf4ef",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.0.12",
      "date": "2026-06-01T08:03:34.000Z",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "05ab1e6d041724521526c68374eafdf835b5fa22494daca30c5149a30371d520",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.0.12",
      "date": "2026-06-01T08:03:42.000Z",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "777c5a1840e51c7de4f764367be4715977a0a8e1f9e92800ae4cc45bc5714bed",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.0.12",
      "date": "2026-06-01T08:04:12.000Z",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "b414b7e3872907469b5ce51d312837386ac6a788b42acd062370a5c7b933afda",
      "status": "success",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.0.12",
      "date": "2026-06-01T08:03:27.000Z",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "23f7e07a07d7cf56eee06e8b7c9750a8431c6ed5f1f8466ea276858503f1ef4c",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.0.12",
      "date": "2026-06-01T08:03:07.000Z",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "0f55f6466dc3107cd03a2aed6ff340eccd5c12ea12cf1442e360daa76a0721b9",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.0.12",
      "date": "2026-06-01T08:02:58.000Z",
      "commit": "904066193116b1e0646640d432a0c15a10da5c8d",
      "fileid": "ae44556c65472a934c9f3af0feaa425bd99c4dc638eef9916dda8669969ad3d7",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/gesistsa/actions/runs/26742537427"
    }
  ]
}