{
  "_id": "6a2e70d53efcd9bda4313e6a",
  "Package": "mallet",
  "Type": "Package",
  "Title": "An R Wrapper for the Java Mallet Topic Modeling Toolkit",
  "Version": "1.3.0",
  "Date": "2022-07-19",
  "Authors@R": "c(\nperson(\"Måns\", \"Magnusson\", email = \"mons.magnusson@gmail.com\", role = c(\"cre\", \"aut\"),\ncomment = c(ORCID = \"0000-0002-0296-2719\")),\nperson(\"David\", \"Mimno\", role = c(\"aut\", \"cph\"),\ncomment = c(ORCID = \"0000-0001-7510-9404\"))\n)",
  "Maintainer": "Måns Magnusson <mons.magnusson@gmail.com>",
  "Description": "An R interface for the Java Machine Learning for Language\nToolkit (mallet) <http://mallet.cs.umass.edu/> to estimate\nprobabilistic topic models, such as Latent Dirichlet\nAllocation. We can use the R package to read textual data into\nmallet from R objects, run the Java implementation of mallet\ndirectly in R, and extract results as R objects. The Mallet\ntoolkit has many functions, this wrapper focuses on the topic\nmodeling sub-package written by David Mimno. The package uses\nthe rJava package to connect to a JVM.",
  "License": "MIT + file LICENSE",
  "URL": "https://github.com/mimno/RMallet",
  "BugReports": "https://github.com/mimno/RMallet/issues",
  "SystemRequirements": "java",
  "Encoding": "UTF-8",
  "VignetteBuilder": "rmarkdown, knitr",
  "RoxygenNote": "7.2.0",
  "LazyData": "TRUE",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-06-14 09:10:59 UTC",
    "User": "root"
  },
  "Author": "Måns Magnusson [cre, aut]\n(<https://orcid.org/0000-0002-0296-2719>), David Mimno [aut,\ncph] (<https://orcid.org/0000-0001-7510-9404>)",
  "Config/pak/sysreqs": "default-jdk",
  "Repository": "https://cran.r-universe.dev",
  "Date/Publication": "2022-07-20 14:50:05 UTC",
  "RemoteUrl": "https://github.com/cran/mallet",
  "RemoteRef": "HEAD",
  "RemoteSha": "41b08030341198b4ce78a347f548f407ccfb62c2",
  "MD5sum": "4711f9979e64b7bd066b1200c8dc6334",
  "_user": "cran",
  "_type": "src",
  "_file": "mallet_1.3.0.tar.gz",
  "_fileid": "655c1a09dc79e1a8cd49ede32997623a6e22d47d42598d280ef85e73b24d5477",
  "_filesize": 4027734,
  "_sha256": "655c1a09dc79e1a8cd49ede32997623a6e22d47d42598d280ef85e73b24d5477",
  "_created": "2026-06-14T09:10:59.000Z",
  "_published": "2026-06-14T09:13:57.650Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 81265209945,
      "time": 140,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7619518337"
    },
    {
      "job": 81265209939,
      "time": 133,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7619517460"
    },
    {
      "job": 81264997633,
      "time": 181,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7619498076"
    },
    {
      "job": 81265209935,
      "time": 116,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7619514733"
    }
  ],
  "_buildurl": "https://github.com/r-universe/cran/actions/runs/27494156793",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/cran/mallet",
  "_commit": {
    "id": "41b08030341198b4ce78a347f548f407ccfb62c2",
    "author": "Måns Magnusson <mons.magnusson@gmail.com>",
    "committer": "cran-robot <csardi.gabor+cran@gmail.com>",
    "message": "version 1.3.0\n",
    "time": 1658328605
  },
  "_maintainer": {
    "name": "Måns Magnusson",
    "email": "mons.magnusson@gmail.com",
    "login": "mansmeg",
    "description": "",
    "uuid": 2458198,
    "orcid": "0000-0002-0296-2719"
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.6.3",
      "role": "Depends"
    },
    {
      "package": "rJava",
      "role": "Imports"
    },
    {
      "package": "checkmate",
      "role": "Imports"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "dplyr",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "role": "Suggests"
    }
  ],
  "_owner": "cran",
  "_selfowned": false,
  "_usedby": 0,
  "_updates": [],
  "_tags": [],
  "_stars": 0,
  "_contributors": [
    {
      "user": "mimno",
      "count": 1,
      "uuid": 2292538
    },
    {
      "user": "mansmeg",
      "count": 1,
      "uuid": 2458198
    }
  ],
  "_userbio": {
    "uuid": 6899542,
    "type": "organization",
    "name": "cran",
    "followers": 606,
    "description": "Unofficial read-only mirror of all CRAN R packages"
  },
  "_downloads": {
    "count": 5107,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/mallet"
  },
  "_mentions": 2,
  "_devurl": "https://github.com/mimno/rmallet",
  "_searchresults": 167,
  "_topics": [
    "openjdk"
  ],
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/mallet.html",
    "LICENSE",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/mimno/rmallet",
  "_realowner": "mimno",
  "_cranurl": false,
  "_releases": [
    {
      "version": "1.0",
      "date": "2013-08-09"
    },
    {
      "version": "1.3.0",
      "date": "2022-07-20"
    }
  ],
  "_exports": [
    "load.mallet.instances",
    "load.mallet.state",
    "mallet_jar",
    "mallet_stoplist_file_path",
    "mallet_supported_stoplists",
    "mallet.doc.topics",
    "mallet.import",
    "mallet.jar",
    "mallet.read.dir",
    "mallet.stoplist.file.path",
    "mallet.subset.topic.words",
    "mallet.supported.stoplists",
    "mallet.top.words",
    "mallet.topic.hclust",
    "mallet.topic.labels",
    "mallet.topic.model.load",
    "mallet.topic.model.read",
    "mallet.topic.model.save",
    "mallet.topic.model.write",
    "mallet.topic.words",
    "mallet.word.freqs",
    "MalletLDA",
    "save.mallet.instances",
    "save.mallet.state"
  ],
  "_datasets": [
    {
      "name": "sotu",
      "title": "State of the Union Adresses.",
      "object": "sotu",
      "class": [
        "data.frame"
      ],
      "fields": [
        "year",
        "paragraph",
        "text"
      ],
      "rows": 6816,
      "table": true,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "mallet-package",
      "title": "An R Wrapper for the Java Mallet Topic Modeling Toolkit",
      "topics": [
        "mallet-package"
      ]
    },
    {
      "page": "load.mallet.state",
      "title": "Load a Mallet state into Mallet",
      "topics": [
        "load.mallet.state"
      ]
    },
    {
      "page": "mallet_jar",
      "title": "Return the mallet jar filename(s)",
      "topics": [
        "mallet.jar",
        "mallet_jar"
      ]
    },
    {
      "page": "mallet_stoplist_file_path",
      "title": "Return the file path to the mallet stoplists",
      "topics": [
        "mallet.stoplist.file.path",
        "mallet_stoplist_file_path"
      ]
    },
    {
      "page": "mallet_supported_stoplists",
      "title": "Mallet supported stoplists",
      "topics": [
        "mallet.supported.stoplists",
        "mallet_supported_stoplists"
      ]
    },
    {
      "page": "mallet.doc.topics",
      "title": "Retrieve a matrix of topic weights for every document",
      "topics": [
        "mallet.doc.topics"
      ]
    },
    {
      "page": "mallet.import",
      "title": "Import text documents into Mallet format",
      "topics": [
        "mallet.import"
      ]
    },
    {
      "page": "mallet.read.dir",
      "title": "Import documents from a directory into Mallet format",
      "topics": [
        "mallet.read.dir"
      ]
    },
    {
      "page": "mallet.subset.topic.words",
      "title": "Estimate topic-word distributions from a sub-corpus",
      "topics": [
        "mallet.subset.topic.words"
      ]
    },
    {
      "page": "mallet.top.words",
      "title": "Get the most probable words and their probabilities for one topic",
      "topics": [
        "mallet.top.words"
      ]
    },
    {
      "page": "mallet.topic.hclust",
      "title": "Return a hierarchical clustering of topics",
      "topics": [
        "mallet.topic.hclust"
      ]
    },
    {
      "page": "mallet.topic.labels",
      "title": "Get strings containing the most probable words for each topic",
      "topics": [
        "mallet.topic.labels"
      ]
    },
    {
      "page": "mallet.topic.model.read",
      "title": "Load (read) and save (write) a topic from a file",
      "topics": [
        "mallet.topic.model.load",
        "mallet.topic.model.read",
        "mallet.topic.model.save",
        "mallet.topic.model.write"
      ]
    },
    {
      "page": "mallet.topic.words",
      "title": "Retrieve a matrix of words weights for topics",
      "topics": [
        "mallet.topic.words"
      ]
    },
    {
      "page": "mallet.word.freqs",
      "title": "Descriptive statistics of word frequencies",
      "topics": [
        "mallet.word.freqs"
      ]
    },
    {
      "page": "MalletLDA",
      "title": "Create a Mallet topic model trainer",
      "topics": [
        "MalletLDA"
      ]
    },
    {
      "page": "save.mallet.instances",
      "title": "Load and save mallet instances from/to file",
      "topics": [
        "load.mallet.instances",
        "save.mallet.instances"
      ]
    },
    {
      "page": "save.mallet.state",
      "title": "Save a Mallet state to file",
      "topics": [
        "save.mallet.state"
      ]
    },
    {
      "page": "sotu",
      "title": "State of the Union Adresses.",
      "topics": [
        "sotu"
      ]
    }
  ],
  "_rundeps": [
    "backports",
    "checkmate",
    "rJava"
  ],
  "_sysdeps": [
    {
      "shlib": "libjvm",
      "package": "openjdk-21-jre-headless",
      "headers": "openjdk-21-jre-headless",
      "source": "openjdk",
      "version": "21.0.11+10-1~24.04.2",
      "name": "openjdk",
      "homepage": "https://openjdk.java.net/",
      "description": "OpenJDK Java runtime, using Hotspot JIT (headless)"
    }
  ],
  "_vignettes": [
    {
      "source": "mallet.Rmd",
      "filename": "mallet.html",
      "title": "Introduction to R mallet",
      "author": "David Mimno and Måns Magnusson",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Installation",
        "Usage",
        "Reading data into R",
        "Training topic models",
        "Analysis of a topic model",
        "Save and load topic states",
        "Save and load topic models"
      ],
      "created": "2022-07-20 14:50:05",
      "modified": "2022-07-20 14:50:05",
      "commits": 1
    }
  ],
  "_score": 4.231912324667104,
  "_indexed": false,
  "_nocasepkg": "mallet",
  "_universes": [
    "cran"
  ],
  "_indexurl": "https://mimno.r-universe.dev/mallet",
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.3.0",
      "date": "2026-06-14T09:13:17.000Z",
      "distro": "noble",
      "commit": "41b08030341198b4ce78a347f548f407ccfb62c2",
      "fileid": "8fea046b2f1253951eaae42f110a97613d7bfdb0cbf4d92e4005c4e82f1197c9",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/cran/actions/runs/27494156793"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.3.0",
      "date": "2026-06-14T09:13:11.000Z",
      "distro": "noble",
      "commit": "41b08030341198b4ce78a347f548f407ccfb62c2",
      "fileid": "50c4a2a5069517c929530f38d5442723f74157a66a8b6feb1db42edab878ff84",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/cran/actions/runs/27494156793"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.3.0",
      "date": "2026-06-14T09:13:09.000Z",
      "commit": "41b08030341198b4ce78a347f548f407ccfb62c2",
      "fileid": "fe6e86817b7451675a00b86671616b06b846afbd8663f0abe7d708749ede1404",
      "status": "success",
      "buildurl": "https://github.com/r-universe/cran/actions/runs/27494156793"
    }
  ]
}