{
  "_id": "6a101b5bacfb0bcc41c870c5",
  "Package": "MantaID",
  "Title": "A Machine-Learning Based Tool to Automate the Identification of\nBiological Database IDs",
  "Version": "1.0.4",
  "Authors@R": "c(person(\"Zhengpeng\", \"Zeng\",email = \"molaison@foxmail.com\", role = c(\"aut\",\"cre\",\"ctb\"),comment = c(ORCID = \"0000-0001-7919-209X\")),\nperson(\"Longfei\",\"Mao\",email = \"longfeimao99@gmail.com\",role = c(\"aut\",\"cph\"),comment = c(ORCID = \"0000-0003-0759-0501\")),\nperson(\"Feng\",\"Yu\",email = \"feng_yu@hnu.edu.cn\",role = c(\"aut\"), comment = c(ORCID = \"0000-0002-5221-281X\")),\nperson(\"Jiamin\",\"Hu\",email = \"Jiamin-Hu@hotmail.com\",role = c(\"ctb\"), comment = c(ORCID = \"0000-0003-3030-2117\")),\nperson(\"Xiting\",\"Wang\",email = \"XitingWang2023@outlook.com\",role = c(\"ctb\"), comment = c(ORCID = \"0009-0009-5235-0006\")))",
  "Description": "The number of biological databases is growing rapidly, but\ndifferent databases use different IDs to refer to the same\nbiological entity. The inconsistency in IDs impedes the\nintegration of various types of biological data. To resolve the\nproblem, we developed 'MantaID', a data-driven,\nmachine-learning based approach that automates identifying IDs\non a large scale. The 'MantaID' model's prediction accuracy was\nproven to be 99%, and it correctly and effectively predicted\n100,000 ID entries within two minutes. 'MantaID' supports the\ndiscovery and exploitation of ID patterns from large quantities\nof databases. (e.g., up to 542 biological databases). An\neasy-to-use freely available open-source software R package, a\nuser-friendly web application, and API were also developed for\n'MantaID' to improve applicability. To our knowledge, 'MantaID'\nis the first tool that enables an automatic, quick, accurate,\nand comprehensive identification of large quantities of IDs,\nand can therefore be used as a starting point to facilitate the\ncomplex assimilation and aggregation of biological data across\ndiverse databases.",
  "License": "GPL (>= 3)",
  "Encoding": "UTF-8",
  "Roxygen": "list(markdown = TRUE)",
  "RoxygenNote": "7.3.2",
  "LazyData": "true",
  "URL": "https://molaison.github.io/MantaID/",
  "Config/pak/sysreqs": "cmake libglpk-dev make libicu-dev libpng-dev\nlibxml2-dev libssl-dev python3 zlib1g-dev",
  "Repository": "https://molaison.r-universe.dev",
  "Date/Publication": "2024-09-18 09:16:30 UTC",
  "RemoteUrl": "https://github.com/molaison/mantaid",
  "RemoteRef": "HEAD",
  "RemoteSha": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-14 09:18:16 UTC",
    "User": "root"
  },
  "Author": "Zhengpeng Zeng [aut, cre, ctb] (ORCID:\n<https://orcid.org/0000-0001-7919-209X>),\nLongfei Mao [aut, cph] (ORCID: <https://orcid.org/0000-0003-0759-0501>),\nFeng Yu [aut] (ORCID: <https://orcid.org/0000-0002-5221-281X>),\nJiamin Hu [ctb] (ORCID: <https://orcid.org/0000-0003-3030-2117>),\nXiting Wang [ctb] (ORCID: <https://orcid.org/0009-0009-5235-0006>)",
  "Maintainer": "Zhengpeng Zeng <molaison@foxmail.com>",
  "MD5sum": "c3cfec614916629476b0f3c6fc3f46af",
  "_user": "molaison",
  "_type": "src",
  "_file": "MantaID_1.0.4.tar.gz",
  "_fileid": "405578957aea5c7de9c147b3c829429a1881b492c5eb0bc5328e21119aaefc5b",
  "_filesize": 76660196,
  "_sha256": "405578957aea5c7de9c147b3c829429a1881b492c5eb0bc5328e21119aaefc5b",
  "_created": "2026-05-14T09:18:16.000Z",
  "_published": "2026-05-22T09:01:15.921Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 77348363105,
      "time": 282,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "NOTE",
      "artifact": "6991243215"
    },
    {
      "job": 77348362924,
      "time": 291,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "6991245712"
    },
    {
      "job": 77348362722,
      "time": 255,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "NOTE",
      "artifact": "6991228367"
    },
    {
      "job": 77348363094,
      "time": 194,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "6991213865"
    },
    {
      "job": 77348362554,
      "time": 258,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6991163603"
    },
    {
      "job": 77348362354,
      "time": 152,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7156730164"
    },
    {
      "job": 77348362938,
      "time": 232,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "NOTE",
      "artifact": "6991229325"
    },
    {
      "job": 77348362973,
      "time": 220,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "NOTE",
      "artifact": "6991225856"
    },
    {
      "job": 77348362886,
      "time": 214,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "6991224744"
    }
  ],
  "_buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/molaison/mantaid",
  "_commit": {
    "id": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
    "author": "Cindy-Wg <xitingwang2023@outlook.com>",
    "committer": "Cindy-Wg <xitingwang2023@outlook.com>",
    "message": "Add parameter\n",
    "time": 1726650990
  },
  "_maintainer": {
    "name": "Zhengpeng Zeng",
    "email": "molaison@foxmail.com",
    "orcid": "0000-0001-7919-209X"
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 4.4.0",
      "role": "Depends"
    },
    {
      "package": "biomaRt",
      "role": "Depends"
    },
    {
      "package": "xgboost",
      "role": "Depends"
    },
    {
      "package": "caret",
      "role": "Depends"
    },
    {
      "package": "data.table",
      "role": "Depends"
    },
    {
      "package": "dplyr",
      "role": "Depends"
    },
    {
      "package": "ggplot2",
      "role": "Depends"
    },
    {
      "package": "keras",
      "role": "Depends"
    },
    {
      "package": "magrittr",
      "role": "Depends"
    },
    {
      "package": "mlr3tuning",
      "role": "Depends"
    },
    {
      "package": "mlr3",
      "role": "Depends"
    },
    {
      "package": "mlr3learners",
      "role": "Depends"
    },
    {
      "package": "purrr",
      "role": "Depends"
    },
    {
      "package": "reshape2",
      "role": "Depends"
    },
    {
      "package": "scutr",
      "role": "Depends"
    },
    {
      "package": "stringr",
      "role": "Depends"
    },
    {
      "package": "tibble",
      "role": "Depends"
    },
    {
      "package": "tidyr",
      "role": "Depends"
    },
    {
      "package": "tidyselect",
      "role": "Depends"
    },
    {
      "package": "paradox",
      "role": "Depends"
    },
    {
      "package": "RColorBrewer",
      "role": "Depends"
    },
    {
      "package": "ggcorrplot",
      "role": "Depends"
    },
    {
      "package": "ranger",
      "role": "Depends"
    },
    {
      "package": "rpart",
      "role": "Depends"
    },
    {
      "package": "mlr3hyperband",
      "role": "Depends"
    }
  ],
  "_owner": "molaison",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [],
  "_tags": [],
  "_stars": 0,
  "_contributors": [
    {
      "user": "molaison",
      "count": 72,
      "uuid": 83850708
    },
    {
      "user": "xitingwang-ida",
      "count": 28,
      "uuid": 147379893
    },
    {
      "user": "caomiyuan",
      "count": 13,
      "uuid": 112462814
    },
    {
      "user": "melany-hu",
      "count": 9,
      "uuid": 109413600
    }
  ],
  "_userbio": {
    "uuid": 83850708,
    "type": "user",
    "name": "ZengZhengPeng",
    "description": "Postgraduate of Hunan university;\r\nStudy in National Institute of Biological Sciences, Beijing."
  },
  "_downloads": {
    "count": 153,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/MantaID"
  },
  "_devurl": "https://github.com/molaison/mantaid",
  "_pkgdown": "https://molaison.github.io/MantaID/",
  "_searchresults": 2,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/MantaID.html",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/molaison/mantaid",
  "_realowner": "molaison",
  "_cranurl": true,
  "_releases": [
    {
      "version": "1.0.1",
      "date": "2022-10-17"
    },
    {
      "version": "1.0.2",
      "date": "2022-10-18"
    },
    {
      "version": "1.0.3",
      "date": "2024-08-27"
    },
    {
      "version": "1.0.4",
      "date": "2024-09-09"
    }
  ],
  "_exports": [
    "mi",
    "mi_balance_data",
    "mi_clean_data",
    "mi_filter_feat",
    "mi_get_confusion",
    "mi_get_ID",
    "mi_get_ID_attr",
    "mi_get_miss",
    "mi_get_padlen",
    "mi_plot_cor",
    "mi_plot_heatmap",
    "mi_predict_new",
    "mi_run_bmr",
    "mi_split_col",
    "mi_split_str",
    "mi_to_numer",
    "mi_train_BP",
    "mi_train_rg",
    "mi_train_rp",
    "mi_train_xgb",
    "mi_tune_rg",
    "mi_tune_rp",
    "mi_tune_xgb",
    "mi_unify_mod"
  ],
  "_datasets": [
    {
      "name": "Example",
      "title": "ID example dataset.",
      "object": "Example",
      "class": [
        "data.frame"
      ],
      "fields": [
        "ID",
        "class"
      ],
      "rows": 5000,
      "table": true,
      "tojson": true
    },
    {
      "name": "mi_data_attributes",
      "title": "ID-related datasets in biomart.",
      "object": "mi_data_attributes",
      "class": [
        "data.frame"
      ],
      "fields": [
        "name",
        "description",
        "page"
      ],
      "rows": 65,
      "table": true,
      "tojson": true
    },
    {
      "name": "mi_data_procID",
      "title": "Processed ID data.",
      "object": "mi_data_procID",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "pos1",
        "pos2",
        "pos3",
        "pos4",
        "pos5",
        "pos6",
        "pos7",
        "pos8",
        "pos9",
        "pos10",
        "pos11",
        "pos12",
        "pos13",
        "pos14",
        "pos15",
        "pos16",
        "pos17",
        "pos18",
        "pos19",
        "pos20",
        "class"
      ],
      "rows": 4997,
      "table": true,
      "tojson": true
    },
    {
      "name": "mi_data_rawID",
      "title": "ID dataset for testing.",
      "object": "mi_data_rawID",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "ID",
        "class"
      ],
      "rows": 5000,
      "table": true,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "Example",
      "title": "ID example dataset.",
      "topics": [
        "Example"
      ]
    },
    {
      "page": "mi",
      "title": "A wrapper function that executes MantaID workflow.",
      "topics": [
        "mi"
      ]
    },
    {
      "page": "mi_balance_data",
      "title": "Data balance. Most classes adopt random undersampling, while a few classes adopt smote method to oversample to obtain relatively balanced data;",
      "topics": [
        "mi_balance_data"
      ]
    },
    {
      "page": "mi_clean_data",
      "title": "Reshape data and delete meaningless rows.",
      "topics": [
        "mi_clean_data"
      ]
    },
    {
      "page": "mi_data_attributes",
      "title": "ID-related datasets in biomart.",
      "topics": [
        "mi_data_attributes"
      ]
    },
    {
      "page": "mi_data_procID",
      "title": "Processed ID data.",
      "topics": [
        "mi_data_procID"
      ]
    },
    {
      "page": "mi_data_rawID",
      "title": "ID dataset for testing.",
      "topics": [
        "mi_data_rawID"
      ]
    },
    {
      "page": "mi_filter_feat",
      "title": "Performing feature selection in a automatic way based on correlation and feature importance.",
      "topics": [
        "mi_filter_feat"
      ]
    },
    {
      "page": "mi_get_confusion",
      "title": "Compute the confusion matrix for the predicted result.",
      "topics": [
        "mi_get_confusion"
      ]
    },
    {
      "page": "mi_get_ID",
      "title": "Get ID data from the 'Biomart' database using 'attributes'.",
      "topics": [
        "mi_get_ID"
      ]
    },
    {
      "page": "mi_get_ID_attr",
      "title": "Get ID attributes from the 'Biomart' database.",
      "topics": [
        "mi_get_ID_attr"
      ]
    },
    {
      "page": "mi_get_miss",
      "title": "Observe the distribution of the false response of the test set.",
      "topics": [
        "mi_get_miss"
      ]
    },
    {
      "page": "mi_get_padlen",
      "title": "Get max length of ID data.",
      "topics": [
        "mi_get_padlen"
      ]
    },
    {
      "page": "mi_plot_cor",
      "title": "Plot correlation heatmap.",
      "topics": [
        "mi_plot_cor"
      ]
    },
    {
      "page": "mi_plot_heatmap",
      "title": "Plot heatmap for result confusion matrix.",
      "topics": [
        "mi_plot_heatmap"
      ]
    },
    {
      "page": "mi_predict_new",
      "title": "Predict new data with a trained learner.",
      "topics": [
        "mi_predict_new"
      ]
    },
    {
      "page": "mi_run_bmr",
      "title": "Compare classification models with small samples.",
      "topics": [
        "mi_run_bmr"
      ]
    },
    {
      "page": "mi_split_col",
      "title": "Cut the string of ID column character by character and divide it into multiple columns.",
      "topics": [
        "mi_split_col"
      ]
    },
    {
      "page": "mi_split_str",
      "title": "Split the string into individual characters and complete the character vector to the maximum length.",
      "topics": [
        "mi_split_str"
      ]
    },
    {
      "page": "mi_to_numer",
      "title": "Convert data to numeric, and for the ID column convert with fixed levels.",
      "topics": [
        "mi_to_numer"
      ]
    },
    {
      "page": "mi_train_BP",
      "title": "Train a three layers neural network model.",
      "topics": [
        "mi_train_BP"
      ]
    },
    {
      "page": "mi_train_rg",
      "title": "Random Forest Model Training.",
      "topics": [
        "mi_train_rg"
      ]
    },
    {
      "page": "mi_train_rp",
      "title": "Classification tree model training.",
      "topics": [
        "mi_train_rp"
      ]
    },
    {
      "page": "mi_train_xgb",
      "title": "Xgboost model training",
      "topics": [
        "mi_train_xgb"
      ]
    },
    {
      "page": "mi_tune_rg",
      "title": "Tune the Random Forest model by hyperband.",
      "topics": [
        "mi_tune_rg"
      ]
    },
    {
      "page": "mi_tune_rp",
      "title": "Tune the Decision Tree model by hyperband.",
      "topics": [
        "mi_tune_rp"
      ]
    },
    {
      "page": "mi_tune_xgb",
      "title": "Tune the Xgboost model by hyperband.",
      "topics": [
        "mi_tune_xgb"
      ]
    },
    {
      "page": "mi_unify_mod",
      "title": "Predict with four models and unify results by the sub-model's specificity score to the four possible classes.",
      "topics": [
        "mi_unify_mod"
      ]
    }
  ],
  "_pkglogo": "https://github.com/molaison/mantaid/raw/HEAD/logo.svg",
  "_readme": "https://github.com/molaison/mantaid/raw/HEAD/README.md",
  "_rundeps": [
    "AnnotationDbi",
    "askpass",
    "backports",
    "base64enc",
    "bbotk",
    "Biobase",
    "BiocFileCache",
    "BiocGenerics",
    "biomaRt",
    "Biostrings",
    "bit",
    "bit64",
    "blob",
    "cachem",
    "caret",
    "checkmate",
    "class",
    "cli",
    "clock",
    "codetools",
    "config",
    "cpp11",
    "crayon",
    "curl",
    "data.table",
    "DBI",
    "dbplyr",
    "dbscan",
    "diagram",
    "digest",
    "dplyr",
    "e1071",
    "evaluate",
    "farver",
    "fastmap",
    "filelock",
    "FNN",
    "foreach",
    "future",
    "future.apply",
    "generics",
    "ggcorrplot",
    "ggplot2",
    "globals",
    "glue",
    "gower",
    "gtable",
    "hardhat",
    "here",
    "hms",
    "httr",
    "httr2",
    "igraph",
    "ipred",
    "IRanges",
    "isoband",
    "iterators",
    "jsonlite",
    "KEGGREST",
    "keras",
    "KernSmooth",
    "labeling",
    "lattice",
    "lava",
    "lgr",
    "lifecycle",
    "listenv",
    "lubridate",
    "magrittr",
    "MASS",
    "Matrix",
    "mclust",
    "memoise",
    "mime",
    "mirai",
    "mlbench",
    "mlr3",
    "mlr3hyperband",
    "mlr3learners",
    "mlr3measures",
    "mlr3misc",
    "mlr3tuning",
    "ModelMetrics",
    "nanonext",
    "nlme",
    "nnet",
    "numDeriv",
    "openssl",
    "palmerpenguins",
    "paradox",
    "parallelly",
    "pillar",
    "pkgconfig",
    "plyr",
    "png",
    "prettyunits",
    "pROC",
    "processx",
    "prodlim",
    "progress",
    "progressr",
    "proxy",
    "PRROC",
    "ps",
    "purrr",
    "R6",
    "ranger",
    "rappdirs",
    "RColorBrewer",
    "Rcpp",
    "RcppEigen",
    "RcppTOML",
    "recipes",
    "reshape2",
    "reticulate",
    "rlang",
    "rpart",
    "rprojroot",
    "RSQLite",
    "rstudioapi",
    "S4Vectors",
    "S7",
    "scales",
    "scutr",
    "Seqinfo",
    "shape",
    "smotefamily",
    "sparsevctrs",
    "SQUAREM",
    "stringi",
    "stringr",
    "survival",
    "sys",
    "tensorflow",
    "tfautograph",
    "tfruns",
    "tibble",
    "tidyr",
    "tidyselect",
    "timechange",
    "timeDate",
    "tzdb",
    "utf8",
    "uuid",
    "vctrs",
    "viridisLite",
    "whisker",
    "withr",
    "xgboost",
    "xml2",
    "XVector",
    "yaml",
    "zeallot"
  ],
  "_score": 3.1760912590556813,
  "_indexed": true,
  "_nocasepkg": "mantaid",
  "_universes": [
    "molaison"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.0.4",
      "date": "2026-05-14T09:21:36.000Z",
      "distro": "noble",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "bba3f75d91b676b1389c13e337ee99115db3fe81f13bb5ae7a713bf08c94b017",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.0.4",
      "date": "2026-05-14T09:21:35.000Z",
      "distro": "noble",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "4e11ec2ff30356293204efe725935f900382ad45cde0bb76c15dc1a7181c4ae6",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "1.0.4",
      "date": "2026-05-14T09:21:13.000Z",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "82c7bf52b679b5378905be7705351ce536f2fc7aec5698dac0da7a357a207a91",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "1.0.4",
      "date": "2026-05-14T09:20:46.000Z",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "a066843e994deb12924534784fe74ab4fd4a786ea562e0af85577954a0e768ee",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "1.0.4",
      "date": "2026-05-14T09:20:30.000Z",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "4eb91581b035f525d29d1d5021b1e9cb7703ba912775db68e34e78692a51b935",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "1.0.4",
      "date": "2026-05-14T09:20:25.000Z",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "6e397bcc9effc84d40946d214c031b7b45691d663e0be8a9fd67581c4839092c",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "1.0.4",
      "date": "2026-05-14T09:20:18.000Z",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "da4638ca33366b89b420cca1da0eb07d75e17a3321ab0a3a651cbae3f21dd83c",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.0.4",
      "date": "2026-05-22T08:59:58.000Z",
      "commit": "1b1adb3c7aca9749cd601f43640fd9fa4e10a67a",
      "fileid": "108ae924529d74c68ab7390ad954decdf94f03760d3c3ee5e11aa6afaf2d1256",
      "status": "success",
      "buildurl": "https://github.com/r-universe/molaison/actions/runs/25852018116"
    }
  ]
}