{
  "_id": "6a1c15881d7bb097a0a2f403",
  "Package": "ViralEntropR",
  "Title": "A Computational Pipeline for Entropy-Informed Detection of\nEmerging Viral Variants",
  "Version": "0.6.2",
  "Authors@R": "c(\nperson(\"Vadim\", \"Tyuryaev\", ,\"vadim.tyuryaev@gmail.com\",\nrole = c(\"aut\", \"cre\"),\ncomment = c(ORCID = \"0009-0008-1361-6265\")),\nperson(\"Jane\", \"Heffernan\", , \"jmheffer@yorku.ca\",\nrole = c(\"aut\")),\nperson(\"Hanna\", \"Jankowski\", , \"hkj@yorku.ca\",\nrole = c(\"aut\"))\n)",
  "Description": "Implements an entropy-informed pipeline for detecting\nemerging variants in viral amino acid sequence data, extending\nprior clustering-based approaches including hemagglutinin\nclustering methods (Li et al., 2015)\n<doi:10.1142/9789814667944_0018>. Provides a fully vectorized\nFASTA preprocessing toolkit covering header parsing, two-pass\ndate and country extraction, ambiguous-residue filtering, and\ninteger encoding under a 25-symbol amino acid alphabet.\nComputes per-site Shannon entropy across user-defined\ncumulative, sliding, or disjoint temporal partitions and\nclusters per-site entropy values using Gaussian mixture models\nvia 'mclust' (Scrucca et al., 2016) <doi:10.32614/RJ-2016-021>.\nQuantifies temporal distributional shifts between partitions\nusing the Hellinger distance (van der Vaart, 1998)\n<doi:10.1017/CBO9780511802256>, and detects temporal change\npoints non-parametrically using energy statistics (Matteson and\nJames, 2014) <doi:10.1080/01621459.2013.849605> via 'ecp' or\nwild binary segmentation (Fryzlewicz, 2014)\n<doi:10.1214/14-AOS1245> via 'HDcpDetect'. Per-site amino-acid\nfrequency tables and entropy trajectory plots characterize\nsequence composition and evolutionary dynamics across time. A\nconfigurable multi-variant simulation engine generates\nsynthetic sequence time series with known ground truth for\nbenchmarking detection pipelines. A curated dataset of\nSARS-CoV-2 Variants of Concern and Variants of Interest with\nassociated lineage and surveillance metadata is included, along\nwith a bundled National Center for Biotechnology Information\n(NCBI) Spike protein sample and vignettes demonstrating the\nfull workflow.",
  "License": "MIT + file LICENSE",
  "Language": "en-GB",
  "Date": "2026-05-07",
  "URL": "https://github.com/vadimtyuryaev/ViralEntropR,\nhttps://doi.org/10.5281/zenodo.19040165,\nhttps://vadimtyuryaev.github.io/ViralEntropR/",
  "BugReports": "https://github.com/vadimtyuryaev/ViralEntropR/issues",
  "Encoding": "UTF-8",
  "LazyData": "true",
  "Roxygen": "list(markdown = TRUE)",
  "RoxygenNote": "7.3.3",
  "Config/testthat/edition": "3",
  "VignetteBuilder": "knitr, R.rsp",
  "Config/pak/sysreqs": "cmake libfontconfig1-dev libfreetype6-dev\nlibfribidi-dev make libharfbuzz-dev libicu-dev libpng-dev\nlibuv1-dev libxml2-dev",
  "Repository": "https://vadimtyuryaev.r-universe.dev",
  "Date/Publication": "2026-05-31 07:23:55 UTC",
  "RemoteUrl": "https://github.com/vadimtyuryaev/viralentropr",
  "RemoteRef": "HEAD",
  "RemoteSha": "405acdac3ec36c078f7ca963dc047b1961de2674",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-31 10:59:31 UTC",
    "User": "root"
  },
  "Author": "Vadim Tyuryaev [aut, cre] (ORCID:\n<https://orcid.org/0009-0008-1361-6265>),\nJane Heffernan [aut],\nHanna Jankowski [aut]",
  "Maintainer": "Vadim Tyuryaev <vadim.tyuryaev@gmail.com>",
  "MD5sum": "1b5797a7e7d8b1fbe2a9c1f3d1a986a6",
  "_user": "vadimtyuryaev",
  "_type": "src",
  "_file": "ViralEntropR_0.6.2.tar.gz",
  "_fileid": "5c4cf33fd2e6c3dc8e9fbe5a427ba36167156ab26eb14336efe314cf28e54fa3",
  "_filesize": 2139485,
  "_sha256": "5c4cf33fd2e6c3dc8e9fbe5a427ba36167156ab26eb14336efe314cf28e54fa3",
  "_created": "2026-05-31T10:59:31.000Z",
  "_published": "2026-05-31T11:03:36.216Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 78720473815,
      "time": 186,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7316182916"
    },
    {
      "job": 78720473805,
      "time": 179,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7316182181"
    },
    {
      "job": 78720473824,
      "time": 183,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7316179147"
    },
    {
      "job": 78720473813,
      "time": 145,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7316176443"
    },
    {
      "job": 78720125122,
      "time": 361,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7316162369"
    },
    {
      "job": 78720473803,
      "time": 137,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7316177621"
    },
    {
      "job": 78720473832,
      "time": 110,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7316175015"
    },
    {
      "job": 78720473821,
      "time": 105,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7316174398"
    },
    {
      "job": 78720473841,
      "time": 128,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7316177163"
    }
  ],
  "_buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/vadimtyuryaev/viralentropr",
  "_commit": {
    "id": "405acdac3ec36c078f7ca963dc047b1961de2674",
    "author": "Vadim Tyuryaev <vadimtyu@yorku.ca>",
    "committer": "Vadim Tyuryaev <vadimtyu@yorku.ca>",
    "message": "update README\n",
    "time": 1780212235
  },
  "_maintainer": {
    "name": "Vadim Tyuryaev",
    "email": "vadim.tyuryaev@gmail.com",
    "login": "vadimtyu",
    "description": "",
    "uuid": 95932875
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.5.0",
      "role": "Depends"
    },
    {
      "package": "ggplot2",
      "version": ">= 3.4.0",
      "role": "Imports"
    },
    {
      "package": "grDevices",
      "role": "Imports"
    },
    {
      "package": "HDcpDetect",
      "role": "Imports"
    },
    {
      "package": "ecp",
      "role": "Imports"
    },
    {
      "package": "kableExtra",
      "role": "Imports"
    },
    {
      "package": "lubridate",
      "role": "Imports"
    },
    {
      "package": "magrittr",
      "role": "Imports"
    },
    {
      "package": "mclust",
      "role": "Imports"
    },
    {
      "package": "rlang",
      "role": "Imports"
    },
    {
      "package": "stats",
      "role": "Imports"
    },
    {
      "package": "stringr",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "zoo",
      "role": "Imports"
    },
    {
      "package": "Biostrings",
      "role": "Suggests"
    },
    {
      "package": "DT",
      "role": "Suggests"
    },
    {
      "package": "dplyr",
      "role": "Suggests"
    },
    {
      "package": "here",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "readxl",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "R.rsp",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "version": ">= 3.0.0",
      "role": "Suggests"
    }
  ],
  "_owner": "vadimtyuryaev",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2026-08",
      "n": 4
    },
    {
      "week": "2026-09",
      "n": 7
    },
    {
      "week": "2026-10",
      "n": 2
    },
    {
      "week": "2026-11",
      "n": 1
    },
    {
      "week": "2026-12",
      "n": 3
    },
    {
      "week": "2026-13",
      "n": 1
    },
    {
      "week": "2026-15",
      "n": 4
    },
    {
      "week": "2026-16",
      "n": 4
    },
    {
      "week": "2026-18",
      "n": 5
    },
    {
      "week": "2026-19",
      "n": 55
    },
    {
      "week": "2026-21",
      "n": 17
    },
    {
      "week": "2026-22",
      "n": 5
    }
  ],
  "_tags": [
    {
      "name": "v0.5.1",
      "date": "2026-05-07"
    },
    {
      "name": "v0.6.2",
      "date": "2026-05-27"
    }
  ],
  "_topics": [
    "bioinformatics",
    "change-point-detection",
    "clustering",
    "computational-biology",
    "covid-19",
    "fasta",
    "functional-data-analysis",
    "gaussian-mixture-models",
    "genomic-surveillance",
    "gisaid",
    "hellinger-distance",
    "molecular-epidemiology",
    "ncbi",
    "sars-cov-2",
    "shannon-entropy",
    "spike-protein",
    "variant-detection",
    "viral-evolution",
    "viral-genomics"
  ],
  "_stars": 0,
  "_contributors": [
    {
      "user": "vadimtyuryaev",
      "count": 110,
      "uuid": 112499209
    }
  ],
  "_userbio": {
    "uuid": 112499209,
    "type": "user",
    "name": "Vadim Tyuryaev",
    "description": "I am a PhD candidate in Statistics at York University. My research specializes in big data clustering of genomic data, math modeling, and machine learning."
  },
  "_downloads": {
    "count": 0,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/ViralEntropR"
  },
  "_devurl": "https://github.com/vadimtyuryaev/viralentropr",
  "_pkgdown": "https://vadimtyuryaev.github.io/ViralEntropR/",
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/ViralEntropR.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/vadimtyuryaev/viralentropr",
  "_realowner": "vadimtyuryaev",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.6.2",
      "date": "2026-05-30"
    }
  ],
  "_exports": [
    "calculate_entropy",
    "calculate_hellinger_matrix",
    "cluster_sites_by_entropy",
    "decode_aa_sequence",
    "detect_changepoints_ecp",
    "detect_changepoints_hdcp",
    "encode_aa_sequence",
    "extract_fasta_countries",
    "extract_fasta_dates",
    "fasta_to_char_matrix",
    "filter_ambiguous_sequences",
    "partition_time_windows",
    "plot_entropy_trajectories",
    "plot_site_class_trajectory",
    "relabel_entropy_classes",
    "simulate_variant_evolution",
    "tabulate_site_evolution"
  ],
  "_datasets": [
    {
      "name": "sarscov2_variants",
      "title": "SARS-CoV-2 VOC/VOI Curated Variant Metadata",
      "object": "sarscov2_variants",
      "class": [
        "list"
      ],
      "fields": [],
      "table": false,
      "tojson": true
    }
  ],
  "_help": [
    {
      "page": "calculate_entropy",
      "title": "Calculate Shannon Entropy",
      "topics": [
        "calculate_entropy"
      ]
    },
    {
      "page": "calculate_hellinger_matrix",
      "title": "Calculate Hellinger Distance Matrix",
      "topics": [
        "calculate_hellinger_matrix"
      ]
    },
    {
      "page": "cluster_sites_by_entropy",
      "title": "Cluster a Univariate Numeric Vector by Gaussian Mixture Model",
      "topics": [
        "cluster_sites_by_entropy"
      ]
    },
    {
      "page": "decode_aa_sequence",
      "title": "Decode Amino Acid Sequences",
      "topics": [
        "decode_aa_sequence"
      ]
    },
    {
      "page": "detect_changepoints_ecp",
      "title": "Detect Temporal Change Points (ECP)",
      "topics": [
        "detect_changepoints_ecp"
      ]
    },
    {
      "page": "detect_changepoints_hdcp",
      "title": "Detect Temporal Change Points (HDcpDetect)",
      "topics": [
        "detect_changepoints_hdcp"
      ]
    },
    {
      "page": "encode_aa_sequence",
      "title": "Encode Amino Acid Sequences",
      "topics": [
        "encode_aa_sequence"
      ]
    },
    {
      "page": "extract_fasta_countries",
      "title": "Extract Countries from FASTA Sequence Names",
      "topics": [
        "extract_fasta_countries"
      ]
    },
    {
      "page": "extract_fasta_dates",
      "title": "Extract Dates from FASTA Sequence Names",
      "topics": [
        "extract_fasta_dates"
      ]
    },
    {
      "page": "fasta_to_char_matrix",
      "title": "Convert FASTA Object to Character Matrix",
      "topics": [
        "fasta_to_char_matrix"
      ]
    },
    {
      "page": "filter_ambiguous_sequences",
      "title": "Remove Sequences Containing Ambiguous Residues",
      "topics": [
        "filter_ambiguous_sequences"
      ]
    },
    {
      "page": "partition_time_windows",
      "title": "Partition Data into Time Windows",
      "topics": [
        "partition_time_windows"
      ]
    },
    {
      "page": "plot_entropy_trajectories",
      "title": "Plot Shannon Entropy Trajectories",
      "topics": [
        "plot_entropy_trajectories"
      ]
    },
    {
      "page": "plot_site_class_trajectory",
      "title": "Plot GMM Entropy Class Trajectory for a Single Site",
      "topics": [
        "plot_site_class_trajectory"
      ]
    },
    {
      "page": "relabel_entropy_classes",
      "title": "Relabel Entropy Classes",
      "topics": [
        "relabel_entropy_classes"
      ]
    },
    {
      "page": "sarscov2_sample",
      "title": "SARS-CoV-2 Surface Glycoprotein Sequences - NCBI Demo Sample",
      "topics": [
        "sarscov2_sample"
      ]
    },
    {
      "page": "sarscov2_variants",
      "title": "SARS-CoV-2 VOC/VOI Curated Variant Metadata",
      "topics": [
        "sarscov2_variants"
      ]
    },
    {
      "page": "simulate_variant_evolution",
      "title": "Simulate Viral Variant Evolution",
      "topics": [
        "simulate_variant_evolution"
      ]
    },
    {
      "page": "tabulate_site_evolution",
      "title": "Tabulate Site Frequency Evolution",
      "topics": [
        "tabulate_site_evolution"
      ]
    }
  ],
  "_readme": "https://github.com/vadimtyuryaev/viralentropr/raw/HEAD/README.md",
  "_rundeps": [
    "base64enc",
    "bslib",
    "cachem",
    "cli",
    "cpp11",
    "digest",
    "ecp",
    "evaluate",
    "farver",
    "fastmap",
    "fontawesome",
    "fs",
    "generics",
    "ggplot2",
    "glue",
    "gtable",
    "HDcpDetect",
    "highr",
    "htmltools",
    "isoband",
    "jquerylib",
    "jsonlite",
    "kableExtra",
    "knitr",
    "labeling",
    "lattice",
    "lifecycle",
    "lubridate",
    "magrittr",
    "mclust",
    "memoise",
    "mime",
    "R6",
    "rappdirs",
    "RColorBrewer",
    "Rcpp",
    "rlang",
    "rmarkdown",
    "rstudioapi",
    "S7",
    "sass",
    "scales",
    "stringi",
    "stringr",
    "svglite",
    "systemfonts",
    "textshaping",
    "timechange",
    "tinytex",
    "vctrs",
    "viridisLite",
    "withr",
    "xfun",
    "xml2",
    "yaml",
    "zoo"
  ],
  "_vignettes": [
    {
      "source": "detecting_variants_simulation.html.asis",
      "filename": "detecting_variants_simulation.html",
      "title": "Entropy Clustering, Hellinger Distance, and Change Point Analysis for Emerging Viral Variant Detection: A Simulation Study",
      "engine": "R.rsp::asis",
      "headings": [],
      "created": "2026-05-05 03:45:10",
      "modified": "2026-05-08 02:45:29",
      "commits": 2
    },
    {
      "source": "preprocessing_pipeline.html.asis",
      "filename": "preprocessing_pipeline.html",
      "title": "NCBI SARS-CoV-2 Spike Protein Sequence Preprocessing: From Raw FASTA to an Analysis-Ready Integer-Encoded Matrix",
      "engine": "R.rsp::asis",
      "headings": [],
      "created": "2026-05-05 03:45:10",
      "modified": "2026-05-08 02:45:29",
      "commits": 2
    },
    {
      "source": "clustering_accuracy.html.asis",
      "filename": "clustering_accuracy.html",
      "title": "Unsupervised Recovery of SARS-CoV-2 Variant Structure via Entropy-Driven Site Selection and PAM Clustering: Precision, Recall, and F1 Evaluation Across Wild-Type and Delta-Dominated Surveillance Periods",
      "engine": "R.rsp::asis",
      "headings": [],
      "created": "2026-05-05 03:45:10",
      "modified": "2026-05-08 02:45:29",
      "commits": 2
    }
  ],
  "_score": 5.2552725051033065,
  "_indexed": true,
  "_nocasepkg": "viralentropr",
  "_universes": [
    "vadimtyuryaev",
    "vadimtyu"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.6.2",
      "date": "2026-05-31T11:02:37.000Z",
      "distro": "noble",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "caeab467ba80c3ba4a4014cf00d7c19f09c77b25418ff3fb04bac845ad5e1c11",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.6.2",
      "date": "2026-05-31T11:02:32.000Z",
      "distro": "noble",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "98cb5c4d12aa17a842657919aab8a7647fbffd3626422946ed88d97b640b46ec",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.6.2",
      "date": "2026-05-31T11:02:16.000Z",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "21d4800922cd68fcbe1f863d9f7929c242bd3ea1fe4dd0547cc8e834ea19cb42",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.6.2",
      "date": "2026-05-31T11:01:52.000Z",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "0cd1ae6aaf9a1a0d48adecc64f2cc5bd15ff0975906453077ca0185960dbe753",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.6.2",
      "date": "2026-05-31T11:02:25.000Z",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "d347f50bffe9eafbcf1b6fc572db0c09dc284b783c16a418b35938b00d1847ab",
      "status": "success",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.6.2",
      "date": "2026-05-31T11:01:13.000Z",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "9d19e64e9452dc9f44a9ce0553c01dc8e69d1f773012c317e0228b7006ad2e58",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.6.2",
      "date": "2026-05-31T11:01:07.000Z",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "ffbc73801cc0b90785b2610ee5c59ae9bc8fd27ccbe8091f978c79dbea447985",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.6.2",
      "date": "2026-05-31T11:01:32.000Z",
      "commit": "405acdac3ec36c078f7ca963dc047b1961de2674",
      "fileid": "5e83b282cdf39c8b9bb093eec7dfd7ecf8d388be36ddb1ebd99097b96e0eb313",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/vadimtyuryaev/actions/runs/26710626088"
    }
  ]
}