Resource List
List all resources, or create a new resource.
GET /api/t/?dataFormatID=%22format_1929%22&format=api
{ "count": 869, "next": "?page=2", "previous": null, "list": [ { "name": "snp-dists", "description": "Pairwise SNP distance matrix from a FASTA sequence alignment", "homepage": "https://github.com/tseemann/snp-dists", "biotoolsID": "snp-dists", "biotoolsCURIE": "biotools:snp-dists", "version": [ "v1.2.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0260", "term": "Sequence alignment conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0870", "term": "Sequence distance matrix" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" }, { "uri": "http://edamontology.org/topic_0091", "term": "Bioinformatics" }, { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" } ], "operatingSystem": [], "language": [ "C", "Shell" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [], "credit": [ { "name": "Torsten Seemann", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Fabian Klötzl", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Andrew J Page", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "Pub2Tools", "additionDate": "2026-06-15T13:34:04.978536Z", "lastUpdate": "2026-06-15T13:34:04.980765Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "Phylo-Movies", "description": "Phylo-Movies is an open-source React and Flask web application, also available as a desktop app, for inspecting ordered phylogenetic tree series. It computes and visualizes subtree-prune-and-regraft transition frames between consecutive trees, helping users see which taxa or subtrees move across sliding-window analyses, bootstrap replicates, and curated tree-series comparisons. The viewer includes timeline playback, tree comparison, MSA context, coloring, analytics, image export, and recording tools.", "homepage": "https://enesberksakalli.github.io/phylo-movies/", "biotoolsID": "phylo-movies", "biotoolsCURIE": "biotools:phylo-movies", "version": [ "0.98.1" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0567", "term": "Phylogenetic tree visualisation" }, { "uri": "http://edamontology.org/operation_0324", "term": "Phylogenetic tree analysis" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0872", "term": "Phylogenetic tree" }, "format": [ { "uri": "http://edamontology.org/format_1910", "term": "newick" } ] }, { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0872", "term": "Phylogenetic tree" }, "format": [ { "uri": "http://edamontology.org/format_1910", "term": "newick" }, { "uri": "http://edamontology.org/format_3464", "term": "JSON" } ] } ], "note": "Visualizes ordered phylogenetic tree series as animated transition movies with comparison, MSA context, movement analytics, image export, and recording support.", "cmd": null } ], "toolType": [ "Desktop application", "Web application" ], "topic": [ { "uri": "http://edamontology.org/topic_3293", "term": "Phylogenetics" }, { "uri": "http://edamontology.org/topic_0092", "term": "Data visualisation" } ], "operatingSystem": [ "Windows", "Mac", "Linux" ], "language": [ "Python", "JavaScript", "TypeScript" ], "license": "MIT", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/enesBerkSakalli/phylo-movies", "type": [ "Repository" ], "note": "Source code repository." }, { "url": "https://enesberksakalli.github.io/phylo-movies/demo/", "type": [ "Service" ], "note": "Static browser demo with precomputed example movies." }, { "url": "https://github.com/enesBerkSakalli/phylo-movies/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [ { "url": "https://github.com/enesBerkSakalli/phylo-movies", "type": "Source code", "note": "Source checkout for full web application and backend workflows.", "version": "0.98.1" }, { "url": "https://github.com/enesBerkSakalli/phylo-movies/releases/tag/v0.98.1", "type": "Binaries", "note": "Desktop convenience builds for macOS, Windows, and Linux.", "version": "0.98.1" } ], "documentation": [ { "url": "https://enesberksakalli.github.io/phylo-movies/manual/", "type": [ "User manual" ], "note": "Researcher-facing manual." }, { "url": "https://github.com/enesBerkSakalli/phylo-movies/blob/main/README.md", "type": [ "General" ], "note": "Project overview, installation, usage, citation, and links." }, { "url": "https://github.com/enesBerkSakalli/phylo-movies/blob/main/docs/getting-started.md", "type": [ "Installation instructions" ], "note": "Local source-checkout setup instructions." }, { "url": "https://github.com/enesBerkSakalli/phylo-movies/blob/main/docs/api.md", "type": [ "API documentation" ], "note": "Backend API documentation." } ], "publication": [ { "doi": "10.64898/2026.04.01.715821", "pmid": null, "pmcid": null, "type": [ "Primary" ], "version": null, "note": "bioRxiv preprint describing the Phylo-Movies method and examples.", "metadata": null }, { "doi": "10.5281/zenodo.20488923", "pmid": null, "pmcid": null, "type": [ "Primary" ], "version": "0.98.1", "note": "Archived software release on Zenodo.", "metadata": null } ], "credit": [ { "name": "Enes Berk Sakalli", "email": "enes@lbi-netmed.at", "url": "https://github.com/enesBerkSakalli", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer", "Primary contact" ], "note": "Corresponding software contact." }, { "name": "Simon E. Haendeler", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null }, { "name": "Arndt von Haeseler", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null }, { "name": "Heiko A. Schmidt", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null } ], "owner": "enes", "additionDate": "2026-06-14T08:34:19.506926Z", "lastUpdate": "2026-06-14T08:36:42.066838Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "nallo", "description": "Nallo is a bioinformatics analysis pipeline for long-reads from both PacBio and (targeted) ONT-data, focused on rare-disease. The pipeline detects a wide range of genetic variants, performs genome assembly,\nand reports CpG methylation. It also enables annotation and ranking of variants based on their predicted functional\nconsequences.", "homepage": "https://github.com/genomic-medicine-sweden/nallo", "biotoolsID": "nallo", "biotoolsCURIE": "biotools:nallo", "version": [ "0.12.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3227", "term": "Variant calling" }, { "uri": "http://edamontology.org/operation_0331", "term": "Variant effect prediction" }, { "uri": "http://edamontology.org/operation_0525", "term": "Genome assembly" }, { "uri": "http://edamontology.org/operation_3226", "term": "Variant prioritisation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_3752", "term": "CSV" }, { "uri": "http://edamontology.org/format_2572", "term": "BAM" }, { "uri": "http://edamontology.org/format_2545", "term": "FASTQ-like format" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_3462", "term": "CRAM" }, { "uri": "http://edamontology.org/format_2572", "term": "BAM" }, { "uri": "http://edamontology.org/format_3327", "term": "BAI" } ] } ], "note": null, "cmd": null } ], "toolType": [], "topic": [ { "uri": "http://edamontology.org/topic_0769", "term": "Workflows" }, { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" }, { "uri": "http://edamontology.org/topic_3673", "term": "Whole genome sequencing" }, { "uri": "http://edamontology.org/topic_0749", "term": "Transcription factors and regulatory sites" }, { "uri": "http://edamontology.org/topic_3295", "term": "Epigenetics" } ], "operatingSystem": [], "language": [ "Groovy", "Java" ], "license": "MIT", "collectionID": [], "maturity": null, "cost": "Free of charge", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/genomic-medicine-sweden/nallo", "type": [ "Repository" ], "note": null } ], "download": [], "documentation": [ { "url": "https://genomic-medicine-sweden.github.io/nallo/latest/", "type": [ "User manual" ], "note": null } ], "publication": [ { "doi": "10.1093/BIOINFORMATICS/BTAG086", "pmid": "41712762", "pmcid": "PMC12988770", "type": [], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Lars Feuk", "email": "lars.feuk@igp.uu.se", "url": null, "orcidid": "https://orcid.org/0000-0003-2355-2919", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "juan_camilo", "additionDate": "2026-06-12T12:09:48.272845Z", "lastUpdate": "2026-06-12T14:03:07.797466Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "FlavoTyper", "description": "FlavoTyper is a bioinformatics tool that performs in silico serotyping of Flavobacterium psychrophilum genome assemblies.", "homepage": "https://forge.inrae.fr/eric.duchaud/flavotyper", "biotoolsID": "flavotyper", "biotoolsCURIE": "biotools:flavotyper", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0346", "term": "Sequence similarity search" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0925", "term": "Sequence assembly" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [], "note": null, "cmd": null } ], "toolType": [ "Command-line tool", "Web service" ], "topic": [ { "uri": "http://edamontology.org/topic_3673", "term": "Whole genome sequencing" }, { "uri": "http://edamontology.org/topic_0625", "term": "Genotype and phenotype" }, { "uri": "http://edamontology.org/topic_3301", "term": "Microbiology" }, { "uri": "http://edamontology.org/topic_3397", "term": "Veterinary medicine" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "Python" ], "license": "Apache-2.0", "collectionID": [], "maturity": "Emerging", "cost": null, "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [ { "url": "https://flavotyper-125bcf.pages-forge.inrae.fr/", "type": [ "User manual" ], "note": null } ], "publication": [], "credit": [], "owner": "Salmam2", "additionDate": "2026-06-10T15:44:24.553891Z", "lastUpdate": "2026-06-10T17:14:53.654094Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "NOVOPlasty", "description": "NOVOPlasty - The organelle assembler and heteroplasmy caller.\n\nNOVOPlasty is a de novo assembler and heteroplasmy/variance caller for short circular genomes..", "homepage": "https://github.com/ndierckx/NOVOPlasty", "biotoolsID": "NOVOPlasty", "biotoolsCURIE": "biotools:NOVOPlasty", "version": [ "NOVOPlasty4.3.5" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0524", "term": "De-novo assembly" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0925", "term": "Sequence assembly" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3227", "term": "Variant calling" } ], "input": [], "output": [], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" } ], "operatingSystem": [], "language": [ "Perl" ], "license": "Other", "collectionID": [], "maturity": "Mature", "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/ndierckx/NOVOPlasty", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/ndierckx/NOVOPlasty/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [], "documentation": [ { "url": "https://github.com/ndierckx/NOVOPlasty/wiki", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1093/nar/gkw955", "pmid": "28204566", "pmcid": "PMC5389512", "type": [ "Primary" ], "version": null, "note": "Primary publication for the tool.", "metadata": null }, { "doi": "10.1093/nargab/lqz011", "pmid": "33575563", "pmcid": "PMC7671380", "type": [ "Primary" ], "version": null, "note": "Primary publication for the heteroplasmy or variance calling option.", "metadata": null } ], "credit": [ { "name": "Nicolas Dierckxsens", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0001-8051-6602", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null } ], "owner": "aniehues", "additionDate": "2026-06-04T09:56:48.749854Z", "lastUpdate": "2026-06-04T09:56:48.751987Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "VerityMap", "description": "VerityMap is a tool for mapping long reads to assemblies of extra-long tandem repeats, producing SAM files and identifying potential heterozygous sites and assembly errors through analysis of rare k-mers. It supports PacBio HiFi and ONT reads and generates interactive HTML plots for variant analysis.", "homepage": "https://github.com/ablab/VerityMap", "biotoolsID": "VerityMap", "biotoolsCURIE": "biotools:VerityMap", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0523", "term": "Mapping assembly" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_2572", "term": "BAM" }, { "uri": "http://edamontology.org/format_3003", "term": "BED" } ] } ], "note": null, "cmd": null } ], "toolType": [], "topic": [ { "uri": "http://edamontology.org/topic_0102", "term": "Mapping" }, { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" } ], "operatingSystem": [], "language": [ "C", "CUDA", "Python", "C++" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/ablab/tandemQUAST/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1093/bioinformatics/btaa440", "pmid": "32657355", "pmcid": "PMC7355294", "type": [], "version": null, "note": null, "metadata": null } ], "credit": [], "owner": "n.m.palmblad@lumc.nl", "additionDate": "2026-06-04T08:25:03.738887Z", "lastUpdate": "2026-06-04T08:25:03.740814Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "screen_assembly", "description": "Screen a bacterial assembly (contigs/CDS or proteins) for nucleotide or protein sequences.\n\nPipeline that screens for presence of genes of interest (GOI) in bacterial assemblies. Generates multiple CSVs and plots that describe which genes are present and how variable their sequence is. Can use DNA or protein query sequences (GOIs) and DNA contigs/fastas or protein fastas as database (db) to search in.", "homepage": "https://github.com/shimbalama/screen_assembly", "biotoolsID": "screen_assembly", "biotoolsCURIE": "biotools:screen_assembly", "version": [ "v1" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_2403", "term": "Sequence analysis" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0925", "term": "Sequence assembly" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [] }, { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [ "Script", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" } ], "operatingSystem": [], "language": [ "Python" ], "license": "MIT", "collectionID": [], "maturity": "Mature", "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/shimbalama/screen_assembly", "type": [ "Repository" ], "note": null } ], "download": [], "documentation": [ { "url": "https://github.com/shimbalama/screen_assembly/wiki", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1038/s41588-019-0417-8", "pmid": "31133745", "pmcid": "PMC6650292", "type": [ "Primary" ], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Mark R. Davies", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0001-6141-5179", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "aniehues", "additionDate": "2026-06-04T08:08:16.771951Z", "lastUpdate": "2026-06-04T08:08:16.774426Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "RepeatAfterMe", "description": "RepeatAfterMe is a package for the extension of repetitive DNA cores. The tool automatically extends a multiple sequence alignment that may represent only a fragment of a longer repetitive sequence family.", "homepage": "https://github.com/Dfam-consortium/RepeatAfterMe", "biotoolsID": "repeatafterme", "biotoolsCURIE": "biotools:repeatafterme", "version": [ "v0.0.7" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0495", "term": "Local alignment" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_3009", "term": "2bit" } ] }, { "data": { "uri": "http://edamontology.org/data_1017", "term": "Sequence range" }, "format": [ { "uri": "http://edamontology.org/format_3585", "term": "bed6" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": "./RAMExtend -ranges test/extension-test2.tsv -twobit test/extension-test2.2bit" } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "C" ], "license": "CC0-1.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [], "credit": [ { "name": "Robert Hubley", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null } ], "owner": "Pub2Tools", "additionDate": "2026-05-08T10:33:02.567199Z", "lastUpdate": "2026-05-08T10:33:02.569259Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "GenErode", "description": "Workflow for whole genome sequencing analysis, including patterns of genome erosion. Written in Snakemake workflow language.", "homepage": "https://github.com/NBISweden/GenErode", "biotoolsID": "generode", "biotoolsCURIE": "biotools:generode", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0368", "term": "Sequence masking" }, { "uri": "http://edamontology.org/operation_3211", "term": "Genome indexing" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_3003", "term": "BED" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3198", "term": "Read mapping" }, { "uri": "http://edamontology.org/operation_3192", "term": "Sequence trimming" }, { "uri": "http://edamontology.org/operation_2478", "term": "Nucleic acid sequence analysis" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_2572", "term": "BAM" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3218", "term": "Sequencing quality control" }, { "uri": "http://edamontology.org/operation_3227", "term": "Variant calling" }, { "uri": "http://edamontology.org/operation_3196", "term": "Genotyping" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_2572", "term": "BAM" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3498", "term": "Sequence variations" }, "format": [ { "uri": "http://edamontology.org/format_3016", "term": "VCF" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Workflow" ], "topic": [ { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" } ], "operatingSystem": [], "language": [ "Other" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [ { "url": "https://github.com/NBISweden/GenErode", "type": [ "General" ], "note": null }, { "url": "https://github.com/NBISweden/GenErode/wiki", "type": [ "User manual" ], "note": null } ], "publication": [ { "doi": "10.1186/s12859-022-04757-0", "pmid": "35698034", "pmcid": "PMC9195343", "type": [ "Method" ], "version": null, "note": null, "metadata": null } ], "credit": [], "owner": "johangustafsson", "additionDate": "2026-05-06T23:40:03.794540Z", "lastUpdate": "2026-05-06T23:40:03.797298Z", "editPermission": { "type": "public", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "fastahack", "description": "fastahack is a library for indexing and extracting sequences and subsequences from FASTA files. The library provides a FASTA reader and indexer that can be embedded into applications which would benefit from directly reading subsequences from FASTA files. The library automatically handles index file generation and use.", "homepage": "https://github.com/ekg/fastahack", "biotoolsID": "fastahack", "biotoolsCURIE": "biotools:fastahack", "version": [ "1.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0227", "term": "Indexing" }, { "uri": "http://edamontology.org/operation_2422", "term": "Data retrieval" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_2200", "term": "FASTA-like (text)" }, { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] }, { "data": { "uri": "http://edamontology.org/data_0955", "term": "Data index" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [ "Library" ], "topic": [ { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" } ], "operatingSystem": [ "Windows", "Linux", "Mac" ], "language": [ "C++" ], "license": "MIT", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/ekg/fastahack", "type": [ "Repository" ], "note": null } ], "download": [], "documentation": [ { "url": "https://github.com/ekg/fastahack/blob/master/README", "type": [ "General" ], "note": null } ], "publication": [], "credit": [ { "name": "Erik Garrison", "email": "erik.garrison@bc.edu", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null } ], "owner": "VKasalica", "additionDate": "2026-05-05T19:32:21.089812Z", "lastUpdate": "2026-05-05T19:57:38.785597Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "Verkko", "description": "Verkko is a hybrid genome assembly pipeline for telomere-to-telomere assembly of long reads.", "homepage": "https://github.com/marbl/verkko", "biotoolsID": "verkko", "biotoolsCURIE": "biotools:verkko", "version": [ "2.3.2" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3216", "term": "Scaffolding" }, { "uri": "http://edamontology.org/operation_0310", "term": "Sequence assembly" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_3181", "term": "Sequence assembly report" }, "format": [ { "uri": "http://edamontology.org/format_3752", "term": "CSV" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" }, { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" }, { "uri": "http://edamontology.org/topic_4056", "term": "Long-read sequencing" } ], "operatingSystem": [ "Linux" ], "language": [ "Perl", "Python", "Bash" ], "license": "Freeware", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [ { "doi": "10.1038/s41587-023-01662-6", "pmid": "36797493", "pmcid": "PMC10427740", "type": [ "Primary" ], "version": null, "note": null, "metadata": null }, { "doi": "10.1101/gr.280383.124", "pmid": "40389285", "pmcid": "PMC12212074", "type": [ "Primary" ], "version": "2.0.0", "note": null, "metadata": null } ], "credit": [], "owner": "n.m.palmblad@lumc.nl", "additionDate": "2026-05-01T11:37:56.074227Z", "lastUpdate": "2026-05-01T11:37:56.076538Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "bwa-meth", "description": "bwa-meth is a tool for alignment of Bisulfite sequencing reads.", "homepage": "https://github.com/brentp/bwa-meth", "biotoolsID": "bwa-meth", "biotoolsCURIE": "biotools:bwa-meth", "version": [ "0.2.9" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0292", "term": "Sequence alignment" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1383", "term": "Nucleic acid sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_2573", "term": "SAM" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0102", "term": "Mapping" }, { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" } ], "operatingSystem": [ "Linux" ], "language": [ "Python" ], "license": "MIT", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [ { "doi": "10.48550/arXiv.1401.1129", "pmid": null, "pmcid": null, "type": [ "Preprint" ], "version": null, "note": null, "metadata": null } ], "credit": [], "owner": "n.m.palmblad@lumc.nl", "additionDate": "2026-05-01T10:45:51.114755Z", "lastUpdate": "2026-05-01T10:45:51.117070Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "shic", "description": "shic is a collection of shims for use in automated workflow composition", "homepage": "https://github.com/magnuspalmblad/shic", "biotoolsID": "shic", "biotoolsCURIE": "biotools:shic", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0896", "term": "Protein report" }, "format": [ { "uri": "http://edamontology.org/format_3747", "term": "protXML" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2872", "term": "ID list" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2536", "term": "Mass spectrometry data" }, "format": [ { "uri": "http://edamontology.org/format_3651", "term": "MGF" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2536", "term": "Mass spectrometry data" }, "format": [ { "uri": "http://edamontology.org/format_3651", "term": "MGF" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0870", "term": "Sequence distance matrix" }, "format": [ { "uri": "http://edamontology.org/format_1912", "term": "Nexus format" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0870", "term": "Sequence distance matrix" }, "format": [ { "uri": "http://edamontology.org/format_1991", "term": "mega" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3021", "term": "UniProt accession" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3655", "term": "pepXML" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3247", "term": "mzIdentML" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0972", "term": "Text mining report" }, "format": [ { "uri": "http://edamontology.org/format_2332", "term": "XML" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1174", "term": "ChEBI ID" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3247", "term": "mzIdentML" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0896", "term": "Protein report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2872", "term": "ID list" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3655", "term": "pepXML" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1009", "term": "Protein name" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3655", "term": "pepXML" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2764", "term": "Protein name (UniProt)" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Script" ], "topic": [], "operatingSystem": [], "language": [], "license": "MIT", "collectionID": [], "maturity": null, "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [ "Proteomics", "Galaxy", "Metabolomics" ], "link": [ { "url": "https://github.com/magnuspalmblad/shic", "type": [ "Repository" ], "note": null } ], "download": [], "documentation": [ { "url": "https://github.com/magnuspalmblad/shic/blob/main/README.md", "type": [ "General" ], "note": null } ], "publication": [], "credit": [ { "name": "Magnus Palmblad", "email": "magnus.palmblad@gmail.com", "url": null, "orcidid": "https://orcid.org/0000-0002-5865-8994", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [ "Primary contact" ], "note": null }, { "name": "Veit Schwämmle", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0002-9708-6722", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Dirk Winkelhardt", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0001-8770-2221", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Vedran Kasalica", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0002-0097-1056", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Anna-Lena Lamprecht", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0003-1953-5606", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null } ], "owner": "n.m.palmblad@lumc.nl", "additionDate": "2023-08-30T13:03:57.407598Z", "lastUpdate": "2026-04-17T13:21:28.211937Z", "editPermission": { "type": "group", "authors": [ "VKasalica", "veits@bmb.sdu.dk" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "pathotypr", "description": "A fast, offline, pathogen-agnostic toolkit for lineage classification and marker-driven genotyping from whole-genome sequencing data. Bring your own SNP marker panel for any microbial pathogen — pathotypr handles the rest. Ships with curated panels for Mycobacterium tuberculosis complex (MTBC): 3,707 lineage-defining SNPs and over 102,000 resistance-associated mutations. Works with assembled genomes (FASTA) and raw reads (FASTQ). Available as command-line interface and cross-platform desktop GUI (Tauri).", "homepage": "https://github.com/PathoGenOmics-Lab/pathotypr", "biotoolsID": "pathotypr", "biotoolsCURIE": "biotools:pathotypr", "version": [ "1.0.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3196", "term": "Genotyping" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0920", "term": "Genotype/phenotype report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": "train — Build a Random Forest classifier from labeled genomes.", "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3225", "term": "Variant classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0920", "term": "Genotype/phenotype report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": "predict — Assign lineages to genomes using a pre-trained Random Forest model.", "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3196", "term": "Genotyping" }, { "uri": "http://edamontology.org/operation_3225", "term": "Variant classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0920", "term": "Genotype/phenotype report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": "classify — Call known SNP markers in assembled genomes against a user-defined marker panel.", "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3196", "term": "Genotyping" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0920", "term": "Genotype/phenotype report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": "split-fastq — Alignment-free genotyping directly from raw reads using k-mer matching.", "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_0346", "term": "Sequence similarity search" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0920", "term": "Genotype/phenotype report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": "match — Find the closest reference genome from a set of references for raw reads.", "cmd": null } ], "toolType": [ "Command-line tool", "Desktop application" ], "topic": [ { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" }, { "uri": "http://edamontology.org/topic_3301", "term": "Microbiology" }, { "uri": "http://edamontology.org/topic_0625", "term": "Genotype and phenotype" }, { "uri": "http://edamontology.org/topic_3168", "term": "Sequencing" }, { "uri": "http://edamontology.org/topic_3305", "term": "Public health and epidemiology" }, { "uri": "http://edamontology.org/topic_3474", "term": "Machine learning" } ], "operatingSystem": [], "language": [ "Rust" ], "license": "AGPL-3.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [ { "url": "https://github.com/PathoGenOmics-Lab/pathotypr/releases", "type": "Binaries", "note": null, "version": null }, { "url": "https://github.com/PathoGenOmics-Lab/pathotypr", "type": "Source code", "note": null, "version": null } ], "documentation": [ { "url": "https://github.com/PathoGenOmics-Lab/pathotypr/tree/main/docs", "type": [ "User manual" ], "note": null } ], "publication": [ { "doi": "10.64898/2026.03.24.714002", "pmid": null, "pmcid": null, "type": [ "Primary" ], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Paula Ruiz-Rodriguez", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0003-0727-5974", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer", "Maintainer" ], "note": null }, { "name": "Mireia Coscolla", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0003-0752-0538", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null }, { "name": "I2SysBio (CSIC - Universitat de València)", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": "PathoGenOmics Lab", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Division", "typeRole": [ "Provider" ], "note": null } ], "owner": "paururo", "additionDate": "2026-04-02T11:29:54.022786Z", "lastUpdate": "2026-04-02T11:29:54.029869Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "MHCcluster", "description": "Functional cluster of MHC class I molecules (MHCI) based on their predicted binding specificity.", "homepage": "http://cbs.dtu.dk/services/MHCcluster/", "biotoolsID": "mhccluster", "biotoolsCURIE": "biotools:mhccluster", "version": [ "2.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3459", "term": "Functional clustering" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1353", "term": "Sequence motif" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0872", "term": "Phylogenetic tree" }, "format": [ { "uri": "http://edamontology.org/format_2006", "term": "Phylogenetic tree format" } ] }, { "data": { "uri": "http://edamontology.org/data_1636", "term": "Heat map" }, "format": [ { "uri": "http://edamontology.org/format_2333", "term": "Binary format" } ] } ], "note": "provides heat-map and graphical tree-based visualizations of the functional relationship between MHC class I and class II variants", "cmd": null } ], "toolType": [ "Web application" ], "topic": [ { "uri": "http://edamontology.org/topic_2830", "term": "Immunoproteins, genes and antigens" } ], "operatingSystem": [ "Linux", "Windows", "Mac" ], "language": [], "license": "Other", "collectionID": [], "maturity": "Emerging", "cost": "Free of charge (with restrictions)", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "http://cbs.dtu.dk/services", "type": [ "Software catalogue" ], "note": null } ], "download": [], "documentation": [ { "url": "http://www.cbs.dtu.dk/services/MHCcluster-2.0/instructions.php", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1007/s00251-013-0714-9", "pmid": "23775223", "pmcid": "PMC3750724", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "MHCcluster, a method for functional clustering of MHC molecules", "abstract": "The identification of peptides binding to major histocompatibility complexes (MHC) is a critical step in the understanding of T cell immune responses. The human MHC genomic region (HLA) is extremely polymorphic comprising several thousand alleles, many encoding a distinct molecule. The potentially unique specificities remain experimentally uncharacterized for the vast majority of HLA molecules. Likewise, for nonhuman species, only a minor fraction of the known MHC molecules have been characterized. Here, we describe a tool, MHCcluster, to functionally cluster MHC molecules based on their predicted binding specificity. The method has a flexible web interface that allows the user to include any MHC of interest in the analysis. The output consists of a static heat map and graphical tree-based visualizations of the functional relationship between MHC variants and a dynamic TreeViewer interface where both the functional relationship and the individual binding specificities of MHC molecules are visualized. We demonstrate that conventional sequence-based clustering will fail to identify the functional relationship between molecules, when applied to MHC system, and only through the use of the predicted binding specificity can a correct clustering be found. Clustering of prevalent HLA-A and HLA-B alleles using MHCcluster confirms the presence of 12 major specificity groups (supertypes) some however with highly divergent specificities. Importantly, some HLA molecules are shown not to fit any supertype classification. Also, we use MHCcluster to show that chimpanzee MHC class I molecules have a reduced functional diversity compared to that of HLA class I molecules. MHCcluster is available at www.cbs.dtu.dk/services/MHCcluster-2.0. © 2013 Springer-Verlag Berlin Heidelberg.", "date": "2013-09-01T00:00:00Z", "citationCount": 60, "authors": [ { "name": "Thomsen M." }, { "name": "Lundegaard C." }, { "name": "Buus S." }, { "name": "Lund O." }, { "name": "Nielsen M." } ], "journal": "Immunogenetics" } } ], "credit": [ { "name": "CBS", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": "Morten Nielsen", "email": "mniel@cbs.dtu.dk", "url": null, "orcidid": "http://orcid.org/0000-0001-7885-4311", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "liuyang", "additionDate": "2015-01-21T13:29:32Z", "lastUpdate": "2026-03-20T11:08:19.028012Z", "editPermission": { "type": "private", "authors": [] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "HTSlib", "description": "The main purpose of HTSlib is to provide access to genomic information files, both alignment data (SAM, BAM, and CRAM formats) and variant data (VCF and BCF formats). The library also provides interfaces to access and index genome reference data in FASTA format and tab-delimited files with genomic coordinates. It is utilized and incorporated into both SAMtools and BCFtools.", "homepage": "http://www.htslib.org/", "biotoolsID": "htslib", "biotoolsCURIE": "biotools:htslib", "version": [ "1.0", "1.1", "1.2", "1.2.1", "1.3", "1.3.1", "1.3.2", "1.4", "1.4.1", "1.5", "1.6", "1.7", "1.8", "1.9", "1.10", "1.10.1", "1.10.2", "1.11", "1.12", "1.13", "1.14", "1.15", "1.15.1", "1.16", "1.17", "1.18", "1.19", "1.20", "1.21.1", "1.22", "1.22.1", "1.22.2", "1.23", "1.23.1" ], "otherID": [], "relation": [ { "biotoolsID": "samtools", "type": "usedBy" }, { "biotoolsID": "bcftools", "type": "usedBy" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_2409", "term": "Data handling" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0924", "term": "Sequence trace" }, "format": [ { "uri": "http://edamontology.org/format_3462", "term": "CRAM" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_2573", "term": "SAM" }, { "uri": "http://edamontology.org/format_2572", "term": "BAM" }, { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_3498", "term": "Sequence variations" }, "format": [ { "uri": "http://edamontology.org/format_3020", "term": "BCF" }, { "uri": "http://edamontology.org/format_3016", "term": "VCF" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0924", "term": "Sequence trace" }, "format": [ { "uri": "http://edamontology.org/format_3462", "term": "CRAM" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_2573", "term": "SAM" }, { "uri": "http://edamontology.org/format_2572", "term": "BAM" }, { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_3498", "term": "Sequence variations" }, "format": [ { "uri": "http://edamontology.org/format_3020", "term": "BCF" }, { "uri": "http://edamontology.org/format_3016", "term": "VCF" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Library" ], "topic": [ { "uri": "http://edamontology.org/topic_3071", "term": "Data management" } ], "operatingSystem": [ "Windows", "Linux", "Mac" ], "language": [ "C" ], "license": "MIT", "collectionID": [ "Animal and Crop Genomics" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/samtools/htslib", "type": [ "Repository" ], "note": null }, { "url": "http://www.htslib.org/support/#lists", "type": [ "Mailing list" ], "note": null }, { "url": "https://github.com/samtools/htslib/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [ { "url": "http://www.htslib.org/download/", "type": "Downloads page", "note": null, "version": null } ], "documentation": [ { "url": "http://www.htslib.org/doc/#manual-pages", "type": [ "User manual" ], "note": null } ], "publication": [ { "doi": "10.1093/gigascience/giab007", "pmid": "33594436", "pmcid": "PMC7931820", "type": [ "Primary" ], "version": null, "note": "HTSlib: C library for reading/writing high-throughput sequencing data.", "metadata": null } ], "credit": [ { "name": "Wellcome Sanger Institute", "email": "samtools@sanger.ac.uk", "url": "https://www.sanger.ac.uk/", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider", "Primary contact" ], "note": null }, { "name": "Samtools Help mailing list", "email": null, "url": "https://lists.sourceforge.net/lists/listinfo/samtools-help", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Project", "typeRole": [ "Support" ], "note": null } ], "owner": "awhitwham", "additionDate": "2017-08-20T16:07:58Z", "lastUpdate": "2026-03-18T17:33:38.200309Z", "editPermission": { "type": "group", "authors": [ "animalandcropgenomics", "smoe" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "QUAST", "description": "QUAST stands for QUality ASsessment Tool. \nIt evaluates a quality of genome assemblies by computing various metrics and providing nice reports.", "homepage": "http://quast.sourceforge.net/quast", "biotoolsID": "quast", "biotoolsCURIE": "biotools:quast", "version": [ "v.5.3.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0337", "term": "Visualisation" }, { "uri": "http://edamontology.org/operation_3180", "term": "Sequence assembly validation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [], "note": "# Running quast on a eukaryotic genome", "cmd": "quast -ek assembly.fa --out output_prefix" } ], "toolType": [ "Workflow" ], "topic": [ { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" } ], "operatingSystem": [ "Linux", "Mac" ], "language": [ "Perl", "Python", "C" ], "license": "GPL-2.0", "collectionID": [ "ONTeater" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/ablab/quast", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/ablab/quast/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [], "documentation": [ { "url": "http://quast.bioinf.spbau.ru/", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1093/bioinformatics/btt086", "pmid": "23422339", "pmcid": "PMC3624806", "type": [], "version": null, "note": null, "metadata": { "title": "QUAST: Quality assessment tool for genome assemblies", "abstract": "Limitations of genome sequencing techniques have led to dozens of assembly algorithms, none of which is perfect. A number of methods for comparing assemblers have been developed, but none is yet a recognized benchmark. Further, most existing methods for comparing assemblies are only applicable to new assemblies of finished genomes; the problem of evaluating assemblies of previously unsequenced species has not been adequately considered. Here, we present QUAST - a quality assessment tool for evaluating and comparing genome assemblies. This tool improves on leading assembly comparison software with new ideas and quality metrics. QUAST can evaluate assemblies both with a reference genome, as well as without a reference. QUAST produces many reports, summary tables and plots to help scientists in their research and in their publications. In this study, we used QUAST to compare several genome assemblers on three datasets. QUAST tables and plots for all of them are available in the Supplementary Material, and interactive versions of these reports are on the QUAST website. © 2013 The Author.", "date": "2013-04-15T00:00:00Z", "citationCount": 6872, "authors": [ { "name": "Gurevich A." }, { "name": "Saveliev V." }, { "name": "Vyahhi N." }, { "name": "Tesler G." } ], "journal": "Bioinformatics" } } ], "credit": [ { "name": "QUAST Support", "email": "quast.support@cab.spbu.ru", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "seqwiki_import", "additionDate": "2017-01-13T13:16:01Z", "lastUpdate": "2026-03-13T09:39:06.494933Z", "editPermission": { "type": "group", "authors": [ "ELIXIR-CZ", "Keiler_Collier", "rathor2611" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "Mapler", "description": "Mapler is a pipeline for assessing assembly quality in taxonomically rich metagenomes sequenced with HiFi reads. It incorporates state-of-the-art metrics and facilitates the comparison of assembly strategies.", "homepage": "https://github.com/Nimauric/Mapler", "biotoolsID": "mapler", "biotoolsCURIE": "biotools:mapler", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0310", "term": "Sequence assembly" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0924", "term": "Sequence trace" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3180", "term": "Sequence assembly validation" }, { "uri": "http://edamontology.org/operation_3731", "term": "Sample comparison" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3914", "term": "Quality control report" }, "format": [ { "uri": "http://edamontology.org/format_3751", "term": "DSV" }, { "uri": "http://edamontology.org/format_2330", "term": "Textual format" }, { "uri": "http://edamontology.org/format_2331", "term": "HTML" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3798", "term": "Read binning" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Workflow", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_3174", "term": "Metagenomics" }, { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" } ], "operatingSystem": [], "language": [ "Bash", "Python" ], "license": "AGPL-3.0", "collectionID": [], "maturity": null, "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/Nimauric/Mapler", "type": [ "Repository" ], "note": null } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1093/BIOINFORMATICS/BTAF334", "pmid": "40478660", "pmcid": "PMC12205171", "type": [], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Nicolas Maurice", "email": "nicolas.maurice@inria.fr", "url": null, "orcidid": "https://orcid.org/0009-0009-9615-2765", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Claire Lemaitre", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0001-8675-170X", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Riccardo Vicedomini", "email": null, "url": null, "orcidid": "https://orcid.org/0000-0002-7706-0998", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Clémence Frioux", "email": "clemence.frioux@inria.fr", "url": null, "orcidid": "https://orcid.org/0000-0003-2114-0697", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "nimauric", "additionDate": "2026-02-22T14:20:37.167505Z", "lastUpdate": "2026-03-10T15:44:03.311515Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "NetPhos", "description": "Neural network predictions for serine, threonine and tyrosine phosphorylation sites in eukaryotic proteins.", "homepage": "http://cbs.dtu.dk/services/NetPhos/", "biotoolsID": "netphos", "biotoolsCURIE": "biotools:netphos", "version": [ "2.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3092", "term": "Protein feature detection" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1277", "term": "Protein features" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] }, { "data": { "uri": "http://edamontology.org/data_2955", "term": "Sequence report" }, "format": [ { "uri": "http://edamontology.org/format_2333", "term": "Binary format" } ] } ], "note": "produces neural network predictions for serine, threonine and tyrosine phosphorylation sites in eukaryotic proteins", "cmd": null } ], "toolType": [ "Command-line tool", "Web application", "Web service" ], "topic": [ { "uri": "http://edamontology.org/topic_0160", "term": "Sequence sites, features and motifs" } ], "operatingSystem": [ "Linux", "Windows", "Mac" ], "language": [], "license": "Other", "collectionID": [], "maturity": "Emerging", "cost": "Free of charge (with restrictions)", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "http://cbs.dtu.dk/services", "type": [ "Software catalogue" ], "note": null } ], "download": [], "documentation": [ { "url": "http://www.cbs.dtu.dk/services/NetPhos/instructions.php", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1006/jmbi.1999.3310", "pmid": "10600390", "pmcid": null, "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "Sequence and structure-based prediction of eukaryotic protein phosphorylation sites", "abstract": "Protein phosphorylation at serine, threonine or tyrosine residues affects a multitude of cellular signaling processes. How is specificity in substrate recognition and phosphorylation by protein kinases achieved? Here, we present an artificial neural network method that predicts phosphorylation sites in independent sequences with a sensitivity in the range from 69% to 96%. As an example, we predict novel phosphorylation sites in the p300/CBP protein that may regulate interaction with transcription factors and histone acetyltransferase activity. In addition, serine and threonine residues in p300/CBP that can be modified by O-linked glycosylation with N-acetylglucosamine are identified. Glycosylation may prevent phosphorplation at these sites, a mechanism named yin-yang regulation. The prediction server is available on the Internet at http://www.cbs.dtu.dk/services/NetPhos/or via e-mail to NetPhos@@@cbs.dtu.dk.", "date": "1999-12-17T00:00:00Z", "citationCount": 2373, "authors": [ { "name": "Blom N." }, { "name": "Gammeltoft S." }, { "name": "Brunak S." } ], "journal": "Journal of Molecular Biology" } } ], "credit": [ { "name": "CBS", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": null, "email": null, "url": "http://www.bioinformatics.dtu.dk/english/Service/Contact", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null }, { "name": "Nicolaj Blom", "email": "nblom@kt.dtu.dk", "url": null, "orcidid": "http://orcid.org/0000-0001-7787-7853", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null } ], "owner": "CBS", "additionDate": "2015-06-29T10:13:32Z", "lastUpdate": "2026-03-05T12:16:41.386128Z", "editPermission": { "type": "group", "authors": [ "I3raf", "Rubika" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "BigSeqKit", "description": "The Next Generation Sequencing (NGS) raw data are stored in FASTA and FASTQ text-based file formats. Common operations on FASTA/Q files include searching, filtering, sampling, deduplication and sorting, among others. We can find several tools in the literature for FASTA/Q file manipulation but none of them are well fitted for large files of tens of GB (likely TBs in the near future) since mostly they are based on sequential processing. The exception is seqkit that allows some routines to use a few threads but, in any case, the scalability is very limited. To deal with this issue, we introduce BigSeqKit, a parallel toolkit to manipulate FASTA/Q files at scale with speed and scalability at its core. BigSeqKit takes advantage of an HPC-Big Data framework (IgnisHPC) to parallelize and optimize the commands included in seqkit. In this way, in most cases it is from tens to hundreds of times faster than other state-of-the-art tools such as seqkit, samtools and pyfastx.", "homepage": "https://github.com/citiususc/BigSeqKit", "biotoolsID": "bigseqkit", "biotoolsCURIE": "biotools:bigseqkit", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3192", "term": "Sequence trimming" }, { "uri": "http://edamontology.org/operation_0372", "term": "DNA transcription" }, { "uri": "http://edamontology.org/operation_0371", "term": "DNA translation" }, { "uri": "http://edamontology.org/operation_0233", "term": "Sequence conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Library", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" } ], "operatingSystem": [ "Linux" ], "language": [ "Python" ], "license": "GPL-3.0", "collectionID": [], "maturity": null, "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [], "credit": [], "owner": "cesarpomar", "additionDate": "2023-05-22T15:10:32.141196Z", "lastUpdate": "2026-03-01T11:28:15.208151Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "PLAST", "description": "PLAST is a heuristical method to search for highest scoring local alignments between a DNA sequence query and a graphical pangenome. It takes as input a plain DNA sequence and a pangenome which may either be a set of (multiple) FASTA or FASTQ files or a sequence graph constructed by the tool Bifrost. It then outputs statistically meaningful (gapped) alignments in the style of the NCBI BLAST standard output format. Alignments are calculated based on a \"seed-and-extend approach\" while traversing the sequence graph. Biologically meaningful alignments are filtered by using an alignment statistic explicitly developed for sequence-to-graph alignments involving graphical pangenomes.", "homepage": "https://github.com/tischulz1/plast", "biotoolsID": "pangenome-blast", "biotoolsCURIE": "biotools:pangenome-blast", "version": [ "0.0.1-0.2.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0495", "term": "Local alignment" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1211", "term": "unambiguous pure nucleotide" } ] }, { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_3975", "term": "GFA 1" }, { "uri": "http://edamontology.org/format_2333", "term": "Binary format" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1383", "term": "Nucleic acid sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1333", "term": "BLAST results" } ] } ], "note": "In order to search for alignments within the pangenome graph, \nA pangenome graph used to search for alignments consists of (1) a file in GFA format containing all sequences of the graph, (2) a binary file produced by the tool itself or the software \"Bifrost\" and (3) a program-specific index data structure in binary format.", "cmd": "PLAST Search -i pangenomeGraphCommonFilePrefix -q fileContainingOneQueryPerLine" }, { "operation": [ { "uri": "http://edamontology.org/operation_0227", "term": "Indexing" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0850", "term": "Sequence set" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0850", "term": "Sequence set" }, "format": [ { "uri": "http://edamontology.org/format_3975", "term": "GFA 1" }, { "uri": "http://edamontology.org/format_2333", "term": "Binary format" } ] } ], "note": "If a pangenome graph already exists and only an index has to be built, FASTA/FASTQ files are not needed.", "cmd": "PLAST Build -i pangenomeGraphCommonFilePrefix -R *.fasta" } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0797", "term": "Comparative genomics" }, { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" } ], "operatingSystem": [ "Linux", "Mac", "Windows" ], "language": [ "C++" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://gitlab.ub.uni-bielefeld.de/gi/plast", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/tischulz1/plast", "type": [ "Mirror" ], "note": null } ], "download": [], "documentation": [ { "url": "https://gitlab.ub.uni-bielefeld.de/gi/plast/-/blob/master/README.md", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1093/bioinformatics/btab077", "pmid": "33532821", "pmcid": "PMC8388040", "type": [ "Primary", "Method", "Benchmarking study" ], "version": null, "note": null, "metadata": { "title": "Detecting high-scoring local alignments in pangenome graphs", "abstract": "Motivation: Increasing amounts of individual genomes sequenced per species motivate the usage of pangenomic approaches. Pangenomes may be represented as graphical structures, e.g. compacted colored de Bruijn graphs, which offer a low memory usage and facilitate reference-free sequence comparisons. While sequence-to-graph mapping to graphical pangenomes has been studied for some time, no local alignment search tool in the vein of BLAST has been proposed yet. Results: We present a new heuristic method to find maximum scoring local alignments of a DNA query sequence to a pangenome represented as a compacted colored de Bruijn graph. Our approach additionally allows a comparison of similarity among sequences within the pangenome. We show that local alignment scores follow an exponential-tail distribution similar to BLAST scores, and we discuss how to estimate its parameters to separate local alignments representing sequence homology from spurious findings. An implementation of our method is presented, and its performance and usability are shown. Our approach scales sublinearly in running time and memory usage with respect to the number of genomes under consideration. This is an advantage over classical methods that do not make use of sequence similarity within the pangenome.", "date": "2021-08-15T00:00:00Z", "citationCount": 6, "authors": [ { "name": "Schulz T." }, { "name": "Wittler R." }, { "name": "Rahmann S." }, { "name": "Hach F." }, { "name": "Stoye J." } ], "journal": "Bioinformatics" } } ], "credit": [ { "name": "Bielefeld University", "email": null, "url": "https://www.uni-bielefeld.de/", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": "Genome Informatics", "email": null, "url": "https://gi.cebitec.uni-bielefeld.de/", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": "Tizian Schulz", "email": "plast-service@cebitec.uni-bielefeld.de", "url": null, "orcidid": "https://orcid.org/0000-0003-0744-7078", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null } ], "owner": "tizian", "additionDate": "2021-05-06T06:18:52Z", "lastUpdate": "2026-02-26T11:22:02.485629Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "cuffcompare", "description": "Compare assembled transcripts to a reference annotation and track Cufflinks transcripts across multiple experiments.", "homepage": "http://cole-trapnell-lab.github.io/cufflinks/", "biotoolsID": "cuffcompare", "biotoolsCURIE": "biotools:cuffcompare", "version": [ "2.2.1.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0492", "term": "Multiple sequence alignment" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1975", "term": "GFF3" }, { "uri": "http://edamontology.org/format_2306", "term": "GTF" } ] }, { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] }, { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_2306", "term": "GTF" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Web application" ], "topic": [ { "uri": "http://edamontology.org/topic_3168", "term": "Sequencing" } ], "operatingSystem": [ "Linux", "Windows", "Mac" ], "language": [ "C++" ], "license": null, "collectionID": [ "Cufflinks", "galaxyPasteur" ], "maturity": "Mature", "cost": null, "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://galaxy.pasteur.fr/tool_runner?tool_id=toolshed.pasteur.fr/repos/fmareuil/cuffcompare/cuffcompare/2.2.1.0", "type": [ "Galaxy service" ], "note": null } ], "download": [], "documentation": [ { "url": "http://cole-trapnell-lab.github.io/cufflinks/cuffcompare/", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1038/nbt.1621", "pmid": "20436464", "pmcid": "PMC3146043", "type": [ "Primary" ], "version": null, "note": null, "metadata": null }, { "doi": "10.1093/nar/gkw343", "pmid": "27137889", "pmcid": "PMC4987906", "type": [ "Other" ], "version": null, "note": null, "metadata": null }, { "doi": "10.7490/f1000research.1114334.1", "pmid": null, "pmcid": null, "type": [ "Other" ], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Galaxy Support Team", "email": "galaxy@pasteur.fr", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "hmenager", "additionDate": "2016-12-19T14:29:34Z", "lastUpdate": "2026-02-26T11:14:58.790920Z", "editPermission": { "type": "private", "authors": [] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "fur", "description": "The program fur takes as input a set of target genome sequences and a set of related genome sequences, the neighbors. It returns the sequence regions common to all targets that are absent form the neighbors. Such regions can be used as candidate genetic markers.", "homepage": "https://github.com/evolbioinf/fur", "biotoolsID": "fur", "biotoolsCURIE": "biotools:fur", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_2998", "term": "Nucleic acid comparison" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2887", "term": "Nucleic acid sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null } ], "toolType": [], "topic": [ { "uri": "http://edamontology.org/topic_3344", "term": "Biomedical science" } ], "operatingSystem": [], "language": [ "Go" ], "license": null, "collectionID": [], "maturity": null, "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [], "credit": [], "owner": "bebatut", "additionDate": "2026-02-16T08:19:06.415244Z", "lastUpdate": "2026-02-16T08:19:06.417279Z", "editPermission": { "type": "public", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "metabuli", "description": "Metabuli: specific and sensitive metagenomic classification via joint analysis of DNA and amino acid", "homepage": "https://metabuli.steineggerlab.com", "biotoolsID": "metabuli", "biotoolsCURIE": "biotools:metabuli", "version": [], "otherID": [], "relation": [ { "biotoolsID": "mmseqs2", "type": "uses" }, { "biotoolsID": "gtdb", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool", "Desktop application" ], "topic": [ { "uri": "http://edamontology.org/topic_0637", "term": "Taxonomy" } ], "operatingSystem": [ "Windows", "Mac", "Linux" ], "language": [ "C++" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/steineggerlab/Metabuli/issues", "type": [ "Issue tracker" ], "note": null }, { "url": "https://github.com/steineggerlab/Metabuli", "type": [ "Repository" ], "note": "github repository" } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1038/s41592-024-02273-y", "pmid": "38769467", "pmcid": null, "type": [], "version": null, "note": null, "metadata": null } ], "credit": [], "owner": "milot-mirdita", "additionDate": "2023-06-07T03:22:25.847061Z", "lastUpdate": "2026-02-12T14:21:25.897853Z", "editPermission": { "type": "group", "authors": [ "vashokan" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "Bakta", "description": "Rapid & standardized annotation of bacterial genomes, MAGs & plasmids", "homepage": "https://github.com/oschwengers/bakta", "biotoolsID": "bakta", "biotoolsCURIE": "biotools:bakta", "version": [ "v1.12.0" ], "otherID": [], "relation": [ { "biotoolsID": "diamond", "type": "uses" }, { "biotoolsID": "hmmer3", "type": "uses" }, { "biotoolsID": "infernal", "type": "uses" }, { "biotoolsID": "trnascan-se", "type": "uses" }, { "biotoolsID": "blast", "type": "uses" }, { "biotoolsID": "aragorn", "type": "uses" }, { "biotoolsID": "pilercr", "type": "uses" }, { "biotoolsID": "deepsig", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0362", "term": "Genome annotation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0925", "term": "Sequence assembly" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2914", "term": "Sequence features metadata" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] }, { "data": { "uri": "http://edamontology.org/data_2012", "term": "Sequence coordinates" }, "format": [ { "uri": "http://edamontology.org/format_1975", "term": "GFF3" } ] }, { "data": { "uri": "http://edamontology.org/data_2886", "term": "Protein sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_1364", "term": "Hidden Markov model" }, "format": [ { "uri": "http://edamontology.org/format_3329", "term": "HMMER3" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1270", "term": "Feature table" }, "format": [ { "uri": "http://edamontology.org/format_1936", "term": "GenBank format" }, { "uri": "http://edamontology.org/format_1975", "term": "GFF3" }, { "uri": "http://edamontology.org/format_3464", "term": "JSON" }, { "uri": "http://edamontology.org/format_1927", "term": "EMBL format" }, { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] }, { "data": { "uri": "http://edamontology.org/data_2886", "term": "Protein sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2887", "term": "Nucleic acid sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2884", "term": "Plot" }, "format": [ { "uri": "http://edamontology.org/format_3604", "term": "SVG" }, { "uri": "http://edamontology.org/format_3603", "term": "PNG" } ] }, { "data": { "uri": "http://edamontology.org/data_1772", "term": "Score" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": "bakta --db <db-path> --prefix <prefix> --output <output-path> genome.fasta" } ], "toolType": [ "Web application", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" }, { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" }, { "uri": "http://edamontology.org/topic_0091", "term": "Bioinformatics" } ], "operatingSystem": [ "Linux", "Mac" ], "language": [ "Python" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [ "Tools" ], "elixirNode": [ "Germany" ], "elixirCommunity": [], "link": [ { "url": "https://github.com/oschwengers/bakta", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/oschwengers/bakta/issues", "type": [ "Issue tracker" ], "note": null }, { "url": "https://bioconda.github.io/recipes/bakta/README.html", "type": [ "Other" ], "note": null }, { "url": "https://bakta.computational.bio", "type": [ "Service" ], "note": null } ], "download": [ { "url": "https://zenodo.org/records/14916843", "type": "Other", "note": "Mandatory annotation database", "version": "v6.0" } ], "documentation": [ { "url": "https://github.com/oschwengers/bakta/blob/main/README.md", "type": [ "General" ], "note": null }, { "url": "https://github.com/oschwengers/bakta/blob/main/CONTRIBUTION.md", "type": [ "Contributions policy" ], "note": null }, { "url": "https://github.com/oschwengers/bakta/blob/main/CODE_OF_CONDUCT.md", "type": [ "Code of conduct" ], "note": null }, { "url": "https://bakta.readthedocs.io/", "type": [ "User manual" ], "note": null } ], "publication": [ { "doi": "10.1099/mgen.0.000685", "pmid": "34739369", "pmcid": "PMC8743544", "type": [ "Primary" ], "version": "1.1", "note": null, "metadata": null }, { "doi": "10.1093/nar/gkaf335", "pmid": "40271661", "pmcid": "PMC12230652", "type": [ "Primary" ], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Oliver Schwengers", "email": "oliver.schwengers@cb.jlug.de", "url": "https://github.com/oschwengers", "orcidid": "https://orcid.org/0000-0003-4216-2721", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact", "Developer", "Maintainer" ], "note": null }, { "name": "Justus Liebig University Giessen", "email": null, "url": "https://www.uni-giessen.de", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null } ], "owner": "oschwengers", "additionDate": "2021-05-08T17:25:21Z", "lastUpdate": "2026-01-29T12:11:19.042627Z", "editPermission": { "type": "group", "authors": [ "ELIXIR-CZ", "bebatut" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "MetaPhlAn", "description": "Computational tool for profiling the composition of microbial communities from metagenomic shotgun sequencing data.", "homepage": "http://segatalab.cibio.unitn.it/tools/metaphlan/index.html", "biotoolsID": "metaphlan", "biotoolsCURIE": "biotools:metaphlan", "version": [], "otherID": [], "relation": [ { "biotoolsID": "gtdb", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_2573", "term": "SAM" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_3751", "term": "DSV" } ] } ], "note": null, "cmd": "metaphlan <fastq_input> --input_type fastq -o <output>" }, { "operation": [ { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_3751", "term": "DSV" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_3751", "term": "DSV" } ] } ], "note": "Convert SGB-based profile to GTDB taxonomy", "cmd": "sgb_to_gtdb_profile.py -i <metaphlan_output> -o <gtdb_metaphlan_output>" } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_3174", "term": "Metagenomics" }, { "uri": "http://edamontology.org/topic_0194", "term": "Phylogenomics" } ], "operatingSystem": [ "Linux", "Mac", "Windows" ], "language": [ "Python" ], "license": "MIT", "collectionID": [ "Animal and Crop Genomics" ], "maturity": null, "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [ { "url": "https://github.com/biobakery/MetaPhlAn", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1038/nmeth.2066", "pmid": "22688413", "pmcid": "PMC3443552", "type": [ "Primary" ], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": null, "email": null, "url": "https://groups.google.com/forum/#!forum/metaphlan-users", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "admin", "additionDate": "2017-08-20T15:57:59Z", "lastUpdate": "2026-01-28T10:35:56.506019Z", "editPermission": { "type": "group", "authors": [ "animalandcropgenomics", "ELIXIR-CZ", "bebatut", "vashokan" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "kraken2", "description": "Kraken 2 is the newest version of Kraken, a taxonomic classification system using exact k-mer matches to achieve high accuracy and fast classification speeds. This classifier matches each k-mer within a query sequence to the lowest common ancestor (LCA) of all genomes containing the given k-mer. The k-mer assignments inform the classification algorithm.\nAny assumption that Kraken’s raw read assignments can be directly translated into species or strain-level abundance estimates is flawed. Bracken (Bayesian Reestimation of Abundance after Classification with KrakEN), estimates species abundances in metagenomics samples by probabilistically re-distributing reads in the taxonomic tree. (Lu, Jennifer et al. “Bracken: estimating species abundance in metagenomics data.”)", "homepage": "https://github.com/DerrickWood/kraken2", "biotoolsID": "kraken2", "biotoolsCURIE": "biotools:kraken2", "version": [ "2.0.8-beta" ], "otherID": [], "relation": [ { "biotoolsID": "kraken", "type": "isNewVersionOf" }, { "biotoolsID": "bracken", "type": "usedBy" }, { "biotoolsID": "gtdb", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": "`kraken2 --db <kraken2_database> <input.fastq>`" } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0637", "term": "Taxonomy" }, { "uri": "http://edamontology.org/topic_3174", "term": "Metagenomics" }, { "uri": "http://edamontology.org/topic_3697", "term": "Microbial ecology" }, { "uri": "http://edamontology.org/topic_3301", "term": "Microbiology" } ], "operatingSystem": [], "language": [ "Perl", "C++" ], "license": "MIT", "collectionID": [ "ONTeater" ], "maturity": null, "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/DerrickWood/kraken2", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/DerrickWood/kraken2/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [ { "url": "https://github.com/DerrickWood/kraken2/archive/v2.0.8-beta.tar.gz", "type": "Source code", "note": null, "version": "2.0.8-beta" } ], "documentation": [ { "url": "https://github.com/DerrickWood/kraken2/wiki/Manual", "type": [ "User manual" ], "note": null }, { "url": "https://benlangmead.github.io/aws-indexes/k2", "type": [ "User manual" ], "note": "Links to multiple Kraken 2 and bracken databases and indexes" } ], "publication": [ { "doi": "10.1101/762302", "pmid": null, "pmcid": null, "type": [], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Derrick E. Wood", "email": null, "url": null, "orcidid": "http://orcid.org/0000-0002-7429-1854", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Jennifer Lu", "email": null, "url": null, "orcidid": "http://orcid.org/0000-0001-9167-2002", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Ben Langmead", "email": "langmea@cs.jhu.edu", "url": null, "orcidid": "http://orcid.org/0000-0003-2437-1976", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "anand-anshu", "additionDate": "2019-09-13T12:51:16Z", "lastUpdate": "2026-01-28T10:34:30.102754Z", "editPermission": { "type": "group", "authors": [ "vashokan", "Keiler_Collier" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "SingleM", "description": "Novelty-inclusive microbial community profiling of shotgun metagenomes", "homepage": "https://wwood.github.io/singlem/", "biotoolsID": "singlem", "biotoolsCURIE": "biotools:singlem", "version": [], "otherID": [], "relation": [ { "biotoolsID": "gtdb", "type": "uses" }, { "biotoolsID": "globdb", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_3752", "term": "CSV" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_3174", "term": "Metagenomics" } ], "operatingSystem": [ "Linux" ], "language": [ "Python" ], "license": "GPL-3.0", "collectionID": [], "maturity": null, "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [ { "url": "https://wwood.github.io/singlem/", "type": [ "General", "Command-line options", "Installation instructions" ], "note": null } ], "publication": [ { "doi": "10.1101/2024.01.30.578060", "pmid": null, "pmcid": null, "type": [], "version": null, "note": null, "metadata": null } ], "credit": [], "owner": "benjwoodcroft", "additionDate": "2024-03-23T21:36:23.370696Z", "lastUpdate": "2026-01-28T10:30:54.345544Z", "editPermission": { "type": "group", "authors": [ "vashokan" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "globalamfungi", "description": "The GlobalAMFungi Database is an open-access, global repository of arbuscular mycorrhizal (AM) fungal occurrence data compiled from high-throughput sequencing studies. It aggregates millions of DNA sequence observations of AM fungi from thousands of geographically referenced environmental samples, together with rich metadata on sampling location and environmental context, to map the global distribution and diversity of these key plant symbionts. The resource is designed to be community-driven and FAIR (Findable, Accessible, Interoperable, Reusable), supporting research into AM fungal ecology, biogeography, and how environmental factors shape their diversity.", "homepage": "https://globalamfungi.com/", "biotoolsID": "globalamfungi", "biotoolsCURIE": "biotools:globalamfungi", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3431", "term": "Data deposition" }, { "uri": "http://edamontology.org/operation_0226", "term": "Annotation" }, { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0857", "term": "Sequence search results" }, "format": [ { "uri": "http://edamontology.org/format_2310", "term": "FASTA-HTML" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Database portal", "Web application" ], "topic": [ { "uri": "http://edamontology.org/topic_3050", "term": "Biodiversity" }, { "uri": "http://edamontology.org/topic_3697", "term": "Microbial ecology" }, { "uri": "http://edamontology.org/topic_3810", "term": "Agricultural science" } ], "operatingSystem": [], "language": [ "R" ], "license": "CC-BY-4.0", "collectionID": [ "ELIXIR-CZ", "Czech Republic" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [ "Data" ], "elixirNode": [ "Czech Republic" ], "elixirCommunity": [ "Plant Sciences" ], "link": [ { "url": "https://globalamfungi.com/", "type": [ "Helpdesk", "Repository", "Service" ], "note": null } ], "download": [], "documentation": [ { "url": "https://globalamfungi.com/", "type": [ "User manual", "Citation instructions", "Quick start guide", "Contributions policy", "General" ], "note": null } ], "publication": [ { "doi": "10.1111/nph.19283", "pmid": null, "pmcid": null, "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": null, "abstract": null, "date": null, "citationCount": 0, "authors": [], "journal": null } } ], "credit": [ { "name": "Tomas Vetrovsky", "email": "vetrovsky@biomed.cas.cz", "url": null, "orcidid": "https://orcid.org/0000-0002-0831-486X", "gridid": null, "rorid": "02p1jz666", "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact", "Developer", "Contributor" ], "note": null }, { "name": "ELIXIR-CZ", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Consortium", "typeRole": [], "note": null } ], "owner": "TomasVetrovsky", "additionDate": "2025-12-16T11:00:25.334832Z", "lastUpdate": "2025-12-16T11:00:25.337448Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "ASAFind", "description": "ASAFind is a software that predicts the intracellular location of proteins in cells with four membrane-bound complex plastids of red algal origin. \nThese plastids evolved via eukaryote-eukaryote endosymbiosis and for example can be found in diatoms and cryptophytes. ASAFind uses protein sequence data and external predictions of signal peptides (by the tools SignalP and TargetP), and predicts plastid proteins, and proteins that are targeted to the periplastidic compartment from these data; optionally, a graphical output can generated.", "homepage": "https://asafind.jcu.cz/", "biotoolsID": "asafind", "biotoolsCURIE": "biotools:asafind", "version": [ "2.0" ], "otherID": [], "relation": [ { "biotoolsID": "signalp", "type": "uses" }, { "biotoolsID": "targetp", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_2489", "term": "Subcellular localisation prediction" }, { "uri": "http://edamontology.org/operation_0239", "term": "Sequence motif recognition" }, { "uri": "http://edamontology.org/operation_0422", "term": "Protein cleavage site prediction" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2886", "term": "Protein sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_1270", "term": "Feature table" }, "format": [] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1277", "term": "Protein features" }, "format": [] }, { "data": { "uri": "http://edamontology.org/data_2884", "term": "Plot" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [ "Script", "Command-line tool", "Web service" ], "topic": [ { "uri": "http://edamontology.org/topic_2229", "term": "Cell biology" }, { "uri": "http://edamontology.org/topic_0078", "term": "Proteins" }, { "uri": "http://edamontology.org/topic_0780", "term": "Plant biology" }, { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "Python" ], "license": "CC-BY-SA-4.0", "collectionID": [ "ELIXIR-CZ", "Czech Republic" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [ "Tools" ], "elixirNode": [ "Czech Republic" ], "elixirCommunity": [ "Plant Sciences", "Marine Metagenomics", "Microbial Biotechnology" ], "link": [ { "url": "https://asafind.jcu.cz", "type": [ "Service" ], "note": "Web Service" }, { "url": "https://github.com/ASAFind/ASAFind-2", "type": [ "Repository" ], "note": "Information and source code, for local installation or development" } ], "download": [ { "url": "https://asafind.jcu.cz/download-page/", "type": "Downloads page", "note": "Download page on web-service, links to repository", "version": "2.0" } ], "documentation": [ { "url": "https://asafind.jcu.cz/download-page/", "type": [ "Installation instructions" ], "note": null } ], "publication": [ { "doi": "10.1111/tpj.70138", "pmid": "40464854", "pmcid": "PMC12136025", "type": [ "Primary" ], "version": "2.0", "note": "Publication of the current version of ASAFind (2.0)", "metadata": { "title": "ASAFind 2.0: multi-class protein targeting prediction for diatoms and algae with complex plastids", "abstract": "", "date": "2025-06-01T00:00:00Z", "citationCount": 0, "authors": [], "journal": "Plant Journal" } }, { "doi": "10.1111/tpj.12734", "pmid": "25438865", "pmcid": "PMC4329603", "type": [ "Other" ], "version": "1.0", "note": "Publication of the first version of ASAFind", "metadata": { "title": "Plastid proteome prediction for diatoms and other algae with secondary plastids of the red lineage", "abstract": "", "date": "2015-02-01T00:00:00Z", "citationCount": 138, "authors": [], "journal": "Plant Journal" } }, { "doi": "10.48550/arXiv.2303.02509", "pmid": null, "pmcid": null, "type": [ "Benchmarking study" ], "version": "1.0", "note": "Benchmarking of the performance of the first version of ASAFind", "metadata": null } ], "credit": [ { "name": "Marta Vohnoutová", "email": "mvohnoutova@jcu.cz", "url": "https://www.jcu.cz/cz/univerzita/lide/clovek?identita=Vohnoutova_Marta_61699", "orcidid": "https://orcid.org/0000-0002-8915-8626", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Contributor", "Developer", "Maintainer" ], "note": null }, { "name": "Ansgar Gruber", "email": "agruber@prf.jcu.cz", "url": "https://www.jcu.cz/cz/univerzita/lide/clovek?identita=Gruber_Ansgar_118401", "orcidid": "https://orcid.org/0000-0002-5876-4391", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact", "Developer", "Documentor" ], "note": null } ], "owner": "martavohnoutova", "additionDate": "2025-12-15T14:17:14.627791Z", "lastUpdate": "2025-12-15T17:36:43.189214Z", "editPermission": { "type": "group", "authors": [ "agruber" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "metagWGS", "description": "metagWGS is a workflow dedicated to the analysis of metagenomic data. It allows assembly, taxonomic annotation, and functional annotation of predicted genes. Since release 2.3, binning step with the possibility of cross-alignment is included. It has been developed in collaboration with several CATI BIOS4biol agents. Funded by Antiselfish Project (Labex Ecofect), ExpoMicoPig project (France Futur elevage) and SeqOccIn project (CPER - Occitanie Toulouse / FEDER), ATB_Biofilm funded by PNREST Anses, France genomique (ANR-10-INBS-09-08) and Resalab Ouest.", "homepage": "https://forgemia.inra.fr/genotoul-bioinfo/metagwgs", "biotoolsID": "metagwgs", "biotoolsCURIE": "biotools:metagwgs", "version": [ "2.3", "2.5.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_1915", "term": "Format" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_3672", "term": "Gene functional annotation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3917", "term": "Count matrix" }, "format": [ { "uri": "http://edamontology.org/format_1915", "term": "Format" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_0524", "term": "De-novo assembly" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Workflow" ], "topic": [ { "uri": "http://edamontology.org/topic_3174", "term": "Metagenomics" } ], "operatingSystem": [ "Linux" ], "language": [ "Python" ], "license": "GPL-3.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [ "France" ], "elixirCommunity": [], "link": [ { "url": "https://forge.inrae.fr/genotoul-bioinfo/metagwgs", "type": [ "Repository" ], "note": "See documentation, source code and functionnal test documentation." } ], "download": [ { "url": "https://forgemia.inra.fr/genotoul-bioinfo/metagwgs-test-datasets", "type": "Test data", "note": "Functional tests data and script", "version": null } ], "documentation": [ { "url": "https://genotoul-bioinfo.pages-forge.inrae.fr/metagwgs/master/index.html", "type": [ "User manual" ], "note": "We provide up to date installation documentation, usage documentation, output description and functionnal test datasets and procedure." } ], "publication": [], "credit": [ { "name": "Claire Hoede", "email": "claire.hoede@inrae.fr", "url": null, "orcidid": "https://orcid.org/0000-0001-5054-7731", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null }, { "name": "GenoToul bioinformatics facility", "email": null, "url": "http://bioinfo.genotoul.fr/", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Division", "typeRole": [ "Provider" ], "note": null } ], "owner": "choede", "additionDate": "2022-04-19T09:32:41.303637Z", "lastUpdate": "2025-12-11T14:51:44.804907Z", "editPermission": { "type": "group", "authors": [ "pbordron" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "Jalview", "description": "Jalview is a free cross-platform program for multiple sequence alignment editing, visualisation and analysis. Use it to align, view and edit sequence alignments, analyse them with phylogenetic trees and principal components analysis (PCA) plots and explore molecular structures and annotation.", "homepage": "https://www.jalview.org/", "biotoolsID": "Jalview", "biotoolsCURIE": "biotools:Jalview", "version": [ "2.11.5.1" ], "otherID": [], "relation": [ { "biotoolsID": "jabaws", "type": "uses" }, { "biotoolsID": "chimera", "type": "uses" }, { "biotoolsID": "chimerax", "type": "uses" }, { "biotoolsID": "pymol", "type": "uses" }, { "biotoolsID": "bioconda", "type": "includedIn" }, { "biotoolsID": "3d-beacons", "type": "uses" }, { "biotoolsID": "uniprot", "type": "uses" }, { "biotoolsID": "pfam", "type": "uses" }, { "biotoolsID": "ensembl", "type": "uses" }, { "biotoolsID": "pdb", "type": "uses" }, { "biotoolsID": "rfam", "type": "uses" }, { "biotoolsID": "3d-beacons", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3081", "term": "Sequence alignment editing" }, { "uri": "http://edamontology.org/operation_0324", "term": "Phylogenetic tree analysis" }, { "uri": "http://edamontology.org/operation_0564", "term": "Sequence visualisation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1948", "term": "nbrf/pir" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_1984", "term": "FASTA-aln" }, { "uri": "http://edamontology.org/format_3015", "term": "Pileup" }, { "uri": "http://edamontology.org/format_1938", "term": "GFF2-seq" }, { "uri": "http://edamontology.org/format_3313", "term": "BLC" }, { "uri": "http://edamontology.org/format_3311", "term": "RNAML" }, { "uri": "http://edamontology.org/format_1915", "term": "Format" }, { "uri": "http://edamontology.org/format_3774", "term": "BioJSON (Jalview)" }, { "uri": "http://edamontology.org/format_1982", "term": "ClustalW format" }, { "uri": "http://edamontology.org/format_1477", "term": "mmCIF" }, { "uri": "http://edamontology.org/format_1997", "term": "PHYLIP format" }, { "uri": "http://edamontology.org/format_3016", "term": "VCF" }, { "uri": "http://edamontology.org/format_1961", "term": "Stockholm format" }, { "uri": "http://edamontology.org/format_1939", "term": "GFF3-seq" }, { "uri": "http://edamontology.org/format_1947", "term": "GCG MSF" } ] }, { "data": { "uri": "http://edamontology.org/data_0886", "term": "Structure alignment" }, "format": [ { "uri": "http://edamontology.org/format_1476", "term": "PDB" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1948", "term": "nbrf/pir" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_3015", "term": "Pileup" }, { "uri": "http://edamontology.org/format_3313", "term": "BLC" }, { "uri": "http://edamontology.org/format_3774", "term": "BioJSON (Jalview)" }, { "uri": "http://edamontology.org/format_1982", "term": "ClustalW format" }, { "uri": "http://edamontology.org/format_3464", "term": "JSON" }, { "uri": "http://edamontology.org/format_1997", "term": "PHYLIP format" }, { "uri": "http://edamontology.org/format_1961", "term": "Stockholm format" }, { "uri": "http://edamontology.org/format_1947", "term": "GCG MSF" } ] }, { "data": { "uri": "http://edamontology.org/data_2884", "term": "Plot" }, "format": [ { "uri": "http://edamontology.org/format_3466", "term": "EPS" }, { "uri": "http://edamontology.org/format_1915", "term": "Format" }, { "uri": "http://edamontology.org/format_2331", "term": "HTML" }, { "uri": "http://edamontology.org/format_3604", "term": "SVG" }, { "uri": "http://edamontology.org/format_3603", "term": "PNG" } ] } ], "note": "Other Input formats:\nAMSA (.amsa);\nJnetFile (.concise, .jnet);\nPFAM (.pfam);\nSubstitution matrix (.matrix);\nJalview Project File (.jvp);\nJalview Feature File (.features, .jvfeatures);\nJalview Annotations File (.annotations, .jvannotations);\nPredicted Aligned Error (PAE) Matrix File (.json)\n...\nOther Output formats:\nPFAM (.pfam);\nBioJS (.biojs) (interactive HTML/Javascript);\nJalview Project File (.jvp);", "cmd": null } ], "toolType": [ "Desktop application", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" }, { "uri": "http://edamontology.org/topic_0092", "term": "Data visualisation" } ], "operatingSystem": [ "Mac", "Linux", "Windows" ], "language": [], "license": "GPL-3.0", "collectionID": [ "ELIXIR-UK" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [ "Tools", "Interoperability" ], "elixirNode": [ "UK" ], "elixirCommunity": [], "link": [ { "url": "https://discourse.jalview.org/", "type": [ "Discussion forum" ], "note": null }, { "url": "https://issues.jalview.org/", "type": [ "Issue tracker" ], "note": null }, { "url": "https://www.jalview.org/development/jalview_develop/", "type": [ "Other" ], "note": "Latest development version" }, { "url": "https://gitlab.jalview.org/jalview/jalview.git", "type": [ "Repository" ], "note": null }, { "url": "https://twitter.com/Jalview", "type": [ "Social media" ], "note": "Twitter feed" }, { "url": "https://www.youtube.com/channel/UCIjpnvZB770yz7ftbrJ0tfw", "type": [ "Social media" ], "note": "YouTube training videos" }, { "url": "https://www.linkedin.com/company/104771886/", "type": [ "Social media" ], "note": null } ], "download": [ { "url": "https://www.jalview.org/download", "type": "Downloads page", "note": null, "version": null }, { "url": "https://www.jalview.org/download/source/", "type": "Source code", "note": null, "version": null }, { "url": "https://www.jalview.org/download/?os=all", "type": "Binaries", "note": "Binaries for all platforms", "version": null }, { "url": "https://www.jalview.org/favicon.svg", "type": "Icon", "note": null, "version": null }, { "url": "https://www.jalview.org/download/other/jar/", "type": "Binaries", "note": "Executable JAR file", "version": null } ], "documentation": [ { "url": "https://www.jalview.org/about/citation", "type": [ "Citation instructions" ], "note": null }, { "url": "https://www.jalview.org/training/", "type": [ "Training material" ], "note": "Hands-on exercises, Training courses and Training videos" }, { "url": "https://www.jalview.org/help/faq", "type": [ "FAQ" ], "note": null }, { "url": "https://www.jalview.org/help/documentation/", "type": [ "User manual" ], "note": null } ], "publication": [ { "doi": "10.1093/bioinformatics/btp033", "pmid": "19151095", "pmcid": "PMC2672624", "type": [], "version": null, "note": null, "metadata": { "title": "Jalview Version 2-A multiple sequence alignment editor and analysis workbench", "abstract": "", "date": "2009-05-07T00:00:00Z", "citationCount": 7717, "authors": [], "journal": "Bioinformatics" } } ], "credit": [ { "name": "Jim Procter", "email": null, "url": "http://www.lifesci.dundee.ac.uk/people/jim-procter", "orcidid": "https://orcid.org/0000-0002-7865-7382", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null }, { "name": "Geoff Barton", "email": null, "url": "https://www.lifesci.dundee.ac.uk/people/geoff-barton", "orcidid": "https://orcid.org/0000-0002-9014-5355", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null } ], "owner": "ben_s", "additionDate": "2019-02-13T17:01:40Z", "lastUpdate": "2025-12-11T14:16:30.074724Z", "editPermission": { "type": "group", "authors": [ "ben_s", "jimprocter" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "emapper2gbk", "description": "creation of genbank files from Eggnog-mapper annotation outputs", "homepage": "https://github.com/AuReMe/emapper2gbk", "biotoolsID": "emapper2gbk", "biotoolsCURIE": "biotools:emapper2gbk", "version": [ "0.3.2" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3434", "term": "Conversion" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0925", "term": "Sequence assembly" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_1233", "term": "Sequence set (protein)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2012", "term": "Sequence coordinates" }, "format": [ { "uri": "http://edamontology.org/format_2305", "term": "GFF" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1270", "term": "Feature table" }, "format": [ { "uri": "http://edamontology.org/format_2205", "term": "GenBank-like format (text)" } ] } ], "note": "Genomic -single mode", "cmd": "genomes -fn genome.fna -fp proteome.faa -gff genome.gff -n \"Escherichia coli\"" } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_4011", "term": "Data rescue" } ], "operatingSystem": [ "Linux" ], "language": [ "Python" ], "license": "LGPL-3.0", "collectionID": [ "AuReMe" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/AuReMe/emapper2gbk", "type": [ "Repository" ], "note": null }, { "url": "https://pypi.org/project/emapper2gbk/", "type": [ "Software catalogue" ], "note": "Access to Python library" } ], "download": [ { "url": "https://github.com/AuReMe/emapper2gbk.git", "type": "Source code", "note": null, "version": "0.3.2" }, { "url": "https://pypi.org/project/emapper2gbk/#files", "type": "Software package", "note": null, "version": "0.3.2" } ], "documentation": [ { "url": "https://github.com/AuReMe/emapper2gbk", "type": [ "Installation instructions", "User manual" ], "note": null } ], "publication": [], "credit": [ { "name": "Arnaud", "email": null, "url": "https://github.com/ArnaudBelcour", "orcidid": "https://orcid.org/0000-0003-1170-0785", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null } ], "owner": "Noe_Robert", "additionDate": "2025-12-10T13:18:28.703003Z", "lastUpdate": "2025-12-10T16:49:05.332576Z", "editPermission": { "type": "group", "authors": [ "jgot" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "South Green Genome Hubs", "description": "The South Green Genome Hub is a suite of crop-specific community portals to manage genomic datasets with focus on tropical and Mediterranean plants. Currently developed on Banana, Cacao, Coffee, Grass, Rice, Vanilla, Citrus and Sugarcane, genome hubs provide access to multiple datasets (e.g. assemblies, gene product information, metabolic pathways, gene families, transcriptomics and genetic markers).", "homepage": "https://banana-genome-hub.southgreen.fr/", "biotoolsID": "South_Green_Genome_Hubs", "biotoolsCURIE": "biotools:South_Green_Genome_Hubs", "version": [], "otherID": [], "relation": [ { "biotoolsID": "tripal", "type": "uses" }, { "biotoolsID": "banana_genome_hub", "type": "includes" }, { "biotoolsID": "coffee_genome_hub", "type": "includes" }, { "biotoolsID": "cocoa_genome_hub", "type": "includes" }, { "biotoolsID": "rice_genome_hub", "type": "includes" }, { "biotoolsID": "sugarcane_genome_hub", "type": "includes" }, { "biotoolsID": "southgreen", "type": "includedIn" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3208", "term": "Genome visualisation" }, { "uri": "http://edamontology.org/operation_0338", "term": "Sequence database search" }, { "uri": "http://edamontology.org/operation_2403", "term": "Sequence analysis" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0968", "term": "Keyword" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [ "Database portal" ], "topic": [ { "uri": "http://edamontology.org/topic_3810", "term": "Agricultural science" }, { "uri": "http://edamontology.org/topic_0622", "term": "Genomics" }, { "uri": "http://edamontology.org/topic_3308", "term": "Transcriptomics" }, { "uri": "http://edamontology.org/topic_0797", "term": "Comparative genomics" }, { "uri": "http://edamontology.org/topic_0621", "term": "Model organisms" } ], "operatingSystem": [], "language": [ "JavaScript", "PHP" ], "license": "GPL-2.0", "collectionID": [ "Genome Hub" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": null, "elixirPlatform": [ "Data", "Tools" ], "elixirNode": [ "France" ], "elixirCommunity": [], "link": [ { "url": "https://github.com/SouthGreenPlatform/genomehubs", "type": [ "Issue tracker" ], "note": null } ], "download": [], "documentation": [ { "url": "https://banana-genome-hub.southgreen.fr/content/term-service", "type": [ "Terms of use" ], "note": null } ], "publication": [ { "doi": "10.1093/database/bat035", "pmid": "23707967", "pmcid": "PMC3662865", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "The banana genome hub", "abstract": "", "date": "2013-12-01T00:00:00Z", "citationCount": 150, "authors": [], "journal": "Database" } }, { "doi": "10.1093/nar/gku1108", "pmid": "25392413", "pmcid": "PMC4383925", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "The coffee genome hub: A resource for coffee genomes", "abstract": "", "date": "2015-01-28T00:00:00Z", "citationCount": 52, "authors": [], "journal": "Nucleic Acids Research" } }, { "doi": "10.1093/hr/uhac221", "pmid": "36479579", "pmcid": "PMC9720444", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "The banana genome hub: a community database for genomics in the Musaceae", "abstract": "", "date": "2022-01-01T00:00:00Z", "citationCount": 29, "authors": [], "journal": "Horticulture Research" } }, { "doi": "10.1016/j.xplc.2022.100330", "pmid": "35617961", "pmcid": "PMC9482989", "type": [ "Usage" ], "version": null, "note": null, "metadata": { "title": "A chromosome-level, haplotype-phased Vanilla planifolia genome highlights the challenge of partial endoreplication for accurate whole-genome assembly", "abstract": "", "date": "2022-09-12T00:00:00Z", "citationCount": 26, "authors": [], "journal": "Plant Communications" } } ], "credit": [ { "name": "Gaetan Droc", "email": "droc@cirad.fr", "url": null, "orcidid": "https://orcid.org/0000-0003-1849-1269", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact", "Developer", "Documentor", "Provider", "Support" ], "note": null }, { "name": "Alexis Dereeper", "email": "alexis.dereeper@ird.fr", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Mathieu Rouard", "email": "m.rouard@cgiar.org", "url": null, "orcidid": "https://orcid.org/0000-0003-1849-1269", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [ "Primary contact", "Maintainer", "Support" ], "note": null }, { "name": "Valentin Guignon", "email": "v.guignon@cgiar.org", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Chrisitine Tranchant", "email": "christine.tranchant@ird.fr", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null }, { "name": "Stéphanie Bocs", "email": "stephanie.sidibe-bocs@cirad.fr", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": null, "typeRole": [], "note": null } ], "owner": "mrouard", "additionDate": "2020-02-26T09:24:43Z", "lastUpdate": "2025-11-27T09:14:28.500250Z", "editPermission": { "type": "group", "authors": [ "gdroc", "Droc" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "trimAl", "description": "Tool for the automated removal of spurious sequences or poorly aligned regions from a multiple sequence alignment.", "homepage": "https://trimal.readthedocs.io", "biotoolsID": "trimal", "biotoolsCURIE": "biotools:trimal", "version": [ "1.5.1", "2.0-RC" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0492", "term": "Multiple sequence alignment" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1916", "term": "Alignment" }, "format": [ { "uri": "http://edamontology.org/format_1998", "term": "phylipnon" }, { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_1982", "term": "ClustalW format" }, { "uri": "http://edamontology.org/format_1997", "term": "PHYLIP format" } ] }, { "data": { "uri": "http://edamontology.org/data_2048", "term": "Report" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" }, { "uri": "http://edamontology.org/topic_3168", "term": "Sequencing" }, { "uri": "http://edamontology.org/topic_0160", "term": "Sequence sites, features and motifs" } ], "operatingSystem": [ "Mac", "Windows", "Linux" ], "language": [ "C++" ], "license": null, "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/inab/trimal", "type": [ "Repository" ], "note": null } ], "download": [ { "url": "https://github.com/inab/trimal", "type": "Source code", "note": null, "version": "1.5.1" }, { "url": "https://github.com/inab/trimal/tree/2.0_RC", "type": "Source code", "note": null, "version": "2.0-RC" } ], "documentation": [ { "url": "http://trimal.cgenomics.org/", "type": [ "General" ], "note": "Old versions" }, { "url": "https://trimal.readthedocs.io", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1093/bioinformatics/btp348", "pmid": "19505945", "pmcid": "PMC2712344", "type": [], "version": null, "note": null, "metadata": { "title": "trimAl: A tool for automated alignment trimming in large-scale phylogenetic analyses", "abstract": "", "date": "2009-08-01T00:00:00Z", "citationCount": 8679, "authors": [], "journal": "Bioinformatics" } } ], "credit": [ { "name": "Salvador Capella-Gutierrez", "email": "salcagu@gmail.com", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null }, { "name": null, "email": "tgabaldon@crg.es", "url": "http://gabaldonlab.crg.es/", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "scapella", "additionDate": "2017-04-15T08:42:53Z", "lastUpdate": "2025-11-26T09:30:50.611915Z", "editPermission": { "type": "group", "authors": [ "nico_bsc", "sergitobara" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "prolfquapp", "description": "A command-line tool for differential expression analysis in quantitative proteomics", "homepage": "https://github.com/prolfqua/prolfquapp", "biotoolsID": "prolfquapp", "biotoolsCURIE": "biotools:prolfquapp", "version": [ "0.1.6" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3741", "term": "Differential protein expression profiling" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2603", "term": "Expression data" }, "format": [ { "uri": "http://edamontology.org/format_3752", "term": "CSV" }, { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] }, { "data": { "uri": "http://edamontology.org/data_2044", "term": "Sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2603", "term": "Expression data" }, "format": [ { "uri": "http://edamontology.org/format_3620", "term": "xlsx" }, { "uri": "http://edamontology.org/format_2331", "term": "HTML" } ] } ], "note": null, "cmd": "./prolfqua_dea.sh -i data_dir/ -d annotation.xlsx -y config.yaml -w NameOfAnalysis -s DIANN\n# and again you run the version within the docker container with\n# ./prolfquapp_docker.sh prolfqua_dea.sh -i data_dir/ -d annotation.xlsx -y config.yaml -w NameOfAnalysis -s DIANN" }, { "operation": [ { "uri": "http://edamontology.org/operation_2428", "term": "Validation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2603", "term": "Expression data" }, "format": [ { "uri": "http://edamontology.org/format_3620", "term": "xlsx" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3914", "term": "Quality control report" }, "format": [ { "uri": "http://edamontology.org/format_2331", "term": "HTML" } ] } ], "note": null, "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_0571", "term": "Expression data visualisation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2603", "term": "Expression data" }, "format": [ { "uri": "http://edamontology.org/format_3752", "term": "CSV" }, { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] }, { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2603", "term": "Expression data" }, "format": [ { "uri": "http://edamontology.org/format_2331", "term": "HTML" }, { "uri": "http://edamontology.org/format_3508", "term": "PDF" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0121", "term": "Proteomics" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "R" ], "license": "MIT", "collectionID": [], "maturity": "Emerging", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/prolfqua/prolfquapp", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/prolfqua/prolfquapp/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [ { "url": "https://github.com/prolfqua/prolfquapp/releases/tag/0.1.6", "type": "Downloads page", "note": null, "version": "0.1.6" } ], "documentation": [ { "url": "https://github.com/prolfqua/prolfquapp/blob/master/README.md", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1021/acs.jproteome.4c00911", "pmid": null, "pmcid": null, "type": [ "Primary" ], "version": "0.0.6", "note": null, "metadata": { "title": "prolfquapp ─ A User-Friendly Command-Line Tool Simplifying Differential Expression Analysis in Quantitative Proteomics", "abstract": "", "date": "2025-02-07T00:00:00Z", "citationCount": 1, "authors": [], "journal": "Journal of Proteome Research" } } ], "credit": [], "owner": "n.m.palmblad@lumc.nl", "additionDate": "2025-02-28T15:04:33.594183Z", "lastUpdate": "2025-11-06T14:37:12.116175Z", "editPermission": { "type": "group", "authors": [ "thatmariia" ] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "PeptideShaker", "description": "PeptideShaker is a search engine independent platform for interpretation of proteomics identification results from multiple search engines, currently supporting X!Tandem, MS-GF+, MS Amanda, OMSSA, MyriMatch, Comet, Tide, Mascot, Andromeda and mzIdentML. By combining the results from multiple search engines, while re-calculating PTM localization scores and redoing the protein inference, PeptideShaker attempts to give you the best possible understanding of your proteomics data", "homepage": "http://compomics.github.io/projects/peptide-shaker.html", "biotoolsID": "peptideshaker", "biotoolsCURIE": "biotools:peptideshaker", "version": [ "3.0.11" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3694", "term": "Mass spectrum visualisation" }, { "uri": "http://edamontology.org/operation_3631", "term": "Peptide identification" }, { "uri": "http://edamontology.org/operation_2428", "term": "Validation" }, { "uri": "http://edamontology.org/operation_3755", "term": "PTM localisation" }, { "uri": "http://edamontology.org/operation_3501", "term": "Enrichment analysis" }, { "uri": "http://edamontology.org/operation_0570", "term": "Structure visualisation" }, { "uri": "http://edamontology.org/operation_3767", "term": "Protein identification" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_0945", "term": "Peptide identification" }, "format": [ { "uri": "http://edamontology.org/format_3247", "term": "mzIdentML" } ] }, { "data": { "uri": "http://edamontology.org/data_2536", "term": "Mass spectrometry data" }, "format": [ { "uri": "http://edamontology.org/format_3651", "term": "MGF" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2992", "term": "Protein structure image" }, "format": [ { "uri": "http://edamontology.org/format_3579", "term": "JPG" }, { "uri": "http://edamontology.org/format_3604", "term": "SVG" } ] }, { "data": { "uri": "http://edamontology.org/data_3754", "term": "GO-term enrichment data" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] }, { "data": { "uri": "http://edamontology.org/data_2969", "term": "Sequence image" }, "format": [ { "uri": "http://edamontology.org/format_3547", "term": "Image format" } ] }, { "data": { "uri": "http://edamontology.org/data_0896", "term": "Protein report" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Desktop application", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0121", "term": "Proteomics" }, { "uri": "http://edamontology.org/topic_3520", "term": "Proteomics experiment" }, { "uri": "http://edamontology.org/topic_0644", "term": "Proteome" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "Java" ], "license": "Apache-2.0", "collectionID": [ "de.NBI", "Proteomics", "BioInfra.Prot" ], "maturity": null, "cost": null, "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [ { "url": "https://github.com/compomics/peptide-shaker", "type": "Source code", "note": null, "version": null } ], "documentation": [ { "url": "http://compomics.github.io/projects/peptide-shaker.html#read-me", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1038/nbt.3109", "pmid": "25574629", "pmcid": null, "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "PeptideShaker enables reanalysis of MS-derived proteomics data sets: To the editor", "abstract": "", "date": "2015-01-01T00:00:00Z", "citationCount": 449, "authors": [], "journal": "Nature Biotechnology" } } ], "credit": [ { "name": "BioInfra.Prot", "email": null, "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": "Dominik Kopczynsk", "email": "dominik.kopczynski@isas.de", "url": "http://compomics.github.io/projects/peptide-shaker.html", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "BioInfra.Prot", "additionDate": "2016-10-20T10:31:19Z", "lastUpdate": "2025-11-01T15:59:45.423975Z", "editPermission": { "type": "group", "authors": [ "proteomics.bio.tools", "veits@bmb.sdu.dk" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "NGP", "description": "Simulation of next-generation proteomics (NGP) based on single-molecule sequencing.", "homepage": "https://github.com/magnuspalmblad/NGP", "biotoolsID": "ngp", "biotoolsCURIE": "biotools:ngp", "version": [], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_2426", "term": "Modelling and simulation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3869", "term": "Simulation" }, "format": [ { "uri": "http://edamontology.org/format_3752", "term": "CSV" }, { "uri": "http://edamontology.org/format_3508", "term": "PDF" } ] } ], "note": null, "cmd": null } ], "toolType": [], "topic": [], "operatingSystem": [], "language": [], "license": null, "collectionID": [], "maturity": null, "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [ { "doi": "10.1021/acs.jproteome.1c00136", "pmid": "33904308", "pmcid": "PMC8185883", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "Theoretical Considerations for Next-Generation Proteomics", "abstract": "", "date": "2021-06-04T00:00:00Z", "citationCount": 5, "authors": [], "journal": "Journal of Proteome Research" } } ], "credit": [], "owner": "n.m.palmblad@lumc.nl", "additionDate": "2025-10-29T16:12:04.796577Z", "lastUpdate": "2025-10-29T16:12:04.798957Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "NetStart", "description": "Prediction of eukaryotic translation initiation sites using a protein language model.\n\nNetStart 2.0 is a deep learning-based model that predicts canonical translation initiation sites in mRNA transcripts in species across the eukaryotic domain, including vertebrates, invertebrates, plants, fungi, and protists. \n\nThe model integrates the ESM-2 protein language model for assessing transitions from non-coding to coding regions with local start codon sequence context and taxonomical information. It has been trained on sequences from 60 phylogenetically diverse eukaryotic species.\n\nIf you need help with the bioinformatics programs, see the \"Getting Help\" section at the server site at the link.", "homepage": "https://services.healthtech.dtu.dk/services/NetStart-2.0/", "biotoolsID": "netstart_2.0", "biotoolsCURIE": "biotools:netstart_2.0", "version": [ "2.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3767", "term": "Protein identification" }, { "uri": "http://edamontology.org/operation_0362", "term": "Genome annotation" }, { "uri": "http://edamontology.org/operation_0477", "term": "Protein modelling" }, { "uri": "http://edamontology.org/operation_0439", "term": "Translation initiation site prediction" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3495", "term": "RNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1772", "term": "Score" }, "format": [] } ], "note": null, "cmd": null } ], "toolType": [], "topic": [ { "uri": "http://edamontology.org/topic_3512", "term": "Gene transcripts" }, { "uri": "http://edamontology.org/topic_0108", "term": "Protein expression" }, { "uri": "http://edamontology.org/topic_0203", "term": "Gene expression" }, { "uri": "http://edamontology.org/topic_0621", "term": "Model organisms" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "Python" ], "license": null, "collectionID": [], "maturity": null, "cost": null, "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/lsandvad/netstart2", "type": [ "Repository" ], "note": "GitHub with code and instructions and to download and run the program locally" }, { "url": "https://services.healthtech.dtu.dk/services/NetStart-2.0/", "type": [ "Service" ], "note": "NetStart 2.0 server where sequences can be uploaded directly without having to download the program (hosted by DTU Health Tech)." } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1186/S12859-025-06220-2", "pmid": "40830753", "pmcid": "PMC12366053", "type": [ "Method" ], "version": "2.0", "note": null, "metadata": { "title": "NetStart 2.0: prediction of eukaryotic translation initiation sites using a protein language model", "abstract": "", "date": "2025-12-01T00:00:00Z", "citationCount": 0, "authors": [], "journal": "BMC Bioinformatics" } } ], "credit": [ { "name": "Line Sandvad Nielsen", "email": "line.s.nielsen@bio.ku.dk", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Henrik Nielsen", "email": "henni@dtu.dk", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "linesandvad", "additionDate": "2025-10-27T16:27:24.014603Z", "lastUpdate": "2025-10-28T17:34:39.042070Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "MS Annika", "description": "MS Annika is a crosslink search engine based on MS Amanda, aimed at identifying crosslinks of cleavable and non-cleavable crosslinkers from MS2 and MS3 spectra. It can deal with a wide variety of cross-linkers and provides robust and transparent FDR control based on a target-decoy approach. MS Annika is available free of charge as a plug-in for Proteome Discoverer.", "homepage": "https://github.com/hgb-bin-proteomics/MSAnnika", "biotoolsID": "ms_annika", "biotoolsCURIE": "biotools:ms_annika", "version": [ "Proteome Discoverer 3.2: MS Annika 3.0 v3.0.7", "Proteome Discoverer 3.1: MS Annika 3.0 v3.0.7", "Proteome Discoverer 3.0: MS Annika 2.0 v1.1.4fix", "Proteome Discoverer 2.5: MS Annika 2.0 v1.1.3", "Proteome Discoverer 2.4: MS Annika v1.0.0", "Proteome Discoverer 2.3: MS Annika v1.0.0" ], "otherID": [], "relation": [ { "biotoolsID": "ms_amanda", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3631", "term": "Peptide identification" }, { "uri": "http://edamontology.org/operation_3646", "term": "Peptide database search" }, { "uri": "http://edamontology.org/operation_3755", "term": "PTM localisation" }, { "uri": "http://edamontology.org/operation_3645", "term": "PTM identification" }, { "uri": "http://edamontology.org/operation_3649", "term": "Target-Decoy" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0943", "term": "Mass spectrum" }, "format": [ { "uri": "http://edamontology.org/format_3651", "term": "MGF" }, { "uri": "http://edamontology.org/format_3712", "term": "Thermo RAW" } ] }, { "data": { "uri": "http://edamontology.org/data_2886", "term": "Protein sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0857", "term": "Sequence search results" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Plug-in" ], "topic": [ { "uri": "http://edamontology.org/topic_0130", "term": "Protein folding, stability and design" }, { "uri": "http://edamontology.org/topic_0736", "term": "Protein folds and structural domains" }, { "uri": "http://edamontology.org/topic_0128", "term": "Protein interactions" }, { "uri": "http://edamontology.org/topic_0121", "term": "Proteomics" }, { "uri": "http://edamontology.org/topic_0091", "term": "Bioinformatics" } ], "operatingSystem": [ "Windows" ], "language": [ "C#" ], "license": "Freeware", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/hgb-bin-proteomics/MSAnnika", "type": [ "Repository" ], "note": "MS Annika version archive" } ], "download": [ { "url": "https://github.com/hgb-bin-proteomics/MSAnnika/raw/master/releases/latest/PD3.2/latest.zip", "type": "Software package", "note": "Latest MS Annika version for Proteome Disoverer 3.2", "version": "PD3.2:latest" }, { "url": "https://github.com/hgb-bin-proteomics/MSAnnika/raw/master/releases/latest/PD3.1/latest.zip", "type": "Software package", "note": "Latest MS Annika version for Proteome Disoverer 3.1", "version": "PD3.1:latest" }, { "url": "https://github.com/hgb-bin-proteomics/MSAnnika/raw/master/releases/latest/PD3.0/latest.zip", "type": "Software package", "note": "Latest MS Annika version for Proteome Disoverer 3.0", "version": "PD3.0:latest" }, { "url": "https://github.com/hgb-bin-proteomics/MSAnnika/raw/master/releases/latest/PD2.5/latest.zip", "type": "Software package", "note": "Latest MS Annika version for Proteome Disoverer 2.5", "version": "PD2.5:latest" } ], "documentation": [ { "url": "https://hgb-bin-proteomics.github.io/MSAnnika/", "type": [ "General" ], "note": null }, { "url": "https://github.com/hgb-bin-proteomics/MSAnnika/raw/master/MS_Annika_3.0_UserManual.pdf", "type": [ "User manual" ], "note": null }, { "url": "https://github.com/hgb-bin-proteomics/MSAnnika/raw/master/tutorial/MS_Annika_3.0_Tutorial.pdf", "type": [ "Training material" ], "note": "Detailed tutorial how to use MS Annika" }, { "url": "https://www.youtube.com/watch?v=L1lVt35PYv4", "type": [ "Training material" ], "note": "Detailed tutorial how to use MS Annika" } ], "publication": [ { "doi": "10.1021/acs.jproteome.0c01000", "pmid": "33852321", "pmcid": "PMC8155564", "type": [ "Primary" ], "version": "1.0", "note": "MS Annika for cleavable crosslink identification from MS2 spectra", "metadata": { "title": "MS Annika: A New Cross-Linking Search Engine", "abstract": "", "date": "2021-05-07T00:00:00Z", "citationCount": 22, "authors": [], "journal": "Journal of Proteome Research" } }, { "doi": "10.1021/acs.jproteome.3c00325", "pmid": "37566781", "pmcid": "PMC10476269", "type": [ "Primary" ], "version": "2.0", "note": "MS Annika 2.0 for cleavable crosslink identification from MS3 spectra", "metadata": { "title": "MS Annika 2.0 Identifies Cross-Linked Peptides in MS2-MS3-Based Workflows at High Sensitivity and Specificity", "abstract": "", "date": "2023-09-01T00:00:00Z", "citationCount": 5, "authors": [], "journal": "Journal of Proteome Research" } }, { "doi": "10.1038/s42004-024-01386-x", "pmid": "39702463", "pmcid": "PMC11659399", "type": [ "Primary" ], "version": "3.0", "note": "MS Annika 3.0 for non-cleavable crosslink identification", "metadata": { "title": "Proteome-wide non-cleavable crosslink identification with MS Annika 3.0 reveals the structure of the C. elegans Box C/D complex", "abstract": "", "date": "2024-12-01T00:00:00Z", "citationCount": 2, "authors": [], "journal": "Communications Chemistry" } } ], "credit": [ { "name": "Viktoria Dorfer", "email": "viktoria.dorfer@fh-hagenberg.at", "url": "http://bioinformatics.fh-hagenberg.at/", "orcidid": "https://orcid.org/0000-0002-5332-5701", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null }, { "name": "Micha Birklbauer", "email": "micha.birklbauer@fh-hagenberg.at", "url": "http://bioinformatics.fh-hagenberg.at/", "orcidid": "https://orcid.org/0009-0005-1051-179X", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null } ], "owner": "michabirklbauer", "additionDate": "2023-07-26T14:40:01.768324Z", "lastUpdate": "2025-10-26T02:38:48.643054Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "EPIK", "description": "Precise and scalable evolutionary placement with informative k-mers.", "homepage": "https://github.com/phylo42/EPIK", "biotoolsID": "epik", "biotoolsCURIE": "biotools:epik", "version": [ "0.2.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0323", "term": "Phylogenetic inference" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2976", "term": "Protein sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_0955", "term": "Data index" }, "format": [ { "uri": "http://edamontology.org/format_2333", "term": "Binary format" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0872", "term": "Phylogenetic tree" }, "format": [ { "uri": "http://edamontology.org/format_3464", "term": "JSON" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0084", "term": "Phylogeny" } ], "operatingSystem": [ "Linux", "Mac" ], "language": [ "C++", "Python" ], "license": "MIT", "collectionID": [], "maturity": "Emerging", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [], "download": [], "documentation": [], "publication": [ { "doi": "10.1093/BIOINFORMATICS/BTAD692", "pmid": "37975872", "pmcid": "PMC10701097", "type": [], "version": "0.2.0", "note": null, "metadata": { "title": "EPIK: Precise and scalable evolutionary placement with informative k-mers", "abstract": "", "date": "2023-12-01T00:00:00Z", "citationCount": 2, "authors": [], "journal": "Bioinformatics" } } ], "credit": [ { "name": "Nikolai Romashchenko", "email": "nromashchenko@lirmm.fr", "url": null, "orcidid": "https://orcid.org/0000-0002-2264-5219", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null }, { "name": "Eric Rivals", "email": "rivals@lirmm.fr", "url": null, "orcidid": "https://orcid.org/0000-0003-3791-3973", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [], "note": null } ], "owner": "nromashchenko", "additionDate": "2024-05-03T08:43:04.841443Z", "lastUpdate": "2025-10-02T12:41:03.856493Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "SQUARNA", "description": "SQUARNA is a tool for RNA secondary structure prediction. It can take a single RNA sequence or an alignment of sequences as input. SQUARNA handles pseudoknots and can predict alternative structures. SQUARNA allows structural restraints and chemical probing data as additional input and is available at https://github.com/febos/SQUARNA.", "homepage": "https://github.com/febos/SQUARNA", "biotoolsID": "squarna", "biotoolsCURIE": "biotools:squarna", "version": [ "2.3" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0278", "term": "RNA secondary structure prediction" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3495", "term": "RNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_1961", "term": "Stockholm format" }, { "uri": "http://edamontology.org/format_1982", "term": "ClustalW format" } ] }, { "data": { "uri": "http://edamontology.org/data_1383", "term": "Nucleic acid sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" }, { "uri": "http://edamontology.org/format_1961", "term": "Stockholm format" }, { "uri": "http://edamontology.org/format_1982", "term": "ClustalW format" } ] }, { "data": { "uri": "http://edamontology.org/data_0889", "term": "Structural profile" }, "format": [] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0880", "term": "RNA secondary structure" }, "format": [ { "uri": "http://edamontology.org/format_2546", "term": "FASTA-like" } ] }, { "data": { "uri": "http://edamontology.org/data_1772", "term": "Score" }, "format": [] } ], "note": "Input can be a single or several RNA sequences or an alignment of RNA sequences along with structural restraints and/or chemical probing data on base reactivities", "cmd": "SQUARNA i=inputfile [OPTIONS]" } ], "toolType": [ "Command-line tool", "Script", "Library" ], "topic": [ { "uri": "http://edamontology.org/topic_3307", "term": "Computational biology" }, { "uri": "http://edamontology.org/topic_0077", "term": "Nucleic acids" }, { "uri": "http://edamontology.org/topic_0081", "term": "Structure analysis" }, { "uri": "http://edamontology.org/topic_0097", "term": "Nucleic acid structure analysis" }, { "uri": "http://edamontology.org/topic_0082", "term": "Structure prediction" }, { "uri": "http://edamontology.org/topic_0099", "term": "RNA" }, { "uri": "http://edamontology.org/topic_0659", "term": "Functional, regulatory and non-coding RNA" }, { "uri": "http://edamontology.org/topic_3511", "term": "Nucleic acid sites, features and motifs" } ], "operatingSystem": [ "Mac", "Linux", "Windows" ], "language": [ "Python" ], "license": "Apache-2.0", "collectionID": [ "3D-BioInfo-Nucleic-Acid" ], "maturity": "Emerging", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/febos/SQUARNA", "type": [ "Repository" ], "note": "GitHub repository" }, { "url": "https://pypi.org/project/SQUARNA/", "type": [ "Software catalogue" ], "note": "PyPi repository page" } ], "download": [ { "url": "https://doi.org/10.5281/zenodo.8292325", "type": "Downloads page", "note": null, "version": "2.3" }, { "url": "https://pypi.org/project/SQUARNA/", "type": "Software package", "note": "pip install SQUARNA", "version": "2.3" } ], "documentation": [ { "url": "https://github.com/febos/SQUARNA/blob/main/README.md", "type": [ "User manual" ], "note": null }, { "url": "https://pypi.org/project/SQUARNA/", "type": [ "Installation instructions" ], "note": "pip install SQUARNA" } ], "publication": [ { "doi": "10.1101/2023.08.28.555103", "pmid": null, "pmcid": null, "type": [], "version": null, "note": "biorxiv preprint", "metadata": null } ], "credit": [ { "name": "Eugene F Baulin", "email": "efbaulin@gmail.com", "url": "https://scholar.google.com/citations?user=sjfDaUwAAAAJ&hl=en", "orcidid": "https://orcid.org/0000-0003-4694-9783", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer", "Primary contact", "Support" ], "note": "https://imol.institute/leaders/baulin-group/" } ], "owner": "febos", "additionDate": "2023-09-05T09:39:45.613658Z", "lastUpdate": "2025-09-26T10:35:19.637909Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "REPET", "description": "The REPET package integrates bioinformatics pipelines dedicated to detect, annotate and analyze transposable elements (TEs) in genomic sequences. The main pipelines are (i) TEdenovo, which search for interspersed repeats, build consensus sequences and classify them according to TE features, and (ii)\n TEannot, which mines a genome with a library of TE sequences, for instance the one produced by the TEdenovo pipeline, to provide TE annotations exported into GFF3 files.", "homepage": "https://urgi.versailles.inrae.fr/Tools/REPET", "biotoolsID": "repet", "biotoolsCURIE": "biotools:repet", "version": [ "v3.0" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0379", "term": "Repeat sequence detection" }, { "uri": "http://edamontology.org/operation_0237", "term": "Repeat sequence analysis" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_1270", "term": "Feature table" }, "format": [ { "uri": "http://edamontology.org/format_2206", "term": "Sequence feature table format (text)" } ] }, { "data": { "uri": "http://edamontology.org/data_3002", "term": "Annotation track" }, "format": [ { "uri": "http://edamontology.org/format_1939", "term": "GFF3-seq" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0157", "term": "Sequence composition, complexity and repeats" }, { "uri": "http://edamontology.org/topic_0654", "term": "DNA" }, { "uri": "http://edamontology.org/topic_0097", "term": "Nucleic acid structure analysis" } ], "operatingSystem": [ "Linux", "Mac" ], "language": [ "C++", "Python" ], "license": "CECILL-2.0", "collectionID": [ "REPET", "elixir-fr-sdp-2019", "URGI" ], "maturity": "Legacy", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [ "Tools" ], "elixirNode": [ "France" ], "elixirCommunity": [], "link": [ { "url": "https://urgi.versailles.inrae.fr/download/repet/", "type": [ "Repository" ], "note": null } ], "download": [ { "url": "https://urgi.versailles.inrae.fr/download/repet/REPET_linux-x64-3.0.tar.gz", "type": "Source code", "note": null, "version": "v3.0" } ], "documentation": [ { "url": "https://urgi.versailles.inrae.fr/Tools/REPET", "type": [ "General" ], "note": "see also https://urgi.versailles.inrae.fr/Tools/REPET/README" }, { "url": "https://urgi.versailles.inrae.fr/Tools/REPET/INSTALL", "type": [ "Installation instructions" ], "note": null }, { "url": "https://urgi.versailles.inrae.fr/Tools/REPET/TEdenovo-tuto", "type": [ "User manual" ], "note": "See also https://urgi.versailles.inra.fr/Tools/REPET/TEannot-tuto" }, { "url": "https://forgemia.inra.fr/urgi-anagen/wiki-repet/-/wikis/REPET-V3.0-tutorial", "type": [ "Training material" ], "note": null } ], "publication": [ { "doi": "10.1371/journal.pone.0091929", "pmid": "24786468", "pmcid": "PMC4008368", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "PASTEC: An automatic transposable element classification tool", "abstract": "", "date": "2014-05-02T00:00:00Z", "citationCount": 226, "authors": [], "journal": "PLoS ONE" } }, { "doi": "10.1371/journal.pone.0016526", "pmid": "21304975", "pmcid": "PMC3031573", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "Considering transposable element diversification in de novo annotation approaches", "abstract": "", "date": "2011-02-09T00:00:00Z", "citationCount": 355, "authors": [], "journal": "PLoS ONE" } }, { "doi": "10.1371/journal.pcbi.0010022", "pmid": "16110336", "pmcid": "PMC1185648", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "Combined evidence annotation of transposable elements in genome sequences", "abstract": "", "date": "2005-01-01T00:00:00Z", "citationCount": 279, "authors": [], "journal": "PLoS Computational Biology" } }, { "doi": "10.1007/s00239-003-0007-2", "pmid": "15008403", "pmcid": null, "type": [ "Method" ], "version": null, "note": null, "metadata": { "title": "Detection of New Transposable Element Families in Drosophila melanogaster and Anopheles gambiae Genomes", "abstract": "", "date": "2003-12-29T00:00:00Z", "citationCount": 65, "authors": [], "journal": "Journal of Molecular Evolution" } }, { "doi": "10.1109/JPROC.2016.2590833", "pmid": null, "pmcid": null, "type": [ "Method" ], "version": null, "note": null, "metadata": { "title": "De Novo Annotation of Transposable Elements: Tackling the Fat Genome Issue", "abstract": "", "date": "2017-03-01T00:00:00Z", "citationCount": 18, "authors": [], "journal": "Proceedings of the IEEE" } } ], "credit": [ { "name": "URGI", "email": "urgi-repet@versailles.inrae.fr", "url": "http://urgi.versailles.inrae.fr/", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Developer", "Contributor", "Maintainer", "Provider", "Support", "Documentor" ], "note": "This tool has a \"Numero de depot APP\": FR 001 480007 000 R P 2008 000 31 235" } ], "owner": "Institut Francais de Bioinform", "additionDate": "2016-03-24T16:22:28Z", "lastUpdate": "2025-09-09T08:10:41.737859Z", "editPermission": { "type": "group", "authors": [ "vjamilloux", "johann_confais", "raphael.flores", "cmichotey" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "fqcleaner", "description": "Mini workflow for preprocessing fastq files, it includes quality trimming, duplicate and artefacts filters for FASTQ read files.", "homepage": "https://gensoft.pasteur.fr/docs/fqCleanER/21.10/", "biotoolsID": "fqcleaner", "biotoolsCURIE": "biotools:fqcleaner", "version": [ "0.4.1.1" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3192", "term": "Sequence trimming" }, { "uri": "http://edamontology.org/operation_3695", "term": "Data filtering" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_0863", "term": "Sequence alignment" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1932", "term": "FASTQ-sanger" } ] }, { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1932", "term": "FASTQ-sanger" } ] }, { "data": { "uri": "http://edamontology.org/data_0006", "term": "Data" }, "format": [ { "uri": "http://edamontology.org/format_1932", "term": "FASTQ-sanger" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Web application" ], "topic": [ { "uri": "http://edamontology.org/topic_3168", "term": "Sequencing" }, { "uri": "http://edamontology.org/topic_3572", "term": "Data quality management" }, { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" } ], "operatingSystem": [], "language": [], "license": null, "collectionID": [ "galaxyPasteur", "Institut Pasteur", "fqtools" ], "maturity": "Mature", "cost": null, "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://galaxy.pasteur.fr/tool_runner?tool_id=toolshed.pasteur.fr/repos/odoppelt/fqcleaner/fqCleaner/0.4.1.1", "type": [ "Galaxy service" ], "note": null } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1093/nar/gkw343", "pmid": null, "pmcid": null, "type": [ "Other" ], "version": null, "note": null, "metadata": { "title": "The Galaxy platform for accessible, reproducible and collaborative biomedical analyses: 2016 update", "abstract": "High-throughput data production technologies, particularly ‘next-generation’ DNA sequencing, have ushered in widespread and disruptive changes to biomedical research. Making sense of the large datasets produced by these technologies requires sophisticated statistical and computational methods, as well as substantial computational power. This has led to an acute crisis in life sciences, as researchers without informatics training attempt to perform computation-dependent analyses. Since 2005, the Galaxy project has worked to address this problem by providing a framework that makes advanced computational tools usable by non experts. Galaxy seeks to make data-intensive research more accessible, transparent and reproducible by providing a Web-based environment in which users can perform computational analyses and have all of the details automatically tracked for later inspection, publication, or reuse. In this report we highlight recently added features enabling biomedical analyses on a large scale.", "date": "2016-07-08T00:00:00Z", "citationCount": 1477, "authors": [ { "name": "Afgan E." }, { "name": "Baker D." }, { "name": "van den Beek M." }, { "name": "Blankenberg D." }, { "name": "Bouvier D." }, { "name": "Cech M." }, { "name": "Chilton J." }, { "name": "Clements D." }, { "name": "Coraor N." }, { "name": "Eberhard C." }, { "name": "Gruning B." }, { "name": "Guerler A." }, { "name": "Hillman-Jackson J." }, { "name": "Kuster G.V." }, { "name": "Rasche E." }, { "name": "Soranzo N." }, { "name": "Turaga N." }, { "name": "Taylor J." }, { "name": "Nekrutenko A." }, { "name": "Goecks J." } ], "journal": "Nucleic Acids Research" } }, { "doi": "10.7490/f1000research.1114334.1", "pmid": null, "pmcid": null, "type": [ "Other" ], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Galaxy Support Team", "email": "galaxy@pasteur.fr", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "hmenager", "additionDate": "2016-12-19T14:27:26Z", "lastUpdate": "2025-08-27T10:47:14.412802Z", "editPermission": { "type": "private", "authors": [] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "ETENLNC", "description": "ETENLNC (End-To-End-Novel-NonCoding) is a lncRNA identification and analysis framework", "homepage": "https://github.com/EvolOMICS-TU/ETENLNC", "biotoolsID": "etenlnc", "biotoolsCURIE": "biotools:etenlnc", "version": [ "1.0" ], "otherID": [], "relation": [ { "biotoolsID": "hisat2", "type": "uses" }, { "biotoolsID": "salmon", "type": "uses" }, { "biotoolsID": "fastqc", "type": "uses" }, { "biotoolsID": "fastp", "type": "uses" }, { "biotoolsID": "stringtie", "type": "uses" }, { "biotoolsID": "gffcompare", "type": "uses" }, { "biotoolsID": "cpc2", "type": "uses" }, { "biotoolsID": "ncbi_blast_plus", "type": "uses" }, { "biotoolsID": "tximport", "type": "uses" }, { "biotoolsID": "deseq2", "type": "uses" }, { "biotoolsID": "lnctar", "type": "uses" }, { "biotoolsID": "capsule-lpi", "type": "uses" }, { "biotoolsID": "seekr", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_3219", "term": "Read pre-processing" }, { "uri": "http://edamontology.org/operation_3218", "term": "Sequencing quality control" }, { "uri": "http://edamontology.org/operation_3258", "term": "Transcriptome assembly" }, { "uri": "http://edamontology.org/operation_0415", "term": "Nucleic acid feature detection" }, { "uri": "http://edamontology.org/operation_3800", "term": "RNA-Seq quantification" }, { "uri": "http://edamontology.org/operation_3223", "term": "Differential gene expression profiling" }, { "uri": "http://edamontology.org/operation_0531", "term": "Heat map generation" }, { "uri": "http://edamontology.org/operation_0278", "term": "RNA secondary structure prediction" }, { "uri": "http://edamontology.org/operation_3472", "term": "k-mer counting" }, { "uri": "http://edamontology.org/operation_0389", "term": "Protein-nucleic acid interaction analysis" }, { "uri": "http://edamontology.org/operation_3901", "term": "RNA-binding protein prediction" }, { "uri": "http://edamontology.org/operation_2437", "term": "Gene regulatory network prediction" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2603", "term": "Expression data" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_1288", "term": "Genome map" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_3002", "term": "Annotation track" }, "format": [ { "uri": "http://edamontology.org/format_2306", "term": "GTF" }, { "uri": "http://edamontology.org/format_2305", "term": "GFF" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2887", "term": "Nucleic acid sequence record" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_3112", "term": "Gene expression matrix" }, "format": [ { "uri": "http://edamontology.org/format_3752", "term": "CSV" } ] }, { "data": { "uri": "http://edamontology.org/data_1636", "term": "Heat map" }, "format": [ { "uri": "http://edamontology.org/format_3508", "term": "PDF" } ] }, { "data": { "uri": "http://edamontology.org/data_0906", "term": "Protein interaction data" }, "format": [] } ], "note": "Run ETENLNC on paired-end raw RNA-Seq (.fastq) data", "cmd": "bash ETENLNC_docker.sh" } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0659", "term": "Functional, regulatory and non-coding RNA" } ], "operatingSystem": [ "Linux", "Mac", "Windows" ], "language": [], "license": "GPL-3.0", "collectionID": [], "maturity": "Emerging", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/EvolOMICS-TU/ETENLNC", "type": [ "Repository" ], "note": "GitHub Repo" } ], "download": [ { "url": "https://zenodo.org/records/14325721?token=eyJhbGciOiJIUzUxMiJ9.eyJpZCI6ImVmYTllNWJkLWE4ODUtNGM3OC05YTAxLWM4ZDk5YTljZDZjMCIsImRhdGEiOnt9LCJyYW5kb20iOiI4M2I1YjBlZDQ4MmUyZTIxNDg2YmI0YTFkMWE5MTI1OCJ9.HeB3WrsPduNzMyXjH4x5HfCgmIp4NzYv0P_11XU9lcXC_ZxEaVndP-kD0LDkxwufHVNlroeAhdK33PR51F6jnw", "type": "Biological data", "note": "Sample/demo data for ETENLNC. A detailed guide on running ETENLNC using the demo data can be found in the ETENLNC manual (supplementary to our publication).", "version": "1.0" } ], "documentation": [ { "url": "https://github.com/EvolOMICS-TU/ETENLNC", "type": [ "Command-line options" ], "note": "A detailed guide on running ETENLNC using the demo data can be found in the ETENLNC manual (supplementary to our publication)" } ], "publication": [ { "doi": "10.1016/j.compbiolchem.2024.108140", "pmid": "38996755", "pmcid": null, "type": [ "Primary" ], "version": ".0", "note": null, "metadata": { "title": "ETENLNC: An end to end lncRNA identification and analysis framework to facilitate construction of known and novel lncRNA regulatory networks", "abstract": "Long non-coding RNAs (lncRNAs) play crucial roles in the regulation of gene expression and maintenance of genomic integrity through various interactions with DNA, RNA, and proteins. The availability of large-scale sequence data from various high-throughput platforms has opened possibilities to identify, predict, and functionally annotate lncRNAs. As a result, there is a growing demand for an integrative computational framework capable of identifying known lncRNAs, predicting novel lncRNAs, and inferring the downstream regulatory interactions of lncRNAs at the genome-scale. We present ETENLNC (End-To-End-Novel-Long-NonCoding), a user-friendly, integrative, open-source, scalable, and modular computational framework for identifying and analyzing lncRNAs from raw RNA-Seq data. ETENLNC employs six stringent filtration steps to identify novel lncRNAs, performs differential expression analysis of mRNA and lncRNA transcripts, and predicts regulatory interactions between lncRNAs, mRNAs, miRNAs, and proteins. We benchmarked ETENLNC against six existing tools and optimized it for desktop workstations and high-performance computing environments using data from three different species. ETENLNC is freely available on GitHub: https://github.com/EvolOMICS-TU/ETENLNC.", "date": "2024-10-01T00:00:00Z", "citationCount": 2, "authors": [ { "name": "Nath P." }, { "name": "Bhuyan K." }, { "name": "Bhattacharyya D.K." }, { "name": "Barah P." } ], "journal": "Computational Biology and Chemistry" } } ], "credit": [ { "name": "Pankaj Barah", "email": "barah@tezu.ernet.in", "url": "https://www.tezu.ernet.in/dmbbt/profile/34", "orcidid": "https://orcid.org/0000-0001-7039-7996", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact", "Maintainer" ], "note": "Assistant Professor at Department of Molecular Biology and Biotechnology, Tezpur University." }, { "name": "Prangan Nath", "email": "prangannathofficial@gmai.com", "url": null, "orcidid": "https://orcid.org/0000-0002-9451-7822", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer", "Maintainer" ], "note": null } ], "owner": "prangannath", "additionDate": "2025-07-23T10:27:57.572501Z", "lastUpdate": "2025-07-23T10:27:57.574879Z", "editPermission": { "type": "private", "authors": [] }, "validated": 0, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "MirGeneDB", "description": "MirGeneDB is a database of manually curated microRNA genes that have been validated and annotated as initially described in Fromm et al. 2015 , Fromm et al. 2020 and Fromm et al 2022. MirGeneDB 3.0 (Clarke and Hoye et al. 2024 ) includes more than 21,000 microRNA gene entries representing more than 1,700 microRNA families from 114 metazoan species. All microRNAs can be browsed, searched and downloaded.", "homepage": "http://mirgenedb.org/", "biotoolsID": "mirgen", "biotoolsCURIE": "biotools:mirgen", "version": [ "3.0" ], "otherID": [ { "value": "doi:10.25504/FAIRsharing.QXSgvF", "type": "doi", "version": "2.0" } ], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_2422", "term": "Data retrieval" }, { "uri": "http://edamontology.org/operation_0564", "term": "Sequence visualisation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1097", "term": "Sequence accession (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_1869", "term": "Organism identifier" }, "format": [] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3134", "term": "Gene transcript report" }, "format": [ { "uri": "http://edamontology.org/format_2331", "term": "HTML" } ] }, { "data": { "uri": "http://edamontology.org/data_0880", "term": "RNA secondary structure" }, "format": [ { "uri": "http://edamontology.org/format_2331", "term": "HTML" } ] } ], "note": "Data retrieval: curated miRNA. Organism identifier: a specific miRNA identifier or a species for all miRNAs for that species. Gene transcript report: with metadata and visualization. RNA secondary structure: the hairpin loop of the miRNA with bases.", "cmd": null }, { "operation": [ { "uri": "http://edamontology.org/operation_0224", "term": "Query and retrieval" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1097", "term": "Sequence accession (nucleic acid)" }, "format": [] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_3495", "term": "RNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_2012", "term": "Sequence coordinates" }, "format": [ { "uri": "http://edamontology.org/format_2305", "term": "GFF" }, { "uri": "http://edamontology.org/format_3003", "term": "BED" } ] }, { "data": { "uri": "http://edamontology.org/data_3917", "term": "Count matrix" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Database portal" ], "topic": [ { "uri": "http://edamontology.org/topic_0659", "term": "Functional, regulatory and non-coding RNA" }, { "uri": "http://edamontology.org/topic_0204", "term": "Gene regulation" }, { "uri": "http://edamontology.org/topic_3299", "term": "Evolutionary biology" }, { "uri": "http://edamontology.org/topic_3500", "term": "Zoology" }, { "uri": "http://edamontology.org/topic_2815", "term": "Human biology" } ], "operatingSystem": [ "Linux", "Windows", "Mac" ], "language": [], "license": "CC0-1.0", "collectionID": [ "UiO tools", "ELIXIR-NO", "ELIXIR-Norway" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [ "Norway" ], "elixirCommunity": [], "link": [ { "url": "https://elixir.no/helpdesk", "type": [ "Helpdesk" ], "note": null } ], "download": [ { "url": "https://www.mirgenedb.org/download", "type": "Biological data", "note": "Sequence downloads for 75 species", "version": "3.0" } ], "documentation": [ { "url": "https://www.mirgenedb.org/information", "type": [ "General" ], "note": null } ], "publication": [ { "doi": "10.1093/nar/gkab1101", "pmid": "34850127", "pmcid": "PMC8728216", "type": [ "Primary" ], "version": "2.1", "note": null, "metadata": { "title": "MirGeneDB 2.1: Toward a complete sampling of all major animal phyla", "abstract": "We describe an update of MirGeneDB, the manually curated microRNA gene database. Adhering to uniform and consistent criteria for microRNA annotation and nomenclature, we substantially expanded MirGeneDB with 30 additional species representing previously missing metazoan phyla such as sponges, jellyfish, rotifers and flatworms. MirGeneDB 2.1 now consists of 75 species spanning over ∼800 million years of animal evolution, and contains a total number of 16 670 microRNAs from 1549 families. Over 6000 microRNAs were added in this update using ∼550 datasets with ∼7.5 billion sequencing reads. By adding new phylogenetically important species, especially those relevant for the study of whole genome duplication events, and through updating evolutionary nodes of origin for many families and genes, we were able to substantially refine our nomenclature system. All changes are traceable in the specifically developed MirGeneDB version tracker. The performance of read-pages is improved and microRNA expression matrices for all tissues and species are now also downloadable. Altogether, this update represents a significant step toward a complete sampling of all major metazoan phyla, and a widely needed foundation for comparative microRNA genomics and transcriptomics studies. MirGeneDB 2.1 is part of RNAcentral and Elixir Norway, publicly and freely available at http://www.mirgenedb.org/.", "date": "2022-01-07T00:00:00Z", "citationCount": 95, "authors": [ { "name": "Fromm B." }, { "name": "Hoye E." }, { "name": "Domanska D." }, { "name": "Zhong X." }, { "name": "Aparicio-Puerta E." }, { "name": "Ovchinnikov V." }, { "name": "Umu S.U." }, { "name": "Chabot P.J." }, { "name": "Kang W." }, { "name": "Aslanzadeh M." }, { "name": "Tarbier M." }, { "name": "Marmol-Sanchez E." }, { "name": "Urgese G." }, { "name": "Johansen M." }, { "name": "Hovig E." }, { "name": "Hackenberg M." }, { "name": "Friedlander M.R." }, { "name": "Peterson K.J." } ], "journal": "Nucleic Acids Research" } }, { "doi": "10.1093/nar/gkz885", "pmid": "31598695", "pmcid": "PMC6943042", "type": [ "Primary" ], "version": "2.0", "note": null, "metadata": { "title": "MirGeneDB 2.0: The metazoan microRNA complement", "abstract": "Small non-coding RNAs have gained substantial attention due to their roles in animal development and human disorders. Among them, microRNAs are special because individual gene sequences are conserved across the animal kingdom. In addition, unique and mechanistically well understood features can clearly distinguish bona fide miRNAs from the myriad other small RNAs generated by cells. However, making this distinction is not a common practice and, thus, not surprisingly, the heterogeneous quality of available miRNA complements has become a major concern in microRNA research. We addressed this by extensively expanding our curated microRNA gene database-MirGeneDB-to 45 organisms, encompassing a wide phylogenetic swath of animal evolution. By consistently annotating and naming 10,899 microRNA genes in these organisms, we show that previous microRNA annotations contained not only many false positives, but surprisingly lacked >2000 bona fide microRNAs. Indeed, curated microRNA complements of closely related organisms are very similar and can be used to reconstruct ancestral miRNA repertoires. MirGeneDB represents a robust platform for microRNA-based research, providing deeper and more significant insights into the biology and evolution of miRNAs as well as biomedical and biomarker research. MirGeneDB is publicly and freely available at http://mirgenedb.org/.", "date": "2020-01-01T00:00:00Z", "citationCount": 178, "authors": [ { "name": "Fromm B." }, { "name": "Domanska D." }, { "name": "Hoye E." }, { "name": "Ovchinnikov V." }, { "name": "Kang W." }, { "name": "Aparicio-Puerta E." }, { "name": "Johansen M." }, { "name": "Flatmark K." }, { "name": "Mathelier A." }, { "name": "Hovig E." }, { "name": "Hackenberg M." }, { "name": "Friedlander M.R." }, { "name": "Peterson K.J." } ], "journal": "Nucleic Acids Research" } }, { "doi": "10.1146/annurev-genet-120213-092023", "pmid": "26473382", "pmcid": "PMC4743252", "type": [ "Primary" ], "version": "1.0", "note": null, "metadata": { "title": "A Uniform System for the Annotation of Vertebrate microRNA Genes and the Evolution of the Human microRNAome", "abstract": "Although microRNAs (miRNAs) are among the most intensively studied molecules of the past 20 years, determining what is and what is not a miRNA has not been straightforward. Here, we present a uniform system for the annotation and nomenclature of miRNA genes. We show that less than a third of the 1,881 human miRBase entries, and only approximately 16% of the 7,095 metazoan miRBase entries, are robustly supported as miRNA genes. Furthermore, we show that the human repertoire of miRNAs has been shaped by periods of intense miRNA innovation and that mature gene products show a very different tempo and mode of sequence evolution than star products. We establish a new open access database-MirGeneDB (http://mirgenedb.org)-to catalog this set of miRNAs, which complements the efforts of miRBase but differs from it by annotating the mature versus star products and by imposing an evolutionary hierarchy upon this curated and consistently named repertoire.", "date": "2015-11-23T00:00:00Z", "citationCount": 435, "authors": [ { "name": "Fromm B." }, { "name": "Billipp T." }, { "name": "Peck L.E." }, { "name": "Johansen M." }, { "name": "Tarver J.E." }, { "name": "King B.L." }, { "name": "Newcomb J.M." }, { "name": "Sempere L.F." }, { "name": "Flatmark K." }, { "name": "Hovig E." }, { "name": "Peterson K.J." } ], "journal": "Annual Review of Genetics" } }, { "doi": "10.1093/nar/gkae1094", "pmid": "39673268", "pmcid": "PMC11701709", "type": [ "Primary" ], "version": "3.0", "note": null, "metadata": { "title": "MirGeneDB 3.0: Improved taxonomic sampling, uniform nomenclature of novel conserved microRNA families and updated covariance models", "abstract": "We present a major update of MirGeneDB (3.0), the manually curated animal microRNA gene database. Beyond moving to a new server and the creation of a computational mirror, we have expanded the database with the addition of 33 invertebrate species, including representatives of 5 previously unsampled phyla, and 6 mammal species. MirGeneDB now contains entries for 21 822 microRNA genes (5160 of these from the new species) belonging to 1743 microRNA families. The inclusion of these new species allowed us to refine both the evolutionary node of appearance of a number of microRNA genes/families, as well as MirGeneDB's phylogenetically informed nomenclature system. Updated covariance models of all microRNA families, along with all smallRNA read data are now downloadable. These enhanced annotations will allow researchers to analyze microRNA properties such as secondary structure and features of their biogenesis within a robust phylogenetic context and without the database plagued with numerous false positives and false negatives. In light of these improvements, MirGeneDB 3.0 will assume the responsibility for naming conserved novel metazoan microRNAs. MirGeneDB is part of RNAcentral and Elixir Norway and is publicly and freely available at mirgenedb.org.", "date": "2025-01-06T00:00:00Z", "citationCount": 6, "authors": [ { "name": "Clarke A.W." }, { "name": "Hoye E." }, { "name": "Hembrom A.A." }, { "name": "Paynter V.M." }, { "name": "Vinther J." }, { "name": "Wyrozemski L." }, { "name": "Biryukova I." }, { "name": "Formaggioni A." }, { "name": "Ovchinnikov V." }, { "name": "Herlyn H." }, { "name": "Pierce A." }, { "name": "Wu C." }, { "name": "Aslanzadeh M." }, { "name": "Cheneby J." }, { "name": "Martinez P." }, { "name": "Friedlander M.R." }, { "name": "Hovig E." }, { "name": "Hackenberg M." }, { "name": "Umu S.U." }, { "name": "Johansen M." }, { "name": "Peterson K.J." }, { "name": "Fromm B." } ], "journal": "Nucleic Acids Research" } } ], "credit": [ { "name": "Bastian Fromm", "email": "BastianFromm@gmail.com", "url": null, "orcidid": "https://orcid.org/0000-0003-0352-3037", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact", "Developer", "Maintainer", "Support" ], "note": null }, { "name": "Kevin J. Peterson", "email": "kevin.j.peterson@dartmouth.edu", "url": null, "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer", "Maintainer" ], "note": null }, { "name": "The Norwegian Bioinformatics Platform (ELIXIR-Norway) Helpdesk", "email": "support@elixir.no", "url": "https://elixir.no/helpdesk", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Consortium", "typeRole": [ "Support" ], "note": null }, { "name": "University of Oslo", "email": null, "url": "https://www.uio.no/english/index.html", "orcidid": null, "gridid": "grid.5510.1", "rorid": "01xtthb56", "fundrefid": "10.13039/501100005366", "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null } ], "owner": "UiO", "additionDate": "2016-02-09T13:19:44Z", "lastUpdate": "2025-07-05T22:33:30.082420Z", "editPermission": { "type": "group", "authors": [ "eca008" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "RepeatModeler2", "description": "RepeatModeler is a de novo transposable element (TE) family identification and modeling package. At the heart of RepeatModeler are three de-novo repeat finding programs ( RECON, RepeatScout and LtrHarvest/Ltr_retriever ) which employ complementary computational methods for identifying repeat element boundaries and family relationships from sequence data.", "homepage": "https://github.com/Dfam-consortium/RepeatModeler", "biotoolsID": "RepeatModeler2", "biotoolsCURIE": "biotools:RepeatModeler2", "version": [ "2.0.7" ], "otherID": [], "relation": [ { "biotoolsID": "repeatmodeler", "type": "isNewVersionOf" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0525", "term": "Genome assembly" }, { "uri": "http://edamontology.org/operation_3644", "term": "de Novo sequencing" }, { "uri": "http://edamontology.org/operation_0362", "term": "Genome annotation" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_3494", "term": "DNA sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [], "note": null, "cmd": null } ], "toolType": [ "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_0621", "term": "Model organisms" }, { "uri": "http://edamontology.org/topic_0157", "term": "Sequence composition, complexity and repeats" }, { "uri": "http://edamontology.org/topic_3673", "term": "Whole genome sequencing" }, { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" }, { "uri": "http://edamontology.org/topic_0798", "term": "Mobile genetic elements" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "Perl" ], "license": "OSL-2.0", "collectionID": [], "maturity": "Mature", "cost": "Free of charge", "accessibility": null, "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/Dfam-consortium/RepeatModeler/blob/master/LICENSE", "type": [ "Repository" ], "note": null } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1101/856591", "pmid": null, "pmcid": null, "type": [], "version": null, "note": null, "metadata": null } ], "credit": [], "owner": "Pub2Tools", "additionDate": "2020-01-14T08:51:14Z", "lastUpdate": "2025-07-01T04:28:03.302129Z", "editPermission": { "type": "public", "authors": [] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "purge_dups", "description": "Identifying and removing haplotypic duplication in primary genome assemblies | haplotypic duplication identification tool | scripts/pd_config.py: script to generate a configuration file used by run_purge_dups.py | purge haplotigs and overlaps in an assembly based on read depth | Given a primary assembly pri_asm and an alternative assembly hap_asm (optional, if you have one), follow the steps shown below to build your own purge_dups pipeline, steps with same number can be run simultaneously. Among all the steps, although step 4 is optional, we highly recommend our users to do so, because assemblers may produce overrepresented seqeuences. In such a case, The final step 4 can be applied to remove those seqeuences", "homepage": "https://github.com/dfguan/purge_dups", "biotoolsID": "purge_dups", "biotoolsCURIE": "biotools:purge_dups", "version": [ "v.1.2.6" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0525", "term": "Genome assembly" }, { "uri": "http://edamontology.org/operation_3798", "term": "Read binning" }, { "uri": "http://edamontology.org/operation_3216", "term": "Scaffolding" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1930", "term": "FASTQ" } ] }, { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_1234", "term": "Sequence set (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "note": null, "cmd": null } ], "toolType": [], "topic": [ { "uri": "http://edamontology.org/topic_0196", "term": "Sequence assembly" } ], "operatingSystem": [ "Mac", "Linux" ], "language": [ "Python", "C" ], "license": "MIT", "collectionID": [ "ONTeater" ], "maturity": null, "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [], "elixirCommunity": [], "link": [ { "url": "https://github.com/dfguan/purge_dups", "type": [ "Repository" ], "note": null }, { "url": "https://github.com/dfguan/purge_dups/issues", "type": [ "Issue tracker" ], "note": null } ], "download": [], "documentation": [], "publication": [ { "doi": "10.1101/729962", "pmid": null, "pmcid": null, "type": [], "version": null, "note": null, "metadata": null } ], "credit": [ { "name": "Dengfeng Guan", "email": null, "url": "https://www.chatlink.com.cn", "orcidid": "https://orcid.org/0000-0002-6376-3940", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer" ], "note": null } ], "owner": "Pub2Tools", "additionDate": "2019-11-14T18:08:10Z", "lastUpdate": "2025-06-30T15:34:51.626796Z", "editPermission": { "type": "public", "authors": [] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" }, { "name": "SILVAngs", "description": "SILVAngs is a data analysis service for ribosomal RNA gene (rDNA) amplicon reads from high-throughput sequencing (next-generation sequencing (NGS)) approaches based on an automatic software pipeline. It uses the SILVA rDNA databases, taxonomies, and alignments as a reference. It facilitates the classification of rDNA reads and provides a wealth of results (tables, graphs and sequence files) for download.", "homepage": "https://ngs.arb-silva.de", "biotoolsID": "silvangs", "biotoolsCURIE": "biotools:silvangs", "version": [ "1.9.10" ], "otherID": [], "relation": [ { "biotoolsID": "silva", "type": "uses" } ], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0337", "term": "Visualisation" }, { "uri": "http://edamontology.org/operation_2238", "term": "Statistical calculation" }, { "uri": "http://edamontology.org/operation_2478", "term": "Nucleic acid sequence analysis" }, { "uri": "http://edamontology.org/operation_3460", "term": "Taxonomic classification" }, { "uri": "http://edamontology.org/operation_2428", "term": "Validation" }, { "uri": "http://edamontology.org/operation_0291", "term": "Sequence clustering" }, { "uri": "http://edamontology.org/operation_0292", "term": "Sequence alignment" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_2082", "term": "Matrix" }, "format": [ { "uri": "http://edamontology.org/format_3475", "term": "TSV" } ] }, { "data": { "uri": "http://edamontology.org/data_2884", "term": "Plot" }, "format": [] }, { "data": { "uri": "http://edamontology.org/data_2048", "term": "Report" }, "format": [ { "uri": "http://edamontology.org/format_3508", "term": "PDF" } ] }, { "data": { "uri": "http://edamontology.org/data_1246", "term": "Sequence cluster (nucleic acid)" }, "format": [ { "uri": "http://edamontology.org/format_1984", "term": "FASTA-aln" } ] }, { "data": { "uri": "http://edamontology.org/data_2977", "term": "Nucleic acid sequence" }, "format": [ { "uri": "http://edamontology.org/format_3830", "term": "ARB" }, { "uri": "http://edamontology.org/format_1984", "term": "FASTA-aln" } ] } ], "note": "The pipeline accepts input data in Multi-Fasta format with each input file representing one sample. Samples that belong to one project (a transect, timeseries etc.) should be uploaded as a single SILVAngs project.", "cmd": null } ], "toolType": [ "Web application" ], "topic": [ { "uri": "http://edamontology.org/topic_3174", "term": "Metagenomics" }, { "uri": "http://edamontology.org/topic_3050", "term": "Biodiversity" }, { "uri": "http://edamontology.org/topic_0637", "term": "Taxonomy" }, { "uri": "http://edamontology.org/topic_0659", "term": "Functional, regulatory and non-coding RNA" }, { "uri": "http://edamontology.org/topic_0080", "term": "Sequence analysis" }, { "uri": "http://edamontology.org/topic_3697", "term": "Microbial ecology" } ], "operatingSystem": [], "language": [], "license": null, "collectionID": [ "de.NBI", "de.NBI-biodata", "DSMZ Digital Diversity" ], "maturity": "Mature", "cost": "Free of charge (with restrictions)", "accessibility": null, "elixirPlatform": [ "Data" ], "elixirNode": [ "Germany" ], "elixirCommunity": [], "link": [], "download": [], "documentation": [ { "url": "https://www.arb-silva.de/fileadmin/silva_databases/sngs/SILVAngs_User_Guide.pdf", "type": [ "User manual" ], "note": null }, { "url": "https://www.arb-silva.de/documentation/silvangs/userfaq/", "type": [ "FAQ" ], "note": null }, { "url": "https://www.arb-silva.de/footer/sngs-termsofuse", "type": [ "Terms of use" ], "note": null } ], "publication": [ { "doi": "10.1093/nar/gks1219", "pmid": "23193283", "pmcid": "PMC3531112", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "The SILVA ribosomal RNA gene database project: Improved data processing and web-based tools", "abstract": "SILVA (from Latin silva, forest, http://www.arb-silva.de) is a comprehensive web resource for up to date, quality-controlled databases of aligned ribosomal RNA (rRNA) gene sequences from the Bacteria, Archaea and Eukaryota domains and supplementary online services. The referred database release 111 (July 2012) contains 3194 778 small subunit and 288717 large subunit rRNA gene sequences. Since the initial description of the project, substantial new features have been introduced, including advanced quality control procedures, an improved rRNA gene aligner, online tools for probe and primer evaluation and optimized browsing, searching and downloading on the website. Furthermore, the extensively curated SILVA taxonomy and the new non-redundant SILVA datasets provide an ideal reference for high-throughput classification of data from next-generation sequencing approaches. © The Author(s) 2012.", "date": "2013-01-01T00:00:00Z", "citationCount": 22633, "authors": [ { "name": "Quast C." }, { "name": "Pruesse E." }, { "name": "Yilmaz P." }, { "name": "Gerken J." }, { "name": "Schweer T." }, { "name": "Yarza P." }, { "name": "Peplies J." }, { "name": "Glockner F.O." } ], "journal": "Nucleic Acids Research" } }, { "doi": "10.1093/nar/gkt1209", "pmid": "24293649", "pmcid": "PMC3965112", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "The SILVA and \"all-species Living Tree Project (LTP)\" taxonomic frameworks", "abstract": "SILVA (from Latin silva, forest, http://www.arb-silva.de) is a comprehensive resource for up-to-date quality-controlled databases of aligned ribosomal RNA (rRNA) gene sequences from the Bacteria, Archaea and Eukaryota domains and supplementary online services. SILVA provides a manually curated taxonomy for all three domains of life, based on representative phylogenetic trees for the small- and large-subunit rRNA genes. This article describes the improvements the SILVA taxonomy has undergone in the last 3 years. Specifically we are focusing on the curation process, the various resources used for curation and the comparison of the SILVA taxonomy with Greengenes and RDP-II taxonomies. Our comparisons not only revealed a reasonable overlap between the taxa names, but also points to significant differences in both names and numbers of taxa between the three resources. © 2013 The Author(s). Published by Oxford University Press.", "date": "2014-01-01T00:00:00Z", "citationCount": 2590, "authors": [ { "name": "Yilmaz P." }, { "name": "Parfrey L.W." }, { "name": "Yarza P." }, { "name": "Gerken J." }, { "name": "Pruesse E." }, { "name": "Quast C." }, { "name": "Schweer T." }, { "name": "Peplies J." }, { "name": "Ludwig W." }, { "name": "Glockner F.O." } ], "journal": "Nucleic Acids Research" } }, { "doi": "10.1093/bioinformatics/bts252", "pmid": "22556368", "pmcid": "PMC3389763", "type": [ "Primary" ], "version": null, "note": null, "metadata": { "title": "SINA: Accurate high-throughput multiple sequence alignment of ribosomal RNA genes", "abstract": "Motivation: In the analysis of homologous sequences, computation of multiple sequence alignments (MSAs) has become a bottleneck. This is especially troublesome for marker genes like the ribosomal RNA (rRNA) where already millions of sequences are publicly available and individual studies can easily produce hundreds of thousands of new sequences. Methods have been developed to cope with such numbers, but further improvements are needed to meet accuracy requirements.Results: In this study, we present the SILVA Incremental Aligner (SINA) used to align the rRNA gene databases provided by the SILVA ribosomal RNA project. SINA uses a combination of k-mer searching and partial order alignment (POA) to maintain very high alignment accuracy while satisfying high throughput performance demands. SINA was evaluated in comparison with the commonly used high throughput MSA programs PyNAST and mothur. The three BRAliBase III benchmark MSAs could be reproduced with 99.3, 97.6 and 96.1 accuracy. A larger benchmark MSA comprising 38 772 sequences could be reproduced with 98.9 and 99.3% accuracy using reference MSAs comprising 1000 and 5000 sequences. SINA was able to achieve higher accuracy than PyNAST and mothur in all performed benchmarks. © The Author(s) 2012. Published by Oxford University Press.", "date": "2012-07-01T00:00:00Z", "citationCount": 2408, "authors": [ { "name": "Pruesse E." }, { "name": "Peplies J." }, { "name": "Glockner F.O." } ], "journal": "Bioinformatics" } } ], "credit": [ { "name": "SILVA Team", "email": "ngs-contact@arb-silva.de", "url": "https://www.arb-silva.de/contact/team/", "orcidid": null, "gridid": "grid.507782.f", "rorid": "027z9pz32", "fundrefid": null, "typeEntity": "Division", "typeRole": [ "Primary contact" ], "note": null }, { "name": "Leibniz Institute DSMZ-German Collection of Microorganisms and Cell Cultures", "email": "hub@dsmz.de", "url": "https://www.dsmz.de", "orcidid": null, "gridid": "grid.420081.f", "rorid": "02tyer376", "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null } ], "owner": "silva", "additionDate": "2016-09-30T07:30:11Z", "lastUpdate": "2025-06-30T13:26:39.251875Z", "editPermission": { "type": "group", "authors": [] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": null }, { "name": "DeepSig", "description": "Prediction of secretory signal peptides in protein sequences", "homepage": "https://busca.biocomp.unibo.it/deepsig/", "biotoolsID": "deepsig", "biotoolsCURIE": "biotools:deepsig", "version": [ "1.2.5" ], "otherID": [], "relation": [], "function": [ { "operation": [ { "uri": "http://edamontology.org/operation_0418", "term": "Protein signal peptide detection" } ], "input": [ { "data": { "uri": "http://edamontology.org/data_2974", "term": "Protein sequence (raw)" }, "format": [ { "uri": "http://edamontology.org/format_1929", "term": "FASTA" } ] }, { "data": { "uri": "http://edamontology.org/data_3028", "term": "Taxonomy" }, "format": [ { "uri": "http://edamontology.org/format_2330", "term": "Textual format" } ] } ], "output": [ { "data": { "uri": "http://edamontology.org/data_0896", "term": "Protein report" }, "format": [ { "uri": "http://edamontology.org/format_2331", "term": "HTML" } ] } ], "note": null, "cmd": null } ], "toolType": [ "Web application", "Command-line tool" ], "topic": [ { "uri": "http://edamontology.org/topic_3307", "term": "Computational biology" }, { "uri": "http://edamontology.org/topic_3510", "term": "Protein sites, features and motifs" }, { "uri": "http://edamontology.org/topic_0123", "term": "Protein properties" } ], "operatingSystem": [ "Linux", "Windows", "Mac" ], "language": [ "Python", "C++" ], "license": "GPL-3.0", "collectionID": [ "Bologna Biocomputing Group" ], "maturity": "Mature", "cost": "Free of charge", "accessibility": "Open access", "elixirPlatform": [], "elixirNode": [ "Italy" ], "elixirCommunity": [], "link": [], "download": [ { "url": "https://github.com/BolognaBiocomp/deepsig", "type": "Source code", "note": null, "version": "1.2.5" }, { "url": "https://hub.docker.com/r/bolognabiocomp/deepsig", "type": "Container file", "note": null, "version": "1.2.5" } ], "documentation": [ { "url": "https://github.com/BolognaBiocomp/deepsig", "type": [ "Command-line options" ], "note": null } ], "publication": [ { "doi": "10.1093/bioinformatics/btx818", "pmid": "29280997", "pmcid": "PMC5946842", "type": [ "Primary" ], "version": "1.0", "note": null, "metadata": { "title": "DeepSig: Deep learning improves signal peptide detection in proteins", "abstract": "Motivation The identification of signal peptides in protein sequences is an important step toward protein localization and function characterization. Results Here, we present DeepSig, an improved approach for signal peptide detection and cleavage-site prediction based on deep learning methods. Comparative benchmarks performed on an updated independent dataset of proteins show that DeepSig is the current best performing method, scoring better than other available state-of-the-art approaches on both signal peptide detection and precise cleavage-site identification. Availability and implementation DeepSig is available as both standalone program and web server at https://deepsig.biocomp.unibo.it. All datasets used in this study can be obtained from the same website.", "date": "2018-05-15T00:00:00Z", "citationCount": 96, "authors": [ { "name": "Savojardo C." }, { "name": "Martelli P.L." }, { "name": "Fariselli P." }, { "name": "Casadio R." } ], "journal": "Bioinformatics" } } ], "credit": [ { "name": "ELIXIR-ITA-BOLOGNA", "email": null, "url": "http://biocomp.unibo.it", "orcidid": null, "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Institute", "typeRole": [ "Provider" ], "note": null }, { "name": "Castrense Savojardo", "email": "castrense.savojardo2@unibo.it", "url": null, "orcidid": "https://orcid.org/0000-0002-7359-0633", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Developer", "Primary contact" ], "note": null }, { "name": "Pier Luigi Martelli", "email": "pierluigi.martelli@unibo.it", "url": "http://biocomp.unibo.it", "orcidid": "https://orcid.org/0000-0002-0274-5669", "gridid": null, "rorid": null, "fundrefid": null, "typeEntity": "Person", "typeRole": [ "Primary contact" ], "note": null } ], "owner": "ELIXIR-ITA-BOLOGNA", "additionDate": "2018-05-28T14:50:09Z", "lastUpdate": "2025-06-19T11:55:09.017105Z", "editPermission": { "type": "group", "authors": [ "savo", "ELIXIR-ITA-BOLOGNA" ] }, "validated": 1, "homepage_status": 0, "elixir_badge": 0, "confidence_flag": "tool" } ] }