diff --git a/citations.tsv b/citations.tsv index 7722ec1..8fa5dd6 100644 --- a/citations.tsv +++ b/citations.tsv @@ -12,8 +12,8 @@ https://www.wiwam.be https://www.wiwam.be url:https://www.wiwam.be r84WbX0P doi:10.1038/sdata.2016.18 doi:10.1038/sdata.2016.18 doi:10.1038/sdata.2016.18 6DjakjNS doi:10.1093/bioinformatics/btr330 doi:10.1093/bioinformatics/btr330 doi:10.1093/bioinformatics/btr330 PzHxvkzH https://github.com/ga4gh-metadata/SchemaBlocks https://github.com/ga4gh-metadata/SchemaBlocks url:https://github.com/ga4gh-metadata/SchemaBlocks 186zclKvK -doi:10.1093/bioinformatics/btq580 doi:10.1093/bioinformatics/btq580 doi:10.1093/bioinformatics/btq580 Wz8l0HlN doi:10.1093/gigascience/giad025 doi:10.1093/gigascience/giad025 doi:10.1093/gigascience/giad025 9fRbvOj2 +doi:10.1093/bioinformatics/btq580 doi:10.1093/bioinformatics/btq580 doi:10.1093/bioinformatics/btq580 Wz8l0HlN doi:10.1093/gigascience/giz051 doi:10.1093/gigascience/giz051 doi:10.1093/gigascience/giz051 AVjkjraw doi:10.1002/ppp3.10187 doi:10.1002/ppp3.10187 doi:10.1002/ppp3.10187 bvSFyrtt doi:10.1093/bioinformatics/btac410 doi:10.1093/bioinformatics/btac410 doi:10.1093/bioinformatics/btac410 VFIpO8nU @@ -24,22 +24,22 @@ doi:10.12688/f1000research.109080.2 doi:10.12688/f1000research.109080.2 doi:10.1 doi:10.5281/zenodo.12625360 doi:10.5281/zenodo.12625360 doi:10.5281/zenodo.12625360 QRzg4OSs doi:10.22004/AG.ECON.266624 doi:10.22004/AG.ECON.266624 doi:10.22004/ag.econ.266624 6VGwG9za doi:10.1093/nar/gkac852 doi:10.1093/nar/gkac852 doi:10.1093/nar/gkac852 pk5OwSG6 -doi:10.1093/database/bax046 doi:10.1093/database/bax046 doi:10.1093/database/bax046 84Yn3FWj -doi:10.1186/s43170-020-00015-6 doi:10.1186/s43170-020-00015-6 doi:10.1186/s43170-020-00015-6 JWi7AKhJ -doi:10.1093/database/baab054 doi:10.1093/database/baab054 doi:10.1093/database/baab054 ArPSsaJQ -doi:10.1093/aobpla/plq008 doi:10.1093/aobpla/plq008 doi:10.1093/aobpla/plq008 VndIxnl3 +doi:10.34133/2019/1671403 doi:10.34133/2019/1671403 doi:10.34133/2019/1671403 m7yuFGsd +doi:10.1007/978-1-4939-6658-5_5 doi:10.1007/978-1-4939-6658-5_5 doi:10.1007/978-1-4939-6658-5_5 15XwZ2Vb0 doi:10.1186/1471-2105-15-259 doi:10.1186/1471-2105-15-259 doi:10.1186/1471-2105-15-259 X22hwO1v doi:10.1111/j.1365-2052.2011.02183.x doi:10.1111/j.1365-2052.2011.02183.x doi:10.1111/j.1365-2052.2011.02183.x 1CKLIIaug doi:10.3389/fpls.2024.1268847 doi:10.3389/fpls.2024.1268847 doi:10.3389/fpls.2024.1268847 1HmEHgW8h doi:10.1007/s10592-024-01611-z doi:10.1007/s10592-024-01611-z doi:10.1007/s10592-024-01611-z x8DIc6zn -doi:10.34133/2019/1671403 doi:10.34133/2019/1671403 doi:10.34133/2019/1671403 m7yuFGsd -doi:10.1007/978-1-4939-6658-5_5 doi:10.1007/978-1-4939-6658-5_5 doi:10.1007/978-1-4939-6658-5_5 15XwZ2Vb0 +doi:10.1093/database/bax046 doi:10.1093/database/bax046 doi:10.1093/database/bax046 84Yn3FWj +doi:10.1186/s43170-020-00015-6 doi:10.1186/s43170-020-00015-6 doi:10.1186/s43170-020-00015-6 JWi7AKhJ +doi:10.1093/database/baab054 doi:10.1093/database/baab054 doi:10.1093/database/baab054 ArPSsaJQ +doi:10.1093/aobpla/plq008 doi:10.1093/aobpla/plq008 doi:10.1093/aobpla/plq008 VndIxnl3 +doi:10.1093/nar/gky1000 doi:10.1093/nar/gky1000 doi:10.1093/nar/gky1000 eaDrNpsp +doi:10.3390/plants10122805 doi:10.3390/plants10122805 doi:10.3390/plants10122805 dcg0274X doi:10.1093/g3journal/jkac078 doi:10.1093/g3journal/jkac078 doi:10.1093/g3journal/jkac078 al3Hd9Ml doi:10.1371/journal.pone.0240059 doi:10.1371/journal.pone.0240059 doi:10.1371/journal.pone.0240059 1FDf25dDD doi:10.1093/genetics/157.4.1819 doi:10.1093/genetics/157.4.1819 doi:10.1093/genetics/157.4.1819 zuq8ri4R doi:10.5281/zenodo.10791627 doi:10.5281/zenodo.10791627 doi:10.5281/zenodo.10791627 a9uPTJgO -doi:10.1093/nar/gky1000 doi:10.1093/nar/gky1000 doi:10.1093/nar/gky1000 eaDrNpsp -doi:10.3390/plants10122805 doi:10.3390/plants10122805 doi:10.3390/plants10122805 dcg0274X doi:10.1002/csc2.20248 doi:10.1002/csc2.20248 doi:10.1002/csc2.20248 sW9euzzP doi:10.2135/cropsci2016.09.0814 doi:10.2135/cropsci2016.09.0814 doi:10.2135/cropsci2016.09.0814 rPgDlCbt doi:10.3389/fpls.2023.1290078 doi:10.3389/fpls.2023.1290078 doi:10.3389/fpls.2023.1290078 7WXz7FUP diff --git a/manuscript.html b/manuscript.html index 8fd87fc..75fef1f 100644 --- a/manuscript.html +++ b/manuscript.html @@ -126,8 +126,8 @@ - - + + @@ -357,9 +357,9 @@ - - - + + + @@ -376,9 +376,9 @@

BrAPI Success Stories

This manuscript -(permalink) +(permalink) was automatically generated -from plantbreeding/BrAPI-Manuscript2@511faa4 +from plantbreeding/BrAPI-Manuscript2@d00841f on July 15, 2024.

Authors

@@ -1147,21 +1147,26 @@

Trait Selector BrAPP

Genotyping

Genotyping has become a cornerstone of most breeding processes, but managing the data can be challenging. Understanding different genotyping protocols for various crops is crucial due to the unique genetic structures of each species. Techniques such as SNP genotyping, Genotyping-by-Sequencing (GBS), SSRs, Whole Genome Sequencing (WGS), and array-based genotyping each offer specific advantages depending on the crop and research objectives. BrAPI supports genotypic data by utilizing existing standards such as VCF12 and the GA4GH Variants schema13. The BrAPI community has developed compatible tools for storing, searching, visualizing, and analyzing genotypic data, making it easier to integrate and utilize this information in breeding programs. Mastery of the various genotyping protocols ensures efficient and effective breeding, while BrAPI compliant tools streamline data management and analysis, enhancing the ability to make data-driven decisions in developing superior crop varieties.

-

Flapjack

-

Flapjack14 is a multi-platform desktop application for data visualization and breeding analysis (eg, pedigree verification, marker-assisted backcrossing and forward breeding) using high-throughput genotype data. Data can be easily imported into Flapjack from any BrAPI compatible data source with genotype data available. Flapjack Bytes is a smaller, lightweight and fully web-based counterpart to Flapjack, which can be easily embedded into a database website to provide similar visualizations online. Traditionally supporting its own text-based data formats, Flapjack’s use of BrAPI has streamlined the end-user experience for data import and work is underway to determine the best methods to exchange analysis results using future versions of the API.

+

DArT Sample Submission

+ +

The DArT genotyping lab is heavily used world wide when it comes to plant genotyping. With over 1200 available organisms and species, client base on every continent and already many million samples processed, DArT provides services for several generic and bespoke genotyping technologies and solutions. Processes of sample tracking and fast data delivery are at the core of the ordering system developed at DArT. The ordering system is tightly integrated with DArTdb - DArT’s custom LIMS operational system, which drives laboratory, quality, and analytical processes.

+

Diversity Arrays Technology was a part of BrAPI community since its inception. DArT developers have worked with the BrAPI community contributing to various aspects of the API specification. One key aspect was establishing a standard API for sending sample metadata to the lab for genotyping. This solution eliminates much of the human error involved with sending samples to an external lab and also allows for an automated process of sample batch transfers. Beyond sample submission, the current implementation also allows for an order status verification, automated data discovery, and data downloads. Data are delivered as standard data packages with self-describing metadata.

+

The current BrAPI implementation at DArT is in production and it is compatible with the newest BrAPI specification. Further details about DArT’s ordering system can be found at DArT Ordering System and also at DArT Help.

DArTView

DArTView is a desktop application for marker data curation via metadata filtering. DArTView enables genotype variant data visualization and users can easily identify trends or correlations within their data using the tool. Its primary goal is to overcome tedious manual calculation of marker data through common spreadsheet applications like Excel. Users are able to import marker data from csv files, but DArTView has been recently enhanced to be BrAPI compatible. Users can now use any BrAPI compatible server as an input data source. BrAPI provides a consistent data standard across databases and data resources. DArTView’s compatibility with BrAPI also ensures easy integration with other tools and pipelines that would use DArTView for marker filtering and exploration.

Initially developed by Diversity Arrays Technology (DArT), the tool is gaining popularity within the breeding community, especially in Africa. Future releases will focus on enhancing the BrAPI compatibility, making it accessible to more breeders and researchers in the region. A web enabled version of DArTView is in development. This new version will allow for further collaboration opportunities with other interested partners who would like to integrate it as part of their pipelines.

DivBrowse

-

DivBrowse15 is a web platform for exploratory data analysis of huge genotyping studies. The software can be run standalone or integrated as a plugin into existing data web portals. It provides a powerful interactive visualization of variant call matrices with hundreds of millions of variants and thousands of samples. It enables easy data import and export by using well established, standardized, bioinformatics file formats.

+

DivBrowse14 is a web platform for exploratory data analysis of huge genotyping studies. The software can be run standalone or integrated as a plugin into existing data web portals. It provides a powerful interactive visualization of variant call matrices with hundreds of millions of variants and thousands of samples. It enables easy data import and export by using well established, standardized, bioinformatics file formats.

At its core, DivBrowse combines the convenience of a genome browser with features tailored to the diversity analysis of germplasm. It is able to display genomic features such as nucleotide sequence, associated gene models, and short genomic variants. DivBrowse provides visual access to large VCF files obtained through genotyping experiments. In addition, DivBrowse also calculates and displays variant statistics such as minor allele frequencies, proportion of heterozygous calls, and proportion missing variant calls. Dynamic Principal Component Analyses (PCA) can be performed on a user specified genomic area to provide information on local genomic diversity.

Parts of the BrAPI Genotyping module are implemented in DivBrowse. There is a server-side component which provides genotypic data that the DivBrowse database can consume. There is also a client-side GUI component which can visualize genotypic data via any external BrAPI endpoint. In addition to BrAPI, DivBrowse has an internal API to control the tool from a hosting web portal. DivBrowse also has an interface to BLAST, which can be used to directly access genes or other genomic features. The modular structure of DivBrowse allows developers to configure and easily embed links to other external information systems.

+

Flapjack

+

Flapjack15 is a multi-platform desktop application for data visualization and breeding analysis (eg, pedigree verification, marker-assisted backcrossing and forward breeding) using high-throughput genotype data. Data can be easily imported into Flapjack from any BrAPI compatible data source with genotype data available. Flapjack Bytes is a smaller, lightweight and fully web-based counterpart to Flapjack, which can be easily embedded into a database website to provide similar visualizations online. Traditionally supporting its own text-based data formats, Flapjack’s use of BrAPI has streamlined the end-user experience for data import and work is underway to determine the best methods to exchange analysis results using future versions of the API.

Gigwa

Gigwa is a Java EE web application providing a means to centralize, share, finely filter, and visualize high-throughput genotyping data16. Built on top of MongoDB, it is scalable and can support working smoothly with datasets containing billions of genotypes. It is installable as a Docker image or as an all-in-one bundle archive. It is straightforward to deploy on servers or local computers and has thus been adopted by numerous research institutes from around the world. Notably, Gigwa serves as a collaborative management tool and a portal for exposing public data for genebanks and breeding programs at some CGIAR centers17. The total amount of data hosted and made widely accessible using this system has continued to grow over the last few years.

-

The Gigwa development team has been involved in the BrAPI community since 2016 and took part in designing the genotype-related section of the BrAPI standard. Gigwa’s first BrAPI-compliant features were designed for compatibility with the Flapjack visualization tool14. Over time, Gigwa has established itself as the first and most reliable implementation of the BrAPI-Genotyping endpoints. Local collaborators and external partners used it as a reference solution to design a number of tools taking advantage of the BrAPI-Genotyping features (e.g., BeegMac, SnpClust, QBMS).

+

The Gigwa development team has been involved in the BrAPI community since 2016 and took part in designing the genotype-related section of the BrAPI standard. Gigwa’s first BrAPI-compliant features were designed for compatibility with the Flapjack visualization tool15. Over time, Gigwa has established itself as the first and most reliable implementation of the BrAPI-Genotyping endpoints. Local collaborators and external partners used it as a reference solution to design a number of tools taking advantage of the BrAPI-Genotyping features (e.g., BeegMac, SnpClust, QBMS).

Additional use-cases required Gigwa to also consume data from other BrAPI servers. This led to the implementation of BrAPI client features within Gigwa. A close collaboration was established with the Integrated Breeding Platform team developing the widely used Breeding Management System (BMS). This collaboration means both applications are now frequently deployed together; Gigwa pulling germplasm or sample metadata from BMS, and BMS displaying Gigwa-hosted genotypes within its own UI.

@@ -1169,11 +1174,6 @@

PHG

The Practical Haplotype Graph (PHG) is a graph-based computational framework that represents large-scale genetic variation and is optimized for plant breeding and genetics18. Using a pangenome approach, each PHG stores haplotypes (the sequence of part of an individual chromosome) to represent the collected genes of a species. This allows for a simplified approach for dealing with large scale variation in plant genomes. The PHG pipeline provides support for a range of genomic analyses and allows for the use of graph data to impute complete genomes from low density sequence or variant data.

Users access the crop databases either with direct calls to the PHG embedded server or indirectly using the rPHG library from an R environment. The PHG server accepts BrAPI queries to return information on sample lists and the variants used to define the graph’s haplotypes. In addition, PHG users utilize the BrAPI Variant Sets endpoint query to return links to VCF files containing haplotype data. Work on the PHG is ongoing and it is expected to support additional BrAPI endpoints that allow for fine tuned slicing genotypic data in the near future.

-

DArT Sample Submission

- -

The DArT genotyping lab is heavily used world wide when it comes to plant genotyping. With over 1200 available organisms and species, client base on every continent and already many million samples processed, DArT provides services for several generic and bespoke genotyping technologies and solutions. Processes of sample tracking and fast data delivery are at the core of the ordering system developed at DArT. The ordering system is tightly integrated with DArTdb - DArT’s custom LIMS operational system, which drives laboratory, quality, and analytical processes.

-

Diversity Arrays Technology was a part of BrAPI community since its inception. DArT developers have worked with the BrAPI community contributing to various aspects of the API specification. One key aspect was establishing a standard API for sending sample metadata to the lab for genotyping. This solution eliminates much of the human error involved with sending samples to an external lab and also allows for an automated process of sample batch transfers. Beyond sample submission, the current implementation also allows for an order status verification, automated data discovery, and data downloads. Data are delivered as standard data packages with self-describing metadata.

-

The current BrAPI implementation at DArT is in production and it is compatible with the newest BrAPI specification. Further details about DArT’s ordering system can be found at DArT Ordering System and also at DArT Help.

Germplasm Management

Germplasm data management is crucial due to the vast quantity of new accessions, variants, and lines created yearly. Germplasm is the basis of variation on which plant breeders rely to upgrade and optimize their breeding programs. This is essential at any scale including individual breeding programs, national initiatives, and international collaborations. BrAPI supports the transmission of germplasm passport data, pedigree trees, and crossing metadata. The BrAPI community has developed compliant tools for storing, searching, and visualizing this metadata, facilitating efficient management. Additionally, there are plans to establish federated networks of genebank data connected via BrAPI, enhancing global accessibility and collaboration in germplasm management.

@@ -1182,36 +1182,33 @@

Germplasm Management

AGENT

In the global system for ex situ conservation of plant genetic resources (PGR)19, material is being conserved in about 1750 collections20 totalling ~5.8 million accessions. Unique and permanent identifiers in the form of DOIs are available for more than 1.7 million accessions via the Global Information System21 of the International Treaty on Plant Genetic Resources for Food and Agriculture. Each DOI is linked to some basic descriptive data that facilitates the use of these resources, mainly passport data. Many DOIs are also linked to additional data from different domains or will be in the future. However, a data space beyond the most basic information is needed that includes genotypic and phenotypic data. This space will help to answer questions about the global biological diversity of plant species, the detection of duplicates, the tracking of provenance for the identification of genetic integrity, the selection of the most suitable material for different purposes, and to support further applications in the field of data mining or AI. In this context, the aim of the AGENT project, funded by the European Commission, is to develop a concept for the digital exploitation and activation of this PGR via European ex situ genebanks according to the FAIR principles11 and to test it in practice using two important crops, barley and wheat. Thirteen European genebanks and five bioinformatics centers are working together and have agreed on standards and protocols for data flow and data formats22 for the collection, integration, and archiving of genotypic and phenotypic data.

-

The BrAPI specification is one of the agreed standards, that are detailed in the AGENT guidelines for dataflow23. The implemented BrAPI interface enables the analysis of current and historic genotypic and phenotypic information. This will drive the discovery of genes, traits, and knowledge for future missions, complement existing information for wheat and barley, and use the new data standards and infrastructure to promote better access and use of PGR for other crops in European genebanks. The AGENT database backend aggregates curated passport data, phenotypic data, and genotypic data on wheat and barley accessions of 18 project partners. This data is accessible via BrAPI endpoints and explorable in a web portal. Genotyping data uses the DivBrowse15 storage engine and its BrAPI interface. Soon, the BrAPI implementation will be expanded to enable the integration of analysis pipelines in the AGENT portal, such as the FIGS+ pipeline developed by ICARDA24. There is also a plan to integrate the data collected by the AGENT project into the European Search Catalogue for Plant Genetic Resources (EURISCO)25. +

The BrAPI specification is one of the agreed standards, that are detailed in the AGENT guidelines for dataflow23. The implemented BrAPI interface enables the analysis of current and historic genotypic and phenotypic information. This will drive the discovery of genes, traits, and knowledge for future missions, complement existing information for wheat and barley, and use the new data standards and infrastructure to promote better access and use of PGR for other crops in European genebanks. The AGENT database backend aggregates curated passport data, phenotypic data, and genotypic data on wheat and barley accessions of 18 project partners. This data is accessible via BrAPI endpoints and explorable in a web portal. Genotyping data uses the DivBrowse14 storage engine and its BrAPI interface. Soon, the BrAPI implementation will be expanded to enable the integration of analysis pipelines in the AGENT portal, such as the FIGS+ pipeline developed by ICARDA24. There is also a plan to integrate the data collected by the AGENT project into the European Search Catalogue for Plant Genetic Resources (EURISCO)25.

-

MGIS

- -

The Musa Germplasm Information System (MGIS) serves as a comprehensive community portal dedicated to banana diversity, a crop critical to global food security26. MGIS offers detailed information on banana germplasm, focusing on the collections held by the CGIAR International Banana Genebank (ITC)27. It is built on the Drupal/Tripal technology, like BIMS28 and Florilège.

-

Since its inception, MGIS developers have actively participated in the BrAPI community. The MGIS team pushed for the integration of the Multi-Crop Passport Data (MCPD) standard into the Germplasm module of the API. MCPD support was added in BrAPI v1.3, and MGIS now provides passport data information on ITC banana genebank accessions (with GLIS DOI), synchronized with Genesys. MGIS also enriches the passport data by incorporating additional information from other germplasm collections worldwide. All the germplasm data is available through the BrAPI Germplasm module implementation. For genotyping data, MGIS integrates with Gigwa16, which provides a tailored implementation of the BrAPI genotyping module. Furthermore, MGIS supports a set of BrAPI phenotyping endpoints, facilitating the exposure of morphological descriptors and trait information supported by ontologies like the Crop Ontology29. MGIS has integrated the Trait Selector BrAPP, and there are use cases implemented to interlink genebank and breeding data between MGIS and the breeding database MusaBase.

-

Helium

- -

Helium30 is a plant pedigree visualization platform designed to account for the specific problems that are unique to plant pedigrees. A pedigree is a representation of how genetically discrete individuals are related to one another and is therefore a representation of the genetic relationship between individual plant lines, their parents and progeny. Plant pedigrees are often used to check for potential genotyping or phenotyping errors, since these errors, by the very nature of Mendelian inheritance, are constrained by the pedigree structure in which they exist31. The accurate representation of pedigrees, and the ability to pull pedigree data from different data sources is important in plant breeding and genetics. Therefore, ways to visualize and interact this complex data in meaningful ways is critical.

-

From its original desktop interface, Helium has developed into a web-based visualization platform implementing BrAPI calls to allow users to import data from other BrAPI compliant databases. The ability to pull data from BrAPI compliant data sources has significantly expanded Helium’s capability and utility within the community. Helium is used in projects ranging in size from tens to tens of thousands of lines and across a wide variety of crops and species. While originally designed for plant data32 it has also found utility in other non-plant projects33 highlighting its broad utility. BrAPI also allows Helium to provide direct dataset links to collaborators, allowing the original data to be held with the data provider and utilizing Helium for its visualization functionality. Our current Helium deployment includes example BrAPI calls to a barley dataset at the James Hutton Institute to allow users to test the system and features it offers.

+

Florilège

+ +

Florilège is a web portal designed primarily for the general public to access public plant genetic resources held by Biological Resource Centers across France. Through this portal, users can browse accessions from over 50 plant genera, spread across 19 genebanks. It allows users to view available seeds and plant material, including options for ordering material. Florilège provides a centralized access to the various French collections of plant genetic resources available to the public.

+

Florilège retrieves accession information from several BrAPI compliant systems. Key among these are OLGA, a genebank accessions management system, and GnpIS, an INRAE data repository for plant genetic resources, phenomics, and genetics26,27. Using BrAPI to gather data from these systems reduced development efforts and enabled standardized data retrieval. As a result, BrAPI has become the de facto standard within the French plant genetic resources community for exchanging information. During development, the Florilège team also proposed several enhancements to the BrAPI specifications themselves, such as additional support for Collection objects or improved reference linking, to better accommodate their specific use case.

+

GLIS

The Global Information System (GLIS) on Plant Genetic Resources for Food and Agriculture (PGRFA) of the International Treaty on Plant Genetic Resources for Food and Agriculture (ITPGRFA) is a web-based global entry point for PGRFA data21. It allows users and third-party systems to access information and knowledge on scientific, technical, and environmental matters to strengthen PGRFA conservation, management, and utilization activities. The system and its portal also enable recipients of PGRFA to make available all non-confidential information on germplasm according to the provisions of the Treaty and facilitates access to the results of their research and development.

Thanks to the adoption of Digital Object Identifiers (DOIs) for Multi-Crop Passport Descriptors (MCPD) of PGRFA accessions, the GLIS Portal provides access to 1.7 million PGRFA in collections conserved worldwide. Of these, over 1.5 million are accessible for research, training and plant breeding in the food and agriculture domain.

The Scientific Advisory Committee of the ITPGRFA have repeatedly welcomed efforts on interoperability among germplasm information systems. In this context, the GLIS Portal adopted the BrAPI v1 in 2022. Integrating BrAPI among the GLIS content negotiators facilitates queries and the exchange of content for data management in plant breeding. The Portal also offers other protocols (XML, DarwinCore, JSON and JSON-LD) to increase data and metadata connectivity. In the near future, depending on the availability of resources, upgrading to BrAPI v2 is planned.

-

Florilège

- -

Florilège is a web portal designed primarily for the general public to access public plant genetic resources held by Biological Resource Centers across France. Through this portal, users can browse accessions from over 50 plant genera, spread across 19 genebanks. It allows users to view available seeds and plant material, including options for ordering material. Florilège provides a centralized access to the various French collections of plant genetic resources available to the public.

-

Florilège retrieves accession information from several BrAPI compliant systems. Key among these are OLGA, a genebank accessions management system, and GnpIS, an INRAE data repository for plant genetic resources, phenomics, and genetics34,35. Using BrAPI to gather data from these systems reduced development efforts and enabled standardized data retrieval. As a result, BrAPI has become the de facto standard within the French plant genetic resources community for exchanging information. During development, the Florilège team also proposed several enhancements to the BrAPI specifications themselves, such as additional support for Collection objects or improved reference linking, to better accommodate their specific use case.

- +

Helium

+ +

Helium28 is a plant pedigree visualization platform designed to account for the specific problems that are unique to plant pedigrees. A pedigree is a representation of how genetically discrete individuals are related to one another and is therefore a representation of the genetic relationship between individual plant lines, their parents and progeny. Plant pedigrees are often used to check for potential genotyping or phenotyping errors, since these errors, by the very nature of Mendelian inheritance, are constrained by the pedigree structure in which they exist29. The accurate representation of pedigrees, and the ability to pull pedigree data from different data sources is important in plant breeding and genetics. Therefore, ways to visualize and interact this complex data in meaningful ways is critical.

+

From its original desktop interface, Helium has developed into a web-based visualization platform implementing BrAPI calls to allow users to import data from other BrAPI compliant databases. The ability to pull data from BrAPI compliant data sources has significantly expanded Helium’s capability and utility within the community. Helium is used in projects ranging in size from tens to tens of thousands of lines and across a wide variety of crops and species. While originally designed for plant data30 it has also found utility in other non-plant projects31 highlighting its broad utility. BrAPI also allows Helium to provide direct dataset links to collaborators, allowing the original data to be held with the data provider and utilizing Helium for its visualization functionality. Our current Helium deployment includes example BrAPI calls to a barley dataset at the James Hutton Institute to allow users to test the system and features it offers.

+

MGIS

+ +

The Musa Germplasm Information System (MGIS) serves as a comprehensive community portal dedicated to banana diversity, a crop critical to global food security32. MGIS offers detailed information on banana germplasm, focusing on the collections held by the CGIAR International Banana Genebank (ITC)33. It is built on the Drupal/Tripal technology, like BIMS34 and Florilège.

+

Since its inception, MGIS developers have actively participated in the BrAPI community. The MGIS team pushed for the integration of the Multi-Crop Passport Data (MCPD) standard into the Germplasm module of the API. MCPD support was added in BrAPI v1.3, and MGIS now provides passport data information on ITC banana genebank accessions (with GLIS DOI), synchronized with Genesys. MGIS also enriches the passport data by incorporating additional information from other germplasm collections worldwide. All the germplasm data is available through the BrAPI Germplasm module implementation. For genotyping data, MGIS integrates with Gigwa16, which provides a tailored implementation of the BrAPI genotyping module. Furthermore, MGIS supports a set of BrAPI phenotyping endpoints, facilitating the exposure of morphological descriptors and trait information supported by ontologies like the Crop Ontology35. MGIS has integrated the Trait Selector BrAPP, and there are use cases implemented to interlink genebank and breeding data between MGIS and the breeding database MusaBase.

Breeding and Genetics Data Management

While specialty data management is important for some use cases, often breeders want a central repository or access point of critical data. General breeding and genetics data management systems and web portals support some level of phenotypic, genotypic, and germplasm data, as well as trial, equipment, and people management. By enabling BrAPI support, these larger systems can connect with smaller tools and specialty systems to provide more functionality under the same user interface. There are several breeding data management systems developed in the BrAPI community, each with their own strengths.

-

DeltaBreed

- -

DeltaBreed is an open-source breeding data management system designed and developed by Breeding Insight to support USDA-ARS specialty crop and animal breeders. DeltaBreed differs from other related systems in that is customizable to small breeding teams and generalized enough to support the workflows of diverse niche species. DeltaBreed is a unified system that connects a variety of BrAPI applications (see list below). BrAPI integration allows the complexity underlying interoperability to be hidden, shielding users from multifactorial differences between various applications. DeltaBreed, adhering to the BrAPI model, establishes data standards and validations for users and provides a singular framework for data management and user training.

-

DeltaBreed users need not be aware of BrAPI or the specifics of underlying applications but will notice that BrAPI interoperability reduces the need for human-mediated file transfers and data manipulation. Field Book users, for example, can connect to their DeltaBreed program, authenticate, and pull studies and traits directly from DeltaBreed to Field Book on their data collection device. The subsequent step of pushing observations from Field Book to DeltaBreed is straightforward via BrAPI, but is pending implementation until observation transaction handling is improved, intentional and inadvertent repeated measures are differentiated, and a data staging area is implemented for quality control.

-

Breeding Insight integrated several BrAPI applications to support 2021 phenotypic data collection by USDA-ARS blueberry breeders. DeltaBreed was used to create traits in Breedbase, and Field Book was used to pull studies and traits from Breedbase. The workflow also permitted users to push Field Book observations back to Breedbase via BrAPI. This effort served as a successful proof of concept for multi-application BrAPI integration, but highlighted limitations to the process of accepting BrAPI observations from Field Book. The Breeding Insight team is actively working with the rest of the BrAPI community to correct these limitations in future versions of the specification.

- -

DeltaBreed is integrated with many other BrAPI community projects and tools. There is a BrAPI enabled connection, either in development or production, with all of the following tools: BrAPI Java Test Server, BreedBase, Field Book, Gigwa, QBMS, Mr Bean, Helium and the Pedigree Viewer BrAPP.

+

BIMS

+ +

BIMS (Breeding Information Management System)34 is a free, secure, and online breeding management system which allows breeders to store, manage, archive, and analyze their private breeding program data. BIMS enables individual breeders to have complete control of their own breeding data along with access to tools such as data import/export, data analysis, and data archiving for their germplasm, phenotype, genotype, and image data. BIMS is currently implemented in five community databases, the Genome Database for Rosaceae36, CottonGEN37, the Citrus Genome Database, the Pulse Crop Database, and the Genome Database for Vaccinium. BIMS in these five community databases enables individual breeders to import publicly available data so that they can utilize public data in their breeding program. BIMS is also implemented in the public database breedwithbims.org that any crop breeder can use.

+

Right now, BIMS primarily utilizes BrAPI to connect with the Field Book Android App2, enabling seamless data transfer between BIMS and the app. Data transfer through BrAPI between BIMS and other resources such as BreedBase38, GIGWA16, and Breeder Genomics Hub is on the way. Hopefully, the BIMS development team can easily reuse some of the solved use cases and workflows created by others in the BrAPI community.

BMS

The Breeding Management System (BMS), developed by the Integrated Breeding Platform (IBP), is a suite of tools designed to enhance the efficiency and effectiveness of plant breeding. BMS covers all stages of the breeding process, with the emphasis on germplasm management and ontology-harmonized phenotyping. It also features analytics and decision-support tools. With its focus on interoperability, BMS integrates smoothly with BrAPI, facilitating easy connections with a broad array of complementary tools and databases. Notably, the BMS is often deployed together with Gigwa to fulfill the genotyping data management needs of BMS users.

@@ -1219,59 +1216,59 @@

BMS

Additionally, brapi-sync improves data management by maintaining links to the original source of each entity it transmits. This retains the original context of the data and establishes a traceability mechanism for accurate data source attribution and verification. Such practices are crucial for maintaining data integrity and fostering trust among collaborative partners, ensuring access to accurate, reliable, and current information.

Breedbase

-

Breedbase is a comprehensive breeding data management system36,37 that implements a digital ecosystem for all breeding data, including trial data, phenotypic data, and genotypic data. Data acquisition is supported through data collection apps such as Fieldbook2, Coordinate, and InterCross, as well as through drone imagery, Near Infra-Red Spectroscopy (NIRS), and other technologies. Search functions, such as the Search Wizard interface, provide powerful query capabilities. Various breeding-centric analysis tools are available, including mixed models, heritability, stability, PCA, and various clustering algorithms. The original impetus for creating Breedbase was the advent of new breeding paradigms based on genomic information such as genomic prediction algorithms38 and the accompanying data management challenges. Thus, complete genomic prediction workflow is integrated in the system.

-

The BrAPI interface is crucial for Breedbase. Breedbase uses BrAPI to connect with the data collection apps, other projects such as CLIMMOB4, and native BrAPPs built into the Breedbase webpage. Users also appreciate the ability to connect to Breedbase instances using packages such as QBMS39 for data import into R for custom analyses. The Breedbase team has been part of the BrAPI community since its inception, and has continuously adopted and contributed to the BrAPI standard.

-

BIMS

- -

BIMS (Breeding Information Management System)28 is a free, secure, and online breeding management system which allows breeders to store, manage, archive, and analyze their private breeding program data. BIMS enables individual breeders to have complete control of their own breeding data along with access to tools such as data import/export, data analysis, and data archiving for their germplasm, phenotype, genotype, and image data. BIMS is currently implemented in five community databases, the Genome Database for Rosaceae40, CottonGEN41, the Citrus Genome Database, the Pulse Crop Database, and the Genome Database for Vaccinium. BIMS in these five community databases enables individual breeders to import publicly available data so that they can utilize public data in their breeding program. BIMS is also implemented in the public database breedwithbims.org that any crop breeder can use.

-

Right now, BIMS primarily utilizes BrAPI to connect with the Field Book Android App2, enabling seamless data transfer between BIMS and the app. Data transfer through BrAPI between BIMS and other resources such as BreedBase36, GIGWA16, and Breeder Genomics Hub is on the way. Hopefully, the BIMS development team can easily reuse some of the solved use cases and workflows created by others in the BrAPI community.

-

Germinate

- -

Germinate42,43 is an open-source plant genetic resources database that combines and integrates various kinds of plant breeding data including genotypic data, phenotypic trials data, passport data, images, geographic information and climate data into a single repository. Germinate is tightly linked to the BrAPI specification and supports a majority of BrAPI endpoints for querying, filtering, and submission.

-

Germinate integrates and connects with other BrAPI-enabled tools such as GridScore for phenotypic data collection, Flapjack for genotypic data visualization, and Helium for pedigree visualization. Additionally, due to the nature of BrAPI, Germinate can act as a data repository for any BrAPI-compatible tool. Thanks to the interoperability provided by BrAPI, the need for manual data handling becomes a rarity with the direct benefit of faster data processing, fewer to no human errors, data security, and data integrity.

+

Breedbase is a comprehensive breeding data management system38,39 that implements a digital ecosystem for all breeding data, including trial data, phenotypic data, and genotypic data. Data acquisition is supported through data collection apps such as Fieldbook2, Coordinate, and InterCross, as well as through drone imagery, Near Infra-Red Spectroscopy (NIRS), and other technologies. Search functions, such as the Search Wizard interface, provide powerful query capabilities. Various breeding-centric analysis tools are available, including mixed models, heritability, stability, PCA, and various clustering algorithms. The original impetus for creating Breedbase was the advent of new breeding paradigms based on genomic information such as genomic prediction algorithms40 and the accompanying data management challenges. Thus, complete genomic prediction workflow is integrated in the system.

+

The BrAPI interface is crucial for Breedbase. Breedbase uses BrAPI to connect with the data collection apps, other projects such as CLIMMOB4, and native BrAPPs built into the Breedbase webpage. Users also appreciate the ability to connect to Breedbase instances using packages such as QBMS41 for data import into R for custom analyses. The Breedbase team has been part of the BrAPI community since its inception, and has continuously adopted and contributed to the BrAPI standard.

+

DeltaBreed

+ +

DeltaBreed is an open-source breeding data management system designed and developed by Breeding Insight to support USDA-ARS specialty crop and animal breeders. DeltaBreed differs from other related systems in that is customizable to small breeding teams and generalized enough to support the workflows of diverse niche species. DeltaBreed is a unified system that connects a variety of BrAPI applications (see list below). BrAPI integration allows the complexity underlying interoperability to be hidden, shielding users from multifactorial differences between various applications. DeltaBreed, adhering to the BrAPI model, establishes data standards and validations for users and provides a singular framework for data management and user training.

+

DeltaBreed users need not be aware of BrAPI or the specifics of underlying applications but will notice that BrAPI interoperability reduces the need for human-mediated file transfers and data manipulation. Field Book users, for example, can connect to their DeltaBreed program, authenticate, and pull studies and traits directly from DeltaBreed to Field Book on their data collection device. The subsequent step of pushing observations from Field Book to DeltaBreed is straightforward via BrAPI, but is pending implementation until observation transaction handling is improved, intentional and inadvertent repeated measures are differentiated, and a data staging area is implemented for quality control.

+

Breeding Insight integrated several BrAPI applications to support 2021 phenotypic data collection by USDA-ARS blueberry breeders. DeltaBreed was used to create traits in Breedbase, and Field Book was used to pull studies and traits from Breedbase. The workflow also permitted users to push Field Book observations back to Breedbase via BrAPI. This effort served as a successful proof of concept for multi-application BrAPI integration, but highlighted limitations to the process of accepting BrAPI observations from Field Book. The Breeding Insight team is actively working with the rest of the BrAPI community to correct these limitations in future versions of the specification.

+ +

DeltaBreed is integrated with many other BrAPI community projects and tools. There is a BrAPI enabled connection, either in development or production, with all of the following tools: BrAPI Java Test Server, BreedBase, Field Book, Gigwa, QBMS, Mr Bean, Helium and the Pedigree Viewer BrAPP.

FAIDARE

FAIDARE8 is a data discovery portal providing a biologist friendly search system over a global federation of 40 plant research databases at the time of writing. It allows users to identify data resources using a full text search approach combined with domain specific filters. Each search result contains a link back to the original database for visualization, analysis, and download. The indexed data types are very broad and include genomic features, selected bibliography, QTL, markers, genetic variation studies, phenomic studies, and plant genetic resources. This inclusiveness is achieved thanks to a two stage indexation data model. The first index, more generic, provides basic search functionalities and relies on five fields: name, link back URL, data type, species, and exhaustive description. To provide more advanced filtering, the second stage indexation mechanism takes advantage of BrAPI endpoints to get more detailed metadata on germplasm, genotyping studies and phenotyping studies.

The indexation mechanism relies on a public software package that allows data resource managers to request the indexation of their database. This BrAPI client is able to extract data from any BrAPI 1.3 and 1.2 endpoint. The development of BrAPI 2.x indexation will be initiated in 2025. Since not all databases are willing to implement BrAPI endpoints, it is possible to generate metadata as static BrAPI compliant JSON files, using the BrAPI standard as a file exchange format.

-

The FAIDARE architecture has been designed by elaborating on the BrAPI data model mixed with the GnpIS Software Architecture34. It uses an Elasticsearch NoSQL engine that searches and serves enriched versions of the BrAPI JSON data model. FAIDARE also includes a BrAPI endpoint using all indexed metadata. It has been adopted by several communities including the ELIXIR and EMPHASIS European infrastructures, and the WheatIS of the Wheat-Initiative. Several databases are added each year to the FAIDARE global federation, allowing to increase both the portal and the BrAPI adoption.

+

The FAIDARE architecture has been designed by elaborating on the BrAPI data model mixed with the GnpIS Software Architecture26. It uses an Elasticsearch NoSQL engine that searches and serves enriched versions of the BrAPI JSON data model. FAIDARE also includes a BrAPI endpoint using all indexed metadata. It has been adopted by several communities including the ELIXIR and EMPHASIS European infrastructures, and the WheatIS of the Wheat-Initiative. Several databases are added each year to the FAIDARE global federation, allowing to increase both the portal and the BrAPI adoption.

+

Germinate

+ +

Germinate42,43 is an open-source plant genetic resources database that combines and integrates various kinds of plant breeding data including genotypic data, phenotypic trials data, passport data, images, geographic information and climate data into a single repository. Germinate is tightly linked to the BrAPI specification and supports a majority of BrAPI endpoints for querying, filtering, and submission.

+

Germinate integrates and connects with other BrAPI-enabled tools such as GridScore for phenotypic data collection, Flapjack for genotypic data visualization, and Helium for pedigree visualization. Additionally, due to the nature of BrAPI, Germinate can act as a data repository for any BrAPI-compatible tool. Thanks to the interoperability provided by BrAPI, the need for manual data handling becomes a rarity with the direct benefit of faster data processing, fewer to no human errors, data security, and data integrity.

Analytics

-

While other tools listed above have the capability to do specialized analytics on certain types of data, general analytics tools can cover a wide range of data types and analytical models. The tools developed by the BrAPI community can pull in data from multiple BrAPI compatible data sources and provide enhanced analytical functionality. In many cases, there is no longer a need to import and export large data files to a local computational environment just to run standard analytical models. These tools are able to extract the data they need from a data source without much human intervention or human error.

+

Modern breeding programs can utilize data management systems to maintain both phenotypic and genotypic data. Numerous systems are available for adoption. To fully leverage the benefits of digitalization in this ecosystem, breeders need to utilize data from different sources to make efficient data-driven decisions. With increased computational power at their disposal, scientists can construct more advanced analysis pipelines by combining various data sources.

+

The tools developed by the BrAPI community can pull in data from multiple BrAPI compatible data sources and provide enhanced analytical functionality. In many cases, there is no longer a need to import and export large data files to a local computational environment just to run standard analytical models. These tools are able to extract the data they need from a data source without much human intervention or human error.

+

G-Crunch

+ +

G-Crunch is an upcoming user-facing analysis tool that attempts to fill the space of simple, user driven analytics requests, with a generic user interface and the ability to swap out data sources and analysis tools. G-Crunch hopes to streamline repeatable, debuggable, simple analytic requests and results.

+

G-Crunch, as a tool, couldn’t feasibly exist without BrAPI. The support of BrAPI interfaces allows G-Crunch to use one unified request method, and adapt to the user’s (BrAPI-compliant) existing network of tools. This lowers the barrier to entry for adoption, and makes analysis pipelines easily repeatable.

QBMS

-

Modern breeding programs can utilize data management systems to maintain both phenotypic and genotypic data. Numerous systems are available for adoption. To fully leverage the benefits of digitalization in this ecosystem, breeders need to utilize data from different sources to make efficient data-driven decisions. With increased computational power at their disposal, scientists can construct more advanced analysis pipelines by combining various data sources.

-

The QBMS39 R package eliminates technical barriers scientists experience when using the BrAPI specification in their analysis scripts and pipelines. This barrier arises from the complexity of managing API backend processes, such as authentication, tokens, TCP/IP protocol, JSON format, pagination, stateless calls, asynchronous communication, database IDs, and more. To bridge this gap, the QBMS package abstracts the technical complexities, providing breeders with stateful functions familiar to them when navigating their GUI systems. It enables them to query and extract data into a standard data frame structure, consistent with their use of the R language, one of the most common statistical tools in the breeding community.

+

The QBMS41 R package eliminates technical barriers scientists experience when using the BrAPI specification in their analysis scripts and pipelines. This barrier arises from the complexity of managing API backend processes, such as authentication, tokens, TCP/IP protocol, JSON format, pagination, stateless calls, asynchronous communication, database IDs, and more. To bridge this gap, the QBMS package abstracts the technical complexities, providing breeders with stateful functions familiar to them when navigating their GUI systems. It enables them to query and extract data into a standard data frame structure, consistent with their use of the R language, one of the most common statistical tools in the breeding community.

Since its release on the official CRAN repository in October 2021, the QBMS R package has garnered over 9400 downloads. Several tools, such as MrBean, rely on the QBMS package as their source data adapter. Moreover, the community has started building extended solutions on top of it. QBMS can serve as a cornerstone in the breeding modernization revolution by providing access to actionable data and by enabling the creation of dashboards to reduce the time between harvest and decision-making for the next breeding cycle.

Mr.Bean

Mr.Bean44 is a graphical user interface designed to assist breeders, statisticians, and individuals involved in plant breeding programs with the analysis of field trials. By utilizing innovative methodologies such as SpATS for modeling spatial trends, and autocorrelation models to address spatial variability, Mr.Bean proves highly practical and powerful in facilitating faster and more effective decision-making. Modeling Genotype-by-environment interaction poses its challenges, but Mr.Bean offers the capability to explore various variance-covariance matrices, including Factor Analytic, compound symmetry, and heterogeneous variances. This aids in the assessment of genotype performance across diverse environments.

Mr.Bean boasts flexibility in importing different file types, yet for users managing their data within data management systems (DMS), the process of downloading from their DMS and importing it into Mr.Bean can be cumbersome. To address this issue, QBMS was integrated into the back-end. This feature prompts users to input the URL of a BrAPI compatible server, enter their credentials (if necessary), and select the specific trial they wish to analyze. Subsequently, users can seamlessly access their dataset through BrAPI and utilize it across the entire Mr.Bean interface.

-

G-Crunch

- -

G-Crunch is an upcoming user-facing analysis tool that attempts to fill the space of simple, user driven analytics requests, with a generic user interface and the ability to swap out data sources and analysis tools. G-Crunch hopes to streamline repeatable, debuggable, simple analytic requests and results.

-

G-Crunch, as a tool, couldn’t feasibly exist without BrAPI. The support of BrAPI interfaces allows G-Crunch to use one unified request method, and adapt to the user’s (BrAPI-compliant) existing network of tools. This lowers the barrier to entry for adoption, and makes analysis pipelines easily repeatable.

-

ShinyBrAPPs

-

Data management systems are generic and robust centralized applications, with a large community of users, long term development cycles and release plans. BrAPI compliance offers these systems the opportunity to add functionalities in a modular way through the development of external plugin applications that can quickly fulfill specific needs of a group of users. R-Shiny is a R-package that opens the possibility to develop rich and productive interactive web applications to R users and developers. As such it allows user communities to quickly prototype and produce applications that are finely tailored to their needs, thus improving adoption and daily use of data management systems. The Breeding Management System (BMS) of the IBP and Gigwa are BrAPI compliant and are being widely used by breeding programs, including national breeding programs in Africa. CIRAD and the IBP teams have been working together as part of the IAVAO breeders community to develop the Shiny-BrAPPs, a set of R-Shiny applications using BrAPI as a core technology for data exchange. These applications are connected to BMS and/or Gigwa and provide tools for specific use cases. So far, four applications have been developed covering the fields of trial data quality control, single trial statistical analysis, breeding decision support, and raw genotyping data visual inspection.

-

The “BMS trial data explorer” retrieves data from a single multi-location trial and displays data counts and summary boxplot for all variables measured in different studies. It also provides an interactive distribution plot to easily select observations that require curation and a report of candidate issues that needs to be addressed by the breeder. The “STABrAPP” tool is an application for single trial mixed model analysis. It basically provides a GUI to the StatGen-STA R package. The “DSBrAPP” tool is a decision support tool helping breeders to select germplasm according to their various characteristics and save this germplasm list into BMS. These first three apps are grouped into a single repository (ShinyBrAPPs) with modular code shared across applications and make use of the brapir-v1 and brapir-v2 R packages. Finally, the “snpclust” tool enables a user to check and manually correct the clustering of fluorescence based SNP genotyping data.

SCT

-

The Sugarcane Crossing Tool (SCT) is a lightweight RShiny dashboard application designed to receive, process, and visualize data from a linked BreedBase36 instance. This application is being developed collaboratively with members of the Sugarcane Integrated Breeding System, who have advocated for an application that assists them in designing crosses based on queried information from a list of available accessions. By leveraging existing community resources, the team has been able to develop a simple, BrAPI-enabled, application without possessing extensive programming knowledge or experience. The SCT is presented as an inspiration for similarly positioned scientists to consider developing custom applications for specific tasks.

+

The Sugarcane Crossing Tool (SCT) is a lightweight RShiny dashboard application designed to receive, process, and visualize data from a linked BreedBase38 instance. This application is being developed collaboratively with members of the Sugarcane Integrated Breeding System, who have advocated for an application that assists them in designing crosses based on queried information from a list of available accessions. By leveraging existing community resources, the team has been able to develop a simple, BrAPI-enabled, application without possessing extensive programming knowledge or experience. The SCT is presented as an inspiration for similarly positioned scientists to consider developing custom applications for specific tasks.

The crossing tool utilizes a modified version of the BrAPI-R library to access a compliant database, and it employs standard R/JavaScript packages to aggregate and visualize data. Modules within the application allow breeders to query the database (through BrAPI) for information relevant to their decision-making process. This includes the number and sex of flowering accessions, deep pedigree and relatedness information, summarized trial data, and the prior frequency and success of potential cross combinations. Future versions of this tool will provide additional decision support (e.g. ranked potential crosses) to enhance the accuracy and efficiency of crossing.

+

ShinyBrAPPs

+

Data management systems are generic and robust centralized applications, with a large community of users, long term development cycles and release plans. BrAPI compliance offers these systems the opportunity to add functionalities in a modular way through the development of external plugin applications that can quickly fulfill specific needs of a group of users. R-Shiny is a R-package that opens the possibility to develop rich and productive interactive web applications to R users and developers. As such it allows user communities to quickly prototype and produce applications that are finely tailored to their needs, thus improving adoption and daily use of data management systems. The Breeding Management System (BMS) of the IBP and Gigwa are BrAPI compliant and are being widely used by breeding programs, including national breeding programs in Africa. CIRAD and the IBP teams have been working together as part of the IAVAO breeders community to develop the Shiny-BrAPPs, a set of R-Shiny applications using BrAPI as a core technology for data exchange. These applications are connected to BMS and/or Gigwa and provide tools for specific use cases. So far, four applications have been developed covering the fields of trial data quality control, single trial statistical analysis, breeding decision support, and raw genotyping data visual inspection.

+

The “BMS trial data explorer” retrieves data from a single multi-location trial and displays data counts and summary boxplot for all variables measured in different studies. It also provides an interactive distribution plot to easily select observations that require curation and a report of candidate issues that needs to be addressed by the breeder. The “STABrAPP” tool is an application for single trial mixed model analysis. It basically provides a GUI to the StatGen-STA R package. The “DSBrAPP” tool is a decision support tool helping breeders to select germplasm according to their various characteristics and save this germplasm list into BMS. These first three apps are grouped into a single repository (ShinyBrAPPs) with modular code shared across applications and make use of the brapir-v1 and brapir-v2 R packages. Finally, the “snpclust” tool enables a user to check and manually correct the clustering of fluorescence based SNP genotyping data.

General Infrastructure

Adopting BrAPI compatibility into an existing system can be difficult sometimes. The BrAPI Community has developed several tools to make adoption easier. This includes things like pre built code libraries, connectors to other technology standards, and mappers to alternate data types or data files. The goal is to lower the barrier to entry for the BrAPI community, making it easier for other groups to get started and connect their existing data to the standard.

-

MIRA

- -

In the plant phenotyping community, MIAPPE (Minimal Information About a Plant Phenotyping Experiment)7 is an established standard for phenotyping experiments. It is commonly serialized into the ISA-Tab file type.45 Although ISA-Tab is easy to read for non-technical experts due to its file-based approach, it lacks programmatic accessibility, particularly for web applications. BrAPI, which is aligned with MIAPPE, can help solve this problem.

-

MIRA is a tool that enables the automatic deployment of a BrAPI server on a MIAPPE-compliant dataset in ISA-Tab format. It can be deployed from a Docker image with the dataset mounted. By utilizing the mapping between MIAPPE, ISA-Tab, and BrAPI, there is no need for parsing or manual mapping of datasets that are already compliant with (meta-)data standards. By gaining programmatic access through BrAPI to these datasets, it facilitates the integration of phenotyping datasets into web applications.

-

BrAPI2ISA

- -

Since the release of BrAPI 1.3, efforts have been made to incorporate support for the MIAPPE standard into the specification7. This integration was finalized in BrAPI 2.0, resulting in full compatibility between the two standards. Consequently, BrAPI now encompasses all attributes necessary for MIAPPE compliance, adhering to standardized descriptions in accordance with MIAPPE guidelines.

-

In some communities and projects, phenotyping data and metadata is archived and published as structured ISA-Tab files, and validated using the MIAPPE ISA configuration. The BrAPI2ISA service functions as a converter between a BrAPI compatible server and the ISA-Tab format. This simplifies, automates, and facilitates the archiving of data, thereby enhancing data preservation and accessibility. The BrAPI2ISA tool is designed to be compatible with BrAPI 1.3, and is open to contributions from the community to extend support for the latest versions of BrAPI.

BrAPIMapper

BrAPIMapper is a full BrAPI implementation designed to be a convenient wrapper for any breeding related data source. BrAPIMapper is provided as a Docker application that can connect to a variety of external data sources including mySQL or PostgreSQL databases, generic REST services, flat files (XML, JSON, CSV/TSV/GFF3/VCF, YAML), or any combination of these. It provides an administration user interface to map BrAPI data models to external data sources. The interface allows administrators to select the BrAPI specification versions to use and which endpoints to enable. Data mapping configuration import and export features simplify upgrades to future BrAPI versions; administrators only have to map missing fields or make minor adjustments. BrAPIMapper supports the primary BrAPI features including paging, deferred search results, user lists, and authentication. Access restrictions to specific endpoints can be managed through the administration interface as well. This tool aims to accelerate BrAPI services deployment while ensuring specification compliance.

+

BrAPI2ISA

+ +

Since the release of BrAPI 1.3, efforts have been made to incorporate support for the MIAPPE (Minimal Information About a Plant Phenotyping Experiment)7 standard into the specification, achieving full compatibility in BrAPI 2.0. Consequently, BrAPI now includes all attributes necessary for MIAPPE compliance, adhering to standardized descriptions in accordance with MIAPPE guidelines. In some communities and projects, phenotyping data and metadata are archived and published as structured ISA-Tab files, validated using the MIAPPE ISA configuration45. Although ISA-Tab is easy to read for non-technical experts due to its file-based approach, it lacks programmatic accessibility, particularly for web applications.

+

MIRA enables the automatic deployment of a BrAPI server on a MIAPPE-compliant dataset in ISA-Tab format, facilitating programmatic access to these datasets. It is deployable from a Docker image with the dataset mounted. The tool leverages the mapping between MIAPPE, ISA-Tab, and BrAPI, eliminating the need for parsing or manual mapping of datasets compliant with (meta-)data standards. By providing programmatic access through BrAPI, MIRA facilitates the integration of phenotyping datasets into web applications.

+

The BrAPI2ISA service functions as a converter between a BrAPI-compatible server and the ISA-Tab format. The tool simplifies, automates, and facilitates the archiving of data, thereby enhancing data preservation and accessibility. The BrAPI2ISA tool is compatible with BrAPI 1.3 and welcomes community contributions to support the latest versions of BrAPI.

GraphQL Data-warehouse

Using the Zendro set of automatic software code generators, a fully functional, efficient, and cloud-capable BrAPI data-warehouse has been created for the current version of the BrAPI data models. Unlike most BrAPI compliant data sources, this data-warehouse supports a GraphQL API rather than a RESTful API. This API provides secure access to data read and write functions for all BrAPI data models. It provides create, read, update, and delete (CRUD) functions that are standardized and accept the same parameters for all data models.

@@ -1442,11 +1439,11 @@

References

13.
ga4gh-metadata/SchemaBlocks. GA4GH Metadata Schema Development Team (2023).
-
-
14.
Milne, I. et al. Flapjack—graphical genotype visualization. Bioinformatics 26, 3133–3134 (2010).
-
-
15.
König, P. et al. DivBrowse—interactive visualization and exploratory data analysis of variant call matrices. GigaScience 12, (2022).
+
14.
König, P. et al. DivBrowse—interactive visualization and exploratory data analysis of variant call matrices. GigaScience 12, (2022).
+
+
+
15.
Milne, I. et al. Flapjack—graphical genotype visualization. Bioinformatics 26, 3133–3134 (2010).
16.
Sempéré, G. et al. Gigwa v2—Extended and improved genotype investigator. GigaScience 8, (2019).
@@ -1478,53 +1475,53 @@

References

25.
Kotni, P., van Hintum, T., Maggioni, L., Oppermann, M. & Weise, S. EURISCO update 2023: the European Search Catalogue for Plant Genetic Resources, a pillar for documentation of genebank material. Nucleic Acids Research 51, D1465–D1469 (2022).
-
-
26.
-
-
-
27.
Van den houwe, I. et al. Safeguarding and using global banana diversity: a holistic approach. CABI Agric Biosci 1, (2020).
-
-
-
28.
+
+
26.
Pommier, C. et al. Applying FAIR Principles to Plant Phenotypic Data Management in GnpIS. Plant Phenomics 2019, (2019).
-
-
29.
+
+
27.
Adam-Blondon, A.-F. et al. Mining Plant Genomic and Genetic Data Using the GnpIS Information System. in Methods in Molecular Biology 103–117 (Springer New York, 2016). doi:10.1007/978-1-4939-6658-5_5.
-
30.
Shaw, P. D., Graham, M., Kennedy, J., Milne, I. & Marshall, D. F. Helium: visualization of large scale plant pedigrees. BMC Bioinformatics 15, (2014).
+
28.
Shaw, P. D., Graham, M., Kennedy, J., Milne, I. & Marshall, D. F. Helium: visualization of large scale plant pedigrees. BMC Bioinformatics 15, (2014).
-
31.
+
29.
-
32.
+
30.
-
33.
+
31.
-
-
34.
Pommier, C. et al. Applying FAIR Principles to Plant Phenotypic Data Management in GnpIS. Plant Phenomics 2019, (2019).
+
+
32.
-
-
35.
Adam-Blondon, A.-F. et al. Mining Plant Genomic and Genetic Data Using the GnpIS Information System. in Methods in Molecular Biology 103–117 (Springer New York, 2016). doi:10.1007/978-1-4939-6658-5_5.
+
+
33.
Van den houwe, I. et al. Safeguarding and using global banana diversity: a holistic approach. CABI Agric Biosci 1, (2020).
+
+
+
34.
+
+
+
35.
+
+
+
36.
Jung, S. et al. 15 years of GDR: New data and functionality in the Genome Database for Rosaceae. Nucleic Acids Research 47, D1137–D1145 (2018).
+
+
+
37.
-
36.
Morales, N. et al. Breedbase: a digital ecosystem for modern plant breeding. G3 Genes|Genomes|Genetics 12, (2022).
+
38.
Morales, N. et al. Breedbase: a digital ecosystem for modern plant breeding. G3 Genes|Genomes|Genetics 12, (2022).
-
37.
+
39.
-
38.
Meuwissen, T. H. E., Hayes, B. J. & Goddard, M. E. Prediction of Total Genetic Value Using Genome-Wide Dense Marker Maps. Genetics 157, 1819–1829 (2001).
+
40.
Meuwissen, T. H. E., Hayes, B. J. & Goddard, M. E. Prediction of Total Genetic Value Using Genome-Wide Dense Marker Maps. Genetics 157, 1819–1829 (2001).
-
39.
Khaled Al-Shamaa, Johan Steven Aparicio, Nick & icarda-git. Icarda-Git/QBMS: QBMS Version 1.0.0. (Zenodo, 2024). doi:10.5281/zenodo.10791627.
-
-
-
40.
Jung, S. et al. 15 years of GDR: New data and functionality in the Genome Database for Rosaceae. Nucleic Acids Research 47, D1137–D1145 (2018).
-
-
-
41.
+
41.
Khaled Al-Shamaa, Johan Steven Aparicio, Nick & icarda-git. Icarda-Git/QBMS: QBMS Version 1.0.0. (Zenodo, 2024). doi:10.5281/zenodo.10791627.
42.
diff --git a/manuscript.md b/manuscript.md index 7b0b9c5..5f21e0e 100644 --- a/manuscript.md +++ b/manuscript.md @@ -97,8 +97,8 @@ header-includes: | - - + + @@ -328,9 +328,9 @@ header-includes: | - - - + + + @@ -352,9 +352,9 @@ manubot-clear-requests-cache: false This manuscript -([permalink](https://plantbreeding.github.io/BrAPI-Manuscript2/v/511faa4c28e126a274c0f733c9fcaab35c0dfe49/)) +([permalink](https://plantbreeding.github.io/BrAPI-Manuscript2/v/d00841fc47e8764c25a9c65e15c4d72427b78a96/)) was automatically generated -from [plantbreeding/BrAPI-Manuscript2@511faa4](https://github.com/plantbreeding/BrAPI-Manuscript2/tree/511faa4c28e126a274c0f733c9fcaab35c0dfe49) +from [plantbreeding/BrAPI-Manuscript2@d00841f](https://github.com/plantbreeding/BrAPI-Manuscript2/tree/d00841fc47e8764c25a9c65e15c4d72427b78a96) on July 15, 2024. @@ -1194,6 +1194,7 @@ This effectively improves data collection speed, reduces errors, and enables lar Field Book has added support for BrAPI to streamline data transfer to and from BrAPI-compatible servers. Removing the need to manually transfer data files simplifies data exchange between these systems and reduces the opportunities for human error and data loss. + #### GridScore @@ -1260,9 +1261,14 @@ The Trait Selector can be integrated into any website or system, assuming there Genotyping has become a cornerstone of most breeding processes, but managing the data can be challenging. Understanding different genotyping protocols for various crops is crucial due to the unique genetic structures of each species. Techniques such as SNP genotyping, Genotyping-by-Sequencing (GBS), SSRs, Whole Genome Sequencing (WGS), and array-based genotyping each offer specific advantages depending on the crop and research objectives. BrAPI supports genotypic data by utilizing existing standards such as VCF [@doi:10.1093/bioinformatics/btr330] and the GA4GH Variants schema [@https://github.com/ga4gh-metadata/SchemaBlocks]. The BrAPI community has developed compatible tools for storing, searching, visualizing, and analyzing genotypic data, making it easier to integrate and utilize this information in breeding programs. Mastery of the various genotyping protocols ensures efficient and effective breeding, while BrAPI compliant tools streamline data management and analysis, enhancing the ability to make data-driven decisions in developing superior crop varieties. -#### Flapjack +#### DArT Sample Submission -[Flapjack](https://ics.hutton.ac.uk/flapjack) [@doi:10.1093/bioinformatics/btq580] is a multi-platform desktop application for data visualization and breeding analysis (eg, pedigree verification, marker-assisted backcrossing and forward breeding) using high-throughput genotype data. Data can be easily imported into Flapjack from any BrAPI compatible data source with genotype data available. [Flapjack Bytes](https://github.com/cropgeeks/flapjack-bytes) is a smaller, lightweight and fully web-based counterpart to Flapjack, which can be easily embedded into a database website to provide similar visualizations online. Traditionally supporting its own text-based data formats, Flapjack's use of BrAPI has streamlined the end-user experience for data import and work is underway to determine the best methods to exchange analysis results using future versions of the API. + +The DArT genotyping lab is heavily used world wide when it comes to plant genotyping. With over 1200 available organisms and species, client base on every continent and already many million samples processed, DArT provides services for several generic and bespoke genotyping technologies and solutions. Processes of sample tracking and fast data delivery are at the core of the ordering system developed at DArT. The ordering system is tightly integrated with DArTdb - DArT's custom LIMS operational system, which drives laboratory, quality, and analytical processes. + +Diversity Arrays Technology was a part of BrAPI community since its inception. DArT developers have worked with the BrAPI community contributing to various aspects of the API specification. One key aspect was establishing a standard API for sending sample metadata to the lab for genotyping. This solution eliminates much of the human error involved with sending samples to an external lab and also allows for an automated process of sample batch transfers. Beyond sample submission, the current implementation also allows for an order status verification, automated data discovery, and data downloads. Data are delivered as standard data packages with self-describing metadata. + +The current BrAPI implementation at DArT is in production and it is compatible with the newest BrAPI specification. Further details about DArT's ordering system can be found at [DArT Ordering System](https://ordering.diversityarrays.com) and also at [DArT Help](https://help.diversityarrays.com/docs/ordering). #### DArTView @@ -1283,6 +1289,11 @@ At its core, DivBrowse combines the convenience of a genome browser with feature Parts of the BrAPI Genotyping module are implemented in DivBrowse. There is a server-side component which provides genotypic data that the DivBrowse database can consume. There is also a client-side GUI component which can visualize genotypic data via any external BrAPI endpoint. In addition to BrAPI, DivBrowse has an internal API to control the tool from a hosting web portal. DivBrowse also has an interface to BLAST, which can be used to directly access genes or other genomic features. The modular structure of DivBrowse allows developers to configure and easily embed links to other external information systems. +#### Flapjack + +[Flapjack](https://ics.hutton.ac.uk/flapjack) [@doi:10.1093/bioinformatics/btq580] is a multi-platform desktop application for data visualization and breeding analysis (eg, pedigree verification, marker-assisted backcrossing and forward breeding) using high-throughput genotype data. Data can be easily imported into Flapjack from any BrAPI compatible data source with genotype data available. [Flapjack Bytes](https://github.com/cropgeeks/flapjack-bytes) is a smaller, lightweight and fully web-based counterpart to Flapjack, which can be easily embedded into a database website to provide similar visualizations online. Traditionally supporting its own text-based data formats, Flapjack's use of BrAPI has streamlined the end-user experience for data import and work is underway to determine the best methods to exchange analysis results using future versions of the API. + + #### Gigwa @@ -1303,16 +1314,6 @@ The [Practical Haplotype Graph](https://www.maizegenetics.net/phg) (PHG) is a gr Users access the crop databases either with direct calls to the PHG embedded server or indirectly using the rPHG library from an R environment. The PHG server accepts BrAPI queries to return information on sample lists and the variants used to define the graph's haplotypes. In addition, PHG users utilize the BrAPI Variant Sets endpoint query to return links to VCF files containing haplotype data. Work on the PHG is ongoing and it is expected to support additional BrAPI endpoints that allow for fine tuned slicing genotypic data in the near future. -#### DArT Sample Submission - - -The DArT genotyping lab is heavily used world wide when it comes to plant genotyping. With over 1200 available organisms and species, client base on every continent and already many million samples processed, DArT provides services for several generic and bespoke genotyping technologies and solutions. Processes of sample tracking and fast data delivery are at the core of the ordering system developed at DArT. The ordering system is tightly integrated with DArTdb - DArT's custom LIMS operational system, which drives laboratory, quality, and analytical processes. - -Diversity Arrays Technology was a part of BrAPI community since its inception. DArT developers have worked with the BrAPI community contributing to various aspects of the API specification. One key aspect was establishing a standard API for sending sample metadata to the lab for genotyping. This solution eliminates much of the human error involved with sending samples to an external lab and also allows for an automated process of sample batch transfers. Beyond sample submission, the current implementation also allows for an order status verification, automated data discovery, and data downloads. Data are delivered as standard data packages with self-describing metadata. - -The current BrAPI implementation at DArT is in production and it is compatible with the newest BrAPI specification. Further details about DArT's ordering system can be found at [DArT Ordering System](https://ordering.diversityarrays.com) and also at [DArT Help](https://help.diversityarrays.com/docs/ordering). - - ### Germplasm Management @@ -1330,20 +1331,14 @@ The BrAPI specification is one of the agreed standards, that are detailed in the -#### MGIS - - -The Musa Germplasm Information System ([MGIS](https://www.crop-diversity.org/mgis/)) serves as a comprehensive community portal dedicated to banana diversity, a crop critical to global food security [@doi:10.1093/database/bax046]. MGIS offers detailed information on banana germplasm, focusing on the collections held by the CGIAR International Banana Genebank (ITC) [@doi:10.1186/s43170-020-00015-6]. It is built on the Drupal/Tripal technology, like BIMS [@doi:10.1093/database/baab054] and Florilège. - -Since its inception, MGIS developers have actively participated in the BrAPI community. The MGIS team pushed for the integration of the Multi-Crop Passport Data (MCPD) standard into the Germplasm module of the API. MCPD support was added in BrAPI v1.3, and MGIS now provides passport data information on ITC banana genebank accessions (with GLIS DOI), synchronized with [Genesys](https://www.genesys-pgr.org/a/overview/v2YdWZGrZjD). MGIS also enriches the passport data by incorporating additional information from other germplasm collections worldwide. All the germplasm data is available through the BrAPI Germplasm module implementation. For genotyping data, MGIS integrates with Gigwa [@doi:10.1093/gigascience/giz051], which provides a tailored implementation of the BrAPI genotyping module. Furthermore, MGIS supports a set of BrAPI phenotyping endpoints, facilitating the exposure of morphological descriptors and trait information supported by ontologies like the Crop Ontology [@doi:10.1093/aobpla/plq008]. MGIS has integrated the Trait Selector BrAPP, and there are use cases implemented to interlink genebank and breeding data between MGIS and the breeding database MusaBase. - +#### Florilège -#### Helium + +[Florilège](https://florilege.arcad-project.org/) is a web portal designed primarily for the general public to access public plant genetic resources held by Biological Resource Centers across France. Through this portal, users can browse accessions from over 50 plant genera, spread across 19 genebanks. It allows users to view available seeds and plant material, including options for ordering material. Florilège provides a centralized access to the various French collections of plant genetic resources available to the public. - -[Helium](https://helium.hutton.ac.uk) [@doi:10.1186/1471-2105-15-259] is a plant pedigree visualization platform designed to account for the specific problems that are unique to plant pedigrees. A pedigree is a representation of how genetically discrete individuals are related to one another and is therefore a representation of the genetic relationship between individual plant lines, their parents and progeny. Plant pedigrees are often used to check for potential genotyping or phenotyping errors, since these errors, by the very nature of Mendelian inheritance, are constrained by the pedigree structure in which they exist [@doi:10.1111/j.1365-2052.2011.02183.x]. The accurate representation of pedigrees, and the ability to pull pedigree data from different data sources is important in plant breeding and genetics. Therefore, ways to visualize and interact this complex data in meaningful ways is critical. +Florilège retrieves accession information from several BrAPI compliant systems. Key among these are OLGA, a genebank accessions management system, and GnpIS, an INRAE data repository for plant genetic resources, phenomics, and genetics [@doi:10.34133/2019/1671403;@doi:10.1007/978-1-4939-6658-5_5]. Using BrAPI to gather data from these systems reduced development efforts and enabled standardized data retrieval. As a result, BrAPI has become the de facto standard within the French plant genetic resources community for exchanging information. During development, the Florilège team also proposed several enhancements to the BrAPI specifications themselves, such as additional support for Collection objects or improved reference linking, to better accommodate their specific use case. -From its [original desktop interface](https://github.com/cardinalb/helium-docs/wiki), Helium has developed into a web-based visualization platform implementing BrAPI calls to allow users to import data from other BrAPI compliant databases. The ability to pull data from BrAPI compliant data sources has significantly expanded Helium’s capability and utility within the community. Helium is used in projects ranging in size from tens to tens of thousands of lines and across a wide variety of crops and species. While originally designed for plant data [@doi:10.3389/fpls.2024.1268847] it has also found utility in other non-plant projects [@doi:10.1007/s10592-024-01611-z] highlighting its broad utility. BrAPI also allows Helium to provide direct dataset links to collaborators, allowing the original data to be held with the data provider and utilizing Helium for its visualization functionality. Our current Helium deployment includes example BrAPI calls to a barley dataset at the James Hutton Institute to allow users to test the system and features it offers. + #### GLIS @@ -1356,32 +1351,33 @@ Thanks to the adoption of Digital Object Identifiers (DOIs) for Multi-Crop Passp The Scientific Advisory Committee of the ITPGRFA have repeatedly welcomed efforts on interoperability among germplasm information systems. In this context, the GLIS Portal adopted the BrAPI v1 in 2022. Integrating BrAPI among the GLIS content negotiators facilitates queries and the exchange of content for data management in plant breeding. The Portal also offers other protocols (XML, DarwinCore, JSON and JSON-LD) to increase data and metadata connectivity. In the near future, depending on the availability of resources, upgrading to BrAPI v2 is planned. -#### Florilège +#### Helium - -[Florilège](https://florilege.arcad-project.org/) is a web portal designed primarily for the general public to access public plant genetic resources held by Biological Resource Centers across France. Through this portal, users can browse accessions from over 50 plant genera, spread across 19 genebanks. It allows users to view available seeds and plant material, including options for ordering material. Florilège provides a centralized access to the various French collections of plant genetic resources available to the public. + +[Helium](https://helium.hutton.ac.uk) [@doi:10.1186/1471-2105-15-259] is a plant pedigree visualization platform designed to account for the specific problems that are unique to plant pedigrees. A pedigree is a representation of how genetically discrete individuals are related to one another and is therefore a representation of the genetic relationship between individual plant lines, their parents and progeny. Plant pedigrees are often used to check for potential genotyping or phenotyping errors, since these errors, by the very nature of Mendelian inheritance, are constrained by the pedigree structure in which they exist [@doi:10.1111/j.1365-2052.2011.02183.x]. The accurate representation of pedigrees, and the ability to pull pedigree data from different data sources is important in plant breeding and genetics. Therefore, ways to visualize and interact this complex data in meaningful ways is critical. -Florilège retrieves accession information from several BrAPI compliant systems. Key among these are OLGA, a genebank accessions management system, and GnpIS, an INRAE data repository for plant genetic resources, phenomics, and genetics [@doi:10.34133/2019/1671403;@doi:10.1007/978-1-4939-6658-5_5]. Using BrAPI to gather data from these systems reduced development efforts and enabled standardized data retrieval. As a result, BrAPI has become the de facto standard within the French plant genetic resources community for exchanging information. During development, the Florilège team also proposed several enhancements to the BrAPI specifications themselves, such as additional support for Collection objects or improved reference linking, to better accommodate their specific use case. +From its [original desktop interface](https://github.com/cardinalb/helium-docs/wiki), Helium has developed into a web-based visualization platform implementing BrAPI calls to allow users to import data from other BrAPI compliant databases. The ability to pull data from BrAPI compliant data sources has significantly expanded Helium’s capability and utility within the community. Helium is used in projects ranging in size from tens to tens of thousands of lines and across a wide variety of crops and species. While originally designed for plant data [@doi:10.3389/fpls.2024.1268847] it has also found utility in other non-plant projects [@doi:10.1007/s10592-024-01611-z] highlighting its broad utility. BrAPI also allows Helium to provide direct dataset links to collaborators, allowing the original data to be held with the data provider and utilizing Helium for its visualization functionality. Our current Helium deployment includes example BrAPI calls to a barley dataset at the James Hutton Institute to allow users to test the system and features it offers. - +#### MGIS -### Breeding and Genetics Data Management + +The [Musa Germplasm Information System (MGIS)](https://www.crop-diversity.org/mgis/) serves as a comprehensive community portal dedicated to banana diversity, a crop critical to global food security [@doi:10.1093/database/bax046]. MGIS offers detailed information on banana germplasm, focusing on the collections held by the CGIAR International Banana Genebank (ITC) [@doi:10.1186/s43170-020-00015-6]. It is built on the Drupal/Tripal technology, like BIMS [@doi:10.1093/database/baab054] and Florilège. -While specialty data management is important for some use cases, often breeders want a central repository or access point of critical data. General breeding and genetics data management systems and web portals support some level of phenotypic, genotypic, and germplasm data, as well as trial, equipment, and people management. By enabling BrAPI support, these larger systems can connect with smaller tools and specialty systems to provide more functionality under the same user interface. There are several breeding data management systems developed in the BrAPI community, each with their own strengths. +Since its inception, MGIS developers have actively participated in the BrAPI community. The MGIS team pushed for the integration of the Multi-Crop Passport Data (MCPD) standard into the Germplasm module of the API. MCPD support was added in BrAPI v1.3, and MGIS now provides passport data information on ITC banana genebank accessions (with GLIS DOI), synchronized with [Genesys](https://www.genesys-pgr.org/a/overview/v2YdWZGrZjD). MGIS also enriches the passport data by incorporating additional information from other germplasm collections worldwide. All the germplasm data is available through the BrAPI Germplasm module implementation. For genotyping data, MGIS integrates with Gigwa [@doi:10.1093/gigascience/giz051], which provides a tailored implementation of the BrAPI genotyping module. Furthermore, MGIS supports a set of BrAPI phenotyping endpoints, facilitating the exposure of morphological descriptors and trait information supported by ontologies like the Crop Ontology [@doi:10.1093/aobpla/plq008]. MGIS has integrated the Trait Selector BrAPP, and there are use cases implemented to interlink genebank and breeding data between MGIS and the breeding database MusaBase. -#### DeltaBreed +### Breeding and Genetics Data Management - -[DeltaBreed](https://app.breedinginsight.net/) is an open-source breeding data management system designed and developed by Breeding Insight to support USDA-ARS specialty crop and animal breeders. DeltaBreed differs from other related systems in that is customizable to small breeding teams and generalized enough to support the workflows of diverse niche species. DeltaBreed is a unified system that connects a variety of BrAPI applications (see list below). BrAPI integration allows the complexity underlying interoperability to be hidden, shielding users from multifactorial differences between various applications. DeltaBreed, adhering to the BrAPI model, establishes data standards and validations for users and provides a singular framework for data management and user training. +While specialty data management is important for some use cases, often breeders want a central repository or access point of critical data. General breeding and genetics data management systems and web portals support some level of phenotypic, genotypic, and germplasm data, as well as trial, equipment, and people management. By enabling BrAPI support, these larger systems can connect with smaller tools and specialty systems to provide more functionality under the same user interface. There are several breeding data management systems developed in the BrAPI community, each with their own strengths. -DeltaBreed users need not be aware of BrAPI or the specifics of underlying applications but will notice that BrAPI interoperability reduces the need for human-mediated file transfers and data manipulation. Field Book users, for example, can connect to their DeltaBreed program, authenticate, and pull studies and traits directly from DeltaBreed to Field Book on their data collection device. The subsequent step of pushing observations from Field Book to DeltaBreed is straightforward via BrAPI, but is pending implementation until observation transaction handling is improved, intentional and inadvertent repeated measures are differentiated, and a data staging area is implemented for quality control. -Breeding Insight integrated several BrAPI applications to support 2021 phenotypic data collection by USDA-ARS blueberry breeders. DeltaBreed was used to create traits in Breedbase, and Field Book was used to pull studies and traits from Breedbase. The workflow also permitted users to push Field Book observations back to Breedbase via BrAPI. This effort served as a successful proof of concept for multi-application BrAPI integration, but highlighted limitations to the process of accepting BrAPI observations from Field Book. The Breeding Insight team is actively working with the rest of the BrAPI community to correct these limitations in future versions of the specification. +#### BIMS - -DeltaBreed is integrated with many other BrAPI community projects and tools. There is a BrAPI enabled connection, either in development or production, with all of the following tools: [BrAPI Java Test Server](https://test-server.brapi.org/brapi/v2/), [BreedBase](https://breedbase.org/), [Field Book](https://play.google.com/store/apps/details?id=com.fieldbook.tracker), [Gigwa](https://gigwa.southgreen.fr/gigwa/), [QBMS](https://icarda-git.github.io/QBMS), [Mr Bean](https://github.com/AparicioJohan/MrBeanApp), [Helium](https://helium.hutton.ac.uk/#/) and the [Pedigree Viewer](https://github.com/solgenomics/BrAPI-Pedigree-Viewer) BrAPP. + +[BIMS](https://wwww.breedwithbims.org) (Breeding Information Management System) [@doi:10.1093/database/baab054] is a free, secure, and online breeding management system which allows breeders to store, manage, archive, and analyze their private breeding program data. BIMS enables individual breeders to have complete control of their own breeding data along with access to tools such as data import/export, data analysis, and data archiving for their germplasm, phenotype, genotype, and image data. BIMS is currently implemented in five community databases, the Genome Database for Rosaceae [@doi:10.1093/nar/gky1000], CottonGEN [@doi:10.3390/plants10122805], the Citrus Genome Database, the Pulse Crop Database, and the Genome Database for Vaccinium. BIMS in these five community databases enables individual breeders to import publicly available data so that they can utilize public data in their breeding program. BIMS is also implemented in the public database [breedwithbims.org](https://wwww.breedwithbims.org) that any crop breeder can use. + +Right now, BIMS primarily utilizes BrAPI to connect with the Field Book Android App [@doi:10.2135/cropsci2013.08.0579], enabling seamless data transfer between BIMS and the app. Data transfer through BrAPI between BIMS and other resources such as BreedBase[@doi:10.1093/g3journal/jkac078], GIGWA[@doi:10.1093/gigascience/giz051], and Breeder Genomics Hub is on the way. Hopefully, the BIMS development team can easily reuse some of the solved use cases and workflows created by others in the BrAPI community. #### BMS @@ -1402,20 +1398,17 @@ Additionally, brapi-sync improves data management by maintaining links to the or The BrAPI interface is crucial for Breedbase. Breedbase uses BrAPI to connect with the data collection apps, other projects such as CLIMMOB [@doi:10.1016/j.compag.2023.108539], and native BrAPPs built into the Breedbase webpage. Users also appreciate the ability to connect to Breedbase instances using packages such as [QBMS](https://icarda-git.github.io/QBMS) [@doi:10.5281/zenodo.10791627] for data import into R for custom analyses. The Breedbase team has been part of the BrAPI community since its inception, and has continuously adopted and contributed to the BrAPI standard. -#### BIMS - - -[BIMS](https://wwww.breedwithbims.org) (Breeding Information Management System) [@doi:10.1093/database/baab054] is a free, secure, and online breeding management system which allows breeders to store, manage, archive, and analyze their private breeding program data. BIMS enables individual breeders to have complete control of their own breeding data along with access to tools such as data import/export, data analysis, and data archiving for their germplasm, phenotype, genotype, and image data. BIMS is currently implemented in five community databases, the Genome Database for Rosaceae [@doi:10.1093/nar/gky1000], CottonGEN [@doi:10.3390/plants10122805], the Citrus Genome Database, the Pulse Crop Database, and the Genome Database for Vaccinium. BIMS in these five community databases enables individual breeders to import publicly available data so that they can utilize public data in their breeding program. BIMS is also implemented in the public database [breedwithbims.org](https://wwww.breedwithbims.org) that any crop breeder can use. - -Right now, BIMS primarily utilizes BrAPI to connect with the Field Book Android App [@doi:10.2135/cropsci2013.08.0579], enabling seamless data transfer between BIMS and the app. Data transfer through BrAPI between BIMS and other resources such as BreedBase[@doi:10.1093/g3journal/jkac078], GIGWA[@doi:10.1093/gigascience/giz051], and Breeder Genomics Hub is on the way. Hopefully, the BIMS development team can easily reuse some of the solved use cases and workflows created by others in the BrAPI community. +#### DeltaBreed + +[DeltaBreed](https://app.breedinginsight.net/) is an open-source breeding data management system designed and developed by Breeding Insight to support USDA-ARS specialty crop and animal breeders. DeltaBreed differs from other related systems in that is customizable to small breeding teams and generalized enough to support the workflows of diverse niche species. DeltaBreed is a unified system that connects a variety of BrAPI applications (see list below). BrAPI integration allows the complexity underlying interoperability to be hidden, shielding users from multifactorial differences between various applications. DeltaBreed, adhering to the BrAPI model, establishes data standards and validations for users and provides a singular framework for data management and user training. -#### Germinate +DeltaBreed users need not be aware of BrAPI or the specifics of underlying applications but will notice that BrAPI interoperability reduces the need for human-mediated file transfers and data manipulation. Field Book users, for example, can connect to their DeltaBreed program, authenticate, and pull studies and traits directly from DeltaBreed to Field Book on their data collection device. The subsequent step of pushing observations from Field Book to DeltaBreed is straightforward via BrAPI, but is pending implementation until observation transaction handling is improved, intentional and inadvertent repeated measures are differentiated, and a data staging area is implemented for quality control. - -[Germinate](https://ics.hutton.ac.uk/get-germinate/) [@doi:10.1002/csc2.20248;@doi:10.2135/cropsci2016.09.0814] is an open-source plant genetic resources database that combines and integrates various kinds of plant breeding data including genotypic data, phenotypic trials data, passport data, images, geographic information and climate data into a single repository. Germinate is tightly linked to the BrAPI specification and supports a majority of BrAPI endpoints for querying, filtering, and submission. +Breeding Insight integrated several BrAPI applications to support 2021 phenotypic data collection by USDA-ARS blueberry breeders. DeltaBreed was used to create traits in Breedbase, and Field Book was used to pull studies and traits from Breedbase. The workflow also permitted users to push Field Book observations back to Breedbase via BrAPI. This effort served as a successful proof of concept for multi-application BrAPI integration, but highlighted limitations to the process of accepting BrAPI observations from Field Book. The Breeding Insight team is actively working with the rest of the BrAPI community to correct these limitations in future versions of the specification. -Germinate integrates and connects with other BrAPI-enabled tools such as GridScore for phenotypic data collection, Flapjack for genotypic data visualization, and Helium for pedigree visualization. Additionally, due to the nature of BrAPI, Germinate can act as a data repository for any BrAPI-compatible tool. Thanks to the interoperability provided by BrAPI, the need for manual data handling becomes a rarity with the direct benefit of faster data processing, fewer to no human errors, data security, and data integrity. + +DeltaBreed is integrated with many other BrAPI community projects and tools. There is a BrAPI enabled connection, either in development or production, with all of the following tools: [BrAPI Java Test Server](https://test-server.brapi.org/brapi/v2/), [BreedBase](https://breedbase.org/), [Field Book](https://play.google.com/store/apps/details?id=com.fieldbook.tracker), [Gigwa](https://gigwa.southgreen.fr/gigwa/), [QBMS](https://icarda-git.github.io/QBMS), [Mr Bean](https://github.com/AparicioJohan/MrBeanApp), [Helium](https://helium.hutton.ac.uk/#/) and the [Pedigree Viewer](https://github.com/solgenomics/BrAPI-Pedigree-Viewer) BrAPP. #### FAIDARE @@ -1430,42 +1423,44 @@ The FAIDARE architecture has been designed by elaborating on the BrAPI data mode -### Analytics +#### Germinate -While other tools listed above have the capability to do specialized analytics on certain types of data, general analytics tools can cover a wide range of data types and analytical models. The tools developed by the BrAPI community can pull in data from multiple BrAPI compatible data sources and provide enhanced analytical functionality. In many cases, there is no longer a need to import and export large data files to a local computational environment just to run standard analytical models. These tools are able to extract the data they need from a data source without much human intervention or human error. + +[Germinate](https://ics.hutton.ac.uk/get-germinate/) [@doi:10.1002/csc2.20248;@doi:10.2135/cropsci2016.09.0814] is an open-source plant genetic resources database that combines and integrates various kinds of plant breeding data including genotypic data, phenotypic trials data, passport data, images, geographic information and climate data into a single repository. Germinate is tightly linked to the BrAPI specification and supports a majority of BrAPI endpoints for querying, filtering, and submission. +Germinate integrates and connects with other BrAPI-enabled tools such as GridScore for phenotypic data collection, Flapjack for genotypic data visualization, and Helium for pedigree visualization. Additionally, due to the nature of BrAPI, Germinate can act as a data repository for any BrAPI-compatible tool. Thanks to the interoperability provided by BrAPI, the need for manual data handling becomes a rarity with the direct benefit of faster data processing, fewer to no human errors, data security, and data integrity. -#### QBMS - +### Analytics + Modern breeding programs can utilize data management systems to maintain both phenotypic and genotypic data. Numerous systems are available for adoption. To fully leverage the benefits of digitalization in this ecosystem, breeders need to utilize data from different sources to make efficient data-driven decisions. With increased computational power at their disposal, scientists can construct more advanced analysis pipelines by combining various data sources. -The [QBMS](https://icarda-git.github.io/QBMS) [@doi:10.5281/zenodo.10791627] R package eliminates technical barriers scientists experience when using the BrAPI specification in their analysis scripts and pipelines. This barrier arises from the complexity of managing API backend processes, such as authentication, tokens, TCP/IP protocol, JSON format, pagination, stateless calls, asynchronous communication, database IDs, and more. To bridge this gap, the QBMS package abstracts the technical complexities, providing breeders with stateful functions familiar to them when navigating their GUI systems. It enables them to query and extract data into a standard data frame structure, consistent with their use of the R language, one of the most common statistical tools in the breeding community. +The tools developed by the BrAPI community can pull in data from multiple BrAPI compatible data sources and provide enhanced analytical functionality. In many cases, there is no longer a need to import and export large data files to a local computational environment just to run standard analytical models. These tools are able to extract the data they need from a data source without much human intervention or human error. -Since its release on the official CRAN repository in October 2021, the QBMS R package has garnered over 9400 downloads. Several tools, such as MrBean, rely on the QBMS package as their source data adapter. Moreover, the community has started building extended solutions on top of it. QBMS can serve as a cornerstone in the breeding modernization revolution by providing access to actionable data and by enabling the creation of dashboards to reduce the time between harvest and decision-making for the next breeding cycle. +#### G-Crunch -#### Mr.Bean + +G-Crunch is an upcoming user-facing analysis tool that attempts to fill the space of simple, user driven analytics requests, with a generic user interface and the ability to swap out data sources and analysis tools. G-Crunch hopes to streamline repeatable, debuggable, simple analytic requests and results. - -[Mr.Bean](https://apariciojohan.github.io/MrBeanApp/) [@doi:10.3389/fpls.2023.1290078] is a graphical user interface designed to assist breeders, statisticians, and individuals involved in plant breeding programs with the analysis of field trials. By utilizing innovative methodologies such as SpATS for modeling spatial trends, and autocorrelation models to address spatial variability, Mr.Bean proves highly practical and powerful in facilitating faster and more effective decision-making. Modeling Genotype-by-environment interaction poses its challenges, but Mr.Bean offers the capability to explore various variance-covariance matrices, including Factor Analytic, compound symmetry, and heterogeneous variances. This aids in the assessment of genotype performance across diverse environments. +G-Crunch, as a tool, couldn't feasibly exist without BrAPI. The support of BrAPI interfaces allows G-Crunch to use one unified request method, and adapt to the user's (BrAPI-compliant) existing network of tools. This lowers the barrier to entry for adoption, and makes analysis pipelines easily repeatable. -Mr.Bean boasts flexibility in importing different file types, yet for users managing their data within data management systems (DMS), the process of downloading from their DMS and importing it into Mr.Bean can be cumbersome. To address this issue, QBMS was integrated into the back-end. This feature prompts users to input the URL of a BrAPI compatible server, enter their credentials (if necessary), and select the specific trial they wish to analyze. Subsequently, users can seamlessly access their dataset through BrAPI and utilize it across the entire Mr.Bean interface. +#### QBMS -#### G-Crunch + - -G-Crunch is an upcoming user-facing analysis tool that attempts to fill the space of simple, user driven analytics requests, with a generic user interface and the ability to swap out data sources and analysis tools. G-Crunch hopes to streamline repeatable, debuggable, simple analytic requests and results. +The [QBMS](https://icarda-git.github.io/QBMS) [@doi:10.5281/zenodo.10791627] R package eliminates technical barriers scientists experience when using the BrAPI specification in their analysis scripts and pipelines. This barrier arises from the complexity of managing API backend processes, such as authentication, tokens, TCP/IP protocol, JSON format, pagination, stateless calls, asynchronous communication, database IDs, and more. To bridge this gap, the QBMS package abstracts the technical complexities, providing breeders with stateful functions familiar to them when navigating their GUI systems. It enables them to query and extract data into a standard data frame structure, consistent with their use of the R language, one of the most common statistical tools in the breeding community. -G-Crunch, as a tool, couldn't feasibly exist without BrAPI. The support of BrAPI interfaces allows G-Crunch to use one unified request method, and adapt to the user's (BrAPI-compliant) existing network of tools. This lowers the barrier to entry for adoption, and makes analysis pipelines easily repeatable. +Since its release on the official CRAN repository in October 2021, the QBMS R package has garnered over 9400 downloads. Several tools, such as MrBean, rely on the QBMS package as their source data adapter. Moreover, the community has started building extended solutions on top of it. QBMS can serve as a cornerstone in the breeding modernization revolution by providing access to actionable data and by enabling the creation of dashboards to reduce the time between harvest and decision-making for the next breeding cycle. -#### ShinyBrAPPs +#### Mr.Bean -Data management systems are generic and robust centralized applications, with a large community of users, long term development cycles and release plans. BrAPI compliance offers these systems the opportunity to add functionalities in a modular way through the development of external plugin applications that can quickly fulfill specific needs of a group of users. [R-Shiny](https://shiny.posit.co/) is a R-package that opens the possibility to develop rich and productive interactive web applications to R users and developers. As such it allows user communities to quickly prototype and produce applications that are finely tailored to their needs, thus improving adoption and daily use of data management systems. The Breeding Management System (BMS) of the IBP and Gigwa are BrAPI compliant and are being widely used by breeding programs, including national breeding programs in Africa. CIRAD and the IBP teams have been working together as part of the [IAVAO](https://www.iavao.org/) breeders community to develop the Shiny-BrAPPs, a set of R-Shiny applications using BrAPI as a core technology for data exchange. These applications are connected to BMS and/or Gigwa and provide tools for specific use cases. So far, four applications have been developed covering the fields of trial data quality control, single trial statistical analysis, breeding decision support, and raw genotyping data visual inspection. + +[Mr.Bean](https://apariciojohan.github.io/MrBeanApp/) [@doi:10.3389/fpls.2023.1290078] is a graphical user interface designed to assist breeders, statisticians, and individuals involved in plant breeding programs with the analysis of field trials. By utilizing innovative methodologies such as SpATS for modeling spatial trends, and autocorrelation models to address spatial variability, Mr.Bean proves highly practical and powerful in facilitating faster and more effective decision-making. Modeling Genotype-by-environment interaction poses its challenges, but Mr.Bean offers the capability to explore various variance-covariance matrices, including Factor Analytic, compound symmetry, and heterogeneous variances. This aids in the assessment of genotype performance across diverse environments. -The "BMS trial data explorer" retrieves data from a single multi-location trial and displays data counts and summary boxplot for all variables measured in different studies. It also provides an interactive distribution plot to easily select observations that require curation and a report of candidate issues that needs to be addressed by the breeder. The "STABrAPP" tool is an application for single trial mixed model analysis. It basically provides a GUI to the [StatGen-STA](https://biometris.github.io/statgenSTA/) R package. The "DSBrAPP" tool is a decision support tool helping breeders to select germplasm according to their various characteristics and save this germplasm list into BMS. These first three apps are grouped into a single repository ([ShinyBrAPPs](https://github.com/IntegratedBreedingPlatform/ShinyBrAPPs/)) with modular code shared across applications and make use of the [brapir-v1](https://github.com/mverouden/brapir-v1) and [brapir-v2](https://github.com/mverouden/brapir-v2) R packages. Finally, the "[snpclust](https://github.com/jframi/snpclust)" tool enables a user to check and manually correct the clustering of fluorescence based SNP genotyping data. +Mr.Bean boasts flexibility in importing different file types, yet for users managing their data within data management systems (DMS), the process of downloading from their DMS and importing it into Mr.Bean can be cumbersome. To address this issue, QBMS was integrated into the back-end. This feature prompts users to input the URL of a BrAPI compatible server, enter their credentials (if necessary), and select the specific trial they wish to analyze. Subsequently, users can seamlessly access their dataset through BrAPI and utilize it across the entire Mr.Bean interface. #### SCT @@ -1479,31 +1474,32 @@ The [Sugarcane Crossing Tool](https://github.com/USDA-ARS-GBRU/SugarcaneCrossing The crossing tool utilizes a modified version of the [BrAPI-R](https://github.com/CIP-RIU/brapi) library to access a compliant database, and it employs standard R/JavaScript packages to aggregate and visualize data. Modules within the application allow breeders to query the database (through BrAPI) for information relevant to their decision-making process. This includes the number and sex of flowering accessions, deep pedigree and relatedness information, summarized trial data, and the prior frequency and success of potential cross combinations. Future versions of this tool will provide additional decision support (e.g. ranked potential crosses) to enhance the accuracy and efficiency of crossing. -### General Infrastructure +#### ShinyBrAPPs -Adopting BrAPI compatibility into an existing system can be difficult sometimes. The BrAPI Community has developed several tools to make adoption easier. This includes things like pre built code libraries, connectors to other technology standards, and mappers to alternate data types or data files. The goal is to lower the barrier to entry for the BrAPI community, making it easier for other groups to get started and connect their existing data to the standard. +Data management systems are generic and robust centralized applications, with a large community of users, long term development cycles and release plans. BrAPI compliance offers these systems the opportunity to add functionalities in a modular way through the development of external plugin applications that can quickly fulfill specific needs of a group of users. [R-Shiny](https://shiny.posit.co/) is a R-package that opens the possibility to develop rich and productive interactive web applications to R users and developers. As such it allows user communities to quickly prototype and produce applications that are finely tailored to their needs, thus improving adoption and daily use of data management systems. The Breeding Management System (BMS) of the IBP and Gigwa are BrAPI compliant and are being widely used by breeding programs, including national breeding programs in Africa. CIRAD and the IBP teams have been working together as part of the [IAVAO](https://www.iavao.org/) breeders community to develop the Shiny-BrAPPs, a set of R-Shiny applications using BrAPI as a core technology for data exchange. These applications are connected to BMS and/or Gigwa and provide tools for specific use cases. So far, four applications have been developed covering the fields of trial data quality control, single trial statistical analysis, breeding decision support, and raw genotyping data visual inspection. +The "BMS trial data explorer" retrieves data from a single multi-location trial and displays data counts and summary boxplot for all variables measured in different studies. It also provides an interactive distribution plot to easily select observations that require curation and a report of candidate issues that needs to be addressed by the breeder. The "STABrAPP" tool is an application for single trial mixed model analysis. It basically provides a GUI to the [StatGen-STA](https://biometris.github.io/statgenSTA/) R package. The "DSBrAPP" tool is a decision support tool helping breeders to select germplasm according to their various characteristics and save this germplasm list into BMS. These first three apps are grouped into a single repository ([ShinyBrAPPs](https://github.com/IntegratedBreedingPlatform/ShinyBrAPPs/)) with modular code shared across applications and make use of the [brapir-v1](https://github.com/mverouden/brapir-v1) and [brapir-v2](https://github.com/mverouden/brapir-v2) R packages. Finally, the "[snpclust](https://github.com/jframi/snpclust)" tool enables a user to check and manually correct the clustering of fluorescence based SNP genotyping data. -#### MIRA - -In the plant phenotyping community, [MIAPPE](https://www.miappe.org/) (Minimal Information About a Plant Phenotyping Experiment) [@doi:10.1111/nph.16544] is an established standard for phenotyping experiments. It is commonly serialized into the ISA-Tab file type. [@doi:10.1038/ng.1054] Although ISA-Tab is easy to read for non-technical experts due to its file-based approach, it lacks programmatic accessibility, particularly for web applications. BrAPI, which is aligned with MIAPPE, can help solve this problem. +### General Infrastructure -[MIRA](https://github.com/USDA-ARS-GBRU/SugarcaneCrossingTool) is a tool that enables the automatic deployment of a BrAPI server on a MIAPPE-compliant dataset in ISA-Tab format. It can be deployed from a Docker image with the dataset mounted. By utilizing the mapping between MIAPPE, ISA-Tab, and BrAPI, there is no need for parsing or manual mapping of datasets that are already compliant with (meta-)data standards. By gaining programmatic access through BrAPI to these datasets, it facilitates the integration of phenotyping datasets into web applications. +Adopting BrAPI compatibility into an existing system can be difficult sometimes. The BrAPI Community has developed several tools to make adoption easier. This includes things like pre built code libraries, connectors to other technology standards, and mappers to alternate data types or data files. The goal is to lower the barrier to entry for the BrAPI community, making it easier for other groups to get started and connect their existing data to the standard. -#### BrAPI2ISA +#### BrAPIMapper + + +[BrAPIMapper](https://github.com/plantbreeding/BrAPIMapper) is a full BrAPI implementation designed to be a convenient wrapper for any breeding related data source. BrAPIMapper is provided as a Docker application that can connect to a variety of external data sources including mySQL or PostgreSQL databases, generic REST services, flat files (XML, JSON, CSV/TSV/GFF3/VCF, YAML), or any combination of these. It provides an administration user interface to map BrAPI data models to external data sources. The interface allows administrators to select the BrAPI specification versions to use and which endpoints to enable. Data mapping configuration import and export features simplify upgrades to future BrAPI versions; administrators only have to map missing fields or make minor adjustments. BrAPIMapper supports the primary BrAPI features including paging, deferred search results, user lists, and authentication. Access restrictions to specific endpoints can be managed through the administration interface as well. This tool aims to accelerate BrAPI services deployment while ensuring specification compliance. - -Since the release of BrAPI 1.3, efforts have been made to incorporate support for the MIAPPE standard into the specification [@doi:10.1111/nph.16544]. This integration was finalized in BrAPI 2.0, resulting in full compatibility between the two standards. Consequently, BrAPI now encompasses all attributes necessary for MIAPPE compliance, adhering to standardized descriptions in accordance with MIAPPE guidelines. -In some communities and projects, phenotyping data and metadata is archived and published as structured ISA-Tab files, and validated using the [MIAPPE ISA configuration](https://github.com/ELIXIR-Belgium/isatab-validation). The [BrAPI2ISA](https://github.com/elixir-europe/plant-brapi-to-isa) service functions as a converter between a BrAPI compatible server and the ISA-Tab format. This simplifies, automates, and facilitates the archiving of data, thereby enhancing data preservation and accessibility. The BrAPI2ISA tool is designed to be compatible with BrAPI 1.3, and is open to contributions from the community to extend support for the latest versions of BrAPI. +#### BrAPI2ISA + +Since the release of BrAPI 1.3, efforts have been made to incorporate support for the [MIAPPE](https://www.miappe.org/) (Minimal Information About a Plant Phenotyping Experiment) [@doi:10.1111/nph.16544] standard into the specification, achieving full compatibility in BrAPI 2.0. Consequently, BrAPI now includes all attributes necessary for MIAPPE compliance, adhering to standardized descriptions in accordance with MIAPPE guidelines. In some communities and projects, phenotyping data and metadata are archived and published as structured ISA-Tab files, validated using the [MIAPPE ISA configuration](https://github.com/ELIXIR-Belgium/isatab-validation) [@doi:10.1038/ng.1054]. Although ISA-Tab is easy to read for non-technical experts due to its file-based approach, it lacks programmatic accessibility, particularly for web applications. -#### BrAPIMapper +[MIRA](https://github.com/USDA-ARS-GBRU/SugarcaneCrossingTool) enables the automatic deployment of a BrAPI server on a MIAPPE-compliant dataset in ISA-Tab format, facilitating programmatic access to these datasets. It is deployable from a Docker image with the dataset mounted. The tool leverages the mapping between MIAPPE, ISA-Tab, and BrAPI, eliminating the need for parsing or manual mapping of datasets compliant with (meta-)data standards. By providing programmatic access through BrAPI, MIRA facilitates the integration of phenotyping datasets into web applications. - -[BrAPIMapper](https://github.com/plantbreeding/BrAPIMapper) is a full BrAPI implementation designed to be a convenient wrapper for any breeding related data source. BrAPIMapper is provided as a Docker application that can connect to a variety of external data sources including mySQL or PostgreSQL databases, generic REST services, flat files (XML, JSON, CSV/TSV/GFF3/VCF, YAML), or any combination of these. It provides an administration user interface to map BrAPI data models to external data sources. The interface allows administrators to select the BrAPI specification versions to use and which endpoints to enable. Data mapping configuration import and export features simplify upgrades to future BrAPI versions; administrators only have to map missing fields or make minor adjustments. BrAPIMapper supports the primary BrAPI features including paging, deferred search results, user lists, and authentication. Access restrictions to specific endpoints can be managed through the administration interface as well. This tool aims to accelerate BrAPI services deployment while ensuring specification compliance. +The [BrAPI2ISA](https://github.com/elixir-europe/plant-brapi-to-isa) service functions as a converter between a BrAPI-compatible server and the ISA-Tab format. The tool simplifies, automates, and facilitates the archiving of data, thereby enhancing data preservation and accessibility. The BrAPI2ISA tool is compatible with BrAPI 1.3 and welcomes community contributions to support the latest versions of BrAPI. #### GraphQL Data-warehouse diff --git a/manuscript.pdf b/manuscript.pdf index 53d72dd..8121cc5 100644 Binary files a/manuscript.pdf and b/manuscript.pdf differ diff --git a/spelling-error-locations.txt b/spelling-error-locations.txt index ebffb58..7b67e1f 100644 --- a/spelling-error-locations.txt +++ b/spelling-error-locations.txt @@ -4,17 +4,17 @@ content/03.01.02.GridScore.md:7:barcodes content/03.01.02.GridScore.md:7:georeferencing content/03.01.--.HEADER.Phenotyping.md:3:Ajay content/03.01.--.HEADER.Phenotyping.md:8:curation +content/03.02.01.DArT.md:3:Grzegorz +content/03.02.01.DArT.md:3:Hok +content/03.02.01.DArT.md:3:Puthick +content/03.02.01.DArT.md:3:Uszynski +content/03.02.01.DArT.md:4:DArTdb +content/03.02.01.DArT.md:4:LIMS content/03.02.02.DArTView.md:4:curation content/03.02.02.DArTView.md:4:DArTView's -content/03.02.04.GIGWA.md:4:EE -content/03.02.04.GIGWA.md:6:Gigwa's -content/03.02.04.GIGWA.md:6:jframi -content/03.02.06.DArT.md:3:Grzegorz -content/03.02.06.DArT.md:3:Hok -content/03.02.06.DArT.md:3:Puthick -content/03.02.06.DArT.md:3:Uszynski -content/03.02.06.DArT.md:4:DArTdb -content/03.02.06.DArT.md:4:LIMS +content/03.02.05.GIGWA.md:4:EE +content/03.02.05.GIGWA.md:6:Gigwa's +content/03.02.05.GIGWA.md:6:jframi content/03.02.--.HEADER.Genotyping.md:3:Ajay content/03.02.--.HEADER.Genotyping.md:4:GBS content/03.02.--.HEADER.Genotyping.md:4:SNP @@ -24,40 +24,41 @@ content/03.03.01.AGENT.md:2:König content/03.03.01.AGENT.md:6:situ content/03.03.01.AGENT.md:6:situ content/03.03.01.AGENT.md:8:dataflow -content/03.03.02.MGIS.md:4:Florilège -content/03.03.05.FLORILEGE.md:1:Florilège -content/03.03.05.FLORILEGE.md:4:Florilège -content/03.03.05.FLORILEGE.md:4:Florilège -content/03.03.05.FLORILEGE.md:6:Florilège -content/03.03.05.FLORILEGE.md:6:Florilège +content/03.03.02.FLORILEGE.md:1:Florilège +content/03.03.02.FLORILEGE.md:4:Florilège +content/03.03.02.FLORILEGE.md:4:Florilège +content/03.03.02.FLORILEGE.md:6:Florilège +content/03.03.02.FLORILEGE.md:6:Florilège +content/03.03.05.MGIS.md:4:Florilège content/03.03.--.HEADER.Germplasm_Management.md:3:Ajay -content/03.04.01.DeltaBreed.md:4:customizable +content/03.04.01.BIMS.md:4:breedwithbims +content/03.04.01.BIMS.md:4:breedwithbims +content/03.04.01.BIMS.md:4:breedwithbims content/03.04.03.Breedbase.md:3:Lukas content/03.04.03.Breedbase.md:4:NIRS content/03.04.03.Breedbase.md:6:webpage -content/03.04.04.BIMS.md:4:breedwithbims -content/03.04.04.BIMS.md:4:breedwithbims -content/03.04.04.BIMS.md:4:breedwithbims -content/03.05.02.Mr_Bean.md:3:Johan -content/03.05.04.ShinyBrAPPs.md:1:ShinyBrAPPs -content/03.05.04.ShinyBrAPPs.md:5:boxplot -content/03.05.04.ShinyBrAPPs.md:5:brapir -content/03.05.04.ShinyBrAPPs.md:5:brapir -content/03.05.04.ShinyBrAPPs.md:5:brapir -content/03.05.04.ShinyBrAPPs.md:5:brapir -content/03.05.04.ShinyBrAPPs.md:5:curation -content/03.05.04.ShinyBrAPPs.md:5:DSBrAPP -content/03.05.04.ShinyBrAPPs.md:5:jframi -content/03.05.04.ShinyBrAPPs.md:5:ShinyBrAPPs -content/03.05.04.ShinyBrAPPs.md:5:ShinyBrAPPs -content/03.05.04.ShinyBrAPPs.md:5:SNP -content/03.05.04.ShinyBrAPPs.md:5:STABrAPP -content/03.05.04.ShinyBrAPPs.md:5:StatGen -content/03.05.05.SCT.md:1:SCT -content/03.05.05.SCT.md:3:Keo -content/03.05.05.SCT.md:4:RShiny -content/03.05.05.SCT.md:4:SCT -content/03.05.05.SCT.md:4:SCT +content/03.04.04.DeltaBreed.md:4:customizable +content/03.05.03.Mr_Bean.md:3:Johan +content/03.05.04.SCT.md:1:SCT +content/03.05.04.SCT.md:3:Keo +content/03.05.04.SCT.md:4:RShiny +content/03.05.04.SCT.md:4:SCT +content/03.05.04.SCT.md:4:SCT +content/03.05.05.ShinyBrAPPs.md:1:ShinyBrAPPs +content/03.05.05.ShinyBrAPPs.md:5:boxplot +content/03.05.05.ShinyBrAPPs.md:5:brapir +content/03.05.05.ShinyBrAPPs.md:5:brapir +content/03.05.05.ShinyBrAPPs.md:5:brapir +content/03.05.05.ShinyBrAPPs.md:5:brapir +content/03.05.05.ShinyBrAPPs.md:5:curation +content/03.05.05.ShinyBrAPPs.md:5:DSBrAPP +content/03.05.05.ShinyBrAPPs.md:5:jframi +content/03.05.05.ShinyBrAPPs.md:5:ShinyBrAPPs +content/03.05.05.ShinyBrAPPs.md:5:ShinyBrAPPs +content/03.05.05.ShinyBrAPPs.md:5:SNP +content/03.05.05.ShinyBrAPPs.md:5:STABrAPP +content/03.05.05.ShinyBrAPPs.md:5:StatGen +content/03.06.02.MIAPPE.md:6:deployable content/04.discussion.md:21:CDO content/04.discussion.md:21:GeoTIFF content/04.discussion.md:21:NOAA diff --git a/spelling-errors.txt b/spelling-errors.txt index d93134c..e718dc7 100644 --- a/spelling-errors.txt +++ b/spelling-errors.txt @@ -34,6 +34,7 @@ customizable DArTdb DArTView’s dataflow +deployable Dhondt Dhungana Dorrie @@ -49,7 +50,7 @@ georeferencing GeoTIFF GH Gigwa’s -Grzegorz +grzegorz Hok IFB Institut @@ -88,7 +89,7 @@ OpenAPI Palladino pascalneveu Pérez -puthick +Puthick Rami Rica Romil diff --git a/variables.json b/variables.json index 3b2c28e..2af7d38 100644 --- a/variables.json +++ b/variables.json @@ -86,7 +86,7 @@ "Stephan Weise", "Shawn C. Yarnes" ], - "header-includes": "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n", + "header-includes": "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n", "bibliography": [ "content/manual-references.json" ], @@ -98,7 +98,7 @@ "manubot": { "date": "2024-07-15", "date_long": "July 15, 2024", - "generated": "2024-07-15T16:32:22+00:00", + "generated": "2024-07-15T18:31:39+00:00", "generated_date_long": "July 15, 2024", "randomize_author_order": false, "authors": [ @@ -1274,19 +1274,19 @@ "repo_slug": "plantbreeding/BrAPI-Manuscript2", "repo_owner": "plantbreeding", "repo_name": "BrAPI-Manuscript2", - "commit": "511faa4c28e126a274c0f733c9fcaab35c0dfe49", - "triggering_commit": "511faa4c28e126a274c0f733c9fcaab35c0dfe49", - "build_url": "https://github.com/plantbreeding/BrAPI-Manuscript2/commit/511faa4c28e126a274c0f733c9fcaab35c0dfe49/checks", - "job_url": "https://github.com/plantbreeding/BrAPI-Manuscript2/actions/runs/9943117162" + "commit": "d00841fc47e8764c25a9c65e15c4d72427b78a96", + "triggering_commit": "d00841fc47e8764c25a9c65e15c4d72427b78a96", + "build_url": "https://github.com/plantbreeding/BrAPI-Manuscript2/commit/d00841fc47e8764c25a9c65e15c4d72427b78a96/checks", + "job_url": "https://github.com/plantbreeding/BrAPI-Manuscript2/actions/runs/9944693356" }, "html_url": "https://plantbreeding.github.io/BrAPI-Manuscript2/", "pdf_url": "https://plantbreeding.github.io/BrAPI-Manuscript2/manuscript.pdf", - "html_url_versioned": "https://plantbreeding.github.io/BrAPI-Manuscript2/v/511faa4c28e126a274c0f733c9fcaab35c0dfe49/", - "pdf_url_versioned": "https://plantbreeding.github.io/BrAPI-Manuscript2/v/511faa4c28e126a274c0f733c9fcaab35c0dfe49/manuscript.pdf", + "html_url_versioned": "https://plantbreeding.github.io/BrAPI-Manuscript2/v/d00841fc47e8764c25a9c65e15c4d72427b78a96/", + "pdf_url_versioned": "https://plantbreeding.github.io/BrAPI-Manuscript2/v/d00841fc47e8764c25a9c65e15c4d72427b78a96/manuscript.pdf", "manubot_version": "0.5.6", "rootstock_commit": "f92ea1b72211d2543bac7276995d1b69947c6949", "manuscript_stats": { - "word_count": 13160 + "word_count": 13068 } } }