diff --git a/joss.05618/10.21105.joss.05618.crossref.xml b/joss.05618/10.21105.joss.05618.crossref.xml
new file mode 100644
index 0000000000..2d7df90d16
--- /dev/null
+++ b/joss.05618/10.21105.joss.05618.crossref.xml
@@ -0,0 +1,374 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<doi_batch xmlns="http://www.crossref.org/schema/5.3.1"
+           xmlns:ai="http://www.crossref.org/AccessIndicators.xsd"
+           xmlns:rel="http://www.crossref.org/relations.xsd"
+           xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+           version="5.3.1"
+           xsi:schemaLocation="http://www.crossref.org/schema/5.3.1 http://www.crossref.org/schemas/crossref5.3.1.xsd">
+  <head>
+    <doi_batch_id>20240510T145759-960ae91c7fe0eec695cd8b37d307c60488c8f490</doi_batch_id>
+    <timestamp>20240510145758</timestamp>
+    <depositor>
+      <depositor_name>JOSS Admin</depositor_name>
+      <email_address>admin@theoj.org</email_address>
+    </depositor>
+    <registrant>The Open Journal</registrant>
+  </head>
+  <body>
+    <journal>
+      <journal_metadata>
+        <full_title>Journal of Open Source Software</full_title>
+        <abbrev_title>JOSS</abbrev_title>
+        <issn media_type="electronic">2475-9066</issn>
+        <doi_data>
+          <doi>10.21105/joss</doi>
+          <resource>https://joss.theoj.org</resource>
+        </doi_data>
+      </journal_metadata>
+      <journal_issue>
+        <publication_date media_type="online">
+          <month>05</month>
+          <year>2024</year>
+        </publication_date>
+        <journal_volume>
+          <volume>9</volume>
+        </journal_volume>
+        <issue>97</issue>
+      </journal_issue>
+      <journal_article publication_type="full_text">
+        <titles>
+          <title>matbench-genmetrics: A Python library for benchmarking
+crystal structure generative models using time-based splits of Materials
+Project structures</title>
+        </titles>
+        <contributors>
+          <person_name sequence="first" contributor_role="author">
+            <given_name>Sterling G.</given_name>
+            <surname>Baird</surname>
+            <ORCID>https://orcid.org/0000-0002-4491-6876</ORCID>
+          </person_name>
+          <person_name sequence="additional"
+                       contributor_role="author">
+            <given_name>Hasan M.</given_name>
+            <surname>Sayeed</surname>
+            <ORCID>https://orcid.org/0000-0002-6583-7755</ORCID>
+          </person_name>
+          <person_name sequence="additional"
+                       contributor_role="author">
+            <given_name>Joseph</given_name>
+            <surname>Montoya</surname>
+            <ORCID>https://orcid.org/0000-0001-5760-2860</ORCID>
+          </person_name>
+          <person_name sequence="additional"
+                       contributor_role="author">
+            <given_name>Taylor D.</given_name>
+            <surname>Sparks</surname>
+            <ORCID>https://orcid.org/0000-0001-8020-7711</ORCID>
+          </person_name>
+        </contributors>
+        <publication_date>
+          <month>05</month>
+          <day>10</day>
+          <year>2024</year>
+        </publication_date>
+        <pages>
+          <first_page>5618</first_page>
+        </pages>
+        <publisher_item>
+          <identifier id_type="doi">10.21105/joss.05618</identifier>
+        </publisher_item>
+        <ai:program name="AccessIndicators">
+          <ai:license_ref applies_to="vor">http://creativecommons.org/licenses/by/4.0/</ai:license_ref>
+          <ai:license_ref applies_to="am">http://creativecommons.org/licenses/by/4.0/</ai:license_ref>
+          <ai:license_ref applies_to="tdm">http://creativecommons.org/licenses/by/4.0/</ai:license_ref>
+        </ai:program>
+        <rel:program>
+          <rel:related_item>
+            <rel:description>Software archive</rel:description>
+            <rel:inter_work_relation relationship-type="references" identifier-type="doi">10.5281/zenodo.10840604</rel:inter_work_relation>
+          </rel:related_item>
+          <rel:related_item>
+            <rel:description>GitHub review issue</rel:description>
+            <rel:inter_work_relation relationship-type="hasReview" identifier-type="uri">https://github.com/openjournals/joss-reviews/issues/5618</rel:inter_work_relation>
+          </rel:related_item>
+        </rel:program>
+        <doi_data>
+          <doi>10.21105/joss.05618</doi>
+          <resource>https://joss.theoj.org/papers/10.21105/joss.05618</resource>
+          <collection property="text-mining">
+            <item>
+              <resource mime_type="application/pdf">https://joss.theoj.org/papers/10.21105/joss.05618.pdf</resource>
+            </item>
+          </collection>
+        </doi_data>
+        <citation_list>
+          <citation key="zhao_physics_2023">
+            <article_title>Physics guided deep learning for generative
+design of crystal materials with symmetry constraints</article_title>
+            <author>Zhao</author>
+            <journal_title>npj Comput Mater</journal_title>
+            <issue>1</issue>
+            <volume>9</volume>
+            <doi>10.1038/s41524-023-00987-9</doi>
+            <issn>2057-3960</issn>
+            <cYear>2023</cYear>
+            <unstructured_citation>Zhao, Y., Siriwardane, E. M. D., Wu,
+Z., Fu, N., Al-Fahdi, M., Hu, M., &amp; Hu, J. (2023). Physics guided
+deep learning for generative design of crystal materials with symmetry
+constraints. Npj Comput Mater, 9(1), 1–12.
+https://doi.org/10.1038/s41524-023-00987-9</unstructured_citation>
+          </citation>
+          <citation key="alverson_generative_2022">
+            <article_title>Generative adversarial networks and diffusion
+models in material discovery</article_title>
+            <author>Alverson</author>
+            <doi>10.26434/chemrxiv-2022-6l4pm</doi>
+            <cYear>2022</cYear>
+            <unstructured_citation>Alverson, M., Baird, S., Murdock, R.,
+&amp; Sparks, T. (2022). Generative adversarial networks and diffusion
+models in material discovery.
+https://doi.org/10.26434/chemrxiv-2022-6l4pm</unstructured_citation>
+          </citation>
+          <citation key="aykol_network_2019">
+            <article_title>Network analysis of synthesizable materials
+discovery</article_title>
+            <author>Aykol</author>
+            <journal_title>Nature Communications</journal_title>
+            <issue>1</issue>
+            <volume>10</volume>
+            <doi>10.1038/s41467-019-10030-5</doi>
+            <issn>2041-1723</issn>
+            <cYear>2019</cYear>
+            <unstructured_citation>Aykol, M., Hegde, V. I., Hung, L.,
+Suram, S., Herring, P., Wolverton, C., &amp; Hummelshøj, J. S. (2019).
+Network analysis of synthesizable materials discovery. Nature
+Communications, 10(1), 2018.
+https://doi.org/10.1038/s41467-019-10030-5</unstructured_citation>
+          </citation>
+          <citation key="brown_guacamol_2019">
+            <article_title>GuacaMol: Benchmarking Models for de Novo
+Molecular Design</article_title>
+            <author>Brown</author>
+            <journal_title>Journal of Chemical Information and
+Modeling</journal_title>
+            <issue>3</issue>
+            <volume>59</volume>
+            <doi>10.1021/acs.jcim.8b00839</doi>
+            <issn>1549-9596</issn>
+            <cYear>2019</cYear>
+            <unstructured_citation>Brown, N., Fiscato, M., Segler, M. H.
+S., &amp; Vaucher, A. C. (2019). GuacaMol: Benchmarking Models for de
+Novo Molecular Design. Journal of Chemical Information and Modeling,
+59(3), 1096–1108.
+https://doi.org/10.1021/acs.jcim.8b00839</unstructured_citation>
+          </citation>
+          <citation key="chen_universal_2022">
+            <article_title>A universal graph deep learning interatomic
+potential for the periodic table</article_title>
+            <author>Chen</author>
+            <journal_title>Nature Computational Science</journal_title>
+            <issue>11</issue>
+            <volume>2</volume>
+            <doi>10.1038/s43588-022-00349-3</doi>
+            <issn>2662-8457</issn>
+            <cYear>2022</cYear>
+            <unstructured_citation>Chen, C., &amp; Ong, S. P. (2022). A
+universal graph deep learning interatomic potential for the periodic
+table. Nature Computational Science, 2(11), 718–728.
+https://doi.org/10.1038/s43588-022-00349-3</unstructured_citation>
+          </citation>
+          <citation key="dunn_benchmarking_2020">
+            <article_title>Benchmarking materials property prediction
+methods: The Matbench test set and Automatminer reference
+algorithm</article_title>
+            <author>Dunn</author>
+            <journal_title>npj Computational Materials</journal_title>
+            <issue>1</issue>
+            <volume>6</volume>
+            <doi>10.1038/s41524-020-00406-3</doi>
+            <issn>2057-3960</issn>
+            <cYear>2020</cYear>
+            <unstructured_citation>Dunn, A., Wang, Q., Ganose, A., Dopp,
+D., &amp; Jain, A. (2020). Benchmarking materials property prediction
+methods: The Matbench test set and Automatminer reference algorithm. Npj
+Computational Materials, 6(1), 1–10.
+https://doi.org/10.1038/s41524-020-00406-3</unstructured_citation>
+          </citation>
+          <citation key="jain_commentary_2013">
+            <article_title>Commentary: The Materials Project: A
+materials genome approach to accelerating materials
+innovation</article_title>
+            <author>Jain</author>
+            <journal_title>APL Materials</journal_title>
+            <issue>1</issue>
+            <volume>1</volume>
+            <doi>10.1063/1.4812323</doi>
+            <cYear>2013</cYear>
+            <unstructured_citation>Jain, A., Ong, S. P., Hautier, G.,
+Chen, W., Richards, W. D., Dacek, S., Cholia, S., Gunter, D., Skinner,
+D., Ceder, G., &amp; Persson, K. A. (2013). Commentary: The Materials
+Project: A materials genome approach to accelerating materials
+innovation. APL Materials, 1(1), 011002.
+https://doi.org/10.1063/1.4812323</unstructured_citation>
+          </citation>
+          <citation key="ong_python_2013">
+            <article_title>Python Materials Genomics (pymatgen): A
+robust, open-source python library for materials
+analysis</article_title>
+            <author>Ong</author>
+            <journal_title>Computational Materials
+Science</journal_title>
+            <volume>68</volume>
+            <doi>10.1016/j.commatsci.2012.10.028</doi>
+            <cYear>2013</cYear>
+            <unstructured_citation>Ong, S. P., Richards, W. D., Jain,
+A., Hautier, G., Kocher, M., Cholia, S., Gunter, D., Chevrier, V. L.,
+Persson, K. A., &amp; Ceder, G. (2013). Python Materials Genomics
+(pymatgen): A robust, open-source python library for materials analysis.
+Computational Materials Science, 68, 314–319.
+https://doi.org/10.1016/j.commatsci.2012.10.028</unstructured_citation>
+          </citation>
+          <citation key="palizhati_agents_2022">
+            <article_title>Agents for sequential learning using
+multiple-fidelity data</article_title>
+            <author>Palizhati</author>
+            <journal_title>Scientific Reports</journal_title>
+            <issue>1</issue>
+            <volume>12</volume>
+            <doi>10.1038/s41598-022-08413-8</doi>
+            <issn>2045-2322</issn>
+            <cYear>2022</cYear>
+            <unstructured_citation>Palizhati, A., Torrisi, S. B., Aykol,
+M., Suram, S. K., Hummelshøj, J. S., &amp; Montoya, J. H. (2022). Agents
+for sequential learning using multiple-fidelity data. Scientific
+Reports, 12(1), 4694.
+https://doi.org/10.1038/s41598-022-08413-8</unstructured_citation>
+          </citation>
+          <citation key="polykovskiy_molecular_2020">
+            <article_title>Molecular sets (MOSES): A benchmarking
+platform for molecular generation models</article_title>
+            <author>Polykovskiy</author>
+            <journal_title>Frontiers in Pharmacology</journal_title>
+            <volume>11</volume>
+            <doi>10.3389/fphar.2020.565644</doi>
+            <issn>1663-9812</issn>
+            <cYear>2020</cYear>
+            <unstructured_citation>Polykovskiy, D., Zhebrak, A.,
+Sanchez-Lengeling, B., Golovanov, S., Tatanov, O., Belyaev, S.,
+Kurbanov, R., Artamonov, A., Aladinskiy, V., Veselov, M., Kadurin, A.,
+Johansson, S., Chen, H., Nikolenko, S., Aspuru-Guzik, A., &amp;
+Zhavoronkov, A. (2020). Molecular sets (MOSES): A benchmarking platform
+for molecular generation models. Frontiers in Pharmacology, 11.
+https://doi.org/10.3389/fphar.2020.565644</unstructured_citation>
+          </citation>
+          <citation key="ren_invertible_2022">
+            <article_title>An invertible crystallographic representation
+for general inverse design of inorganic crystals with targeted
+properties</article_title>
+            <author>Ren</author>
+            <journal_title>Matter</journal_title>
+            <issue>1</issue>
+            <volume>5</volume>
+            <doi>10.1016/j.matt.2021.11.032</doi>
+            <issn>2590-2385</issn>
+            <cYear>2022</cYear>
+            <unstructured_citation>Ren, Z., Tian, S. I. P., Noh, J.,
+Oviedo, F., Xing, G., Li, J., Liang, Q., Zhu, R., Aberle, A. G., Sun,
+S., Wang, X., Liu, Y., Li, Q., Jayavelu, S., Hippalgaonkar, K., Jung,
+Y., &amp; Buonassisi, T. (2022). An invertible crystallographic
+representation for general inverse design of inorganic crystals with
+targeted properties. Matter, 5(1), 314–335.
+https://doi.org/10.1016/j.matt.2021.11.032</unstructured_citation>
+          </citation>
+          <citation key="spek_checkcif_2020">
+            <article_title>checkCIF validation ALERTS: What they mean
+and how to respond</article_title>
+            <author>Spek</author>
+            <journal_title>Acta Crystallographica Section E
+Crystallographic Communications</journal_title>
+            <issue>1</issue>
+            <volume>76</volume>
+            <doi>10.1107/S2056989019016244</doi>
+            <issn>2056-9890</issn>
+            <cYear>2020</cYear>
+            <unstructured_citation>Spek, A. L. (2020). checkCIF
+validation ALERTS: What they mean and how to respond. Acta
+Crystallographica Section E Crystallographic Communications, 76(1),
+1–11. https://doi.org/10.1107/S2056989019016244</unstructured_citation>
+          </citation>
+          <citation key="tshitoyan_unsupervised_2019">
+            <article_title>Unsupervised word embeddings capture latent
+knowledge from materials science literature</article_title>
+            <author>Tshitoyan</author>
+            <journal_title>Nature</journal_title>
+            <issue>7763</issue>
+            <volume>571</volume>
+            <doi>10.1038/s41586-019-1335-8</doi>
+            <issn>0028-0836</issn>
+            <cYear>2019</cYear>
+            <unstructured_citation>Tshitoyan, V., Dagdelen, J., Weston,
+L., Dunn, A., Rong, Z., Kononova, O., Persson, K. A., Ceder, G., &amp;
+Jain, A. (2019). Unsupervised word embeddings capture latent knowledge
+from materials science literature. Nature, 571(7763), 95–98.
+https://doi.org/10.1038/s41586-019-1335-8</unstructured_citation>
+          </citation>
+          <citation key="xie_crystal_2022">
+            <article_title>Crystal Diffusion Variational Autoencoder for
+Periodic Material Generation</article_title>
+            <author>Xie</author>
+            <journal_title>arXiv:2110.06197 [cond-mat,
+physics:physics]</journal_title>
+            <cYear>2022</cYear>
+            <unstructured_citation>Xie, T., Fu, X., Ganea, O.-E.,
+Barzilay, R., &amp; Jaakkola, T. (2022). Crystal Diffusion Variational
+Autoencoder for Periodic Material Generation. arXiv:2110.06197
+[Cond-Mat, Physics:physics].
+https://arxiv.org/abs/2110.06197</unstructured_citation>
+          </citation>
+          <citation key="zhao_high-throughput_2021">
+            <article_title>High-throughput discovery of novel cubic
+crystal materials using deep generative neural networks</article_title>
+            <author>Zhao</author>
+            <journal_title>Advanced Science</journal_title>
+            <issue>20</issue>
+            <volume>8</volume>
+            <doi>10.1002/advs.202100566</doi>
+            <issn>2198-3844</issn>
+            <cYear>2021</cYear>
+            <unstructured_citation>Zhao, Y., Al-Fahdi, M., Hu, M.,
+Siriwardane, E. M., Song, Y., Nasiri, A., &amp; Hu, J. (2021).
+High-throughput discovery of novel cubic crystal materials using deep
+generative neural networks. Advanced Science, 8(20), 2100566.
+https://doi.org/10.1002/advs.202100566</unstructured_citation>
+          </citation>
+          <citation key="choudhary_large_2023">
+            <article_title>Large Scale Benchmark of Materials Design
+Methods</article_title>
+            <author>Choudhary</author>
+            <doi>10.48550/arXiv.2306.11688</doi>
+            <cYear>2023</cYear>
+            <unstructured_citation>Choudhary, K., Wines, D., Li, K.,
+Garrity, K. F., Gupta, V., Romero, A. H., Krogel, J. T., Saritas, K.,
+Fuhr, A., Ganesh, P., Kent, P. R. C., Yan, K., Lin, Y., Ji, S.,
+Blaiszik, B., Reiser, P., Friederich, P., Agrawal, A., Tiwary, P., …
+Tavazza, F. (2023). Large Scale Benchmark of Materials Design Methods
+(No. arXiv:2306.11688). arXiv.
+https://doi.org/10.48550/arXiv.2306.11688</unstructured_citation>
+          </citation>
+          <citation key="riebesell_matbench_2024">
+            <article_title>Matbench Discovery – A framework to evaluate
+machine learning crystal stability predictions</article_title>
+            <author>Riebesell</author>
+            <doi>10.48550/arXiv.2308.14920</doi>
+            <cYear>2024</cYear>
+            <unstructured_citation>Riebesell, J., Goodall, R. E. A.,
+Benner, P., Chiang, Y., Deng, B., Lee, A. A., Jain, A., &amp; Persson,
+K. A. (2024). Matbench Discovery – A framework to evaluate machine
+learning crystal stability predictions (No. arXiv:2308.14920). arXiv.
+https://doi.org/10.48550/arXiv.2308.14920</unstructured_citation>
+          </citation>
+        </citation_list>
+      </journal_article>
+    </journal>
+  </body>
+</doi_batch>
diff --git a/joss.05618/10.21105.joss.05618.pdf b/joss.05618/10.21105.joss.05618.pdf
new file mode 100644
index 0000000000..c3935df6c9
Binary files /dev/null and b/joss.05618/10.21105.joss.05618.pdf differ
diff --git a/joss.05618/paper.jats/10.21105.joss.05618.jats b/joss.05618/paper.jats/10.21105.joss.05618.jats
new file mode 100644
index 0000000000..f157d378b8
--- /dev/null
+++ b/joss.05618/paper.jats/10.21105.joss.05618.jats
@@ -0,0 +1,772 @@
+<?xml version="1.0" encoding="utf-8" ?>
+<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN"
+                  "JATS-publishing1.dtd">
+<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.2" article-type="other">
+<front>
+<journal-meta>
+<journal-id></journal-id>
+<journal-title-group>
+<journal-title>Journal of Open Source Software</journal-title>
+<abbrev-journal-title>JOSS</abbrev-journal-title>
+</journal-title-group>
+<issn publication-format="electronic">2475-9066</issn>
+<publisher>
+<publisher-name>Open Journals</publisher-name>
+</publisher>
+</journal-meta>
+<article-meta>
+<article-id pub-id-type="publisher-id">5618</article-id>
+<article-id pub-id-type="doi">10.21105/joss.05618</article-id>
+<title-group>
+<article-title>matbench-genmetrics: A Python library for benchmarking
+crystal structure generative models using time-based splits of Materials
+Project structures</article-title>
+</title-group>
+<contrib-group>
+<contrib contrib-type="author" corresp="yes">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-4491-6876</contrib-id>
+<name>
+<surname>Baird</surname>
+<given-names>Sterling G.</given-names>
+</name>
+<xref ref-type="aff" rid="aff-1"/>
+<xref ref-type="aff" rid="aff-3"/>
+<xref ref-type="corresp" rid="cor-1"><sup>*</sup></xref>
+</contrib>
+<contrib contrib-type="author">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-6583-7755</contrib-id>
+<name>
+<surname>Sayeed</surname>
+<given-names>Hasan M.</given-names>
+</name>
+<xref ref-type="aff" rid="aff-1"/>
+</contrib>
+<contrib contrib-type="author">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-5760-2860</contrib-id>
+<name>
+<surname>Montoya</surname>
+<given-names>Joseph</given-names>
+</name>
+<xref ref-type="aff" rid="aff-2"/>
+</contrib>
+<contrib contrib-type="author">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-8020-7711</contrib-id>
+<name>
+<surname>Sparks</surname>
+<given-names>Taylor D.</given-names>
+</name>
+<xref ref-type="aff" rid="aff-1"/>
+</contrib>
+<aff id="aff-1">
+<institution-wrap>
+<institution>Materials Science &amp; Engineering, University of Utah,
+USA</institution>
+</institution-wrap>
+</aff>
+<aff id="aff-2">
+<institution-wrap>
+<institution>Toyota Research Institute, Los Altos, CA, USA</institution>
+</institution-wrap>
+</aff>
+<aff id="aff-3">
+<institution-wrap>
+<institution>Acceleration Consortium, University of Toronto. 80 St
+George St, Toronto, ON M5S 3H6</institution>
+</institution-wrap>
+</aff>
+</contrib-group>
+<author-notes>
+<corresp id="cor-1">* E-mail: <email></email></corresp>
+</author-notes>
+<pub-date date-type="pub" publication-format="electronic" iso-8601-date="2024-03-19">
+<day>19</day>
+<month>3</month>
+<year>2024</year>
+</pub-date>
+<volume>9</volume>
+<issue>97</issue>
+<fpage>5618</fpage>
+<permissions>
+<copyright-statement>Authors of papers retain copyright and release the
+work under a Creative Commons Attribution 4.0 International License (CC
+BY 4.0)</copyright-statement>
+<copyright-year>2022</copyright-year>
+<copyright-holder>The article authors</copyright-holder>
+<license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
+<license-p>Authors of papers retain copyright and release the work under
+a Creative Commons Attribution 4.0 International License (CC BY
+4.0)</license-p>
+</license>
+</permissions>
+<kwd-group kwd-group-type="author">
+<kwd>Python</kwd>
+<kwd>materials informatics</kwd>
+<kwd>crystal structure</kwd>
+<kwd>generative modeling</kwd>
+<kwd>TimeSeriesSplit</kwd>
+<kwd>benchmarking</kwd>
+</kwd-group>
+</article-meta>
+</front>
+<body>
+<sec id="summary">
+  <title>Summary</title>
+  <p>The progress of a machine learning field is both tracked and
+  propelled through the development of robust benchmarks. While
+  significant progress has been made to create standardized, easy-to-use
+  benchmarks for molecular discovery e.g.,
+  (<xref alt="Brown et al., 2019" rid="ref-brown_guacamol_2019" ref-type="bibr">Brown
+  et al., 2019</xref>), this remains a challenge for solid-state
+  material discovery
+  (<xref alt="Alverson et al., 2022" rid="ref-alverson_generative_2022" ref-type="bibr">Alverson
+  et al., 2022</xref>;
+  <xref alt="Xie et al., 2022" rid="ref-xie_crystal_2022" ref-type="bibr">Xie
+  et al., 2022</xref>;
+  <xref alt="Zhao et al., 2023" rid="ref-zhao_physics_2023" ref-type="bibr">Zhao
+  et al., 2023</xref>). To address this limitation, we propose
+  <monospace>matbench-genmetrics</monospace>, an open-source Python
+  library for benchmarking generative models for crystal structures. We
+  use four evaluation metrics inspired by Guacamol
+  (<xref alt="Brown et al., 2019" rid="ref-brown_guacamol_2019" ref-type="bibr">Brown
+  et al., 2019</xref>) and Crystal Diffusion Variational AutoEncoder
+  (CDVAE)
+  (<xref alt="Xie et al., 2022" rid="ref-xie_crystal_2022" ref-type="bibr">Xie
+  et al., 2022</xref>)—validity, coverage, novelty, and uniqueness—to
+  assess performance on Materials Project data splits using
+  timeline-based cross-validation. We believe that
+  <monospace>matbench-genmetrics</monospace> will provide the
+  standardization and convenience required for rigorous benchmarking of
+  crystal structure generative models. A visual overview of the
+  <monospace>matbench-genmetrics</monospace> library is provided in
+  <xref alt="[fig:summary]" rid="figU003Asummary">[fig:summary]</xref>.</p>
+  <fig>
+    <caption><p>Summary visualization of
+    <monospace>matbench-genmetrics</monospace> to evaluate crystal
+    generative model performance using validity, coverage, novelty, and
+    uniqueness metrics based on calendar-time splits of experimentally
+    determined Materials Project database entries. Validity is the
+    comparison of distribution characteristics (space group number)
+    between the generated materials and the training and test sets.
+    Coverage is the number of matches between the generated structures
+    and a held-out test set. Novelty is a comparison between the
+    generated and training structures. Finally, uniqueness is a measure
+    of the number of repeats within the generated structures (i.e.,
+    comparing the set of generated structures to itself). For in-depth
+    descriptions and equations for the four metrics described above, see
+    <ext-link ext-link-type="uri" xlink:href="https://matbench-genmetrics.readthedocs.io/en/latest/readme.html">https://matbench-genmetrics.readthedocs.io/en/latest/readme.html</ext-link>
+    and
+    <ext-link ext-link-type="uri" xlink:href="https://matbench-genmetrics.readthedocs.io/en/latest/metrics.html">https://matbench-genmetrics.readthedocs.io/en/latest/metrics.html</ext-link>.<styled-content id="figU003Asummary"></styled-content></p></caption>
+    <graphic mimetype="image" mime-subtype="png" xlink:href="paper.jats/matbench-genmetrics.png" />
+  </fig>
+</sec>
+<sec id="statement-of-need">
+  <title>Statement of need</title>
+  <p>In the field of materials informatics, where materials science
+  intersects with machine learning, benchmarks play a crucial role in
+  assessing model performance and enabling fair comparisons among
+  various tools and models. Typically, these benchmarks focus on
+  evaluating the accuracy of predictive models for materials properties,
+  utilizing well-established metrics such as mean absolute error and
+  root-mean-square error to measure performance against actual
+  measurements. A standard practice involves splitting the data into two
+  parts, with one serving as training data for model development and the
+  other as test data for assessing performance
+  (<xref alt="Dunn et al., 2020" rid="ref-dunn_benchmarking_2020" ref-type="bibr">Dunn
+  et al., 2020</xref>).</p>
+  <p>However, benchmarking generative models, which aim to create
+  entirely new data rather than focusing solely on predictive accuracy,
+  presents unique challenges. While significant progress has been made
+  in standardizing benchmarks for tasks like image generation and
+  molecule synthesis, the field of crystal structure generative modeling
+  lacks this level of standardization (this is separate from machine
+  learning interatomic potentials, which have the robust and
+  comprehensive
+  <ext-link ext-link-type="uri" xlink:href="https://matbench-discovery.materialsproject.org/"><monospace>matbench-discovery</monospace></ext-link>
+  (<xref alt="Riebesell et al., 2024" rid="ref-riebesell_matbench_2024" ref-type="bibr">Riebesell
+  et al., 2024</xref>) and
+  <ext-link ext-link-type="uri" xlink:href="https://pages.nist.gov/jarvis_leaderboard/">Jarvis
+  Leaderboard</ext-link> benchmarking frameworks
+  (<xref alt="Choudhary et al., 2023" rid="ref-choudhary_large_2023" ref-type="bibr">Choudhary
+  et al., 2023</xref>)). Molecular generative modeling benefits from
+  widely adopted benchmark platforms such as Guacamol
+  (<xref alt="Brown et al., 2019" rid="ref-brown_guacamol_2019" ref-type="bibr">Brown
+  et al., 2019</xref>) and Moses
+  (<xref alt="Polykovskiy et al., 2020" rid="ref-polykovskiy_molecular_2020" ref-type="bibr">Polykovskiy
+  et al., 2020</xref>), which offer easy installation, usage guidelines,
+  and leaderboards for tracking progress. In contrast, existing
+  evaluations in crystal structure generative modeling, as seen in CDVAE
+  (<xref alt="Xie et al., 2022" rid="ref-xie_crystal_2022" ref-type="bibr">Xie
+  et al., 2022</xref>), FTCP
+  (<xref alt="Ren et al., 2022" rid="ref-ren_invertible_2022" ref-type="bibr">Ren
+  et al., 2022</xref>), PGCGM
+  (<xref alt="Zhao et al., 2023" rid="ref-zhao_physics_2023" ref-type="bibr">Zhao
+  et al., 2023</xref>), CubicGAN
+  (<xref alt="Zhao et al., 2021" rid="ref-zhao_high-throughput_2021" ref-type="bibr">Zhao
+  et al., 2021</xref>), and CrysTens
+  (<xref alt="Alverson et al., 2022" rid="ref-alverson_generative_2022" ref-type="bibr">Alverson
+  et al., 2022</xref>), lack standardization, pose challenges in terms
+  of installation and application to new models and datasets, and lack
+  publicly accessible leaderboards. While these evaluations are valuable
+  within their respective scopes, there is a clear need for a dedicated
+  benchmarking platform to promote standardization and facilitate robust
+  comparisons.</p>
+  <p>In this work, we introduce
+  <monospace>matbench-genmetrics</monospace>, a materials benchmarking
+  platform for crystal structure generative models. We use concepts from
+  molecular generative modeling benchmarking to create a set of
+  evaluation metrics—validity, coverage, novelty, and uniqueness—which
+  are broadly defined as follows:</p>
+  <list list-type="bullet">
+    <list-item>
+      <p><bold>Validity</bold>: a measure of how well the generated
+      materials match the distribution of the training dataset</p>
+    </list-item>
+    <list-item>
+      <p><bold>Coverage</bold>: the ability to successfully predict
+      known materials which have been held out</p>
+    </list-item>
+    <list-item>
+      <p><bold>Novelty</bold>: generating structures which are close
+      matches to examples in the training set are penalized</p>
+    </list-item>
+    <list-item>
+      <p><bold>Uniqueness</bold>: the number of repeats within the
+      generated structures</p>
+    </list-item>
+  </list>
+  <p><monospace>matbench-genmetrics</monospace> is comprised of two
+  namespace packages. The first namespace package is
+  <monospace>matbench_genmetrics.core</monospace>, which provides the
+  following features:</p>
+  <list list-type="bullet">
+    <list-item>
+      <p><monospace>GenMatcher</monospace>: A class for calculating
+      matches between two sets of structures</p>
+    </list-item>
+    <list-item>
+      <p><monospace>GenMetrics</monospace>: A class for calculating
+      validity, coverage, novelty, and uniqueness metrics</p>
+    </list-item>
+    <list-item>
+      <p><monospace>MPTSMetrics</monospace>: class for loading
+      <monospace>mp_time_split</monospace> data, calculating time-series
+      cross-validation metrics, and saving results</p>
+    </list-item>
+    <list-item>
+      <p>Fixed benchmark classes for 10, 100, 1000, and 10000 generated
+      structures</p>
+    </list-item>
+  </list>
+  <p>Additionally, we introduce the
+  <monospace>matbench_genmetrics.mp_time_split</monospace> namespace
+  package as a complement to
+  <monospace>matbench_genmetrics.core</monospace>. It provides a
+  standardized dataset and cross-validation splits for evaluating the
+  mentioned four metrics. Time-based splits have been utilized in
+  materials informatics model validation, such as predicting future
+  thermoelectric materials via word embeddings
+  (<xref alt="Tshitoyan et al., 2019" rid="ref-tshitoyan_unsupervised_2019" ref-type="bibr">Tshitoyan
+  et al., 2019</xref>), searching for efficient solar photoabsorption
+  materials through multi-fidelity optimization
+  (<xref alt="Palizhati et al., 2022" rid="ref-palizhati_agents_2022" ref-type="bibr">Palizhati
+  et al., 2022</xref>), and predicting future materials stability trends
+  via network models
+  (<xref alt="Aykol et al., 2019" rid="ref-aykol_network_2019" ref-type="bibr">Aykol
+  et al., 2019</xref>). Recently, Hu et al.
+  (<xref alt="Zhao et al., 2023" rid="ref-zhao_physics_2023" ref-type="bibr">Zhao
+  et al., 2023</xref>) used what they call a rediscovery metric,
+  referred to here as a coverage metric in line with molecular
+  benchmarking terminology, to evaluate crystal structure generative
+  models. While time-series splitting wasn’t used, they showed that
+  after generating millions of structures, only a small percentage of
+  held-out structures had matches. These results highlight the
+  difficulty (and robustness) of coverage tasks. By leveraging timeline
+  metadata from the Materials Project database
+  (<xref alt="Jain et al., 2013" rid="ref-jain_commentary_2013" ref-type="bibr">Jain
+  et al., 2013</xref>) and creating a standard time-series splitting of
+  data, <monospace>matbench_genmetrics.mp_time_split</monospace> enables
+  rigorous evaluation of future discovery performance.</p>
+  <p>The <monospace>matbench_genmetrics.mp_time_split</monospace>
+  namespace package provides the following features:</p>
+  <list list-type="bullet">
+    <list-item>
+      <p>downloading and storing snapshots of Materials Project crystal
+      structures via <monospace>pymatgen</monospace>
+      (<xref alt="Ong et al., 2013" rid="ref-ong_python_2013" ref-type="bibr">Ong
+      et al., 2013</xref>)</p>
+    </list-item>
+    <list-item>
+      <p>modification of <monospace>pymatgen</monospace> search criteria
+      to fetch custom datasets</p>
+    </list-item>
+    <list-item>
+      <p>utilities for post-processing Materials Project entries</p>
+    </list-item>
+    <list-item>
+      <p>convenience methods to access the snapshot dataset</p>
+    </list-item>
+    <list-item>
+      <p>predefined scikit-learn <monospace>TimeSeriesSplit</monospace>
+      cross-validation splits
+      (<xref alt="Ong et al., 2013" rid="ref-ong_python_2013" ref-type="bibr">Ong
+      et al., 2013</xref>)</p>
+    </list-item>
+  </list>
+  <p>In future work, metrics will serve as multi-criteria filters to
+  prevent manipulation. Standalone metrics can be “hacked” by generating
+  nonsensical structures for novelty or including training structures to
+  inflate validity scores. To address this, multiple criteria are
+  considered simultaneously for each generated structure, such as
+  novelty, uniqueness, and filtering rules like non-overlapping atoms,
+  stoichiometry, or checkCIF criteria
+  (<xref alt="Spek, 2020" rid="ref-spek_checkcif_2020" ref-type="bibr">Spek,
+  2020</xref>). Additional filters based on machine learning models can
+  be applied for properties like negative formation energy, energy above
+  hull, ICSD classification, and coordination number. Applying
+  machine-learning-based structural relaxation using M3GNet
+  (<xref alt="Chen &amp; Ong, 2022" rid="ref-chen_universal_2022" ref-type="bibr">Chen
+  &amp; Ong, 2022</xref>) (e.g., as in CrysTens
+  (<xref alt="Alverson et al., 2022" rid="ref-alverson_generative_2022" ref-type="bibr">Alverson
+  et al., 2022</xref>)) before filtering is also of interest.
+  Contributions related to multi-criteria filtering, enhanced validity
+  filters, and implementing a benchmark submission system and public
+  leaderboard are welcome.</p>
+  <p>We believe that the <monospace>matbench-genmetrics</monospace>
+  ecosystem is a robust and easy-to-use benchmarking platform that will
+  help propel novel materials discovery and targeted crystal structure
+  inverse design. We hope that practioners of crystal structure
+  generative modeling will adopt
+  <monospace>matbench-genmetrics</monospace>, contribute improvements
+  and ideas, and submit their results to the planned public
+  leaderboard.</p>
+</sec>
+<sec id="acknowledgements">
+  <title>Acknowledgements</title>
+  <p>We acknowledge contributions from Kevin M. Jablonka
+  (<ext-link ext-link-type="uri" xlink:href="https://github.com/kjappelbaum">@kjappelbaum</ext-link>),
+  Matthew K. Horton
+  (<ext-link ext-link-type="uri" xlink:href="https://github.com/mkhorton">@mkhorton</ext-link>),
+  Kyle D. Miller
+  (<ext-link ext-link-type="uri" xlink:href="https://github.com/kyledmiller">@kyledmiller</ext-link>),
+  and Janosh Riebesell
+  (<ext-link ext-link-type="uri" xlink:href="https://github.com/janosh">@janosh</ext-link>).
+  S.G.B. and T.D.S. acknowledge support by the National Science
+  Foundation, USA under Grant No. DMR-1651668. We acknowledge OpenAI for
+  the use of ChatGPT for basic proofreading and editing.</p>
+</sec>
+</body>
+<back>
+<ref-list>
+  <ref id="ref-zhao_physics_2023">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Zhao</surname><given-names>Yong</given-names></name>
+        <name><surname>Siriwardane</surname><given-names>Edirisuriya M. Dilanga</given-names></name>
+        <name><surname>Wu</surname><given-names>Zhenyao</given-names></name>
+        <name><surname>Fu</surname><given-names>Nihang</given-names></name>
+        <name><surname>Al-Fahdi</surname><given-names>Mohammed</given-names></name>
+        <name><surname>Hu</surname><given-names>Ming</given-names></name>
+        <name><surname>Hu</surname><given-names>Jianjun</given-names></name>
+      </person-group>
+      <article-title>Physics guided deep learning for generative design of crystal materials with symmetry constraints</article-title>
+      <source>npj Comput Mater</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2023-03">2023</year><month>03</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2024-05-09">2024</year><month>05</month><day>09</day></date-in-citation>
+      <volume>9</volume>
+      <issue>1</issue>
+      <issn>2057-3960</issn>
+      <pub-id pub-id-type="doi">10.1038/s41524-023-00987-9</pub-id>
+      <fpage>1</fpage>
+      <lpage>12</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-alverson_generative_2022">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Alverson</surname><given-names>Michael</given-names></name>
+        <name><surname>Baird</surname><given-names>Sterling</given-names></name>
+        <name><surname>Murdock</surname><given-names>Ryan</given-names></name>
+        <name><surname>Sparks</surname><given-names>Taylor</given-names></name>
+      </person-group>
+      <article-title>Generative adversarial networks and diffusion models in material discovery</article-title>
+      <year iso-8601-date="2022-11">2022</year><month>11</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-11-17">2022</year><month>11</month><day>17</day></date-in-citation>
+      <pub-id pub-id-type="doi">10.26434/chemrxiv-2022-6l4pm</pub-id>
+    </element-citation>
+  </ref>
+  <ref id="ref-aykol_network_2019">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Aykol</surname><given-names>Muratahan</given-names></name>
+        <name><surname>Hegde</surname><given-names>Vinay I.</given-names></name>
+        <name><surname>Hung</surname><given-names>Linda</given-names></name>
+        <name><surname>Suram</surname><given-names>Santosh</given-names></name>
+        <name><surname>Herring</surname><given-names>Patrick</given-names></name>
+        <name><surname>Wolverton</surname><given-names>Chris</given-names></name>
+        <name><surname>Hummelshøj</surname><given-names>Jens S.</given-names></name>
+      </person-group>
+      <article-title>Network analysis of synthesizable materials discovery</article-title>
+      <source>Nature Communications</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2019-05">2019</year><month>05</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-11-14">2022</year><month>11</month><day>14</day></date-in-citation>
+      <volume>10</volume>
+      <issue>1</issue>
+      <issn>2041-1723</issn>
+      <pub-id pub-id-type="doi">10.1038/s41467-019-10030-5</pub-id>
+      <fpage>2018</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-brown_guacamol_2019">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Brown</surname><given-names>Nathan</given-names></name>
+        <name><surname>Fiscato</surname><given-names>Marco</given-names></name>
+        <name><surname>Segler</surname><given-names>Marwin H. S.</given-names></name>
+        <name><surname>Vaucher</surname><given-names>Alain C.</given-names></name>
+      </person-group>
+      <article-title>GuacaMol: Benchmarking Models for de Novo Molecular Design</article-title>
+      <source>Journal of Chemical Information and Modeling</source>
+      <year iso-8601-date="2019-03">2019</year><month>03</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-06-25">2022</year><month>06</month><day>25</day></date-in-citation>
+      <volume>59</volume>
+      <issue>3</issue>
+      <issn>1549-9596</issn>
+      <pub-id pub-id-type="doi">10.1021/acs.jcim.8b00839</pub-id>
+      <fpage>1096</fpage>
+      <lpage>1108</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-chen_universal_2022">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Chen</surname><given-names>Chi</given-names></name>
+        <name><surname>Ong</surname><given-names>Shyue Ping</given-names></name>
+      </person-group>
+      <article-title>A universal graph deep learning interatomic potential for the periodic table</article-title>
+      <source>Nature Computational Science</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2022-11">2022</year><month>11</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-02-17">2023</year><month>02</month><day>17</day></date-in-citation>
+      <volume>2</volume>
+      <issue>11</issue>
+      <issn>2662-8457</issn>
+      <pub-id pub-id-type="doi">10.1038/s43588-022-00349-3</pub-id>
+      <fpage>718</fpage>
+      <lpage>728</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-dunn_benchmarking_2020">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Dunn</surname><given-names>Alexander</given-names></name>
+        <name><surname>Wang</surname><given-names>Qi</given-names></name>
+        <name><surname>Ganose</surname><given-names>Alex</given-names></name>
+        <name><surname>Dopp</surname><given-names>Daniel</given-names></name>
+        <name><surname>Jain</surname><given-names>Anubhav</given-names></name>
+      </person-group>
+      <article-title>Benchmarking materials property prediction methods: The Matbench test set and Automatminer reference algorithm</article-title>
+      <source>npj Computational Materials</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2020-09">2020</year><month>09</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-06-17">2023</year><month>06</month><day>17</day></date-in-citation>
+      <volume>6</volume>
+      <issue>1</issue>
+      <issn>2057-3960</issn>
+      <pub-id pub-id-type="doi">10.1038/s41524-020-00406-3</pub-id>
+      <fpage>1</fpage>
+      <lpage>10</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-jain_commentary_2013">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Jain</surname><given-names>Anubhav</given-names></name>
+        <name><surname>Ong</surname><given-names>Shyue Ping</given-names></name>
+        <name><surname>Hautier</surname><given-names>Geoffroy</given-names></name>
+        <name><surname>Chen</surname><given-names>Wei</given-names></name>
+        <name><surname>Richards</surname><given-names>William Davidson</given-names></name>
+        <name><surname>Dacek</surname><given-names>Stephen</given-names></name>
+        <name><surname>Cholia</surname><given-names>Shreyas</given-names></name>
+        <name><surname>Gunter</surname><given-names>Dan</given-names></name>
+        <name><surname>Skinner</surname><given-names>David</given-names></name>
+        <name><surname>Ceder</surname><given-names>Gerbrand</given-names></name>
+        <name><surname>Persson</surname><given-names>Kristin A.</given-names></name>
+      </person-group>
+      <article-title>Commentary: The Materials Project: A materials genome approach to accelerating materials innovation</article-title>
+      <source>APL Materials</source>
+      <publisher-name>American Institute of Physics</publisher-name>
+      <year iso-8601-date="2013-07">2013</year><month>07</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-11-14">2022</year><month>11</month><day>14</day></date-in-citation>
+      <volume>1</volume>
+      <issue>1</issue>
+      <pub-id pub-id-type="doi">10.1063/1.4812323</pub-id>
+      <fpage>011002</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-ong_python_2013">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Ong</surname><given-names>Shyue Ping</given-names></name>
+        <name><surname>Richards</surname><given-names>William Davidson</given-names></name>
+        <name><surname>Jain</surname><given-names>Anubhav</given-names></name>
+        <name><surname>Hautier</surname><given-names>Geoffroy</given-names></name>
+        <name><surname>Kocher</surname><given-names>Michael</given-names></name>
+        <name><surname>Cholia</surname><given-names>Shreyas</given-names></name>
+        <name><surname>Gunter</surname><given-names>Dan</given-names></name>
+        <name><surname>Chevrier</surname><given-names>Vincent L.</given-names></name>
+        <name><surname>Persson</surname><given-names>Kristin A.</given-names></name>
+        <name><surname>Ceder</surname><given-names>Gerbrand</given-names></name>
+      </person-group>
+      <article-title>Python Materials Genomics (pymatgen): A robust, open-source python library for materials analysis</article-title>
+      <source>Computational Materials Science</source>
+      <year iso-8601-date="2013-02">2013</year><month>02</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-06-09">2022</year><month>06</month><day>09</day></date-in-citation>
+      <volume>68</volume>
+      <pub-id pub-id-type="doi">10.1016/j.commatsci.2012.10.028</pub-id>
+      <fpage>314</fpage>
+      <lpage>319</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-palizhati_agents_2022">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Palizhati</surname><given-names>Aini</given-names></name>
+        <name><surname>Torrisi</surname><given-names>Steven B.</given-names></name>
+        <name><surname>Aykol</surname><given-names>Muratahan</given-names></name>
+        <name><surname>Suram</surname><given-names>Santosh K.</given-names></name>
+        <name><surname>Hummelshøj</surname><given-names>Jens S.</given-names></name>
+        <name><surname>Montoya</surname><given-names>Joseph H.</given-names></name>
+      </person-group>
+      <article-title>Agents for sequential learning using multiple-fidelity data</article-title>
+      <source>Scientific Reports</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2022-03">2022</year><month>03</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-11-14">2022</year><month>11</month><day>14</day></date-in-citation>
+      <volume>12</volume>
+      <issue>1</issue>
+      <issn>2045-2322</issn>
+      <pub-id pub-id-type="doi">10.1038/s41598-022-08413-8</pub-id>
+      <fpage>4694</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-polykovskiy_molecular_2020">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Polykovskiy</surname><given-names>Daniil</given-names></name>
+        <name><surname>Zhebrak</surname><given-names>Alexander</given-names></name>
+        <name><surname>Sanchez-Lengeling</surname><given-names>Benjamin</given-names></name>
+        <name><surname>Golovanov</surname><given-names>Sergey</given-names></name>
+        <name><surname>Tatanov</surname><given-names>Oktai</given-names></name>
+        <name><surname>Belyaev</surname><given-names>Stanislav</given-names></name>
+        <name><surname>Kurbanov</surname><given-names>Rauf</given-names></name>
+        <name><surname>Artamonov</surname><given-names>Aleksey</given-names></name>
+        <name><surname>Aladinskiy</surname><given-names>Vladimir</given-names></name>
+        <name><surname>Veselov</surname><given-names>Mark</given-names></name>
+        <name><surname>Kadurin</surname><given-names>Artur</given-names></name>
+        <name><surname>Johansson</surname><given-names>Simon</given-names></name>
+        <name><surname>Chen</surname><given-names>Hongming</given-names></name>
+        <name><surname>Nikolenko</surname><given-names>Sergey</given-names></name>
+        <name><surname>Aspuru-Guzik</surname><given-names>Alán</given-names></name>
+        <name><surname>Zhavoronkov</surname><given-names>Alex</given-names></name>
+      </person-group>
+      <article-title>Molecular sets (MOSES): A benchmarking platform for molecular generation models</article-title>
+      <source>Frontiers in Pharmacology</source>
+      <year iso-8601-date="2020">2020</year>
+      <volume>11</volume>
+      <issn>1663-9812</issn>
+      <pub-id pub-id-type="doi">10.3389/fphar.2020.565644</pub-id>
+    </element-citation>
+  </ref>
+  <ref id="ref-ren_invertible_2022">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Ren</surname><given-names>Zekun</given-names></name>
+        <name><surname>Tian</surname><given-names>Siyu Isaac Parker</given-names></name>
+        <name><surname>Noh</surname><given-names>Juhwan</given-names></name>
+        <name><surname>Oviedo</surname><given-names>Felipe</given-names></name>
+        <name><surname>Xing</surname><given-names>Guangzong</given-names></name>
+        <name><surname>Li</surname><given-names>Jiali</given-names></name>
+        <name><surname>Liang</surname><given-names>Qiaohao</given-names></name>
+        <name><surname>Zhu</surname><given-names>Ruiming</given-names></name>
+        <name><surname>Aberle</surname><given-names>Armin G.</given-names></name>
+        <name><surname>Sun</surname><given-names>Shijing</given-names></name>
+        <name><surname>Wang</surname><given-names>Xiaonan</given-names></name>
+        <name><surname>Liu</surname><given-names>Yi</given-names></name>
+        <name><surname>Li</surname><given-names>Qianxiao</given-names></name>
+        <name><surname>Jayavelu</surname><given-names>Senthilnath</given-names></name>
+        <name><surname>Hippalgaonkar</surname><given-names>Kedar</given-names></name>
+        <name><surname>Jung</surname><given-names>Yousung</given-names></name>
+        <name><surname>Buonassisi</surname><given-names>Tonio</given-names></name>
+      </person-group>
+      <article-title>An invertible crystallographic representation for general inverse design of inorganic crystals with targeted properties</article-title>
+      <source>Matter</source>
+      <year iso-8601-date="2022-01">2022</year><month>01</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-03-26">2022</year><month>03</month><day>26</day></date-in-citation>
+      <volume>5</volume>
+      <issue>1</issue>
+      <issn>2590-2385</issn>
+      <pub-id pub-id-type="doi">10.1016/j.matt.2021.11.032</pub-id>
+      <fpage>314</fpage>
+      <lpage>335</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-spek_checkcif_2020">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Spek</surname><given-names>Anthony L.</given-names></name>
+      </person-group>
+      <article-title>checkCIF validation ALERTS: What they mean and how to respond</article-title>
+      <source>Acta Crystallographica Section E Crystallographic Communications</source>
+      <year iso-8601-date="2020-01">2020</year><month>01</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-06-11">2022</year><month>06</month><day>11</day></date-in-citation>
+      <volume>76</volume>
+      <issue>1</issue>
+      <issn>2056-9890</issn>
+      <pub-id pub-id-type="doi">10.1107/S2056989019016244</pub-id>
+      <fpage>1</fpage>
+      <lpage>11</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-tshitoyan_unsupervised_2019">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Tshitoyan</surname><given-names>Vahe</given-names></name>
+        <name><surname>Dagdelen</surname><given-names>John</given-names></name>
+        <name><surname>Weston</surname><given-names>Leigh</given-names></name>
+        <name><surname>Dunn</surname><given-names>Alexander</given-names></name>
+        <name><surname>Rong</surname><given-names>Ziqin</given-names></name>
+        <name><surname>Kononova</surname><given-names>Olga</given-names></name>
+        <name><surname>Persson</surname><given-names>Kristin A.</given-names></name>
+        <name><surname>Ceder</surname><given-names>Gerbrand</given-names></name>
+        <name><surname>Jain</surname><given-names>Anubhav</given-names></name>
+      </person-group>
+      <article-title>Unsupervised word embeddings capture latent knowledge from materials science literature</article-title>
+      <source>Nature</source>
+      <year iso-8601-date="2019-07">2019</year><month>07</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-08-06">2022</year><month>08</month><day>06</day></date-in-citation>
+      <volume>571</volume>
+      <issue>7763</issue>
+      <issn>0028-0836</issn>
+      <pub-id pub-id-type="doi">10.1038/s41586-019-1335-8</pub-id>
+      <fpage>95</fpage>
+      <lpage>98</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-xie_crystal_2022">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Xie</surname><given-names>Tian</given-names></name>
+        <name><surname>Fu</surname><given-names>Xiang</given-names></name>
+        <name><surname>Ganea</surname><given-names>Octavian-Eugen</given-names></name>
+        <name><surname>Barzilay</surname><given-names>Regina</given-names></name>
+        <name><surname>Jaakkola</surname><given-names>Tommi</given-names></name>
+      </person-group>
+      <article-title>Crystal Diffusion Variational Autoencoder for Periodic Material Generation</article-title>
+      <source>arXiv:2110.06197 [cond-mat, physics:physics]</source>
+      <year iso-8601-date="2022-03">2022</year><month>03</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2022-04-15">2022</year><month>04</month><day>15</day></date-in-citation>
+      <uri>https://arxiv.org/abs/2110.06197</uri>
+    </element-citation>
+  </ref>
+  <ref id="ref-zhao_high-throughput_2021">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Zhao</surname><given-names>Yong</given-names></name>
+        <name><surname>Al-Fahdi</surname><given-names>Mohammed</given-names></name>
+        <name><surname>Hu</surname><given-names>Ming</given-names></name>
+        <name><surname>Siriwardane</surname><given-names>Edirisuriya MD</given-names></name>
+        <name><surname>Song</surname><given-names>Yuqi</given-names></name>
+        <name><surname>Nasiri</surname><given-names>Alireza</given-names></name>
+        <name><surname>Hu</surname><given-names>Jianjun</given-names></name>
+      </person-group>
+      <article-title>High-throughput discovery of novel cubic crystal materials using deep generative neural networks</article-title>
+      <source>Advanced Science</source>
+      <year iso-8601-date="2021-10">2021</year><month>10</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-03-17">2023</year><month>03</month><day>17</day></date-in-citation>
+      <volume>8</volume>
+      <issue>20</issue>
+      <issn>2198-3844</issn>
+      <uri>https://arxiv.org/abs/2102.01880</uri>
+      <pub-id pub-id-type="doi">10.1002/advs.202100566</pub-id>
+      <fpage>2100566</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-choudhary_large_2023">
+    <element-citation>
+      <person-group person-group-type="author">
+        <name><surname>Choudhary</surname><given-names>Kamal</given-names></name>
+        <name><surname>Wines</surname><given-names>Daniel</given-names></name>
+        <name><surname>Li</surname><given-names>Kangming</given-names></name>
+        <name><surname>Garrity</surname><given-names>Kevin F.</given-names></name>
+        <name><surname>Gupta</surname><given-names>Vishu</given-names></name>
+        <name><surname>Romero</surname><given-names>Aldo H.</given-names></name>
+        <name><surname>Krogel</surname><given-names>Jaron T.</given-names></name>
+        <name><surname>Saritas</surname><given-names>Kayahan</given-names></name>
+        <name><surname>Fuhr</surname><given-names>Addis</given-names></name>
+        <name><surname>Ganesh</surname><given-names>Panchapakesan</given-names></name>
+        <name><surname>Kent</surname><given-names>Paul R. C.</given-names></name>
+        <name><surname>Yan</surname><given-names>Keqiang</given-names></name>
+        <name><surname>Lin</surname><given-names>Yuchao</given-names></name>
+        <name><surname>Ji</surname><given-names>Shuiwang</given-names></name>
+        <name><surname>Blaiszik</surname><given-names>Ben</given-names></name>
+        <name><surname>Reiser</surname><given-names>Patrick</given-names></name>
+        <name><surname>Friederich</surname><given-names>Pascal</given-names></name>
+        <name><surname>Agrawal</surname><given-names>Ankit</given-names></name>
+        <name><surname>Tiwary</surname><given-names>Pratyush</given-names></name>
+        <name><surname>Beyerle</surname><given-names>Eric</given-names></name>
+        <name><surname>Minch</surname><given-names>Peter</given-names></name>
+        <name><surname>Rhone</surname><given-names>Trevor David</given-names></name>
+        <name><surname>Takeuchi</surname><given-names>Ichiro</given-names></name>
+        <name><surname>Wexler</surname><given-names>Robert B.</given-names></name>
+        <name><surname>Mannodi-Kanakkithodi</surname><given-names>Arun</given-names></name>
+        <name><surname>Ertekin</surname><given-names>Elif</given-names></name>
+        <name><surname>Mishra</surname><given-names>Avanish</given-names></name>
+        <name><surname>Mathew</surname><given-names>Nithin</given-names></name>
+        <name><surname>Baird</surname><given-names>Sterling G.</given-names></name>
+        <name><surname>Wood</surname><given-names>Mitchell</given-names></name>
+        <name><surname>Rohskopf</surname><given-names>Andrew Dale</given-names></name>
+        <name><surname>Hattrick-Simpers</surname><given-names>Jason</given-names></name>
+        <name><surname>Wang</surname><given-names>Shih-Han</given-names></name>
+        <name><surname>Achenie</surname><given-names>Luke E. K.</given-names></name>
+        <name><surname>Xin</surname><given-names>Hongliang</given-names></name>
+        <name><surname>Williams</surname><given-names>Maureen</given-names></name>
+        <name><surname>Biacchi</surname><given-names>Adam J.</given-names></name>
+        <name><surname>Tavazza</surname><given-names>Francesca</given-names></name>
+      </person-group>
+      <article-title>Large Scale Benchmark of Materials Design Methods</article-title>
+      <publisher-name>arXiv</publisher-name>
+      <year iso-8601-date="2023-06">2023</year><month>06</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2024-03-18">2024</year><month>03</month><day>18</day></date-in-citation>
+      <uri>https://arxiv.org/abs/2306.11688</uri>
+      <pub-id pub-id-type="doi">10.48550/arXiv.2306.11688</pub-id>
+    </element-citation>
+  </ref>
+  <ref id="ref-riebesell_matbench_2024">
+    <element-citation>
+      <person-group person-group-type="author">
+        <name><surname>Riebesell</surname><given-names>Janosh</given-names></name>
+        <name><surname>Goodall</surname><given-names>Rhys E. A.</given-names></name>
+        <name><surname>Benner</surname><given-names>Philipp</given-names></name>
+        <name><surname>Chiang</surname><given-names>Yuan</given-names></name>
+        <name><surname>Deng</surname><given-names>Bowen</given-names></name>
+        <name><surname>Lee</surname><given-names>Alpha A.</given-names></name>
+        <name><surname>Jain</surname><given-names>Anubhav</given-names></name>
+        <name><surname>Persson</surname><given-names>Kristin A.</given-names></name>
+      </person-group>
+      <article-title>Matbench Discovery – A framework to evaluate machine learning crystal stability predictions</article-title>
+      <publisher-name>arXiv</publisher-name>
+      <year iso-8601-date="2024-02">2024</year><month>02</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2024-03-18">2024</year><month>03</month><day>18</day></date-in-citation>
+      <uri>https://arxiv.org/abs/2308.14920</uri>
+      <pub-id pub-id-type="doi">10.48550/arXiv.2308.14920</pub-id>
+    </element-citation>
+  </ref>
+</ref-list>
+</back>
+</article>
diff --git a/joss.05618/paper.jats/matbench-genmetrics.png b/joss.05618/paper.jats/matbench-genmetrics.png
new file mode 100644
index 0000000000..d8d3eb8a1e
Binary files /dev/null and b/joss.05618/paper.jats/matbench-genmetrics.png differ