<?xml version='1.0' encoding='UTF-8'?><codeBook xmlns="ddi:codebook:2_5" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="ddi:codebook:2_5 https://ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" version="2.5"><docDscr><citation><titlStmt><titl>KSC - Observational Data Clustering Preprocessor</titl><IDNo agency="DOI">doi:10.26165/JUELICH-DATA/GLTKXZ</IDNo></titlStmt><distStmt><distrbtr source="archive">Jülich DATA</distrbtr><distDate>2025-12-04</distDate></distStmt><verStmt source="DVN"><version date="2025-12-04" type="RELEASED">1</version></verStmt><biblCit>Hermanns, Alexander; Lange, Anne Caroline; Fuchs, Hendrik; Kowalski, Julia; Franke. Philipp, 2025, "KSC - Observational Data Clustering Preprocessor", https://doi.org/10.26165/JUELICH-DATA/GLTKXZ, Jülich DATA, V1</biblCit></citation></docDscr><stdyDscr><citation><titlStmt><titl>KSC - Observational Data Clustering Preprocessor</titl><IDNo agency="DOI">doi:10.26165/JUELICH-DATA/GLTKXZ</IDNo></titlStmt><rspStmt><AuthEnty affiliation="Forschungszentrum Jülich">Hermanns, Alexander</AuthEnty><AuthEnty affiliation="Forschungszentrum Jülich">Lange, Anne Caroline</AuthEnty><AuthEnty affiliation="Forschungszentrum Jülich">Fuchs, Hendrik</AuthEnty><AuthEnty affiliation="RWTH Aachen university">Kowalski, Julia</AuthEnty><AuthEnty affiliation="Forschungszentrum Jülich">Franke. Philipp</AuthEnty></rspStmt><prodStmt/><distStmt><distrbtr source="archive">Jülich DATA</distrbtr><contact affiliation="Forschungszentrum Jülich" email="p.franke@fz-juelich.de">Franke, Philipp</contact><depositr>Franke, Philipp</depositr><depDate>2025-12-03</depDate></distStmt></citation><stdyInfo><subject><keyword>Earth and Environmental Sciences</keyword><keyword>K-Mean</keyword><keyword>air quality</keyword><keyword>clustering</keyword><keyword>Data assimilation</keyword></subject><abstract date="2025-12-03">Preprocessing routine for ground-based atmospheric monitoring network data. Utilizing a k-means soft constrained clustering algorithm to derive a representative sub-sampling of the availiable data into an assimilation and validation set. &#xd;
&#xd;
This work was partially performed as part of the Helmholtz School for Data Science in Life, Earth and Energy (HDS-&#xd;
LEE) and received funding from the Helmholtz Association of German Research Centres.</abstract><sumDscr/></stdyInfo><method><dataColl><sources/></dataColl><anlyInfo/></method><dataAccs><notes type="DVN:TOU" level="dv">CC0 Waiver</notes><setAvail/><useStmt/></dataAccs><othrStdyMat><relPubl><citation><titlStmt><IDNo agency="doi">https://doi.org/10.5281/zenodo.14711881</IDNo></titlStmt><biblCit>Hermanns, A.: KSC – Observational Data Clustering Preprocessor, Zenodo [code], https://doi.org/10.5281/zenodo.14711881, 2025.</biblCit></citation><ExtLink URI="https://doi.org/10.5281/zenodo.14711881"/></relPubl><relPubl><citation><titlStmt><IDNo agency="doi">https://doi.org/10.5194/gmd-18-9417-2025</IDNo></titlStmt><biblCit>Hermanns, A., Lange, A. C., Kowalski, J., Fuchs, H., and Franke, P.: Data clustering to optimise the representativity of observational data in air quality data assimilation: a case study with EURAD-IM (version 5.9.1 DA), Geosci. Model Dev., 18, 9417–9432, https://doi.org/10.5194/gmd-18-9417-2025, 2025.</biblCit></citation><ExtLink URI="https://doi.org/10.5194/gmd-18-9417-2025"/></relPubl></othrStdyMat></stdyDscr></codeBook>