<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd"><identifier identifierType="DOI">10.26165/JUELICH-DATA/GLTKXZ</identifier><creators><creator><creatorName nameType="Personal">Hermanns, Alexander</creatorName><givenName>Alexander</givenName><familyName>Hermanns</familyName><nameIdentifier SchemeURI="https://orcid.org/" nameIdentifierScheme="ORCID">0009-0007-9974-4307</nameIdentifier><affiliation>Forschungszentrum Jülich</affiliation></creator><creator><creatorName nameType="Personal">Lange, Anne Caroline</creatorName><givenName>Anne Caroline</givenName><familyName>Lange</familyName><nameIdentifier SchemeURI="https://orcid.org/" nameIdentifierScheme="ORCID">0000-0001-8027-5933</nameIdentifier><affiliation>Forschungszentrum Jülich</affiliation></creator><creator><creatorName nameType="Personal">Fuchs, Hendrik</creatorName><givenName>Hendrik</givenName><familyName>Fuchs</familyName><nameIdentifier SchemeURI="https://orcid.org/" nameIdentifierScheme="ORCID">0000-0003-1263-0061</nameIdentifier><affiliation>Forschungszentrum Jülich</affiliation></creator><creator><creatorName nameType="Personal">Kowalski, Julia</creatorName><givenName>Julia</givenName><familyName>Kowalski</familyName><nameIdentifier SchemeURI="https://orcid.org/" nameIdentifierScheme="ORCID">0000-0003-4123-5896</nameIdentifier><affiliation>RWTH Aachen university</affiliation></creator><creator><creatorName nameType="Personal">Franke. Philipp</creatorName><nameIdentifier SchemeURI="https://orcid.org/" nameIdentifierScheme="ORCID">0000-0001-6298-164X</nameIdentifier><affiliation>Forschungszentrum Jülich</affiliation></creator></creators><titles><title>KSC - Observational Data Clustering Preprocessor</title></titles><publisher>Jülich DATA</publisher><publicationYear>2025</publicationYear><subjects><subject>Earth and Environmental Sciences</subject><subject>K-Mean</subject><subject>air quality</subject><subject>clustering</subject><subject>Data assimilation</subject></subjects><contributors><contributor contributorType="ContactPerson"><contributorName nameType="Personal">Franke, Philipp</contributorName><givenName>Philipp</givenName><familyName>Franke</familyName><affiliation>Forschungszentrum Jülich</affiliation></contributor></contributors><dates><date dateType="Submitted">2025-12-03</date><date dateType="Updated">2025-12-04</date></dates><resourceType resourceTypeGeneral="Dataset"/><relatedIdentifiers><relatedIdentifier relationType="IsCitedBy" SchemeURI="https://doi.org/" relatedIdentifierType="DOI">10.5281/zenodo.14711881</relatedIdentifier><relatedIdentifier relationType="IsCitedBy" SchemeURI="https://doi.org/" relatedIdentifierType="DOI">10.5194/gmd-18-9417-2025</relatedIdentifier></relatedIdentifiers><version>1.0</version><rightsList><rights rightsURI="info:eu-repo/semantics/openAccess"/><rights rightsURI="https://creativecommons.org/publicdomain/zero/1.0/">CC0 Waiver</rights></rightsList><descriptions><description descriptionType="Abstract">Preprocessing routine for ground-based atmospheric monitoring network data. Utilizing a k-means soft constrained clustering algorithm to derive a representative sub-sampling of the availiable data into an assimilation and validation set. &#xd;
&#xd;
This work was partially performed as part of the Helmholtz School for Data Science in Life, Earth and Energy (HDS-&#xd;
LEE) and received funding from the Helmholtz Association of German Research Centres.</description></descriptions><geoLocations/></resource>