<?xml version="1.0" encoding="UTF-8"?><resource xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.3/metadata.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4"><identifier identifierType="URL">https://doi.pangaea.de/10.1594/PANGAEA.980505</identifier><creators><creator><creatorName>Kruse, Stefan</creatorName><givenName>Stefan</givenName><familyName>Kruse</familyName><nameIdentifier schemeURI="http://orcid.org/" nameIdentifierScheme="ORCID">0000-0003-1107-1958</nameIdentifier><affiliation affiliationIdentifierScheme="ROR" affiliationIdentifier="https://ror.org/032e6b942">Alfred Wegener Institute, Helmholtz Centre for Polar and Marine Research, Potsdam</affiliation></creator><creator><creatorName>Schladebach, Jacob</creatorName><givenName>Jacob</givenName><familyName>Schladebach</familyName><affiliation affiliationIdentifierScheme="ROR" affiliationIdentifier="https://ror.org/032e6b942">Alfred Wegener Institute, Helmholtz Centre for Polar and Marine Research, Potsdam</affiliation></creator><creator><creatorName>Broers, Jakob</creatorName><givenName>Jakob</givenName><familyName>Broers</familyName><affiliation affiliationIdentifierScheme="ROR" affiliationIdentifier="https://ror.org/032e6b942">Alfred Wegener Institute, Helmholtz Centre for Polar and Marine Research, Potsdam</affiliation></creator><creator><creatorName>Hao, Kunyan</creatorName><givenName>Kunyan</givenName><familyName>Hao</familyName><affiliation affiliationIdentifierScheme="ROR" affiliationIdentifier="https://ror.org/032e6b942">Alfred Wegener Institute, Helmholtz Centre for Polar and Marine Research, Potsdam</affiliation></creator><creator><creatorName>Tretton, James</creatorName><givenName>James</givenName><familyName>Tretton</familyName></creator><creator><creatorName>Gorshunova, Anna</creatorName><givenName>Anna</givenName><familyName>Gorshunova</familyName></creator></creators><titles><title>Reference dataset of individual trees from the Tundra-Taiga-Ecotone and Northern boreal forests BorFIT</title></titles><publisher>PANGAEA</publisher><publicationYear>2026</publicationYear><subjects><subject>boreal forest</subject><subject>Forest Transect</subject><subject>lidar remote sensing</subject><subject>Reference</subject><subject>Tree segmentation</subject><subject subjectScheme="Parameter">Event label</subject><subject subjectScheme="Parameter">Other event</subject><subject subjectScheme="Parameter">Sample code/label</subject><subject subjectScheme="Parameter">Plot</subject><subject subjectScheme="Parameter">Color description</subject><subject subjectScheme="Parameter">Vegetation type</subject><subject subjectScheme="Parameter">Major vegetation</subject><subject subjectScheme="Parameter">Tree height</subject><subject subjectScheme="Parameter">Model</subject><subject subjectScheme="Parameter">LATITUDE</subject><subject subjectScheme="Parameter">LONGITUDE</subject><subject subjectScheme="Parameter">Binary Object</subject><subject subjectScheme="Parameter">Landform</subject><subject subjectScheme="Parameter">Biome</subject><subject subjectScheme="Parameter">Location</subject><subject subjectScheme="Parameter">Area/locality</subject><subject subjectScheme="Parameter">Proposed International Geo Sample Number</subject><subject subjectScheme="Parameter">International Generic Sample Number</subject><subject subjectScheme="Method">Unmanned Aerial Vehicle (UAV), DJI Technology Co, Matrice 300 RTK; coupled with Light detection and ranging scanner (LiDAR), YellowScan, Mapper</subject><subject subjectScheme="Method">see documentation</subject><subject subjectScheme="Method">Light detection and ranging scanner (LiDAR), YellowScan, Mapper</subject><subject subjectScheme="Campaign">RU-Land_2021_Yakutia</subject><subject subjectScheme="Campaign">CA-Land_2022_NWCanada_Forests</subject><subject subjectScheme="Campaign">AK-Land_2023_Alaska_Forests</subject><subject subjectScheme="Campaign">AK-Land_2024_WAlaska_Forests</subject><subject subjectScheme="Basis">AWI Arctic Land Expedition</subject><subject subjectScheme="Project">Polar Terrestrial Environmental Systems @ AWI (AWI_Envi)</subject></subjects><dates><date dateType="Collected">2021-08-06T00:00:00/2024-07-06T00:00:00</date></dates><resourceType resourceTypeGeneral="Dataset">Dataset</resourceType><relatedIdentifiers><relatedIdentifier relatedIdentifierType="DOI" relationType="IsSupplementTo">10.5194/essd-2025-340</relatedIdentifier><relatedIdentifier relatedIdentifierType="DOI" relationType="IsDerivedFrom">10.1594/PANGAEA.980757</relatedIdentifier><relatedIdentifier relatedIdentifierType="DOI" relationType="IsDerivedFrom">10.1594/PANGAEA.980485</relatedIdentifier><relatedIdentifier relatedIdentifierType="DOI" relationType="IsDerivedFrom">10.1594/PANGAEA.977771</relatedIdentifier><relatedIdentifier relatedIdentifierType="DOI" relationType="IsDerivedFrom">10.1594/PANGAEA.980735</relatedIdentifier><relatedIdentifier relatedIdentifierType="URL" relationType="IsDocumentedBy">https://store.pangaea.de/Publications/Kruse_et_al_2025_BorFIT-training-data.zip</relatedIdentifier></relatedIdentifiers><sizes><size>5072 data points</size></sizes><formats><format>text/tab-separated-values</format></formats><rightsList><rights rightsURI="https://creativecommons.org/licenses/by/4.0/" schemeURI="https://spdx.org/licenses/" rightsIdentifierScheme="SPDX" rightsIdentifier="CC-BY-4.0">Creative Commons Attribution 4.0 International</rights></rightsList><descriptions><description descriptionType="Abstract">BorFIT is a comprehensive training dataset that aims at enhancing the segmentation of individual trees and species detection from LiDAR point clouds, specifically in boreal forests. This dataset comprises 385 LiDAR point clouds, each covering an area of 20×20 m² and containing up to 200 manually segmented trees. The data was collected from 145 sites across Yakutia, Canada, and Alaska between 2021 and 2024, strategically chosen to represent a bioclimatic gradient across the circumboreal region. The LiDAR surveys utilized a YellowScan LiDAR Mapper+ mounted on a UAV which surveyed the areas at an altitude of 70 m achieving an average point density of 1200 points/m² over an area of approximately 50×500 m². Up to 4 reference plots (depending on data quality and performed forest inventories) per point cloud were extracted, based on present tree heights to generate a representative subset of the original point cloud. Manual segmentation of trees was performed using the software CloudCompare. Based on these, a training data set for a randomForest classifier was prepared by assigning the species determination for a subset of individual trees per present species. The classifiers were then trained based on structural parameters from the point cloud, and if available, spectral information based on RGB imagery (CA,AK). Four classifiers were then utilized to predict the species of all segmented trees within the data set. The number coded species prediction was added to a new scalar field in the point clouds including a probability value as a indicator for prediction accuracy. The dataset encompasses various mostly northern boreal tree species, including Picea glauca, Picea mariana, Betula spp., and Larix laricina, among others. This diversity supports the analysis of species distribution and stand structure, crucial for understanding vegetation dynamics in response to climate change. The dataset's design not only addresses the limitations of existing AI-supported detection methods but also serves as a foundational resource for future research into boreal forest dynamics under global warming scenarios.</description><description descriptionType="TechnicalInfo">Funding: The project was supported  through DataHub Information Infrastructure funds, project BorFIT<br/><br/>Data: The *.laz files  contain points with the following attributes: a. Tree; b. Species; c. Classification; d. Intensity; e. Return Number; f. Number of Returns; g. User Data; h. Synthetic Flag; i. Point Source ID; j. GPS Time</description></descriptions><geoLocations><geoLocation><geoLocationBox><westBoundLongitude>130.1122653</westBoundLongitude><eastBoundLongitude>-121.8371161</eastBoundLongitude><southBoundLatitude>58.74853844</southBoundLatitude><northBoundLatitude>68.72589969</northBoundLatitude></geoLocationBox></geoLocation><geoLocation><geoLocationPlace>Yukon, Canada</geoLocationPlace></geoLocation><geoLocation><geoLocationPlace>Northwest Territories, Canada</geoLocationPlace></geoLocation><geoLocation><geoLocationPlace>British Columbia, Canada</geoLocationPlace></geoLocation><geoLocation><geoLocationPlace>Alaska Interior, USA</geoLocationPlace></geoLocation><geoLocation><geoLocationPlace>Southcentral Alaska, USA</geoLocationPlace></geoLocation></geoLocations><fundingReferences><fundingReference><funderName>Ministerium für Wissenschaft, Forschung und Kultur</funderName><funderIdentifier funderIdentifierType="Crossref Funder ID">https://doi.org/10.13039/501100004581</funderIdentifier><awardNumber>F221-08-AWI/001/002</awardNumber></fundingReference></fundingReferences></resource>