<?xml version="1.0" encoding="UTF-8"?><!--*** Generated from internal PANGAEA metadata schema by dif.xslt ***--><DIF xsi:schemaLocation="http://gcmd.gsfc.nasa.gov/Aboutus/xml/dif/ http://gcmd.gsfc.nasa.gov/Aboutus/xml/dif/dif_v9.4.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://gcmd.gsfc.nasa.gov/Aboutus/xml/dif/">
<Entry_ID>PANGAEA_980505</Entry_ID>
<Entry_Title>Reference dataset of individual trees from the Tundra-Taiga-Ecotone and Northern boreal forests BorFIT</Entry_Title>
<Data_Set_Citation>
<Dataset_Creator>Kruse, Stefan; Schladebach, Jacob; Broers, Jakob; Hao, Kunyan; Tretton, James; Gorshunova, Anna</Dataset_Creator>
<Dataset_Title>Reference dataset of individual trees from the Tundra-Taiga-Ecotone and Northern boreal forests BorFIT</Dataset_Title>
<Dataset_Release_Date>2026-06-03</Dataset_Release_Date>
<Dataset_Publisher>PANGAEA</Dataset_Publisher>
<Data_Presentation_Form>Dataset</Data_Presentation_Form>
<Online_Resource>https://doi.pangaea.de/10.1594/PANGAEA.980505</Online_Resource>
</Data_Set_Citation>
<Personnel>
<Role>Investigator</Role>
<First_Name>Jacob</First_Name>
<Last_Name>Schladebach</Last_Name>
<Email>jacob.schladebach@awi.de</Email>
</Personnel>
<Discipline>
<Discipline_Name>Earth Science</Discipline_Name>
</Discipline>
<Parameters>
<Detailed_Variable>Event label</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Other event</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Sample code/label</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Plot</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Color description</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Vegetation type</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Major vegetation</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Tree height</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Model</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>LATITUDE</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>LONGITUDE</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Binary Object</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Landform</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Biome</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Location</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Area/locality</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>Proposed International Geo Sample Number</Detailed_Variable>
</Parameters>
<Parameters>
<Detailed_Variable>International Generic Sample Number</Detailed_Variable>
</Parameters>
<ISO_Topic_Category>geoscientificInformation</ISO_Topic_Category>
<Keyword>AK-Land_2023_Alaska_Forests</Keyword>
<Keyword>AK-Land_2024_WAlaska_Forests</Keyword>
<Keyword>boreal forest</Keyword>
<Keyword>CA-Land_2022_NWCanada_Forests</Keyword>
<Keyword>EN21201</Keyword>
<Keyword>EN21201_Lidar</Keyword>
<Keyword>EN21202_Lidar</Keyword>
<Keyword>EN21203_Lidar</Keyword>
<Keyword>EN21204</Keyword>
<Keyword>EN21204_Lidar</Keyword>
<Keyword>EN21205</Keyword>
<Keyword>EN21205_Lidar</Keyword>
<Keyword>EN21207</Keyword>
<Keyword>EN21207_Lidar</Keyword>
<Keyword>EN21209</Keyword>
<Keyword>EN21209_Lidar</Keyword>
<Keyword>EN21210</Keyword>
<Keyword>EN21210_Lidar</Keyword>
<Keyword>EN21211</Keyword>
<Keyword>EN21211_Lidar</Keyword>
<Keyword>EN21212</Keyword>
<Keyword>EN21212_Lidar</Keyword>
<Keyword>EN21213_Lidar</Keyword>
<Keyword>EN21215</Keyword>
<Keyword>EN21215_Lidar</Keyword>
<Keyword>EN21217_Lidar</Keyword>
<Keyword>EN21218</Keyword>
<Keyword>EN21218_Lidar</Keyword>
<Keyword>EN21220</Keyword>
<Keyword>EN21220_Lidar</Keyword>
<Keyword>EN21221</Keyword>
<Keyword>EN21221_Lidar</Keyword>
<Keyword>EN21224</Keyword>
<Keyword>EN21224_Lidar</Keyword>
<Keyword>EN21225</Keyword>
<Keyword>EN21225_Lidar</Keyword>
<Keyword>EN21228</Keyword>
<Keyword>EN21228_Lidar</Keyword>
<Keyword>EN21230</Keyword>
<Keyword>EN21230_Lidar</Keyword>
<Keyword>EN21232_Lidar</Keyword>
<Keyword>EN21233_Lidar</Keyword>
<Keyword>EN21234</Keyword>
<Keyword>EN21234_Lidar</Keyword>
<Keyword>EN21235</Keyword>
<Keyword>EN21235_Lidar</Keyword>
<Keyword>EN21236</Keyword>
<Keyword>EN21236_Lidar</Keyword>
<Keyword>EN21237</Keyword>
<Keyword>EN21237_Lidar</Keyword>
<Keyword>EN21238</Keyword>
<Keyword>EN21238_Lidar</Keyword>
<Keyword>EN21239</Keyword>
<Keyword>EN21239_Lidar</Keyword>
<Keyword>EN21240</Keyword>
<Keyword>EN21240_Lidar</Keyword>
<Keyword>EN21241</Keyword>
<Keyword>EN21241_Lidar</Keyword>
<Keyword>EN21244</Keyword>
<Keyword>EN21244_Lidar</Keyword>
<Keyword>EN21245</Keyword>
<Keyword>EN21245_Lidar</Keyword>
<Keyword>EN21247</Keyword>
<Keyword>EN21247_Lidar</Keyword>
<Keyword>EN21248</Keyword>
<Keyword>EN21248_Lidar</Keyword>
<Keyword>EN21249</Keyword>
<Keyword>EN21249_Lidar</Keyword>
<Keyword>EN21251</Keyword>
<Keyword>EN21251_Lidar</Keyword>
<Keyword>EN21252_Lidar</Keyword>
<Keyword>EN21253_Lidar</Keyword>
<Keyword>EN21255_Lidar</Keyword>
<Keyword>EN21257</Keyword>
<Keyword>EN21257_Lidar</Keyword>
<Keyword>EN21258</Keyword>
<Keyword>EN21258_Lidar</Keyword>
<Keyword>EN21260_Lidar</Keyword>
<Keyword>EN21261</Keyword>
<Keyword>EN21261_Lidar</Keyword>
<Keyword>EN21262</Keyword>
<Keyword>EN21262_Lidar</Keyword>
<Keyword>EN22002</Keyword>
<Keyword>EN22002_Lidar</Keyword>
<Keyword>EN22003</Keyword>
<Keyword>EN22003_Lidar</Keyword>
<Keyword>EN22005</Keyword>
<Keyword>EN22005_Lidar</Keyword>
<Keyword>EN22006</Keyword>
<Keyword>EN22006_Lidar</Keyword>
<Keyword>EN22009</Keyword>
<Keyword>EN22009_Lidar</Keyword>
<Keyword>EN22011</Keyword>
<Keyword>EN22011_Lidar</Keyword>
<Keyword>EN22012</Keyword>
<Keyword>EN22012_Lidar</Keyword>
<Keyword>EN22018</Keyword>
<Keyword>EN22018_Lidar</Keyword>
<Keyword>EN22019</Keyword>
<Keyword>EN22019_Lidar</Keyword>
<Keyword>EN22021</Keyword>
<Keyword>EN22021_Lidar</Keyword>
<Keyword>EN22032</Keyword>
<Keyword>EN22032_Lidar</Keyword>
<Keyword>EN22033</Keyword>
<Keyword>EN22033_Lidar</Keyword>
<Keyword>EN22037</Keyword>
<Keyword>EN22037_Lidar</Keyword>
<Keyword>EN22039</Keyword>
<Keyword>EN22039_Lidar</Keyword>
<Keyword>EN22047</Keyword>
<Keyword>EN22047_Lidar</Keyword>
<Keyword>EN22049</Keyword>
<Keyword>EN22049_Lidar</Keyword>
<Keyword>EN22052</Keyword>
<Keyword>EN22052_Lidar</Keyword>
<Keyword>EN22055</Keyword>
<Keyword>EN22055_Lidar</Keyword>
<Keyword>EN22058</Keyword>
<Keyword>EN22058_Lidar</Keyword>
<Keyword>EN22060</Keyword>
<Keyword>EN22060_Lidar</Keyword>
<Keyword>EN22062</Keyword>
<Keyword>EN22062_Lidar</Keyword>
<Keyword>EN22063</Keyword>
<Keyword>EN22063_Lidar</Keyword>
<Keyword>EN22065</Keyword>
<Keyword>EN22065_Lidar</Keyword>
<Keyword>EN22069</Keyword>
<Keyword>EN22069_Lidar</Keyword>
<Keyword>EN22071</Keyword>
<Keyword>EN22071_Lidar</Keyword>
<Keyword>EN23604_Lidar</Keyword>
<Keyword>EN23608_Lidar</Keyword>
<Keyword>EN23611_Lidar</Keyword>
<Keyword>EN23612_Lidar</Keyword>
<Keyword>EN23614_Lidar</Keyword>
<Keyword>EN23619_Lidar</Keyword>
<Keyword>EN23620</Keyword>
<Keyword>EN23620_Lidar</Keyword>
<Keyword>EN23621_Lidar</Keyword>
<Keyword>EN23622</Keyword>
<Keyword>EN23622_Lidar</Keyword>
<Keyword>EN23634_Lidar</Keyword>
<Keyword>EN23636_Lidar</Keyword>
<Keyword>EN23639_Lidar</Keyword>
<Keyword>EN23644_Lidar</Keyword>
<Keyword>EN23650_Lidar</Keyword>
<Keyword>EN23651_Lidar</Keyword>
<Keyword>EN23661_Lidar</Keyword>
<Keyword>EN23662</Keyword>
<Keyword>EN23662_Lidar</Keyword>
<Keyword>EN23666_Lidar</Keyword>
<Keyword>EN23668_Lidar</Keyword>
<Keyword>EN23675_Lidar</Keyword>
<Keyword>EN23676</Keyword>
<Keyword>EN23676_Lidar</Keyword>
<Keyword>EN23677_Lidar</Keyword>
<Keyword>EN23688</Keyword>
<Keyword>EN23688_Lidar</Keyword>
<Keyword>EN23699_Lidar</Keyword>
<Keyword>EN23700_Lidar</Keyword>
<Keyword>EN24110_Lidar</Keyword>
<Keyword>EN24112</Keyword>
<Keyword>EN24112_Lidar</Keyword>
<Keyword>EN24118_Lidar</Keyword>
<Keyword>EN24124_Lidar</Keyword>
<Keyword>Forest Transect</Keyword>
<Keyword>lidar remote sensing</Keyword>
<Keyword>Reference</Keyword>
<Keyword>RU-Land_2021_Yakutia</Keyword>
<Keyword>Tree segmentation</Keyword>
<Keyword>Unmanned Aerial Vehicle (UAV), DJI Technology Co, Matrice 300 RTK; coupled with Light detection and ranging scanner (LiDAR), YellowScan, Mapper</Keyword>
<Sensor_Name>
<Long_Name>see documentation</Long_Name>
</Sensor_Name>
<Sensor_Name>
<Long_Name>Light detection and ranging scanner (LiDAR), YellowScan, Mapper</Long_Name>
</Sensor_Name>
<Source_Name>
<Long_Name>AWI Arctic Land Expedition</Long_Name>
</Source_Name>
<Temporal_Coverage>
<Start_Date>2021-08-06</Start_Date>
<Stop_Date>2024-07-06</Stop_Date>
</Temporal_Coverage>
<Data_Set_Progress>Complete</Data_Set_Progress>
<Spatial_Coverage>
<Southernmost_Latitude>58.74853844</Southernmost_Latitude>
<Northernmost_Latitude>68.72589969</Northernmost_Latitude>
<Westernmost_Longitude>130.1122653</Westernmost_Longitude>
<Easternmost_Longitude>-121.8371161</Easternmost_Longitude>
</Spatial_Coverage>
<Project>
<Short_Name>AWI_Envi</Short_Name>
<Long_Name>Polar Terrestrial Environmental Systems @ AWI</Long_Name>
</Project>
<Access_Constraints>unrestricted</Access_Constraints>
<Use_Constraints>CC-BY-4.0: Creative Commons Attribution 4.0 International</Use_Constraints>
<Data_Set_Language>English</Data_Set_Language>
<Data_Center>
<Data_Center_Name>
<Short_Name>PANGAEA</Short_Name>
<Long_Name>Data Publisher for Earth &amp; Environmental Science</Long_Name>
</Data_Center_Name>
<Data_Center_URL>https://www.pangaea.de/</Data_Center_URL>
<Personnel>
<Role>Data Center Contact</Role>
<First_Name>Michael</First_Name>
<Last_Name>Diepenbroek</Last_Name>
<Email>info@pangaea.de</Email>
<Contact_Address>
<Address>Leobener Str.</Address>
<City>Bremen</City>
<Province_or_State>Bremen</Province_or_State>
<Postal_Code>28359</Postal_Code>
<Country>Germany</Country>
</Contact_Address>
</Personnel>
</Data_Center>
<Distribution>
<Distribution_Media>online</Distribution_Media>
<Distribution_Size>5072 data points</Distribution_Size>
<Distribution_Format>text/tab-separated-values</Distribution_Format>
</Distribution>
<Reference>Schladebach, Jacob; Heim, Birgit; Enguehard, Léa; Wieczorek, Mareike; Broers, Jakob; Jackisch, Robert; Gloy, Josias; Hao, Kunyan; Tretton, James; Gorshunova, Anna; Kruse, Stefan (preprint): BorFIT: A Novel LiDAR-Based Training Dataset for Individual Tree Segmentation and Species Detection in northern boreal Forests. https://doi.org/10.5194/essd-2025-340</Reference>
<Reference>Kruse, Stefan; Enguehard, Léa; Juday, Glenn; Santosh, Panda; Badola, Anushree; Broers, Jakob; Farkas, Luca; Schladebach, Jacob; Hao, Kunyan; Jackisch, Robert; Döpper, Veronika; Heim, Birgit (2025): Point clouds with ground point classification and individual tree segmentation of 28 northern boreal forest and tundra sites from UAV-based lidar surveys in western and central parts of Alaska in 2024 [dataset]. PANGAEA, https://doi.org/10.1594/PANGAEA.980757</Reference>
<Reference>Kruse, Stefan; Enguehard, Léa; Juday, Glenn; Santosh, Panda; Badola, Anushree; Broers, Jakob; Farkas, Luca; Schladebach, Jacob; Hao, Kunyan; Jackisch, Robert; Döpper, Veronika; Heim, Birgit (2025): Point clouds with ground point classification and individual tree segmentation of 47 northern boreal forest and tundra sites from UAV-based lidar surveys in the eastern part of Alaska in 2023 [dataset]. PANGAEA, https://doi.org/10.1594/PANGAEA.980485</Reference>
<Reference>Kruse, Stefan; Gloy, Josias; Farkas, Luca; Schladebach, Jacob; Hao, Kunyan; Döpper, Veronika; Heim, Birgit (2025): Point clouds with ground point classification and individual tree segmentation of 25 northern boreal forest and tundra sites from UAV-based lidar surveys in northwestern Canada in 2022 [dataset]. PANGAEA, https://doi.org/10.1594/PANGAEA.977771</Reference>
<Reference>Kruse, Stefan; Jackisch, Robert; Gloy, Josias; Farkas, Luca; Schladebach, Jacob; Hao, Kunyan; Heim, Birgit; Kolmogorov, Alexei; Zakharov, Evgenii S; Pestryakova, Luidmila A; Förster, Michael; Kleinschmit, Birgit; Herzschuh, Ulrike (2025): Point clouds with ground point classification and individual tree segmentation of 89 northern boreal forest and tundra sites from UAV-based lidar surveys in Yakutia, Russia in 2021 [dataset]. PANGAEA, https://doi.org/10.1594/PANGAEA.980735</Reference>
<Reference>Schladebach, Jacob; Kruse, Stefan (2025): Product Guide -  BorFIT: A Novel LiDAR-Based Training Dataset for Individual Tree Segmentation and Species Detection in northern boreal Forests. https://download.pangaea.de/reference/133868/attachments/Product%20Guide.pdf</Reference>
<Reference>Kruse, Stefan (2025): Manually assigned training data las files [dataset]. https://store.pangaea.de/Publications/Kruse_et_al_2025_BorFIT-training-data.zip</Reference>
<Summary>BorFIT is a comprehensive training dataset that aims at enhancing the segmentation of individual trees and species detection from LiDAR point clouds, specifically in boreal forests. This dataset comprises 385 LiDAR point clouds, each covering an area of 20×20 m² and containing up to 200 manually segmented trees. The data was collected from 145 sites across Yakutia, Canada, and Alaska between 2021 and 2024, strategically chosen to represent a bioclimatic gradient across the circumboreal region. The LiDAR surveys utilized a YellowScan LiDAR Mapper+ mounted on a UAV which surveyed the areas at an altitude of 70 m achieving an average point density of 1200 points/m² over an area of approximately 50×500 m². Up to 4 reference plots (depending on data quality and performed forest inventories) per point cloud were extracted, based on present tree heights to generate a representative subset of the original point cloud. Manual segmentation of trees was performed using the software CloudCompare. Based on these, a training data set for a randomForest classifier was prepared by assigning the species determination for a subset of individual trees per present species. The classifiers were then trained based on structural parameters from the point cloud, and if available, spectral information based on RGB imagery (CA,AK). Four classifiers were then utilized to predict the species of all segmented trees within the data set. The number coded species prediction was added to a new scalar field in the point clouds including a probability value as a indicator for prediction accuracy. The dataset encompasses various mostly northern boreal tree species, including Picea glauca, Picea mariana, Betula spp., and Larix laricina, among others. This diversity supports the analysis of species distribution and stand structure, crucial for understanding vegetation dynamics in response to climate change. The dataset's design not only addresses the limitations of existing AI-supported detection methods but also serves as a foundational resource for future research into boreal forest dynamics under global warming scenarios. ** For all details see the full metadata description at "https://doi.pangaea.de/10.1594/PANGAEA.980505"! ** Funding: The project was supported  through DataHub Information Infrastructure funds, project BorFIT

Data: The *.laz files  contain points with the following attributes: a. Tree; b. Species; c. Classification; d. Intensity; e. Return Number; f. Number of Returns; g. User Data; h. Synthetic Flag; i. Point Source ID; j. GPS Time</Summary>
<Related_URL>
<URL>http://en.wikipedia.org/wiki/ISO_6709</URL>
<Description>LATITUDE</Description>
</Related_URL>
<Related_URL>
<URL>http://en.wikipedia.org/wiki/ISO_6709</URL>
<Description>LONGITUDE</Description>
</Related_URL>
<Related_URL>
<URL>http://www.igsn.org/</URL>
<Description>International Generic Sample Number</Description>
</Related_URL>
<Related_URL>
<URL>https://doi.org/10.5194/essd-2025-340</URL>
<Description>BorFIT: A Novel LiDAR-Based Training Dataset for Individual Tree Segmentation and Species Detection in northern boreal Forests</Description>
</Related_URL>
<Related_URL>
<URL>https://doi.pangaea.de/10.1594/PANGAEA.977771</URL>
<Description>Point clouds with ground point classification and individual tree segmentation of 25 northern boreal forest and tundra sites from UAV-based lidar surveys in northwestern Canada in 2022</Description>
</Related_URL>
<Related_URL>
<URL>https://doi.pangaea.de/10.1594/PANGAEA.980485</URL>
<Description>Point clouds with ground point classification and individual tree segmentation of 47 northern boreal forest and tundra sites from UAV-based lidar surveys in the eastern part of Alaska in 2023</Description>
</Related_URL>
<Related_URL>
<URL>https://doi.pangaea.de/10.1594/PANGAEA.980735</URL>
<Description>Point clouds with ground point classification and individual tree segmentation of 89 northern boreal forest and tundra sites from UAV-based lidar surveys in Yakutia, Russia in 2021</Description>
</Related_URL>
<Related_URL>
<URL>https://doi.pangaea.de/10.1594/PANGAEA.980757</URL>
<Description>Point clouds with ground point classification and individual tree segmentation of 28 northern boreal forest and tundra sites from UAV-based lidar surveys in western and central parts of Alaska in 2024</Description>
</Related_URL>
<Related_URL>
<URL>https://en.wikipedia.org/wiki/Biome</URL>
<Description>Biome</Description>
</Related_URL>
<Related_URL>
<URL>https://store.pangaea.de/Publications/Kruse_et_al_2025_BorFIT-training-data.zip</URL>
<Description>Manually assigned training data las files</Description>
</Related_URL>
<Related_URL>
<URL>https://www.awi.de/en/science/geosciences/polar-terrestrial-environmental-systems.html</URL>
<Description>AWI_Envi</Description>
</Related_URL>
<Metadata_Name>DIF</Metadata_Name>
<Metadata_Version>9.4</Metadata_Version>
<DIF_Creation_Date>2026-06-03</DIF_Creation_Date>
<Last_DIF_Revision_Date>2026-06-03</Last_DIF_Revision_Date>
</DIF>
