% IMPORTANT: The following is UTF-8 encoded.  This means that in the presence
% of non-ASCII characters, it will not work with BibTeX 0.99 or older.
% Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or
% “biber”.

@INPROCEEDINGS{Szczepanik:1019189,
      author       = {Szczepanik, Michał and Heunis, Stephan and Mönch,
                      Christian and Wagner, Adina and Waite, Alexander Q. and
                      Waite, Laura and Hanke, Michael},
      title        = {{D}istributed data management for large collaborative
                      projects: {D}ata{L}ad ecosystem in {C}ollaborative
                      {R}esearch {C}enter 1451},
      reportid     = {FZJ-2023-05235},
      year         = {2023},
      abstract     = {Multi-site research projects offer a unique opportunity for
                      scientific insight based on data collected across different
                      modalities, paradigms, and species. Yet, they also pose
                      unique research data management challenges. Here, we present
                      software developments and lessons learned from the
                      information management project of CRC1451. Given the large
                      variability of RDM demands across over 20 CRC member
                      projects, we opted for a decentralized approach: Projects
                      retain full control over key data management decisions
                      (standards, storage, sharing), and the findability,
                      accessibility, interoperability, and reusability of their
                      data is achieved with DataLad as an overlay structure for
                      all distributed datasets. We use DataLad Catalog to generate
                      an online data portal based on metadata. Metadata extraction
                      is done using MetaLad, based on the 'capture immediately,
                      curate perpetually' iterative approach. To mitigate
                      DataLad’s limited adoption outside central projects, we
                      are developing two solutions. First, DataLad Gooey is a
                      graphical user interface for basic data management
                      operations. Second, DataLad Tabby is a format specification
                      and a collection of tools for dataset descriptions which can
                      be created and provided as a spreadsheet, using well-defined
                      terms, translatable to catalog records and linked data
                      objects.},
      month         = {Sep},
      date          = {2023-09-18},
      organization  = {INCF Neuroinformatics Assembly 2023,
                       online (Sweden), 18 Sep 2023 - 20 Sep
                       2023},
      subtyp        = {After Call},
      cin          = {INM-7},
      cid          = {I:(DE-Juel1)INM-7-20090406},
      pnm          = {5254 - Neuroscientific Data Analytics and AI (POF4-525) /
                      SFB 1451 INF - Datenmanagement für computergestützte
                      Modellierung (INF) (458705875)},
      pid          = {G:(DE-HGF)POF4-5254 / G:(GEPRIS)458705875},
      typ          = {PUB:(DE-HGF)24},
      doi          = {10.5281/ZENODO.8355962},
      url          = {https://juser.fz-juelich.de/record/1019189},
}