@inproceedings{KorfmannBeyersdorfferM{\"u}nchetal.2024, author = {Korfmann, Robin and Beyersdorffer, Patrick and M{\"u}nch, J{\"u}rgen and Kuhrmann, Marco}, title = {Using data augmentation to support AI-based requirements evaluation in large-scale projects}, booktitle = {Systems, Software and Services Process Improvement : 31st European Conference, EuroSPI 2024, Munich, Germany, September 4-6, 2024, Proceedings, Part I}, editor = {Yilmaz, Murat and Clarke, Paul and Riel, Andreas and Messnarz, Richard and Greiner, Christian and Peisl, Thomas}, isbn = {978-3-031-71138-1}, issn = {1865-0929}, doi = {10.1007/978-3-031-71139-8_7}, institution = {Informatik}, pages = {97 -- 111}, year = {2024}, abstract = {Natural language processing (NLP) offers the potential to automate quality assurance of software requirement specifications. Especially large-scale projects involving numerous suppliers can benefit from this improvement. However, due to privacy restrictions and domain- and project-specific vocabulary, as such in the aerospace domain, the availability of SRS documents for training NLP tools is severely limited. To provide a sufficient amount of data, we studied algorithms for the augmentation of textual data. Four algorithms have been studied by expanding a given set of requirements from European Space projects generating correct and incorrect requirements. The study yielded data of poor quality due to insufficient accuracy caused by the domain-specific vocabulary, yet, laid the foundation for the algorithms improvement, which, eventually, resulted in an increased set of requirements, which is 20 times the size of the seed set. Finally, an explorative experiment demonstrated the usability of augmented requirements to support AI-based quality assurance.}, language = {en} }