@article{BornheimGriegerBlanecketal.2024, author = {Bornheim, Tobias and Grieger, Niklas and Blaneck, Patrick Gustav and Bialonski, Stephan}, title = {Speaker Attribution in German Parliamentary Debates with QLoRA-adapted Large Language Models}, series = {Journal for language technology and computational linguistics : JLCL}, volume = {37}, journal = {Journal for language technology and computational linguistics : JLCL}, number = {1}, publisher = {Gesellschaft f{\"u}r Sprachtechnologie und Computerlinguistik}, address = {Regensburg}, issn = {2190-6858}, doi = {10.21248/jlcl.37.2024.244}, pages = {13 Seiten}, year = {2024}, abstract = {The growing body of political texts opens up new opportunities for rich insights into political dynamics and ideologies but also increases the workload for manual analysis. Automated speaker attribution, which detects who said what to whom in a speech event and is closely related to semantic role labeling, is an important processing step for computational text analysis. We study the potential of the large language model family Llama 2 to automate speaker attribution in German parliamentary debates from 2017-2021. We fine-tune Llama 2 with QLoRA, an efficient training strategy, and observe our approach to achieve competitive performance in the GermEval 2023 Shared Task On Speaker Attribution in German News Articles and Parliamentary Debates. Our results shed light on the capabilities of large language models in automating speaker attribution, revealing a promising avenue for computational analysis of political discourse and the development of semantic role labeling systems.}, language = {en} } @article{HaegerJolmesOyenetal.2024, author = {Haeger, Gerrit and Jolmes, Tristan and Oyen, Sven and Jaeger, Karl-Erich and Bongaerts, Johannes and Sch{\"o}rken, Ulrich and Siegert, Petra}, title = {Novel recombinant aminoacylase from Paraburkholderia monticola capable of N-acyl-amino acid synthesis}, series = {Applied Microbiology and Biotechnology}, journal = {Applied Microbiology and Biotechnology}, number = {108}, publisher = {Springer}, address = {Berlin}, issn = {1432-0614}, doi = {10.1007/s00253-023-12868-8}, pages = {14 Seiten}, year = {2024}, abstract = {N-Acyl-amino acids can act as mild biobased surfactants, which are used, e.g., in baby shampoos. However, their chemical synthesis needs acyl chlorides and does not meet sustainability criteria. Thus, the identification of biocatalysts to develop greener synthesis routes is desirable. We describe a novel aminoacylase from Paraburkholderia monticola DSM 100849 (PmAcy) which was identified, cloned, and evaluated for its N-acyl-amino acid synthesis potential. Soluble protein was obtained by expression in lactose autoinduction medium and co-expression of molecular chaperones GroEL/S. Strep-tag affinity purification enriched the enzyme 16-fold and yielded 15 mg pure enzyme from 100 mL of culture. Biochemical characterization revealed that PmAcy possesses beneficial traits for industrial application like high temperature and pH-stability. A heat activation of PmAcy was observed upon incubation at temperatures up to 80 °C. Hydrolytic activity of PmAcy was detected with several N-acyl-amino acids as substrates and exhibited the highest conversion rate of 773 U/mg with N-lauroyl-L-alanine at 75 °C. The enzyme preferred long-chain acyl-amino-acids and displayed hardly any activity with acetyl-amino acids. PmAcy was also capable of N-acyl-amino acid synthesis with good conversion rates. The best synthesis results were obtained with the cationic L-amino acids L-arginine and L-lysine as well as with L-leucine and L-phenylalanine. Exemplarily, L-phenylalanine was acylated with fatty acids of chain lengths from C8 to C18 with conversion rates of up to 75\%. N-lauroyl-L-phenylalanine was purified by precipitation, and the structure of the reaction product was verified by LC-MS and NMR.}, language = {en} }