import re
pattern = r"-?\b\d+(?:[.,]\d+)*\s*m?g(?:\s*/\s*-?\d+(?:[.,]\d+)*\s*m?g)+\b"
strings = [
"Dexamethasonacetat 5 mg/10 mg, Lidocain-HCl 1H2O 30 mg/60 mg",
"Anakinra 120 mg /-20 g /-12mg gentechnologisch hergestellt aus E. coli. 10mg pack"
]
for s in strings:
print([re.sub(r"[\s-]+", "", m) for m in re.findall(pattern, s)])
aW1wb3J0IHJlCgpwYXR0ZXJuID0gciItP1xiXGQrKD86Wy4sXVxkKykqXHMqbT9nKD86XHMqL1xzKi0/XGQrKD86Wy4sXVxkKykqXHMqbT9nKStcYiIKCnN0cmluZ3MgPSBbCiAgICAiRGV4YW1ldGhhc29uYWNldGF0IDUgbWcvMTAgbWcsIExpZG9jYWluLUhDbCAxSDJPIDMwIG1nLzYwIG1nIiwKICAgICJBbmFraW5yYSAxMjAgbWcgLy0yMCBnIC8tMTJtZyBnZW50ZWNobm9sb2dpc2NoIGhlcmdlc3RlbGx0IGF1cyBFLiBjb2xpLiAxMG1nIHBhY2siCl0KCmZvciBzIGluIHN0cmluZ3M6CiAgICBwcmludChbcmUuc3ViKHIiW1xzLV0rIiwgIiIsIG0pIGZvciBtIGluIHJlLmZpbmRhbGwocGF0dGVybiwgcyldKQ==