fork download
  1. import re
  2. pattern = re.compile( r'^((?=.*,)[^,]+|\S+)[\s,]+(.*)' )
  3. texts = [">Keratyna 5, egzon 2, Homo sapiens", ">101m_A mol:protein length:154 MYOGLOBIN"]
  4. for text in texts:
  5. m = pattern.search(text)
  6. if m:
  7. id, description = m.groups()
  8. print(f"ID: '{id}', DESCRIPTION: '{description}'")
  9.  
Success #stdin #stdout 0.02s 9500KB
stdin
Standard input is empty
stdout
ID: '>Keratyna 5', DESCRIPTION: 'egzon 2, Homo sapiens'
ID: '>101m_A', DESCRIPTION: 'mol:protein length:154  MYOGLOBIN'