fork download
  1. import re
  2. p = re.compile(r'^Sequence:[^|]*\|(?P<hitsid>[^|]*)\|\S*\s*(?P<protein>[^][]*?)\s*\[(?P<organism>[^][]*)][\s\S]*?\nE-value:\s*(?P<evalue>.*)', re.MULTILINE)
  3. s = "****ALIGNMENT****\nSequence: gi|86755972|gb|ABD15130.1| cold acclimation protein COR413-PM1 [Chimonanthus praecox]\nLength: 201\nE-value: 2.66576e-82\nKYLAMKTDQLAVANMIDSDINELKMATMRLINDASMLGHYGFGTHFLKWLACLAAIYLLILDRTNWRTNMLTSLL...\n+YLAMKTD+ + +I +D+ E+ A +L+ DA+ LG G GT LKW+A AAIYLLILDRTNW+TNMLT+LL...\nEYLAMKTDEWSAQQLIQTDLKEMGKAAKKLVYDATKLGSLGVGTSILKWVASFAAIYLLILDRTNWKTNMLTALL..."
  4. res = [m.groupdict() for m in p.finditer(s)]
  5. for x in res:
  6. print(x['hitsid'])
  7. print(x['protein'])
  8. print(x['organism'])
  9. print(x['evalue'])
Success #stdin #stdout 0.01s 9016KB
stdin
Standard input is empty
stdout
86755972
cold acclimation protein COR413-PM1
Chimonanthus praecox
2.66576e-82