fork download
  1. from urllib.parse import urlparse
  2. import re
  3.  
  4. pattern = r"_([^.]+)\.([^.]+)\.\d+"
  5.  
  6. o = urlparse('https://f...content-available-to-author-only...s.com/compare._plant1.green.402992_plant2.yellow.402228_plant3.red.403010_plant4.orange.399987.html')
  7. print(re.findall(pattern, o.path))
Success #stdin #stdout 0.02s 9700KB
stdin
Standard input is empty
stdout
[('plant1', 'green'), ('plant2', 'yellow'), ('plant3', 'red'), ('plant4', 'orange')]