fork download
  1. import re
  2. test_str = [
  3. "bla bla google.com bla bla", #0
  4. "bla bla www.google.com bla bla", #1
  5. "bla bla api.google.com bla bla", #2
  6. "google.com", #3
  7. "www.google.com", #4
  8. "api.google.com", #5
  9. "http://google.com", #6
  10. "http://www.google.com", #7
  11. "http://api.google.com", #8
  12. "bla bla http://www.google.com bla bla", #9
  13. "bla bla https://www.api.google.com bla bla", #10
  14. "bla bla https://www.map.google.com bla bla" #11
  15. ]
  16. r = re.compile(r"(?<!\S)(?:https?://)?(?:www\.)?google\.\S*")
  17. for i,s in enumerate(test_str):
  18. m = r.search(s)
  19. if m:
  20. print("{}\t#{}".format(m.group(0), i))
Success #stdin #stdout 0s 23304KB
stdin
Standard input is empty
stdout
google.com	#0
www.google.com	#1
google.com	#3
www.google.com	#4
http://google.com	#6
http://www.google.com	#7
http://www.google.com	#9