import re txt = ... regexp = "[0-9]{1,3} .+, .+, [A-Z]{2} [0-9]{5}" address = re.findall(regexp, txt) #Output : address = ['44 West 22nd Street, New York, NY 12345']