Use this link in raw_input: http://edition.cnn.com/
import urllib
import re
CNN_Technology = (raw_input('Paste your link here: '))
urls = ["http://edition.cnn.com/"]
pattern = 'Entertainment</a><a class="nav-menu-links__link" href="//(.+?)data-analytics-header="main-menu_tech'
result = re.compile(pattern)
for url in urls:
htmlsource = urllib.urlopen(url)
htmltext = htmlsource.read()
cnntech = re.findall(result, htmltext)
print ""
print "CNN Link:"
print cnntech
print ""
I want the newly found link money.cnn.com/technology/
to be where cnntech is and scan it afterwards.
urls = ["cnntech"]
pattern = 'Entertainment</a><a class="nav-menu-links__link" href="//(.+?)data-analytics-header="main-menu_tech'
result = re.compile(pattern)
for url in urls:
htmlsource = urllib.urlopen(url)
htmltext = htmlsource.read()
cnntech2 = re.findall(result, htmltext)
print "CNN Link:"
print cnntech2
<code>