s = open('class1_files/gooselamp.html').read()
s[0:1000]
l1 = s.split('<span id="priceblock_ourprice" class="a-size-medium a-color-price">$')
len(l1)
l1[0][:1000]
price = l1[1].split('</span>')[0]
price
price = float(l1[1].split('</span>')[0])
price
# In summary
s = open('class1_files/gooselamp.html').read()
l1 = s.split('<span id="priceblock_ourprice" class="a-size-medium a-color-price">$')
price = float(l1[1].split('</span>')[0])
price
import requests
url = 'https://www.amazon.com/Union-61100-Outdoor-Garden-Statue/dp/B0027YPQEC'
s = requests.get(url)
'19.59' in s.text
#if this returns true, then you've successfully accessed the webpage and it does in fact contain the string `19.59'
url = 'http://math.buffalo.edu'
s = requests.get(url)
# print(s.text)
url = 'http://www.buffalo.edu/cas/math.html'
s = requests.get(url,headers={'User-Agent':'Fake out!'})
ua = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/56.0.2924.76 Safari/537.36'
s = requests.get(url,headers={'User-Agent':'Fake out!'})
s.text[1:100]
import requests
def getprice(pid):
ua = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/56.0.2924.76 Safari/537.36'
url = 'https://www.amazon.com/dp/'+pid
s = requests.get(url, headers={'User-Agent':ua})
pattern = '<span id="priceblock_ourprice" class="a-size-medium a-color-price">$'
price = float( s.text.split(pattern)[-1].split('</span>')[0] )
return price
price = getprice('B0027YPQEC')
print(price)
pid = 'B00BB581NQ'
url = 'https://www.amazon.com/dp/'+pid
price = getprice(pid) # another item: a kite
print('the price of item ' + url + ' is ' + str(price) )