mediaczar · November 9, 2018 10:47
diff --git a/interbrandrankscraper.py b/interbrandrankscraper.py
 #!/usr/bin/env/ python

 import requests
 from bs4 import BeautifulSoup

 def collect(year):
    url = "https://www.interbrand.com/best-brands/best-global-brands/%s/ranking" % str(year)
    html = requests.get(url)
    page = BeautifulSoup(html.text, features="html5lib")
    return page

 def scrape(year, page, attributes):
    content = page.find_all("li", class_="brand-item")

    for i in content:
        scraped = {}
        for attr in attributes:
            try:
                scraped[attr] = i.find("div", class_=attr).text.strip()
            except:
                scraped[attr] = ""

        output = ('\t'.join([x.encode('utf-8') for x in scraped.values()]))
        print output

 attributes = ("brand-rank", "brand-name", "brand-region", "brand-country", "brand-sector", "brand-value", "brand-value-change")

 for y in range(2000, 2019):
    p = collect(y)
    scrape(y, p, attributes)
	#!/usr/bin/env/ python

	import requests
	from bs4 import BeautifulSoup

	def collect(year):
	url = "https://www.interbrand.com/best-brands/best-global-brands/%s/ranking" % str(year)
	html = requests.get(url)
	page = BeautifulSoup(html.text, features="html5lib")
	return page

	def scrape(year, page, attributes):
	content = page.find_all("li", class_="brand-item")

	for i in content:
	scraped = {}
	for attr in attributes:
	try:
	scraped[attr] = i.find("div", class_=attr).text.strip()
	except:
	scraped[attr] = ""

	output = ('\t'.join([x.encode('utf-8') for x in scraped.values()]))
	print output

	attributes = ("brand-rank", "brand-name", "brand-region", "brand-country", "brand-sector", "brand-value", "brand-value-change")

	for y in range(2000, 2019):
	p = collect(y)
	scrape(y, p, attributes)
No results found