Cynthia Alice Andrews
2015-10-22 23:01:21 UTC
At this point I feel like I am wasting my time by not asking for help. I
can't figure out why the file keeps coming back empty. There are no error
message, just an empy file. Very frustrating.
from BeautifulSoup import BeautifulSoup
import urllib2
import csv
wiki = "https://en.wikipedia.org/wiki/List_of_Golden_Globe_winners"
header = {'User-Agent': 'Mozilla/5.0'}
req = urllib2.Request(wiki,headers=header)
page = urllib2.urlopen(req)
soup = BeautifulSoup(page)
drama = ""
musical_comedy = ""
drama_actor = ""
musical_comedy_actor = ""
drama_actress = ""
musical_comedy_actress = ""
director = ""
table = soup.find("table", {"class": "wikitable"})
f = open('output.csv','w')
for row in table.findAll("tr"):
cells = row.findAll("td")
if len(cells) == 7:
drama = cells[0].find(text=True)
musical_comedy = cells[1].find(text = True)
drama_actor = cells[2].find(text=True)
musical_comedy_actor = cells[3].find(text=True)
drama_actress = cells[4].find(text=True)
musical_comedy_actress = cells[5].find(text=True)
director = cells[6].find(text=True)
for x in range(len(drama_actor)):
drama_actor_list = drama_actor[x].split("/")
for i in range(len(drama_actor_list)):
if (len(drama_actor_list[i]) > 2) and (len(drama_actor_list[i]) <=5):
data = drama + "," + musical_comedy + "," +
drama_actor_list[i].lstrip('\n').strip() + "," + musical_comedy_actor + ","
+ drama_actress + "," + musical_comedy_actress + "," + director + "," + "\n"
print write_to_file
f.write(write_to_file)
f.close()
*cynthia*andrews
MCDM Candidate, Communication Leadership
University of Washington
<http://www.linkedin.com/in/cynthiaaliceandrews>
_______________________________________________
Tutor maillist - ***@python.org
To unsubscribe or change subscription options:
https://mail.python.org/mailman/listinfo/tutor
can't figure out why the file keeps coming back empty. There are no error
message, just an empy file. Very frustrating.
from BeautifulSoup import BeautifulSoup
import urllib2
import csv
wiki = "https://en.wikipedia.org/wiki/List_of_Golden_Globe_winners"
header = {'User-Agent': 'Mozilla/5.0'}
req = urllib2.Request(wiki,headers=header)
page = urllib2.urlopen(req)
soup = BeautifulSoup(page)
drama = ""
musical_comedy = ""
drama_actor = ""
musical_comedy_actor = ""
drama_actress = ""
musical_comedy_actress = ""
director = ""
table = soup.find("table", {"class": "wikitable"})
f = open('output.csv','w')
for row in table.findAll("tr"):
cells = row.findAll("td")
if len(cells) == 7:
drama = cells[0].find(text=True)
musical_comedy = cells[1].find(text = True)
drama_actor = cells[2].find(text=True)
musical_comedy_actor = cells[3].find(text=True)
drama_actress = cells[4].find(text=True)
musical_comedy_actress = cells[5].find(text=True)
director = cells[6].find(text=True)
for x in range(len(drama_actor)):
drama_actor_list = drama_actor[x].split("/")
for i in range(len(drama_actor_list)):
if (len(drama_actor_list[i]) > 2) and (len(drama_actor_list[i]) <=5):
data = drama + "," + musical_comedy + "," +
drama_actor_list[i].lstrip('\n').strip() + "," + musical_comedy_actor + ","
+ drama_actress + "," + musical_comedy_actress + "," + director + "," + "\n"
print write_to_file
f.write(write_to_file)
f.close()
*cynthia*andrews
MCDM Candidate, Communication Leadership
University of Washington
<http://www.linkedin.com/in/cynthiaaliceandrews>
_______________________________________________
Tutor maillist - ***@python.org
To unsubscribe or change subscription options:
https://mail.python.org/mailman/listinfo/tutor