print "and we begin"
import requests
from bs4.diagnose import diagnose
from bs4 import BeautifulSoup
#from bs4.diagnose import diagnose
#r = requests.get("")
f = open("events.xml", "r")
f = requests.get("") #grabs the xml from 25live
#f = open("events.xml", "r") #Opens a local document. events.xml is a shortened version of the larger events doc
soup = BeautifulSoup(, "lxml")
entries = soup.find_all('entry')
print type(entries[0]), "\n"
print entries[0].prettify(), "\n"
print entries[0].find('content').prettify(), "\n"
soup = BeautifulSoup(f.text, "lxml") #creates soup of the xml
entries = soup.find_all('entry') #creates a list of all the entry tags from the xml
print type(entries[0]), "\n" #prints the first entry
print entries[0].prettify(), "\n" #prints the first entry out
print entries[0].find('content').prettify(), "\n" #prints the first content tag in the first entry
titles = []
for item in entries:
ladle = BeautifulSoup(unicode(item.string), "lxml")
titles = ladle.find_all('title')
#this iterates through the entries and puts each event's title into a list
print titles
......@@ -8,3 +8,14 @@ python-dateutil==2.6.1
The packages currently installed are:
beautiful soup
lxml parser for beautiful soup
run the following install commands:
$ pip install beautifulsoup4
$ pp install lxml
$ pip install requests
