Webspace Scheduler in Python


#! /usr/bin/python
# install mechanize and BeautifulSoup

var = raw_input("Enter Your Intake Code: ")
import urllib, urllib2, cookielib
import mechanize
import re
import sys
from BeautifulSoup import BeautifulSoup
reload(sys)
br = mechanize.Browser()
getweb=br.open('http://webspace.apiit.edu.my/intake-timetable/').read()
getwebspace = BeautifulSoup(getweb)
scrapDate = re.compile('[0-9-]+.xml')
listdate = re.findall(scrapDate,str(getwebspace))
week = '%s'%(listdate[0])
date = week.replace(".xml","")
intake_Search_Week = ''
selectIntakeAll = '%s' %(var)
cj = cookielib.CookieJar()
opener = urllib2.build_opener(urllib2.HTTPCookieProcessor(cj))
opener.addheaders = [('User-agent', 'Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.0.1) Gecko/2008071615 Fedora/3.0.1-1.fc9 Firefox/3.0.1')]
opener.open('http://webspace.apiit.edu.my/intake-timetable/')
post_data = urllib.urlencode({'week':week,'intake_Search_Week':intake_Search_Week,'selectIntakeAll':selectIntakeAll})
log = opener.open('http://webspace.apiit.edu.my/intake-timetable/intake-result.php', post_data)
logread = log.read()
webspace = BeautifulSoup(logread)
scrapSchedule = re.compile('<table class="timetable-display">\s*[A-z 0-9 \<\>,-:]+</table>')
listwebspace = re.findall(scrapSchedule,str(webspace))
webby = ('%s' % (listwebspace))
webby.replace("[","").replace("]","")
f = open('schedule%s.html'% date, 'w')
htmlcode = ('%s' % (webby))
f.write(htmlcode)
f.close

Powered by Blogger.