︠fe11e309-e703-4d65-b17c-997b81a3ed39︠
import re
import urllib2

site = urllib2.urlopen("http://www.internetautoguide.com/cost-of-ownership/09-int/2007/honda/civic/index.html")

site_text = site.read()

rows = re.findall('<td class="bgrnd17.*td>', site_text)

for row in rows:
	row_data = re.findall('>([^<]*)<',row)[0::2]
	
htc = re.findall('<td .*Hybrid Tax Credit</td>.*>([^<]*)</td>', site_text )
print htc, row_data
︡8938572b-d79c-4e45-8c37-29f686755e26︡{"stdout": "['N/A'] ['Cost Per Year', '$4,914', '$4,405', '$4,304', '$4,930', '$4,635', '$23,188']"}︡


Collaborative Calculation and Data Science

colby

sagemath

cornellcollege

facebook

github

google

twitter

depaul

All published worksheets from http://sagenb.org

Product

Resources

Company