for row in tree.findall('.//*[@id="div1"]//tr'): cells = row.findall('td') if len(cells) >= 3: yield { 'candidate': cells[0].text.strip(), 'party': cells[1].text.strip(), 'votes': cells[2].text.strip(), } dataset = [] for place in constituencies('http://eciresults.nic.in/ConstituencywiseS2653.htm'): url = 'http://eciresults.nic.in/Constituencywise{:s}{:s}.htm?ac={:s}'.format( place['statecode'], place['constituencycode'], place['constituencycode']) # print 'Debug: scraping', place['state'], place['constituency'] for result in results(url): result.update(place) dataset.append(result) # Let's save this as tab-delimited UTF-8 file. (Sadly, csv doesn't do UTF-8) with open('2013-result.txt', 'wb') as out: fields = ['state', 'constituency', 'votes', 'candidate', 'party'] out.write('\t'.join(fields) + '\n') for row in dataset: out.write('\t'.join(row[f] for f in fields).encode('utf-8') + '\n')