crawlers

dbdb00c3 · Renán Sosa Guillen · 7d116982 · dbdb00c3 · dbdb00c3
Commit dbdb00c3 authored Dec 03, 2017 by Renán Sosa Guillen
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

noticias.py descarga_por_dia/unoMasUno/unoMasUno/spiders/noticias.py +3 -3

noticias.pyc descarga_por_dia/unoMasUno/unoMasUno/spiders/noticias.pyc +0 -0

No files found.
--- a/descarga_por_dia/unoMasUno/unoMasUno/spiders/noticias.py
+++ b/descarga_por_dia/unoMasUno/unoMasUno/spiders/noticias.py
@@ -43,9 +43,9 @@ class QuotesSpider(scrapy.Spider):
 		day = getattr(self, 'day', None)
 		self.date_parser = {'enero': 1,      'febrero': 2,  'marzo': 3,     'abril': 4,
 												'mayo': 5,       'junio': 6,    'julio': 7,     'agosto': 8,
-												'septiembre': 9, 'octubre': 10, 'noviembre': 9, 'diciembre': 12}
+												'septiembre': 9, 'octubre': 10, 'noviembre': 11, 'diciembre': 12}
-		self.baseURL='http://www.unomasuno.com.mx/index.php/'+year+'/'+month+'/'+day
+		self.baseURL='http://www.unomasuno.com.mx/'+year+'/'+month+'/'+day
 		yield scrapy.Request(url=self.baseURL, callback=self.parse)
@@ -91,7 +91,7 @@ class QuotesSpider(scrapy.Spider):
 		d = response.xpath('//p[@class="post-meta"]/span/text()').extract_first()
 		d = d.replace(',','').split(' ')
-		item['date'] = datetime(int(d[2]), self.date_parser[d[0].lower()], int(d[1]), tzinfo=self.tz).isoformat('T')
+		item['date'] = datetime(int(d[2]), self.date_parser[d[1].lower()], int(d[0]), tzinfo=self.tz).isoformat('T')
 		item['topic'] = response.xpath('//span[@typeof="v:Breadcrumb"]/a/text()').extract()[1]
 		item['title'] = response.xpath('//*[@class="post-inner"]/h1/span/text()').extract_first()

--- a/descarga_por_dia/unoMasUno/unoMasUno/spiders/noticias.pyc
+++ b/descarga_por_dia/unoMasUno/unoMasUno/spiders/noticias.pyc