Commit 5b15cb53 authored by Renán Sosa Guillen's avatar Renán Sosa Guillen

crawl rss

parent 3cd0913c
...@@ -24,13 +24,20 @@ with open(sys.argv[1]) as data_file: ...@@ -24,13 +24,20 @@ with open(sys.argv[1]) as data_file:
except: except:
print "ok" print "ok"
os.chdir(media) os.chdir(media)
CORRECT_YEAR = False
while not CORRECT_YEAR:
lstYears = os.listdir(".") lstYears = os.listdir(".")
lstYears.sort() lstYears.sort()
year = desde.year year = desde.year
if len(lstYears) > 0: if len(lstYears) > 0:
year = int(lstYears[len(lstYears) - 1]) element = lstYears[len(lstYears) - 1]
if element[-4:] == 'json':
os.system('rm ' + element)
else:
CORRECT_YEAR = True
year = int(element)
for y in range(year, today.year + 1): for y in range(year, today.year + 1):
print y print y
try: try:
...@@ -59,6 +66,7 @@ with open(sys.argv[1]) as data_file: ...@@ -59,6 +66,7 @@ with open(sys.argv[1]) as data_file:
day = 1 day = 1
for d in range(day, ((datetime.date(y, 12, 31) - datetime.date(y, 1, 1)).days + 1 if today.year != y else today.timetuple().tm_yday) + 1): for d in range(day, ((datetime.date(y, 12, 31) - datetime.date(y, 1, 1)).days + 1 if today.year != y else today.timetuple().tm_yday) + 1):
YESTERDAY = False
filename = currentDate.strftime('%Y-%m-%d') + ".json" filename = currentDate.strftime('%Y-%m-%d') + ".json"
scrapycommand = "scrapy crawl noticias -t json --nolog -o " + filename scrapycommand = "scrapy crawl noticias -t json --nolog -o " + filename
mydir = os.getcwd() mydir = os.getcwd()
...@@ -71,8 +79,6 @@ with open(sys.argv[1]) as data_file: ...@@ -71,8 +79,6 @@ with open(sys.argv[1]) as data_file:
if fileSize <= 3: if fileSize <= 3:
os.system('rm ' + filename) os.system('rm ' + filename)
else: else:
YESTERDAY = False
f1 = mydir + '/' + filename f1 = mydir + '/' + filename
f2 = filename f2 = filename
f3 = baseDir + media + '/' + filename f3 = baseDir + media + '/' + filename
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment