mirror of
https://github.com/taroved/pol
synced 2025-05-16 06:10:09 -07:00
duplicates
This commit is contained in:
parent
79c0bc467e
commit
f5465442f2
11
pol/feed.py
11
pol/feed.py
@ -70,13 +70,18 @@ class Feed(object):
|
|||||||
fetched_dates[md5hash] = created
|
fetched_dates[md5hash] = created
|
||||||
|
|
||||||
cur_time = datetime.datetime.utcnow()
|
cur_time = datetime.datetime.utcnow()
|
||||||
|
saved_times = {}
|
||||||
for item in items:
|
for item in items:
|
||||||
if item['md5'] in fetched_dates:
|
if item['md5'] in fetched_dates:
|
||||||
item['time'] = fetched_dates[item['md5']]
|
item['time'] = fetched_dates[item['md5']]
|
||||||
else:
|
else:
|
||||||
item['time'] = cur_time
|
if item['md5'] in saved_times:
|
||||||
self.save_post(conn, cur_time, feed_id, item)
|
item['time'] = saved_times[item['md5']]
|
||||||
new_post_cnt += 1
|
else:
|
||||||
|
self.save_post(conn, cur_time, feed_id, item)
|
||||||
|
saved_times[item['md5']] = cur_time
|
||||||
|
item['time'] = cur_time
|
||||||
|
new_post_cnt += 1
|
||||||
cur_time -= datetime.timedelta(minutes=self.POST_TIME_DISTANCE)
|
cur_time -= datetime.timedelta(minutes=self.POST_TIME_DISTANCE)
|
||||||
return new_post_cnt
|
return new_post_cnt
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user