Here are the examples of the python api scrapi.util.timestamp taken from open source projects. By voting up you can indicate which examples are most useful and appropriate.
5 Examples
3
Example 1
Project: scrapi Source File: tasks.py
@app.task
@events.creates_task(events.HARVESTER_RUN)
def run_harvester(harvester_name, start_date=None, end_date=None):
logger.info('Running harvester "{}"'.format(harvester_name))
start_date = start_date or date.today() - timedelta(settings.DAYS_BACK)
end_date = end_date or date.today()
normalization = begin_normalization.s(harvester_name)
start_harvest = harvest.si(harvester_name, timestamp(), start_date=start_date, end_date=end_date)
# Form and start a celery chain
(start_harvest | normalization).apply_async()
3
Example 2
Project: scrapi Source File: tasks.py
@app.task
@events.logged(events.HARVESTER_RUN)
def harvest(harvester_name, job_created, start_date=None, end_date=None):
harvest_started = timestamp()
harvester = registry[harvester_name]
start_date = start_date or date.today() - timedelta(settings.DAYS_BACK)
end_date = end_date or date.today()
logger.info('Harvester "{}" has begun harvesting'.format(harvester_name))
result = harvester.harvest(start_date=start_date, end_date=end_date)
# result is a list of all of the RawDocuements harvested
return result, {
'harvestFinished': timestamp(),
'harvestTaskCreated': job_created,
'harvestStarted': harvest_started,
}
3
Example 3
Project: scrapi Source File: tasks.py
@events.creates_task(events.PROCESSING)
@events.creates_task(events.NORMALIZATION)
def spawn_tasks(raw, timestamps, harvester_name):
raw['timestamps'] = timestamps
raw['timestamps']['normalizeTaskCreated'] = timestamp()
chain = (normalize.si(raw, harvester_name) | process_normalized.s(raw))
chain.apply_async()
process_raw.delay(raw)
3
Example 4
Project: scrapi Source File: tasks.py
@task_autoretry(default_retry_delay=settings.CELERY_RETRY_DELAY, max_retries=settings.CELERY_MAX_RETRIES, throws=events.Skip)
@events.logged(events.NORMALIZATION)
def normalize(raw_doc, harvester_name):
normalized_started = timestamp()
harvester = registry[harvester_name]
normalized = null_on_error(harvester.normalize)(raw_doc)
if not normalized:
raise events.Skip('Did not normalize docuement with id {}'.format(raw_doc['docID']))
normalized['timestamps'] = util.stamp_from_raw(raw_doc, normalizeStarted=normalized_started)
return normalized # returns a single normalized docuement
0
Example 5
def test_timestamp(self):
timestamp = util.timestamp()
parsed = parse(timestamp)
assert isinstance(parsed, datetime.datetime)