本文整理汇总了Python中singer.metrics.record_counter方法的典型用法代码示例。如果您正苦于以下问题:Python metrics.record_counter方法的具体用法?Python metrics.record_counter怎么用?Python metrics.record_counter使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类singer.metrics
的用法示例。
在下文中一共展示了metrics.record_counter方法的15个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: _sync_contacts_by_company
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def _sync_contacts_by_company(STATE, ctx, company_id):
schema = load_schema(CONTACTS_BY_COMPANY)
catalog = ctx.get_catalog_from_id(singer.get_currently_syncing(STATE))
mdata = metadata.to_map(catalog.get('metadata'))
url = get_url("contacts_by_company", company_id=company_id)
path = 'vids'
with Transformer(UNIX_MILLISECONDS_INTEGER_DATETIME_PARSING) as bumble_bee:
with metrics.record_counter(CONTACTS_BY_COMPANY) as counter:
data = request(url, default_contacts_by_company_params).json()
for row in data[path]:
counter.increment()
record = {'company-id' : company_id,
'contact-id' : row}
record = bumble_bee.transform(lift_properties_and_versions(record), schema, mdata)
singer.write_record("contacts_by_company", record, time_extracted=utils.now())
return STATE
示例2: get_all_team_members
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_team_members(team_slug, schemas, repo_path, state, mdata):
org = repo_path.split('/')[0]
with metrics.record_counter('team_members') as counter:
for response in authed_get_all_pages(
'team_members',
'https://api.github.com/orgs/{}/teams/{}/members?sort=created_at&direction=desc'.format(org, team_slug)
):
team_members = response.json()
for r in team_members:
r['_sdc_repository'] = repo_path
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
counter.increment()
yield rec
return state
示例3: get_all_team_memberships
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_team_memberships(team_slug, schemas, repo_path, state, mdata):
org = repo_path.split('/')[0]
for response in authed_get_all_pages(
'team_members',
'https://api.github.com/orgs/{}/teams/{}/members?sort=created_at&direction=desc'.format(org, team_slug)
):
team_members = response.json()
with metrics.record_counter('team_memberships') as counter:
for r in team_members:
username = r['login']
for res in authed_get_all_pages(
'memberships',
'https://api.github.com/orgs/{}/teams/{}/memberships/{}'.format(org, team_slug, username)
):
team_membership = res.json()
team_membership['_sdc_repository'] = repo_path
with singer.Transformer() as transformer:
rec = transformer.transform(team_membership, schemas, metadata=metadata.to_map(mdata))
counter.increment()
yield rec
return state
示例4: get_all_releases
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_releases(schemas, repo_path, state, mdata):
# Releases doesn't seem to have an `updated_at` property, yet can be edited.
# For this reason and since the volume of release can safely be considered low,
# bookmarks were ignored for releases.
with metrics.record_counter('releases') as counter:
for response in authed_get_all_pages(
'releases',
'https://api.github.com/repos/{}/releases?sort=created_at&direction=desc'.format(repo_path)
):
releases = response.json()
extraction_time = singer.utils.now()
for r in releases:
r['_sdc_repository'] = repo_path
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
singer.write_record('releases', rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'releases', {'since': singer.utils.strftime(extraction_time)})
counter.increment()
return state
示例5: get_all_collaborators
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_collaborators(schema, repo_path, state, mdata):
'''
https://developer.github.com/v3/repos/collaborators/#list-collaborators
'''
with metrics.record_counter('collaborators') as counter:
for response in authed_get_all_pages(
'collaborators',
'https://api.github.com/repos/{}/collaborators'.format(repo_path)
):
collaborators = response.json()
extraction_time = singer.utils.now()
for collaborator in collaborators:
collaborator['_sdc_repository'] = repo_path
with singer.Transformer() as transformer:
rec = transformer.transform(collaborator, schema, metadata=metadata.to_map(mdata))
singer.write_record('collaborators', rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'collaborator', {'since': singer.utils.strftime(extraction_time)})
counter.increment()
return state
示例6: sync_stream
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def sync_stream(sf, catalog_entry, state):
stream = catalog_entry['stream']
with metrics.record_counter(stream) as counter:
try:
sync_records(sf, catalog_entry, state, counter)
singer.write_state(state)
except RequestException as ex:
raise Exception("Error syncing {}: {} Response: {}".format(
stream, ex, ex.response.text))
except Exception as ex:
raise Exception("Error syncing {}: {}".format(
stream, ex)) from ex
return counter
示例7: write_page
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def write_page(self, page):
stream = Context.get_catalog_entry(self.tap_stream_id)
stream_metadata = metadata.to_map(stream.metadata)
extraction_time = singer.utils.now()
for rec in page:
with Transformer() as transformer:
rec = transformer.transform(rec, stream.schema.to_dict(), stream_metadata)
singer.write_record(self.tap_stream_id, rec, time_extracted=extraction_time)
with metrics.record_counter(self.tap_stream_id) as counter:
counter.increment(len(page))
示例8: gen_request
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def gen_request(STATE, tap_stream_id, url, params, path, more_key, offset_keys, offset_targets):
if len(offset_keys) != len(offset_targets):
raise ValueError("Number of offset_keys must match number of offset_targets")
if singer.get_offset(STATE, tap_stream_id):
params.update(singer.get_offset(STATE, tap_stream_id))
with metrics.record_counter(tap_stream_id) as counter:
while True:
data = request(url, params).json()
for row in data[path]:
counter.increment()
yield row
if not data.get(more_key, False):
break
STATE = singer.clear_offset(STATE, tap_stream_id)
for key, target in zip(offset_keys, offset_targets):
if key in data:
params[target] = data[key]
STATE = singer.set_offset(STATE, tap_stream_id, target, data[key])
singer.write_state(STATE)
STATE = singer.clear_offset(STATE, tap_stream_id)
singer.write_state(STATE)
示例9: do_sync
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def do_sync(account, catalog, state):
streams_to_sync = get_streams_to_sync(account, catalog, state)
refs = load_shared_schema_refs()
for stream in streams_to_sync:
LOGGER.info('Syncing %s, fields %s', stream.name, stream.fields())
schema = singer.resolve_schema_references(load_schema(stream), refs)
metadata_map = metadata.to_map(stream.catalog_entry.metadata)
bookmark_key = BOOKMARK_KEYS.get(stream.name)
singer.write_schema(stream.name, schema, stream.key_properties, bookmark_key, stream.stream_alias)
# NB: The AdCreative stream is not an iterator
if stream.name == 'adcreative':
stream.sync()
continue
with Transformer(pre_hook=transform_date_hook) as transformer:
with metrics.record_counter(stream.name) as counter:
for message in stream:
if 'record' in message:
counter.increment()
time_extracted = utils.now()
record = transformer.transform(message['record'], schema, metadata=metadata_map)
singer.write_record(stream.name, record, stream.stream_alias, time_extracted)
elif 'state' in message:
singer.write_state(message['state'])
else:
raise TapFacebookException('Unrecognized message {}'.format(message))
示例10: get_all_teams
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_teams(schemas, repo_path, state, mdata):
org = repo_path.split('/')[0]
with metrics.record_counter('teams') as counter:
for response in authed_get_all_pages(
'teams',
'https://api.github.com/orgs/{}/teams?sort=created_at&direction=desc'.format(org)
):
teams = response.json()
extraction_time = singer.utils.now()
for r in teams:
r['_sdc_repository'] = repo_path
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
singer.write_record('teams', rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'teams', {'since': singer.utils.strftime(extraction_time)})
counter.increment()
if schemas.get('team_members'):
team_slug = r['slug']
for team_members_rec in get_all_team_members(team_slug, schemas['team_members'], repo_path, state, mdata):
singer.write_record('team_members', team_members_rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'team_members', {'since': singer.utils.strftime(extraction_time)})
if schemas.get('team_memberships'):
team_slug = r['slug']
for team_memberships_rec in get_all_team_memberships(team_slug, schemas['team_memberships'], repo_path, state, mdata):
singer.write_record('team_memberships', team_memberships_rec, time_extracted=extraction_time)
return state
示例11: get_all_events
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_events(schemas, repo_path, state, mdata):
# Incremental sync off `created_at`
# https://developer.github.com/v3/issues/events/#list-events-for-a-repository
# 'https://api.github.com/repos/{}/issues/events?sort=created_at&direction=desc'.format(repo_path)
bookmark_value = get_bookmark(state, repo_path, "events", "since")
if bookmark_value:
bookmark_time = singer.utils.strptime_to_utc(bookmark_value)
else:
bookmark_time = 0
with metrics.record_counter('events') as counter:
for response in authed_get_all_pages(
'events',
'https://api.github.com/repos/{}/events?sort=created_at&direction=desc'.format(repo_path)
):
events = response.json()
extraction_time = singer.utils.now()
for r in events:
r['_sdc_repository'] = repo_path
# skip records that haven't been updated since the last run
# the GitHub API doesn't currently allow a ?since param for pulls
# once we find the first piece of old data we can return, thanks to
# the sorting
updated_at = r.get('created_at') if r.get('updated_at') is None else r.get('updated_at')
if bookmark_time and singer.utils.strptime_to_utc(updated_at) < bookmark_time:
return state
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
singer.write_record('events', rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'events', {'since': singer.utils.strftime(extraction_time)})
counter.increment()
return state
示例12: get_all_issue_milestones
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_issue_milestones(schemas, repo_path, state, mdata):
# Incremental sync off `due on` ??? confirm.
# https://developer.github.com/v3/issues/milestones/#list-milestones-for-a-repository
# 'https://api.github.com/repos/{}/milestones?sort=created_at&direction=desc'.format(repo_path)
bookmark_value = get_bookmark(state, repo_path, "issue_milestones", "since")
if bookmark_value:
bookmark_time = singer.utils.strptime_to_utc(bookmark_value)
else:
bookmark_time = 0
with metrics.record_counter('issue_milestones') as counter:
for response in authed_get_all_pages(
'milestones',
'https://api.github.com/repos/{}/milestones?direction=desc'.format(repo_path)
):
milestones = response.json()
extraction_time = singer.utils.now()
for r in milestones:
r['_sdc_repository'] = repo_path
# skip records that haven't been updated since the last run
# the GitHub API doesn't currently allow a ?since param for pulls
# once we find the first piece of old data we can return, thanks to
# the sorting
if bookmark_time and singer.utils.strptime_to_utc(r.get('due_on')) < bookmark_time:
return state
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
singer.write_record('issue_milestones', rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'issue_milestones', {'since': singer.utils.strftime(extraction_time)})
counter.increment()
return state
示例13: get_all_commit_comments
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_commit_comments(schemas, repo_path, state, mdata):
# https://developer.github.com/v3/repos/comments/
# updated_at? incremental
# 'https://api.github.com/repos/{}/comments?sort=created_at&direction=desc'.format(repo_path)
bookmark_value = get_bookmark(state, repo_path, "commit_comments", "since")
if bookmark_value:
bookmark_time = singer.utils.strptime_to_utc(bookmark_value)
else:
bookmark_time = 0
with metrics.record_counter('commit_comments') as counter:
for response in authed_get_all_pages(
'commit_comments',
'https://api.github.com/repos/{}/comments?sort=created_at&direction=desc'.format(repo_path)
):
commit_comments = response.json()
extraction_time = singer.utils.now()
for r in commit_comments:
r['_sdc_repository'] = repo_path
# skip records that haven't been updated since the last run
# the GitHub API doesn't currently allow a ?since param for pulls
# once we find the first piece of old data we can return, thanks to
# the sorting
if bookmark_time and singer.utils.strptime_to_utc(r.get('updated_at')) < bookmark_time:
return state
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
singer.write_record('commit_comments', rec, time_extracted=extraction_time)
singer.write_bookmark(state, repo_path, 'commit_comments', {'since': singer.utils.strftime(extraction_time)})
counter.increment()
return state
示例14: get_all_project_cards
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_project_cards(project_id, schemas, repo_path, state, mdata):
bookmark_value = get_bookmark(state, repo_path, "project_cards", "since")
if bookmark_value:
bookmark_time = singer.utils.strptime_to_utc(bookmark_value)
else:
bookmark_time = 0
with metrics.record_counter('project_cards') as counter:
for response in authed_get_all_pages(
'project_cards',
'https://api.github.com/projects/{}/columns?sort=created_at&direction=desc'.format(project_id)
):
project_cards = response.json()
for r in project_cards:
r['_sdc_repository'] = repo_path
# skip records that haven't been updated since the last run
# the GitHub API doesn't currently allow a ?since param for pulls
# once we find the first piece of old data we can return, thanks to
# the sorting
if bookmark_time and singer.utils.strptime_to_utc(r.get('updated_at')) < bookmark_time:
return state
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
# counter.increment()
yield rec
return state
示例15: get_all_project_columns
# 需要导入模块: from singer import metrics [as 别名]
# 或者: from singer.metrics import record_counter [as 别名]
def get_all_project_columns(project_id, schemas, repo_path, state, mdata):
bookmark_value = get_bookmark(state, repo_path, "project_columns", "since")
if bookmark_value:
bookmark_time = singer.utils.strptime_to_utc(bookmark_value)
else:
bookmark_time = 0
with metrics.record_counter('project_columns') as counter:
for response in authed_get_all_pages(
'project_columns',
'https://api.github.com/projects/{}/columns?sort=created_at&direction=desc'.format(project_id)
):
project_columns = response.json()
for r in project_columns:
r['_sdc_repository'] = repo_path
# skip records that haven't been updated since the last run
# the GitHub API doesn't currently allow a ?since param for pulls
# once we find the first piece of old data we can return, thanks to
# the sorting
if bookmark_time and singer.utils.strptime_to_utc(r.get('updated_at')) < bookmark_time:
return state
# transform and write release record
with singer.Transformer() as transformer:
rec = transformer.transform(r, schemas, metadata=metadata.to_map(mdata))
# counter.increment()
yield rec
return state