本文整理汇总了Python中pupa.scrape.Person.add_term方法的典型用法代码示例。如果您正苦于以下问题:Python Person.add_term方法的具体用法?Python Person.add_term怎么用?Python Person.add_term使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类pupa.scrape.Person
的用法示例。
在下文中一共展示了Person.add_term方法的5个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: test_person_add_term
# 需要导入模块: from pupa.scrape import Person [as 别名]
# 或者: from pupa.scrape.Person import add_term [as 别名]
def test_person_add_term():
p = Person('Eternal')
p.add_term('eternal', 'council', start_date='0001', end_date='9999')
p._related[0].validate()
assert get_pseudo_id(p._related[0].organization_id) == {
'classification': 'council',
}
assert p._related[0].start_date == '0001'
assert p._related[0].end_date == '9999'
示例2: scrape
# 需要导入模块: from pupa.scrape import Person [as 别名]
# 或者: from pupa.scrape.Person import add_term [as 别名]
def scrape(self):
committee_d = {}
non_committees = {'City Council', 'Office of the Mayor',
'Office of the City Clerk'}
for councilman, committees in self.councilMembers() :
if councilman['Ward/Office'] == "":
continue
ward = councilman['Ward/Office']
if ward not in {"Mayor", "Clerk"} :
ward = "Ward {}".format(int(ward))
role = "Alderman"
p = Person(councilman['Person Name']['label'],
district=ward,
primary_org="legislature",
role=role)
if councilman['Photo'] :
p.image = councilman['Photo']
contact_types = {
"City Hall Office": ("address", "City Hall Office"),
"City Hall Phone": ("voice", "City Hall Phone"),
"Ward Office Phone": ("voice", "Ward Office Phone"),
"Ward Office Address": ("address", "Ward Office Address"),
"Fax": ("fax", "Fax")
}
for contact_type, (type_, _note) in contact_types.items():
if councilman[contact_type]:
p.add_contact_detail(type=type_,
value= councilman[contact_type],
note=_note)
if councilman["E-mail"]:
p.add_contact_detail(type="email",
value=councilman['E-mail']['label'],
note='E-mail')
if councilman['Website']:
p.add_link(councilman['Website']['url'])
p.add_source(councilman['Person Name']['url'], note='web')
for committee, _, _ in committees:
committee_name = committee['Legislative Body']['label']
if committee_name and committee_name not in non_committees:
o = committee_d.get(committee_name, None)
if o is None:
o = Organization(committee_name,
classification='committee',
parent_id={'name' : 'Chicago City Council'})
o.add_source(committee['Legislative Body']['url'],
note='web')
committee_d[committee_name] = o
o.add_member(p, role=committee["Title"])
yield p
for name, term in FORMER_ALDERMEN.items() :
p = Person(name=name,
primary_org="legislature",
start_date=term['term'][0],
end_date=term['term'][1],
district="Ward {}".format(term['ward']),
role='Alderman')
if name == 'Chandler, Michael D.' :
p.add_term('Alderman',
"legislature",
district="Ward {}".format(term['ward']),
start_date=datetime.date(2011, 5, 16),
end_date=datetime.date(2015, 5, 18))
p.add_source(term['source'], note='web')
yield p
for o in committee_d.values() :
yield o
for committee_name in FORMER_COMMITTEES :
o = Organization(committee_name,
classification='committee',
parent_id={'name' : 'Chicago City Council'})
o.add_source("https://chicago.legistar.com/Departments.aspx",
note='web')
yield o
for joint_committee in JOINT_COMMITTEES :
o = Organization(joint_committee,
classification='committee',
parent_id={'name' : 'Chicago City Council'})
o.add_source("https://chicago.legistar.com/Departments.aspx",
note='web')
yield o
示例3: scrape
# 需要导入模块: from pupa.scrape import Person [as 别名]
# 或者: from pupa.scrape.Person import add_term [as 别名]
def scrape(self):
web_scraper = LegistarPersonScraper(requests_per_minute = self.requests_per_minute)
web_scraper.MEMBERLIST = 'http://legistar.council.nyc.gov/DepartmentDetail.aspx?ID=6897&GUID=CDC6E691-8A8C-4F25-97CB-86F31EDAB081&Mode=MainBody'
if self.cache_storage:
web_scraper.cache_storage = self.cache_storage
if self.requests_per_minute == 0:
web_scraper.cache_write_only = False
web_info = {}
for member, _ in web_scraper.councilMembers():
name = member['Person Name']['label'].strip()
web_info[name] = member
city_council, = [body for body in self.bodies()
if body['BodyName'] == 'City Council']
terms = collections.defaultdict(list)
public_advocates = { # Match casing to Bill De Blasio as council member
'The Public Advocate (Mr. de Blasio)': 'Bill De Blasio',
'The Public Advocate (Ms. James)': 'Letitia James',
}
for office in self.body_offices(city_council):
name = office['OfficeRecordFullName']
name = public_advocates.get(name, name).strip()
terms[name].append(office)
# Add past members (and advocates public)
if name not in web_info:
web_info[name] = collections.defaultdict(lambda: None)
# Check that we have everyone we expect, formatted consistently, in
# both information arrays. For instance, this will fail if we forget to
# strip trailing spaces from names on one side or the other (which has
# the effect of omitting information, such as post, from the scrape).
assert set(web_info.keys()) == set(terms.keys())
members = {}
for member, offices in terms.items():
p = Person(member)
web = web_info[member]
for term in offices:
role = term['OfficeRecordTitle']
if role == 'Public Advocate':
role = 'Non-Voting Council Member'
else:
role = 'Council Member'
district = web.get('District', '').replace(' 0', ' ')
p.add_term(role,
'legislature',
district=district,
start_date=self.toDate(term['OfficeRecordStartDate']),
end_date=self.toDate(term['OfficeRecordEndDate']))
party = web.get('Political Party')
if party == 'Democrat':
party = 'Democratic'
if party:
p.add_party(party)
if web.get('Photo'):
p.image = web['Photo']
contact_types = {
"City Hall Office": ("address", "City Hall Office"),
"City Hall Phone": ("voice", "City Hall Phone"),
"Ward Office Phone": ("voice", "Ward Office Phone"),
"Ward Office Address": ("address", "Ward Office Address"),
"Fax": ("fax", "Fax")
}
for contact_type, (type_, _note) in contact_types.items():
if web.get(contact_type) and web(contact_type) != 'N/A':
p.add_contact_detail(type=type_,
value= web[contact_type],
note=_note)
if web.get('E-mail'):
p.add_contact_detail(type="email",
value=web['E-mail']['url'],
note='E-mail')
if web.get('Web site'):
p.add_link(web['Web site']['url'], note='web site')
#.........这里部分代码省略.........
示例4: scrape
# 需要导入模块: from pupa.scrape import Person [as 别名]
# 或者: from pupa.scrape.Person import add_term [as 别名]
def scrape(self):
noncommittees = {'Committee of the Whole'}
committee_d = {}
people_d = {}
for councilman, committees in self.councilMembers() :
if 'url' in councilman['Person Name'] :
councilman_url = councilman['Person Name']['url']
if councilman_url in people_d :
people_d[councilman_url][0].append(councilman)
else :
people_d[councilman_url] = [councilman], committees
for person_entries, committees in people_d.values() :
councilman = person_entries[-1]
p = Person(councilman['Person Name']['label'])
if p.name == 'Letitia James' :
p.name = 'Letitia Ms. James'
p.add_name('Letitia James')
spans = [(self.toTime(entry['Start Date']).date(),
self.toTime(entry['End Date']).date(),
entry['District'])
for entry in person_entries]
merged_spans = []
last_end_date = None
last_district = None
for start_date, end_date, district in sorted(spans) :
if last_end_date is None :
span = [start_date, end_date, district]
elif (start_date - last_end_date) == datetime.timedelta(1) and district == last_district :
span[1] = end_date
else :
merged_spans.append(span)
span = [start_date, end_date, district]
last_end_date = end_date
last_district = district
merged_spans.append(span)
for start_date, end_date, district in merged_spans :
district = councilman['District'].replace(' 0', ' ')
if end_date == datetime.date(2017, 12, 31) :
end_date = ''
else :
end_date = end_date.isoformat()
print(start_date, end_date)
p.add_term('Council Member', 'legislature',
district=district,
start_date=start_date.isoformat(),
end_date=end_date)
party = councilman['Political Party']
if party == 'Democrat' :
party = 'Democratic'
if party :
p.add_party(party)
if councilman['Photo'] :
p.image = councilman['Photo']
if councilman["E-mail"]:
p.add_contact_detail(type="email",
value=councilman['E-mail']['url'],
note='E-mail')
if councilman['Web site']:
p.add_link(councilman['Web site']['url'], note='web site')
p.extras = {'Notes' : councilman['Notes']}
p.add_source(councilman['Person Name']['url'], note='web')
for committee, _, _ in committees:
committee_name = committee['Department Name']['label']
if committee_name not in noncommittees and 'committee' in committee_name.lower():
o = committee_d.get(committee_name, None)
if o is None:
parent_id = PARENT_ORGS.get(committee_name,
'New York City Council')
o = Organization(committee_name,
classification='committee',
parent_id={'name' : parent_id})
o.add_source(committee['Department Name']['url'])
committee_d[committee_name] = o
membership = o.add_member(p, role=committee["Title"])
membership.start_date = self.mdY2Ymd(committee["Start Date"])
yield p
#.........这里部分代码省略.........
示例5: get_organizations
# 需要导入模块: from pupa.scrape import Person [as 别名]
# 或者: from pupa.scrape.Person import add_term [as 别名]
def get_organizations(self):
org = Organization(name="Chicago City Council", classification="legislature")
for x in range(1, 51):
org.add_post(
"Ward {}".format(x),
"Alderman",
division_id='ocd-division/country:us/state:il/place:chicago/ward:{}'.format(x))
yield org
city = Organization('City of Chicago', classification='executive')
city.add_post('Mayor', 'Mayor', division_id='ocd-division/country:us/state:il/place:chicago')
city.add_post('City Clerk', 'City Clerk', division_id='ocd-division/country:us/state:il/place:chicago')
yield city
daley = Person(name="Daley, Richard M.")
daley.add_term('Mayor',
'executive',
start_date=datetime.date(1989, 4, 24),
end_date=datetime.date(2011, 5, 16),
appointment=True)
daley.add_source('https://chicago.legistar.com/People.aspx')
yield daley
emanuel = Person(name="Emanuel, Rahm")
emanuel.add_term('Mayor',
'executive',
start_date=datetime.date(2011, 5, 16),
appointment=True)
emanuel.add_source('https://chicago.legistar.com/People.aspx')
yield emanuel
mendoza = Person(name='Mendoza, Susana A.')
mendoza.add_term('City Clerk',
'executive',
start_date=datetime.date(2011, 5, 16),
end_date=datetime.date(2016, 12, 4),
appointment=True)
mendoza.add_source('https://chicago.legistar.com/People.aspx')
yield mendoza
valle = Person(name='Del Valle, Miguel')
valle.add_term('City Clerk',
'executive',
start_date=datetime.date(2006, 12, 1),
end_date=datetime.date(2011, 5, 16),
appointment=True)
valle.add_source('https://chicago.legistar.com/People.aspx')
yield valle
valencia = Person(name='Valencia, Anna M.')
valencia.add_term(role='City Clerk',
org_classification='executive',
start_date=datetime.date(2017, 1, 25),
end_date=datetime.date(2019, 5, 20),
appointment=True)
valencia.add_source('https://chicago.legistar.com/People.aspx')
yield valencia