in osci/preprocess/match_company/process.py [0:0]
def process_github_daily_push_events(day: datetime.datetime):
push_events_commits = DataLake().landing.get_daily_push_events_commits(date=day)
if push_events_commits is not None and not push_events_commits.empty:
companies_events = process_push_commits(push_events_commits,
email_field=DataLake().landing.schemas.push_commits.author_email,
company_field=DataLake().staging.schemas.push_commits.company,
datetime_field=DataLake().landing.schemas.push_commits.event_created_at)
for company, commits in companies_events:
log.debug(f'Save company {company}')
DataLake().staging.save_raw_push_events_commits(push_event_commits=commits, date=day, company_name=company)