@@ -420,7 +420,7 @@ def get_rich_pull_reviews(self, comments, eitem):
420
420
# Copy data from the raw comment
421
421
ecomment ['body' ] = comment ['body' ][:self .KEYWORD_MAX_LENGTH ]
422
422
ecomment ['body_analyzed' ] = comment ['body' ]
423
- ecomment ['url' ] = comment ['html_url' ]
423
+ # ecomment['url'] = comment['html_url']
424
424
425
425
# extract reactions and add it to enriched item
426
426
ecomment .update (self .__get_reactions (comment ))
@@ -524,6 +524,11 @@ def __get_rich_pull(self, item):
524
524
self .copy_raw_fields (self .RAW_FIELDS_COPY , item , rich_pr )
525
525
# The real data
526
526
pull_request = item ['data' ]
527
+
528
+ if pull_request ['closed_at' ] == '' :
529
+ pull_request ['closed_at' ] = None
530
+ if pull_request ['merged_at' ] == '' :
531
+ pull_request ['merged_at' ] = None
527
532
528
533
rich_pr ['time_to_close_days' ] = \
529
534
get_time_diff_days (pull_request ['created_at' ], pull_request ['closed_at' ])
@@ -541,26 +546,26 @@ def __get_rich_pull(self, item):
541
546
rich_pr ['user_name' ] = user ['name' ]
542
547
rich_pr ['author_name' ] = user ['name' ]
543
548
rich_pr ['user_email' ] = user .get ('email' , None )
544
- rich_pr ["user_domain" ] = self .get_email_domain (user ['email' ]) if user [ 'email' ] else None
545
- rich_pr ['user_org' ] = user [ 'company' ]
546
- # rich_pr['user_location'] = user[ 'location']
549
+ rich_pr ["user_domain" ] = self .get_email_domain (user ['email' ]) if user . get ( 'email' , None ) else None
550
+ rich_pr ['user_org' ] = user . get ( 'company' , None )
551
+ rich_pr ['user_location' ] = user . get ( 'location' , None )
547
552
rich_pr ['user_geolocation' ] = None
548
553
else :
549
554
rich_pr ['user_name' ] = None
555
+ rich_pr ['user_email' ] = None
550
556
rich_pr ["user_domain" ] = None
551
557
rich_pr ['user_org' ] = None
552
558
rich_pr ['user_location' ] = None
553
559
rich_pr ['user_geolocation' ] = None
554
560
rich_pr ['author_name' ] = None
555
- rich_pr ['user_email' ] = None
556
561
557
562
merged_by = pull_request .get ('merged_by_data' , None )
558
563
if merged_by and merged_by != USER_NOT_AVAILABLE :
559
564
rich_pr ['merge_author_login' ] = merged_by ['login' ]
560
565
rich_pr ['merge_author_name' ] = merged_by ['name' ]
561
- rich_pr ["merge_author_domain" ] = self .get_email_domain (merged_by ['email' ]) if merged_by [ 'email' ] else None
562
- rich_pr ['merge_author_org' ] = merged_by [ 'company' ]
563
- # rich_pr['merge_author_location'] = merged_by[ 'location']
566
+ rich_pr ["merge_author_domain" ] = self .get_email_domain (merged_by ['email' ]) if merged_by . get ( 'email' , None ) else None
567
+ rich_pr ['merge_author_org' ] = merged_by . get ( 'company' , None )
568
+ rich_pr ['merge_author_location' ] = merged_by . get ( 'location' , None )
564
569
rich_pr ['merge_author_geolocation' ] = None
565
570
else :
566
571
rich_pr ['merge_author_name' ] = None
@@ -635,12 +640,15 @@ def __get_rich_issue(self, item):
635
640
self .copy_raw_fields (self .RAW_FIELDS_COPY , item , rich_issue )
636
641
# The real data
637
642
issue = item ['data' ]
643
+
644
+ if issue ['finished_at' ] == '' :
645
+ issue ['finished_at' ] = None
638
646
639
647
rich_issue ['time_to_close_days' ] = \
640
648
get_time_diff_days (issue ['created_at' ], issue ['finished_at' ])
641
649
642
- #issue have four status: open,progressing, closed, rejected .
643
- if issue ['state' ] == 'open' or issue [ 'state' ] == 'progressing' :
650
+ #issue have four status: open, closed.
651
+ if issue ['state' ] == 'open' :
644
652
rich_issue ['time_open_days' ] = \
645
653
get_time_diff_days (issue ['created_at' ], datetime_utcnow ().replace (tzinfo = None ))
646
654
else :
@@ -653,26 +661,26 @@ def __get_rich_issue(self, item):
653
661
rich_issue ['user_name' ] = user ['name' ]
654
662
rich_issue ['author_name' ] = user ['name' ]
655
663
rich_issue ['user_email' ] = user .get ('email' , None )
656
- rich_issue ["user_domain" ] = self .get_email_domain (user ['email' ]) if user [ 'email' ] else None
657
- rich_issue ['user_org' ] = user [ 'company' ]
658
- # rich_issue['user_location'] = user[ 'location']
664
+ rich_issue ["user_domain" ] = self .get_email_domain (user ['email' ]) if user . get ( 'email' , None ) else None
665
+ rich_issue ['user_org' ] = user . get ( 'company' , None )
666
+ rich_issue ['user_location' ] = user . get ( 'location' , None )
659
667
rich_issue ['user_geolocation' ] = None
660
668
else :
661
669
rich_issue ['user_name' ] = None
670
+ rich_issue ['user_email' ] = None
662
671
rich_issue ["user_domain" ] = None
663
672
rich_issue ['user_org' ] = None
664
673
rich_issue ['user_location' ] = None
665
674
rich_issue ['user_geolocation' ] = None
666
675
rich_issue ['author_name' ] = None
667
- rich_issue ['user_email' ] = None
668
676
669
677
assignee = issue .get ('assignee_data' , None )
670
678
if assignee and assignee != USER_NOT_AVAILABLE :
671
679
rich_issue ['assignee_login' ] = assignee ['login' ]
672
680
rich_issue ['assignee_name' ] = assignee ['name' ]
673
- rich_issue ["assignee_domain" ] = self .get_email_domain (assignee ['email' ]) if assignee [ 'email' ] else None
674
- rich_issue ['assignee_org' ] = assignee [ 'company' ]
675
- # rich_issue['assignee_location'] = assignee[ 'location']
681
+ rich_issue ["assignee_domain" ] = self .get_email_domain (assignee ['email' ]) if assignee . get ( 'email' , None ) else None
682
+ rich_issue ['assignee_org' ] = assignee . get ( 'company' , None )
683
+ rich_issue ['assignee_location' ] = assignee . get ( 'location' , None )
676
684
rich_issue ['assignee_geolocation' ] = None
677
685
else :
678
686
rich_issue ['assignee_name' ] = None
@@ -703,9 +711,7 @@ def __get_rich_issue(self, item):
703
711
rich_issue ['issue_labels' ] = labels
704
712
705
713
rich_issue ['item_type' ] = ISSUE_TYPE
706
- rich_issue ['issue_pull_request' ] = True
707
- if 'head' not in issue .keys () and 'pull_request' not in issue .keys ():
708
- rich_issue ['issue_pull_request' ] = False
714
+ rich_issue ['issue_pull_request' ] = False
709
715
710
716
rich_issue ['gitcode_repo' ] = rich_issue ['repository' ].replace (GITCODE , '' )
711
717
rich_issue ['gitcode_repo' ] = re .sub ('.git$' , '' , rich_issue ['gitcode_repo' ])
0 commit comments