File tree 1 file changed +10
-2
lines changed
sb125_analyses/sb125_fund_split_analysis
1 file changed +10
-2
lines changed Original file line number Diff line number Diff line change @@ -619,11 +619,12 @@ def fund_request_melt(df):
619
619
620
620
621
621
if __name__ == "__main__" :
622
-
622
+ print ( "running fund_request_checker_v3()" )
623
623
good_list , review_list = fund_request_checker_v3 (file_list )
624
624
625
625
cleaned_fund_request = cleaner_loop (good_list )
626
626
627
+ print ("running individual cleaning scripts" )
627
628
#these functions clean specific values (DFs) in the cleaned_fund_request dict
628
629
clean_humboldt ()
629
630
@@ -658,13 +659,20 @@ def fund_request_melt(df):
658
659
659
660
# concat all values (DFs) from cleaned_fund_request dict to be a single DF and concat the rest of the DFs
660
661
662
+ print ("running concat_everything" )
661
663
all_fund_requests = concat_everything ()
662
664
665
+ print ("saving data as .parquet and .csv to GCS" )
663
666
# SAVING TO GCS!
664
667
all_fund_requests .to_parquet (f"{ GCS_PATH } all_fund_requests_concat.parquet" )
665
668
666
669
#melt all fund requests
667
670
all_melt = fund_request_melt (all_fund_requests )
668
671
669
672
#saving to gcs
670
- all_melt .to_parquet (f"{ GCS_PATH } all_fund_requests_melt.parquet" )
673
+ all_melt .to_parquet (f"{ GCS_PATH } all_fund_requests_melt.parquet" )
674
+
675
+ # saving all_melt to csv
676
+ all_melt .to_csv (f"{ GCS_PATH } all_fund_requests_melt.csv" , index = False )
677
+
678
+ print ("end of script" )
You can’t perform that action at this time.
0 commit comments