import pandas as pd
df= pd.read_csv('/content/Dataset_Contract_Sub-Awards.csv')
cols= df.columns.tolist()
cols
['prime_award_unique_key', 'prime_award_piid', 'prime_award_parent_piid', 'prime_award_amount', 'prime_award_disaster_emergency_fund_codes', 'prime_award_outlayed_amount_funded_by_COVID-19_supplementals', 'prime_award_obligated_amount_funded_by_COVID-19_supplementals', 'prime_award_base_action_date', 'prime_award_base_action_date_fiscal_year', 'prime_award_latest_action_date', 'prime_award_latest_action_date_fiscal_year', 'prime_award_period_of_performance_start_date', 'prime_award_period_of_performance_current_end_date', 'prime_award_period_of_performance_potential_end_date', 'prime_award_awarding_agency_code', 'prime_award_awarding_agency_name', 'prime_award_awarding_sub_agency_code', 'prime_award_awarding_sub_agency_name', 'prime_award_awarding_office_code', 'prime_award_awarding_office_name', 'prime_award_funding_agency_code', 'prime_award_funding_agency_name', 'prime_award_funding_sub_agency_code', 'prime_award_funding_sub_agency_name', 'prime_award_funding_office_code', 'prime_award_funding_office_name', 'prime_award_treasury_accounts_funding_this_award', 'prime_award_federal_accounts_funding_this_award', 'prime_award_object_classes_funding_this_award', 'prime_award_program_activities_funding_this_award', 'prime_awardee_duns', 'prime_awardee_uei', 'prime_awardee_name', 'prime_awardee_dba_name', 'prime_awardee_parent_duns', 'prime_awardee_parent_uei', 'prime_awardee_parent_name', 'prime_awardee_country_code', 'prime_awardee_country_name', 'prime_awardee_address_line_1', 'prime_awardee_city_name', 'prime_awardee_county_name', 'prime_awardee_state_code', 'prime_awardee_state_name', 'prime_awardee_zip_code', 'prime_awardee_congressional_district', 'prime_awardee_foreign_postal_code', 'prime_awardee_business_types', 'prime_award_primary_place_of_performance_city_name', 'prime_award_primary_place_of_performance_state_code', 'prime_award_primary_place_of_performance_state_name', 'prime_award_primary_place_of_performance_address_zip_code', 'prime_award_primary_place_of_performance_congressional_district', 'prime_award_primary_place_of_performance_country_code', 'prime_award_primary_place_of_performance_country_name', 'prime_award_description', 'prime_award_project_title', 'prime_award_naics_code', 'prime_award_naics_description', 'prime_award_national_interest_action_code', 'prime_award_national_interest_action', 'subaward_type', 'subaward_fsrs_report_id', 'subaward_fsrs_report_year', 'subaward_fsrs_report_month', 'subaward_number', 'subaward_amount', 'subaward_action_date', 'subaward_action_date_fiscal_year', 'subawardee_duns', 'subawardee_name', 'subawardee_dba_name', 'subawardee_parent_duns', 'subawardee_parent_name', 'subawardee_country_code', 'subawardee_country_name', 'subawardee_address_line_1', 'subawardee_city_name', 'subawardee_state_code', 'subawardee_state_name', 'subawardee_zip_code', 'subawardee_congressional_district', 'subawardee_foreign_postal_code', 'subawardee_business_types', 'subaward_primary_place_of_performance_address_line_1', 'subaward_primary_place_of_performance_city_name', 'subaward_primary_place_of_performance_state_code', 'subaward_primary_place_of_performance_state_name', 'subaward_primary_place_of_performance_address_zip_code', 'subaward_primary_place_of_performance_congressional_district', 'subaward_primary_place_of_performance_country_code', 'subaward_primary_place_of_performance_country_name', 'subaward_description', 'subawardee_highly_compensated_officer_1_name', 'subawardee_highly_compensated_officer_1_amount', 'subawardee_highly_compensated_officer_2_name', 'subawardee_highly_compensated_officer_2_amount', 'subawardee_highly_compensated_officer_3_name', 'subawardee_highly_compensated_officer_3_amount', 'subawardee_highly_compensated_officer_4_name', 'subawardee_highly_compensated_officer_4_amount', 'subawardee_highly_compensated_officer_5_name', 'subawardee_highly_compensated_officer_5_amount', 'usaspending_permalink', 'subaward_fsrs_report_last_modified_date']
df.head()
prime_award_unique_key | prime_award_piid | prime_award_parent_piid | prime_award_amount | prime_award_disaster_emergency_fund_codes | prime_award_outlayed_amount_funded_by_COVID-19_supplementals | prime_award_obligated_amount_funded_by_COVID-19_supplementals | prime_award_base_action_date | prime_award_base_action_date_fiscal_year | prime_award_latest_action_date | ... | subawardee_highly_compensated_officer_2_name | subawardee_highly_compensated_officer_2_amount | subawardee_highly_compensated_officer_3_name | subawardee_highly_compensated_officer_3_amount | subawardee_highly_compensated_officer_4_name | subawardee_highly_compensated_officer_4_amount | subawardee_highly_compensated_officer_5_name | subawardee_highly_compensated_officer_5_amount | usaspending_permalink | subaward_fsrs_report_last_modified_date | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2021-11-16 13:35:00+00 |
1 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2020-11-17 10:56:12+00 |
2 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-07-09 19:26:13+00 |
3 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-02-15 14:22:36+00 |
4 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-03-26 19:23:55+00 |
5 rows × 105 columns
df=df.drop_duplicates()
df.head()
prime_award_unique_key | prime_award_piid | prime_award_parent_piid | prime_award_amount | prime_award_disaster_emergency_fund_codes | prime_award_outlayed_amount_funded_by_COVID-19_supplementals | prime_award_obligated_amount_funded_by_COVID-19_supplementals | prime_award_base_action_date | prime_award_base_action_date_fiscal_year | prime_award_latest_action_date | ... | subawardee_highly_compensated_officer_2_name | subawardee_highly_compensated_officer_2_amount | subawardee_highly_compensated_officer_3_name | subawardee_highly_compensated_officer_3_amount | subawardee_highly_compensated_officer_4_name | subawardee_highly_compensated_officer_4_amount | subawardee_highly_compensated_officer_5_name | subawardee_highly_compensated_officer_5_amount | usaspending_permalink | subaward_fsrs_report_last_modified_date | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2021-11-16 13:35:00+00 |
1 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2020-11-17 10:56:12+00 |
2 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-07-09 19:26:13+00 |
3 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-02-15 14:22:36+00 |
4 | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | NaN | 174746702.0 | NaN | NaN | NaN | 2016-10-31 | 2017 | 2021-09-15 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-03-26 19:23:55+00 |
5 rows × 105 columns
def describe_nan(df):
return pd.DataFrame([(i, df[df[i].isna()].shape[0],df[df[i].isna()].shape[0]/df.shape[0]) for i in df.columns], columns=['column', 'nan_counts', 'nan_rate'])
missing_value_count= describe_nan(df)
missing_value_count
column | nan_counts | nan_rate | |
---|---|---|---|
0 | prime_award_unique_key | 0 | 0.000000 |
1 | prime_award_piid | 0 | 0.000000 |
2 | prime_award_parent_piid | 347 | 1.000000 |
3 | prime_award_amount | 0 | 0.000000 |
4 | prime_award_disaster_emergency_fund_codes | 329 | 0.948127 |
... | ... | ... | ... |
100 | subawardee_highly_compensated_officer_4_amount | 329 | 0.948127 |
101 | subawardee_highly_compensated_officer_5_name | 326 | 0.939481 |
102 | subawardee_highly_compensated_officer_5_amount | 329 | 0.948127 |
103 | usaspending_permalink | 0 | 0.000000 |
104 | subaward_fsrs_report_last_modified_date | 0 | 0.000000 |
105 rows × 3 columns
### Removing columns with more than 90% missing data
major_data_missing_cols= missing_value_count[missing_value_count['nan_rate']>0.9]['column'].to_list()
major_data_missing_cols
['prime_award_parent_piid', 'prime_award_disaster_emergency_fund_codes', 'prime_award_outlayed_amount_funded_by_COVID-19_supplementals', 'prime_award_obligated_amount_funded_by_COVID-19_supplementals', 'prime_awardee_foreign_postal_code', 'subawardee_foreign_postal_code', 'subaward_primary_place_of_performance_address_line_1', 'subawardee_highly_compensated_officer_1_name', 'subawardee_highly_compensated_officer_1_amount', 'subawardee_highly_compensated_officer_2_name', 'subawardee_highly_compensated_officer_2_amount', 'subawardee_highly_compensated_officer_3_name', 'subawardee_highly_compensated_officer_3_amount', 'subawardee_highly_compensated_officer_4_name', 'subawardee_highly_compensated_officer_4_amount', 'subawardee_highly_compensated_officer_5_name', 'subawardee_highly_compensated_officer_5_amount']
df= df.drop(major_data_missing_cols, axis=1)
cols= df.columns.tolist()
cols
['prime_award_unique_key', 'prime_award_piid', 'prime_award_amount', 'prime_award_base_action_date', 'prime_award_base_action_date_fiscal_year', 'prime_award_latest_action_date', 'prime_award_latest_action_date_fiscal_year', 'prime_award_period_of_performance_start_date', 'prime_award_period_of_performance_current_end_date', 'prime_award_period_of_performance_potential_end_date', 'prime_award_awarding_agency_code', 'prime_award_awarding_agency_name', 'prime_award_awarding_sub_agency_code', 'prime_award_awarding_sub_agency_name', 'prime_award_awarding_office_code', 'prime_award_awarding_office_name', 'prime_award_funding_agency_code', 'prime_award_funding_agency_name', 'prime_award_funding_sub_agency_code', 'prime_award_funding_sub_agency_name', 'prime_award_funding_office_code', 'prime_award_funding_office_name', 'prime_award_treasury_accounts_funding_this_award', 'prime_award_federal_accounts_funding_this_award', 'prime_award_object_classes_funding_this_award', 'prime_award_program_activities_funding_this_award', 'prime_awardee_duns', 'prime_awardee_uei', 'prime_awardee_name', 'prime_awardee_dba_name', 'prime_awardee_parent_duns', 'prime_awardee_parent_uei', 'prime_awardee_parent_name', 'prime_awardee_country_code', 'prime_awardee_country_name', 'prime_awardee_address_line_1', 'prime_awardee_city_name', 'prime_awardee_county_name', 'prime_awardee_state_code', 'prime_awardee_state_name', 'prime_awardee_zip_code', 'prime_awardee_congressional_district', 'prime_awardee_business_types', 'prime_award_primary_place_of_performance_city_name', 'prime_award_primary_place_of_performance_state_code', 'prime_award_primary_place_of_performance_state_name', 'prime_award_primary_place_of_performance_address_zip_code', 'prime_award_primary_place_of_performance_congressional_district', 'prime_award_primary_place_of_performance_country_code', 'prime_award_primary_place_of_performance_country_name', 'prime_award_description', 'prime_award_project_title', 'prime_award_naics_code', 'prime_award_naics_description', 'prime_award_national_interest_action_code', 'prime_award_national_interest_action', 'subaward_type', 'subaward_fsrs_report_id', 'subaward_fsrs_report_year', 'subaward_fsrs_report_month', 'subaward_number', 'subaward_amount', 'subaward_action_date', 'subaward_action_date_fiscal_year', 'subawardee_duns', 'subawardee_name', 'subawardee_dba_name', 'subawardee_parent_duns', 'subawardee_parent_name', 'subawardee_country_code', 'subawardee_country_name', 'subawardee_address_line_1', 'subawardee_city_name', 'subawardee_state_code', 'subawardee_state_name', 'subawardee_zip_code', 'subawardee_congressional_district', 'subawardee_business_types', 'subaward_primary_place_of_performance_city_name', 'subaward_primary_place_of_performance_state_code', 'subaward_primary_place_of_performance_state_name', 'subaward_primary_place_of_performance_address_zip_code', 'subaward_primary_place_of_performance_congressional_district', 'subaward_primary_place_of_performance_country_code', 'subaward_primary_place_of_performance_country_name', 'subaward_description', 'usaspending_permalink', 'subaward_fsrs_report_last_modified_date']
clean_df= df
clean_df['prime_award_funding_office_name'].value_counts()
DEF ADVANCED RESEARCH PROJECTS AGCY 257 AFRL RWP 54 AFRL RQH HIGH SPEED SYS DIV 29 AFRL RW 6 OFFICE OF NAVAL RESEARCH 1 Name: prime_award_funding_office_name, dtype: int64
projects= pd.DataFrame(clean_df['prime_award_project_title'].value_counts().reset_index())
projects
index | prime_award_project_title | |
---|---|---|
0 | HYPERSONIC AIR BREAT | 207 |
1 | AMS: ADV PROGRAMS | 126 |
2 | AMS: ADV PROGRAMS; AMS:AAWS | 6 |
3 | AMS: ADV PROGRAMS/RMS: NBI | 5 |
4 | AMS:HYPERSONICS | 2 |
5 | AMS:AAWS | 1 |
projects['prime_award_project_title']= (projects['prime_award_project_title']/347)*100
projects
index | prime_award_project_title | |
---|---|---|
0 | HYPERSONIC AIR BREAT | 59.654179 |
1 | AMS: ADV PROGRAMS | 36.311239 |
2 | AMS: ADV PROGRAMS; AMS:AAWS | 1.729107 |
3 | AMS: ADV PROGRAMS/RMS: NBI | 1.440922 |
4 | AMS:HYPERSONICS | 0.576369 |
5 | AMS:AAWS | 0.288184 |
projects['index'].to_list()
['HYPERSONIC AIR BREAT', 'AMS: ADV PROGRAMS', 'AMS: ADV PROGRAMS; AMS:AAWS', 'AMS: ADV PROGRAMS/RMS: NBI', 'AMS:HYPERSONICS', 'AMS:AAWS']
print(clean_df['subawardee_parent_name'][clean_df['prime_award_project_title']=='AMS:AAWS'])
print(clean_df['subawardee_name'][clean_df['prime_award_project_title']=='AMS:AAWS'])
61 ORBITAL ATK, INC. Name: subawardee_parent_name, dtype: object 61 ALLIANT TECHSYSTEMS OPERATIONS LLC Name: subawardee_name, dtype: object
clean_df['prime_award_naics_description'].value_counts()
RESEARCH AND DEVELOPMENT IN THE PHYSICAL, ENGINEERING, AND LIFE SCIENCES (EXCEPT BIOTECHNOLOGY) 347 Name: prime_award_naics_description, dtype: int64
We can see that all the awards fall into the R&D category only. This insight is even more important since the scope of losing this important data to a cyberattack is zero.
sub=pd.DataFrame(clean_df['subawardee_name'].value_counts().reset_index())
sub
index | subawardee_name | |
---|---|---|
0 | ALLIANT TECHSYSTEMS OPERATIONS LLC | 25 |
1 | DUCOMMUN LABARGE TECHNOLOGIES, INC. | 22 |
2 | PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY... | 16 |
3 | DYNETICS TECHNICAL SOLUTIONS, INC. | 13 |
4 | A. P. I. INCORPORATED | 12 |
... | ... | ... |
74 | CARLETON TECHNOLOGIES INC | 1 |
75 | MORGAN ADVANCED CERAMICS, INC. | 1 |
76 | GRAY'S ENGINEERING & CONSULTING, INC. | 1 |
77 | PORT ELECTRONICS CORP. | 1 |
78 | ROCKWELL COLLINS, INC. | 1 |
79 rows × 2 columns
sub['index'].to_list()
['ALLIANT TECHSYSTEMS OPERATIONS LLC', 'DUCOMMUN LABARGE TECHNOLOGIES, INC.', 'PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC', 'DYNETICS TECHNICAL SOLUTIONS, INC.', 'A. P. I. INCORPORATED', 'STANLEY MACHINING & TOOL CORP.', 'TRI MODELS, INC.', 'UNI-CAST, INC.', 'MEASUREMENT SPECIALTIES, INC.', 'L3 TECHNOLOGIES, INC.', 'EAGLEPICHER TECHNOLOGIES, LLC', 'ALLCOMP INC.', 'MARVIN ENGINEERING CO., INC.', 'ENSIGN-BICKFORD AEROSPACE & DEFENSE COMPANY', 'MICRO CRAFT, INC.', 'KEYSIGHT TECHNOLOGIES, INC.', 'VENTURA AEROSPACE, INC.', 'INOVAR, INC.', 'PRAXIS RESOURCES INC.', 'PARKER-HANNIFIN CORPORATION', 'HI-TECH MACHINING & ENGINEERING, L.L.C.', 'TELETRONICS TECHNOLOGY CORPORATION', "JANSEN'S AIRCRAFT SYSTEMS CONTROLS, INC.", 'AZMARK AERO SYSTEMS, LLC', 'ORBITAL SCIENCES CORPORATION', 'RADIUS AEROSPACE, INC.', 'HERLEY INDUSTRIES, INC.', 'PCC STRUCTURALS, INC.', 'SPARTRONICS LOGAN, LLC', 'PORT ELECTRONICS CORPORATION', 'MORGAN ADVANCED CERAMICS, INC', 'ATK SPACE SYSTEMS INC.', 'AMRO FABRICATING CORPORATION', 'PARALLEL VENTURES, INC.', 'QUASONIX, LLC', 'BADGER METER, INC.', 'CONCURRENT TECHNOLOGIES CORPORATION', 'PROMAT INC', 'HONEYWELL INTERNATIONAL INC.', 'GLENAIR, INC.', 'KLUNE INDUSTRIES, INC.', 'PCB PIEZOTRONICS, INC.', 'SOUTHERN GEAR & MACHINE, INC.', 'KIRSH MANUFACTURING, INC.', 'AEROJET ROCKETDYNE, INC.', 'ADVANCED THERMAL BATTERIES INC.', 'DYTRAN INSTRUMENTS INC.', 'CAID INDUSTRIES, INC', 'SPACE VECTOR CORPORATION', 'CAMI RESEARCH, INC.', 'TEVET, LLC', 'CICOIL, LLC', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.', 'BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS INTEGRATION INC.', 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.', 'EMOTEQ CORPORATION', 'DESIGNLINX HARDWARE SOLUTIONS, INC.', 'COBHAM MISSION SYSTEMS ORCHARD PARK INC.', 'ARCH GLOBAL PRECISION - HUNTINGDON VALLEY, LLC', 'NICOMATIC, L.P.', 'MICRO SYSTEMS, INC.', 'LABARGE ACQUISITION COMPANY, INC.', 'AEROSPEC, INC.', 'CORVID TECHNOLOGIES LLC', 'ORBITAL SCIENCES LLC', 'ADVANCED MATERIALS TECHNOLOGIES, LLC', 'COORSTEK, INC.', 'SHELLI INDUSTRIES LLC', "GRAY'S ENGINEERING & CONSULTING, LLC", 'UNI-CAST, LLC', 'TRIUMPH ENGINEERED SOLUTIONS, INC.', 'GLOBE MOTORS, INC.', 'DYNETICS, INC.', 'DESIGNLINX HARDWARE SOLUTIONS, LLC', 'CARLETON TECHNOLOGIES INC', 'MORGAN ADVANCED CERAMICS, INC.', "GRAY'S ENGINEERING & CONSULTING, INC.", 'PORT ELECTRONICS CORP.', 'ROCKWELL COLLINS, INC.']
sub['subawardee_name'].to_list()
[25, 22, 16, 13, 12, 11, 10, 8, 8, 8, 8, 7, 7, 7, 6, 6, 6, 6, 5, 5, 5, 5, 5, 5, 4, 4, 4, 4, 4, 4, 4, 4, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]
imp_sub= pd.DataFrame(df['subawardee_parent_name'].value_counts().reset_index())
imp_sub.head()
index | subawardee_parent_name | |
---|---|---|
0 | Ducommun Incorporated | 24 |
1 | NORTHROP GRUMMAN CORPORATION | 18 |
2 | ORBITAL ATK, INC. | 16 |
3 | Fortive Corporation | 16 |
4 | STANLEY MACHINING & TOOL CORP. | 11 |
imp_sub['index'].to_list()
['Ducommun Incorporated', 'NORTHROP GRUMMAN CORPORATION', 'ORBITAL ATK, INC.', 'Fortive Corporation', 'STANLEY MACHINING & TOOL CORP.', 'LEIDOS HOLDINGS, INC.', 'TE Connectivity Ltd.', 'EAGLEPICHER TECHNOLOGIES, LLC', 'MARVIN ENGINEERING CO., INC.', 'BERKSHIRE HATHAWAY INC.', 'DYNETICS, INC.', 'L3HARRIS TECHNOLOGIES, INC.', 'KEYSIGHT TECHNOLOGIES, INC.', 'CURTISS-WRIGHT CORPORATION', 'PARKER-HANNIFIN CORPORATION', 'MORGAN ADVANCED MATERIALS PLC', 'Imaginetics Holdings LLC', 'ULTRA ELECTRONICS HOLDINGS PLC', 'Ensign-Bickford Industries, Inc.', 'Ems Holdco, Inc.', 'AMRO FABRICATING CORPORATION', 'GLENAIR, INC.', 'ASB AEROSPATIALE BATTERIES', 'HONEYWELL INTERNATIONAL INC.', 'ALLIED MOTION TECHNOLOGIES INC.', 'BADGER METER, INC.', 'Samuel, Son & Co., Limited', 'QUASONIX, LLC', 'Etex', 'ENSIGN-BICKFORD INDUSTRIES, INC.', 'AEROJET ROCKETDYNE HOLDINGS, INC.', 'CONCURRENT TECHNOLOGIES CORPORATION', 'MTS SYSTEMS CORPORATION', 'BAE SYSTEMS PLC', 'TEVET, LLC', 'KRATOS DEFENSE & SECURITY SOLUTIONS, INC.', 'Keystone Holdings Group, LLC', 'NICOMATIC', 'ARLINGTON CAPITAL PARTNERS IV, L.P.', 'L3 TECHNOLOGIES, INC.', 'CORVID TECHNOLOGIES LLC', 'The Jordan Company L P', 'Radius Aerospace, Inc.', 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.', 'VISHAY PRECISION GROUP, INC.', 'AMPHENOL CORPORATION', 'TRIUMPH GROUP, INC.', 'ELEMENT MATERIALS TECHNOLOGY GROUP LIMITED', 'CREATION TECHNOLOGIES INC', 'AI Convoy & Cy S.C.A.', 'AI CONVOY HOLDCO LIMITED', 'APPLIED TECHNICAL SERVICES, LLC', 'ROCKWELL COLLINS, INC.', 'Vectra Co.']
imp_sub['subawardee_parent_name'].to_list()
[24, 18, 16, 16, 11, 8, 8, 7, 7, 7, 6, 6, 6, 5, 5, 5, 5, 4, 4, 4, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]
clean_df['subawardee_business_types'].value_counts()
For-Profit Organization,Manufacturer of Goods 140 For-Profit Organization,Limited Liability Company,Manufacturer of Goods 28 For-Profit Organization,S Corporation 25 For-Profit Organization 24 For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods 21 For-Profit Organization,Manufacturer of Goods,S Corporation 18 For-Profit Organization,Manufacturer of Goods,Woman-Owned Business 13 For-Profit Organization,S Corporation,Veteran Owned Business 12 For-Profit Organization,Limited Liability Company 11 Contracts and Grants,For-Profit Organization,Manufacturer of Goods 9 For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business 5 Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business 5 Contracts,For-Profit Organization,Manufacturer of Goods 4 Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business 4 For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm 4 For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm 3 Nonprofit Organization 3 For-Profit Organization,Foreign Owned and Located 2 For-Profit Organization,Limited Liability Company,SBA Certified Hub Zone Firm,Service Disabled Veteran Owned,Veteran Owned Business 2 For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business 2 For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods,Self-Certified Small Disadvantaged Business 2 For-Profit Organization,Veteran Owned Business 2 For-Profit Organization,Manufacturer of Goods,Service Disabled Veteran Owned,Veteran Owned Business 2 Contracts and Grants,For-Profit Organization,Limited Liability Company 1 For-Profit Organization,Manufacturer of Goods,Veteran Owned Business 1 Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business 1 Contracts and Grants,For-Profit Organization,Limited Liability Company,Veteran Owned Business 1 For-Profit Organization,Limited Liability Company,Woman-Owned Business 1 Contracts,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Other than one of the preceding,S Corporation 1 Name: subawardee_business_types, dtype: int64
subawardee_biz_desc=' '.join(clean_df['subawardee_business_types'])
subawardee_biz_desc
'For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Limited Liability Company,Veteran Owned Business For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation Contracts and Grants,For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Other than one of the preceding,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Manufacturer of Goods,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Veteran Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Veteran Owned Business For-Profit Organization,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization Contracts and Grants,For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation Nonprofit Organization For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Nonprofit Organization Nonprofit Organization For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,S Corporation Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company,SBA Certified Hub Zone Firm,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Limited Liability Company,SBA Certified Hub Zone Firm,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located For-Profit Organization,Foreign Owned and Located For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Limited Liability Company,Woman-Owned Business For-Profit Organization,Limited Liability Company,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods,Self-Certified Small Disadvantaged Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods,Self-Certified Small Disadvantaged Business'
clean_df['subaward_description'].to_list()
['Detonator&Initiator, Fuselage, Gen Structural Assys, Molded Rubber&O Ring, Non-complex Machined, NRE - Other, Seals, Tech/Eng Services, Wire Cable.', 'Detonator&Initiator, Fuselage, Gen Structural Assys, Molded Rubber&O Ring, Non-complex Machined, NRE - Other, Seals, Tech/Eng Services, Wire Cable.', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'NRE - Other.', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'Cost Plus Fixed Fee', 'NRE - Other.', 'Cost Plus Fixed Fee', 'Detonator&Initiator, NRE - Engineering, NRE - Other, NRE - Qualification, S&A Devices.', 'Detonator&Initiator, NRE - Engineering, NRE - Other, NRE - Qualification, S&A Devices.', 'Firm Fixed Price', 'NRE - Other.', 'NRE - Other.', 'Cost Plus Fixed Fee', 'Firm Fixed Price', 'FinsWings&Boattails, NRE - Other, Pyrotechnic Fuses, Rocket Motors.', 'FinsWings&Boattails, NRE - Other, Pyrotechnic Fuses, Rocket Motors.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Explosive Cut Device, NRE - Engineering, NRE - Other.', 'Explosive Cut Device, NRE - Engineering, NRE - Other.', 'Couplers, Gen Structural Assys, NRE - Other, Nuts.', 'Couplers, Gen Structural Assys, NRE - Other, Nuts.', 'Firm Fixed Price', 'EnvTestEq(Shock/etc), NRE - Engineering, Tech/Eng Services.', 'EnvTestEq(Shock/etc), NRE - Engineering, Tech/Eng Services.', 'Firm Fixed Price', 'Firm Fixed Price', 'Encoders, NRE - Other.', 'Encoders, NRE - Other.', 'Firm Fixed Price', 'Firm Fixed Price', 'Fuselage, Gen Structural Assys, NRE - Other.', 'Fuselage, Gen Structural Assys, NRE - Other.', 'Firm Fixed Price', 'Cost Plus Fixed Fee', 'Multi-Function Assys.', 'Multi-Function Assys.', 'Testing (Non-Prod).', 'Testing (Non-Prod).', 'Firm Fixed Price', 'NRE - Data Items, NRE - Engineering, NRE - Qualification, Pumps, Tech/Eng Services.', 'Firm Fixed Price', 'Firm Fixed Price', 'Gen Structural Assys, NRE - Other, Valves.', 'Gen Structural Assys, NRE - Other, Valves.', 'Cable Assemblies RF, CableAssy&HarnMulti, NRE - Other.', 'Cost Plus Fixed Fee', 'Time & Material', 'Cable Assemblies RF, CableAssy&HarnMulti, NRE - Other.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Alum Invest Casting, NRE - Engineering, NRE - Other.', 'Alum Invest Casting, NRE - Engineering, NRE - Other.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Time & Material', 'Tech/Eng Services.', 'Tech/Eng Services.', 'NRE - Data Items, NRE - Engineering, NRE - Qualification, Pumps, Tech/Eng Services.', 'NRE - Engineering, Titanium Invest Cast.', 'NRE - Engineering, Titanium Invest Cast.', 'Firm Fixed Price', 'Cost Plus Fixed Fee', 'Firm Fixed Price', 'NRE - Other.', 'NRE - Other.', 'Firm Fixed Price', 'Tech/Eng Services.', 'Tech/Eng Services.', 'Firm Fixed Price', 'Firm Fixed Price', 'Time & Material', 'FinsWings&Boattails.', 'FinsWings&Boattails.', 'Firm Fixed Price', 'Gen Structural Assys, NRE - Engineering.', 'Gen Structural Assys, NRE - Engineering.', 'Firm Fixed Price', 'Time & Material', 'Firm Fixed Price', 'Explosive Cut Device.', 'Explosive Cut Device.', 'Firm Fixed Price', 'Firm Fixed Price', 'Cost Plus Fixed Fee', 'NRE - Engineering, Receivers.', 'NRE - Engineering, Receivers.', 'Firm Fixed Price', 'Firm Fixed Price', 'NRE - Other.', "Metal Shp'g Containr.", "Metal Shp'g Containr.", 'NRE - Other.', 'NRE - Other.', 'Firm Fixed Price', 'Missile Antenna &Ped.', 'Missile Antenna &Ped.', 'AlarmBuzzerSensor, EnvTestEq(Shock/etc).', 'AlarmBuzzerSensor, EnvTestEq(Shock/etc).', 'Missile Antenna &Ped, NRE - Engineering, NRE - Other.', 'Missile Antenna &Ped, NRE - Engineering, NRE - Other.', 'Firm Fixed Price', 'Iron Batteries.', 'Iron Batteries.', 'Firm Fixed Price', 'Time & Material', "Custom CCA's, NRE - Other.", 'Firm Fixed Price', "Custom CCA's, NRE - Other.", 'Gen Structural Assys.', 'Gen Structural Assys.', 'Test Equipment.', 'Test Equipment.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Transducers.', 'Firm Fixed Price', 'Chargers, Lithium Batteries, NRE - Other.', 'Chargers, Lithium Batteries, NRE - Other.', 'NRE - Other.', 'Transducers.', 'NRE - Other.', 'NRE - Other.', 'Iron Batteries, NRE - Other.', 'Firm Fixed Price', 'Iron Batteries, NRE - Other.', 'Firm Fixed Price', 'Accelerometers, Amplifiers, Cable/CableAssyHV, Non-complex Machined.', 'Accelerometers, Amplifiers, Cable/CableAssyHV, Non-complex Machined.', 'Firm Fixed Price', 'Cost Plus Fixed Fee', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'NRE - Other.', 'Iron Batteries.', 'Iron Batteries.', 'Firm Fixed Price', 'Test Equipment.', 'Test Equipment.', 'Firm Fixed Price', 'Services: Nonproduct.', 'Services: Nonproduct.', 'Firm Fixed Price', 'Measuring Devices.', 'Measuring Devices.', 'Firm Fixed Price', 'Gen Structural Assys, NRE - Other.', 'Gen Structural Assys, NRE - Other.', 'Measuring Devices.', 'Measuring Devices.', 'Firm Fixed Price', 'Firm Fixed Price', 'Launchers&Cannisters.', 'Firm Fixed Price', 'Launchers&Cannisters.', 'Machine Shop Work.', 'Machine Shop Work.', 'Firm Fixed Price', 'NRE - Other, T/E Rental/Lease.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Gen Structural Assys, Non-complex Machined.', 'Gen Structural Assys, Non-complex Machined.', 'NRE - Other, Titanium Plate.', 'NRE - Other, Titanium Plate.', 'Gears, Precision Machined.', 'Gears, Precision Machined.', 'NRE - Other.', 'Firm Fixed Price', 'NRE - Other.', 'Firm Fixed Price', 'Firm Fixed Price', 'NRE - Other.', 'Bolts, Launchers&Cannisters.', 'Bolts, Launchers&Cannisters.', 'FinsWings&Boattails.', 'FinsWings&Boattails.', 'Firm Fixed Price', "Custom CCA's, NRE - Other.", "Custom CCA's, NRE - Other.", 'Missile Antenna &Ped, NRE - Other.', 'Missile Antenna &Ped, NRE - Other.', 'Firm Fixed Price', 'Gen Structural Assys, Non-complex Machined.', 'Gen Structural Assys, Non-complex Machined.', 'Firm Fixed Price', 'Iron Batteries.', 'Firm Fixed Price', 'CableAssy&HarnMulti, NRE - Other.', 'CableAssy&HarnMulti, NRE - Other.', 'Firm Fixed Price', 'NRE - Other, T/E Rental/Lease.', 'Firm Fixed Price', 'Gen Structural Assys, NRE - Engineering.', 'Gen Structural Assys, NRE - Engineering.', 'Firm Fixed Price', 'Firm Fixed Price', 'Time & Material', 'Gen Structural Assys.', 'Gen Structural Assys.', 'Gen Structural Assys, NRE - Engineering.', 'Gen Structural Assys, NRE - Engineering.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Time & Material', 'Firm Fixed Price', 'Firm Fixed Price', "Custom CCA's.", "Custom CCA's.", "Custom CCA's.", "Custom CCA's.", 'CableAssy&HarnMulti, NRE - Other.', 'CableAssy&HarnMulti, NRE - Other.', 'NRE - Other.', 'NRE - Other.', 'Major Assemblies.', 'Major Assemblies.', "Custom CCA's, NRE - Other.", "Custom CCA's, NRE - Other.", 'Transmitters.', 'Transmitters.', 'Firm Fixed Price', 'Missile Antenna &Ped.', 'Missile Antenna &Ped.', 'Non-complex Machined, Precision Machined.', 'Non-complex Machined, Precision Machined.', 'Firm Fixed Price', 'T/E Rental/Lease.', 'T/E Rental/Lease.', 'IMUs IRUs.', 'IMUs IRUs.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Test Equipment.', 'Test Equipment.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price', 'Test Equipment.', 'Firm Fixed Price', 'Test Equipment.', 'Firm Fixed Price', 'NRE - Engineering.', 'NRE - Engineering.', 'Non-complex ShtMetal.', 'Non-complex ShtMetal.', 'Test Equipment.', 'Test Equipment.', 'Firm Fixed Price', 'Gen Structural Assys.', 'Gen Structural Assys.', 'NRE - Other, Protect&Dust Covers, Rectanglar Connector, S&A Devices.', 'NRE - Other, Protect&Dust Covers, Rectanglar Connector, S&A Devices.', 'Firm Fixed Price', 'Tech/Eng Services.', 'Time & Material', 'Tech/Eng Services.', 'NRE - Other.', 'NRE - Other.', 'Firm Fixed Price', 'CableAssy&HarnMulti, NRE - Other.', 'Fasteners & Hardware.', 'Fasteners & Hardware.', 'Firm Fixed Price', 'Measuring Devices, NRE - Other.', 'Measuring Devices, NRE - Other.', 'Firm Fixed Price', 'Shafts.', 'Firm Fixed Price', 'Testing (Non-Prod).', 'Testing (Non-Prod).', 'CableAssy&HarnMulti.', 'GPS Receivers.', 'GPS Receivers.', 'Major Assemblies.', 'Major Assemblies.', 'Integrtd Electr Assy, NRE - Data Items.', 'Firm Fixed Price', 'Firm Fixed Price', 'Encoders.', 'Encoders.', 'Clamps, Washers.', 'Clamps, Washers.', 'Accelerometers, CableMulticonductor.', 'CableAssy&HarnMulti.', 'Machine Shop Work.', 'Firm Fixed Price', 'Composites.', 'Composites.', 'Accelerometers, CableMulticonductor.', 'Wire Cable.', 'Wire Cable.', 'Firm Fixed Price', 'Firm Fixed Price', 'Encoders.', 'Encoders.', 'Clamps, Non-complex Machined, Protect&Dust Covers.', 'Clamps, Non-complex Machined, Protect&Dust Covers.', 'Non-complex Machined.', 'Non-complex Machined.', 'AC-DC Power Supplies, Adaptors, Backshells, CableAssy&HarnMulti, Chargers, Custom - Computer SW, Filter Pin Connector, Flex Assy(w/Connect), Lithium Batteries, Microprocessors.', 'AC-DC Power Supplies, Adaptors, Backshells, CableAssy&HarnMulti, Chargers, Custom - Computer SW, Filter Pin Connector, Flex Assy(w/Connect), Lithium Batteries, Microprocessors.', 'Amplifiers.', 'CableAssy&HarnMulti, NRE - Other.', 'CableAssy&HarnMulti, NRE - Other.', 'Major Assemblies.', 'Major Assemblies.', 'Firm Fixed Price', 'Test Equipment.', 'Test Equipment.', 'Firm Fixed Price', 'Lithium Batteries.', 'Firm Fixed Price', 'Firm Fixed Price', 'Firm Fixed Price']
ctech= clean_df[clean_df['subaward_description'].str.contains('Batteries|batteries|Sensors|sensors|sensor|Sensor|Detonator&Initiaor|explosive|Explosive|Missile|missile|explosives|Explosives|Launchers&Cannisters|transmitters|Transmitters|Transmitter|Receivers|Receiver|receiver|Encoders|Encoder')==True]
ctech['subaward_primary_place_of_performance_state_name'].value_counts()
California 16 Arizona 6 Missouri 6 Pennsylvania 4 Massachusetts 2 Virginia 2 Maryland 2 Ohio 2 Iowa 2 Name: subaward_primary_place_of_performance_state_name, dtype: int64
batteries_sensors=clean_df[clean_df['subaward_description'].str.contains('Batteries|batteries|Sensors|sensors|sensor|Sensor')==True]
pd.DataFrame(batteries_sensors[['subawardee_name','subaward_primary_place_of_performance_city_name',
'subaward_primary_place_of_performance_state_name']]).drop_duplicates()
subawardee_name | subaward_primary_place_of_performance_city_name | subaward_primary_place_of_performance_state_name | |
---|---|---|---|
116 | MEASUREMENT SPECIALTIES, INC. | HAMPTON | Virginia |
121 | EAGLEPICHER TECHNOLOGIES, LLC | JOPLIN | Missouri |
122 | EAGLEPICHER TECHNOLOGIES, LLC | Joplin | Missouri |
140 | SPACE VECTOR CORPORATION | CHATSWORTH | California |
159 | ADVANCED THERMAL BATTERIES INC. | WESTMINSTER | Maryland |
333 | DIVERSIFIED TECHNICAL SYSTEMS, INC. | SEAL BEACH | California |
batteries_sensors['subawardee_name'].value_counts()
EAGLEPICHER TECHNOLOGIES, LLC 6 MEASUREMENT SPECIALTIES, INC. 2 SPACE VECTOR CORPORATION 2 ADVANCED THERMAL BATTERIES INC. 2 DIVERSIFIED TECHNICAL SYSTEMS, INC. 2 Name: subawardee_name, dtype: int64
explosives=clean_df[clean_df['subaward_description'].str.contains('Detonator&Initiaor|explosive|Explosive|Missile|missile|explosives|Explosives|Launchers&Cannisters')==True]
pd.DataFrame(explosives[['subawardee_name','subaward_primary_place_of_performance_city_name',
'subaward_primary_place_of_performance_state_name']]).drop_duplicates()
subawardee_name | subaward_primary_place_of_performance_city_name | subaward_primary_place_of_performance_state_name | |
---|---|---|---|
33 | PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY... | CHANDLER | Arizona |
114 | PORT ELECTRONICS CORPORATION | LAWRENCE | Massachusetts |
118 | MORGAN ADVANCED CERAMICS, INC | HAYWARD | California |
177 | MARVIN ENGINEERING CO., INC. | INGLEWOOD | California |
202 | HI-TECH MACHINING & ENGINEERING, L.L.C. | TUCSON | Arizona |
209 | ATK SPACE SYSTEMS INC. | SAN DIEGO | California |
252 | ALLCOMP INC. | CITY OF INDUSTRY | California |
explosives['subawardee_name'].value_counts()
PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC 4 PORT ELECTRONICS CORPORATION 2 MORGAN ADVANCED CERAMICS, INC 2 MARVIN ENGINEERING CO., INC. 2 HI-TECH MACHINING & ENGINEERING, L.L.C. 2 ATK SPACE SYSTEMS INC. 2 ALLCOMP INC. 2 Name: subawardee_name, dtype: int64
rf=clean_df[clean_df['subaward_description'].str.contains('transmitters|Transmitters|Transmitter|Receivers|Receiver|receiver|Encoders|Encoder')==True]
pd.DataFrame(rf[['subawardee_name','subaward_primary_place_of_performance_city_name',
'subaward_primary_place_of_performance_state_name']]).drop_duplicates()
subawardee_name | subaward_primary_place_of_performance_city_name | subaward_primary_place_of_performance_state_name | |
---|---|---|---|
42 | L3 TECHNOLOGIES, INC. | SAN DIEGO | California |
104 | HERLEY INDUSTRIES, INC. | LANCASTER | Pennsylvania |
249 | QUASONIX, LLC | WEST CHESTER | Ohio |
304 | BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS... | CEDAR RAPIDS | Iowa |
311 | L3 TECHNOLOGIES, INC. | BRISTOL | Pennsylvania |
rf['subawardee_name'].value_counts()
L3 TECHNOLOGIES, INC. 6 HERLEY INDUSTRIES, INC. 2 QUASONIX, LLC 2 BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS INTEGRATION INC. 2 Name: subawardee_name, dtype: int64
contract_duration= df[['prime_award_period_of_performance_start_date',
'prime_award_period_of_performance_potential_end_date',
'prime_award_funding_office_name','prime_award_project_title',
'subawardee_name','subawardee_parent_name','prime_award_primary_place_of_performance_state_name']]
contract_duration.info()
<class 'pandas.core.frame.DataFrame'> Int64Index: 347 entries, 0 to 347 Data columns (total 7 columns): # Column Non-Null Count Dtype --- ------ -------------- ----- 0 prime_award_period_of_performance_start_date 347 non-null object 1 prime_award_period_of_performance_potential_end_date 347 non-null object 2 prime_award_funding_office_name 347 non-null object 3 prime_award_project_title 347 non-null object 4 subawardee_name 347 non-null object 5 subawardee_parent_name 242 non-null object 6 prime_award_primary_place_of_performance_state_name 347 non-null object dtypes: object(7) memory usage: 21.7+ KB
Convert Dates to appropriate column types
contract_duration['prime_award_period_of_performance_start_date'] = pd.to_datetime(
contract_duration['prime_award_period_of_performance_start_date'], format='%Y-%m-%d')
contract_duration['prime_award_period_of_performance_potential_end_date'] = pd.to_datetime(
contract_duration['prime_award_period_of_performance_potential_end_date'], format='%Y-%m-%d')
contract_duration.head()
/usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:2: SettingWithCopyWarning: A value is trying to be set on a copy of a slice from a DataFrame. Try using .loc[row_indexer,col_indexer] = value instead See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy /usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:5: SettingWithCopyWarning: A value is trying to be set on a copy of a slice from a DataFrame. Try using .loc[row_indexer,col_indexer] = value instead See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy """
prime_award_period_of_performance_start_date | prime_award_period_of_performance_potential_end_date | prime_award_funding_office_name | prime_award_project_title | subawardee_name | subawardee_parent_name | prime_award_primary_place_of_performance_state_name | |
---|---|---|---|---|---|---|---|
0 | 2016-10-31 | 2022-03-31 | DEF ADVANCED RESEARCH PROJECTS AGCY | HYPERSONIC AIR BREAT | ALLIANT TECHSYSTEMS OPERATIONS LLC | NORTHROP GRUMMAN CORPORATION | Arizona |
1 | 2016-10-31 | 2022-03-31 | DEF ADVANCED RESEARCH PROJECTS AGCY | HYPERSONIC AIR BREAT | ALLIANT TECHSYSTEMS OPERATIONS LLC | NORTHROP GRUMMAN CORPORATION | Arizona |
2 | 2016-10-31 | 2022-03-31 | AFRL RWP | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | ORBITAL ATK, INC. | Arizona |
3 | 2016-10-31 | 2022-03-31 | AFRL RQH HIGH SPEED SYS DIV | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | ORBITAL ATK, INC. | Arizona |
4 | 2016-10-31 | 2022-03-31 | DEF ADVANCED RESEARCH PROJECTS AGCY | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | ORBITAL ATK, INC. | Arizona |
Calculate the number of days that it takes for each contract to be completed
contract_duration['duration']= contract_duration['prime_award_period_of_performance_potential_end_date']- contract_duration['prime_award_period_of_performance_start_date']
contract_duration.head()
prime_award_period_of_performance_start_date | prime_award_period_of_performance_potential_end_date | prime_award_funding_office_name | prime_award_project_title | subawardee_name | subawardee_parent_name | prime_award_primary_place_of_performance_state_name | duration | |
---|---|---|---|---|---|---|---|---|
0 | 2016-10-31 | 2022-03-31 | DEF ADVANCED RESEARCH PROJECTS AGCY | HYPERSONIC AIR BREAT | ALLIANT TECHSYSTEMS OPERATIONS LLC | NORTHROP GRUMMAN CORPORATION | Arizona | 1977 days |
2 | 2016-10-31 | 2022-03-31 | AFRL RWP | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | ORBITAL ATK, INC. | Arizona | 1977 days |
3 | 2016-10-31 | 2022-03-31 | AFRL RQH HIGH SPEED SYS DIV | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | ORBITAL ATK, INC. | Arizona | 1977 days |
4 | 2016-10-31 | 2022-03-31 | DEF ADVANCED RESEARCH PROJECTS AGCY | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | ORBITAL ATK, INC. | Arizona | 1977 days |
6 | 2016-10-31 | 2022-03-31 | AFRL RWP | AMS: ADV PROGRAMS | ALLIANT TECHSYSTEMS OPERATIONS LLC | NORTHROP GRUMMAN CORPORATION | Arizona | 1977 days |
contract_duration['duration'].describe()
count 171 mean 1977 days 00:00:00 std 0 days 00:00:00 min 1977 days 00:00:00 25% 1977 days 00:00:00 50% 1977 days 00:00:00 75% 1977 days 00:00:00 max 1977 days 00:00:00 Name: duration, dtype: object
It seems that all the contracts last for about 5.4 years which is again a significant long time for hackers to knwo about the companies and hack into the systems
contract_count_agency= pd.DataFrame(clean_df['prime_award_funding_sub_agency_name'].value_counts().reset_index())
contract_count_agency
index | prime_award_funding_sub_agency_name | |
---|---|---|
0 | DEFENSE ADVANCED RESEARCH PROJECTS AGENCY (DA... | 257 |
1 | DEPT OF THE AIR FORCE | 89 |
2 | DEPT OF THE NAVY | 1 |
clean_df['subawardee_name'].value_counts()
ALLIANT TECHSYSTEMS OPERATIONS LLC 25 DUCOMMUN LABARGE TECHNOLOGIES, INC. 22 PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC 16 DYNETICS TECHNICAL SOLUTIONS, INC. 13 A. P. I. INCORPORATED 12 .. CARLETON TECHNOLOGIES INC 1 MORGAN ADVANCED CERAMICS, INC. 1 GRAY'S ENGINEERING & CONSULTING, INC. 1 PORT ELECTRONICS CORP. 1 ROCKWELL COLLINS, INC. 1 Name: subawardee_name, Length: 79, dtype: int64
contractors= clean_df.groupby('subawardee_parent_name').first().reset_index()
contractors.head()
subawardee_parent_name | prime_award_unique_key | prime_award_piid | prime_award_amount | prime_award_base_action_date | prime_award_base_action_date_fiscal_year | prime_award_latest_action_date | prime_award_latest_action_date_fiscal_year | prime_award_period_of_performance_start_date | prime_award_period_of_performance_current_end_date | ... | subaward_primary_place_of_performance_city_name | subaward_primary_place_of_performance_state_code | subaward_primary_place_of_performance_state_name | subaward_primary_place_of_performance_address_zip_code | subaward_primary_place_of_performance_congressional_district | subaward_primary_place_of_performance_country_code | subaward_primary_place_of_performance_country_name | subaward_description | usaspending_permalink | subaward_fsrs_report_last_modified_date | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | AEROJET ROCKETDYNE HOLDINGS, INC. | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | 174746702.0 | 2016-10-31 | 2017 | 2021-09-15 | 2021 | 2016-10-31 | 2022-03-31 | ... | BRISTOW | VA | Virginia | 201361152 | 11 | USA | UNITED STATES | Cost Plus Fixed Fee | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2017-09-27 14:39:26+00 |
1 | AI CONVOY HOLDCO LIMITED | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | 174746702.0 | 2016-10-31 | 2017 | 2021-09-15 | 2021 | 2016-10-31 | 2022-03-31 | ... | ORCHARD PARK | NY | New York | 141274121 | 27 | USA | UNITED STATES | Tech/Eng Services. | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2020-11-17 10:56:12+00 |
2 | AI Convoy & Cy S.C.A. | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | 174746702.0 | 2016-10-31 | 2017 | 2021-09-15 | 2021 | 2016-10-31 | 2022-03-31 | ... | ORCHARD PARK | NY | New York | 141274121 | 27 | USA | UNITED STATES | Tech/Eng Services. | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2021-11-16 13:35:00+00 |
3 | ALLIED MOTION TECHNOLOGIES INC. | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | 174746702.0 | 2016-10-31 | 2017 | 2021-09-15 | 2021 | 2016-10-31 | 2022-03-31 | ... | TULSA | OK | Oklahoma | 741463638 | 01 | USA | UNITED STATES | Firm Fixed Price | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2018-12-14 17:39:50+00 |
4 | AMPHENOL CORPORATION | CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- | HR001117C0025 | 174746702.0 | 2016-10-31 | 2017 | 2021-09-15 | 2021 | 2016-10-31 | 2022-03-31 | ... | DEPEW | NY | New York | 140432417 | 27 | USA | UNITED STATES | Accelerometers, CableMulticonductor. | https://www.usaspending.gov/award/CONT_AWD_HR0... | 2021-11-16 13:35:00+00 |
5 rows × 88 columns
network=pd.DataFrame(contractors[['subaward_primary_place_of_performance_state_name',
'subawardee_parent_name','subawardee_name',
'subaward_primary_place_of_performance_country_name'
]])
network.head()
subaward_primary_place_of_performance_state_name | subawardee_parent_name | subawardee_name | subaward_primary_place_of_performance_country_name | |
---|---|---|---|---|
0 | Virginia | AEROJET ROCKETDYNE HOLDINGS, INC. | AEROJET ROCKETDYNE, INC. | UNITED STATES |
1 | New York | AI CONVOY HOLDCO LIMITED | COBHAM MISSION SYSTEMS ORCHARD PARK INC. | UNITED STATES |
2 | New York | AI Convoy & Cy S.C.A. | COBHAM MISSION SYSTEMS ORCHARD PARK INC. | UNITED STATES |
3 | Oklahoma | ALLIED MOTION TECHNOLOGIES INC. | EMOTEQ CORPORATION | UNITED STATES |
4 | New York | AMPHENOL CORPORATION | PCB PIEZOTRONICS, INC. | UNITED STATES |
network['subaward_primary_place_of_performance_state_name'].value_counts().reset_index()
index | subaward_primary_place_of_performance_state_name | |
---|---|---|
0 | California | 9 |
1 | Arizona | 7 |
2 | Pennsylvania | 5 |
3 | New York | 4 |
4 | Maryland | 3 |
5 | Ohio | 3 |
6 | Missouri | 3 |
7 | Virginia | 2 |
8 | Colorado | 2 |
9 | Tennessee | 2 |
10 | Connecticut | 2 |
11 | Alabama | 2 |
12 | Iowa | 2 |
13 | North Carolina | 1 |
14 | Oregon | 1 |
15 | Utah | 1 |
16 | Wisconsin | 1 |
17 | Minnesota | 1 |
18 | Oklahoma | 1 |
19 | Florida | 1 |
20 | Massachusetts | 1 |
21 | Illinois | 1 |
nodes1=[]
for i in range(0,len(network['subaward_primary_place_of_performance_state_name'])):
state= network['subaward_primary_place_of_performance_country_name'][i]
parent=network['subaward_primary_place_of_performance_state_name'][i]
connection=[state, parent]
nodes1.append(connection)
nodes1
[['UNITED STATES', 'Virginia'], ['UNITED STATES', 'New York'], ['UNITED STATES', 'New York'], ['UNITED STATES', 'Oklahoma'], ['UNITED STATES', 'New York'], ['UNITED STATES', 'California'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Maryland'], ['UNITED STATES', 'Wisconsin'], ['UNITED STATES', 'Iowa'], ['UNITED STATES', 'Oregon'], ['UNITED STATES', 'Pennsylvania'], ['UNITED STATES', 'North Carolina'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Pennsylvania'], ['UNITED STATES', 'California'], ['UNITED STATES', 'Alabama'], ['UNITED STATES', 'Missouri'], ['UNITED STATES', 'Missouri'], ['UNITED STATES', 'Ohio'], ['UNITED STATES', 'Ohio'], ['UNITED STATES', 'Connecticut'], ['UNITED STATES', 'Utah'], ['UNITED STATES', 'Connecticut'], ['UNITED STATES', 'Tennessee'], ['UNITED STATES', 'California'], ['UNITED STATES', 'California'], ['UNITED STATES', 'Minnesota'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Colorado'], ['UNITED STATES', 'Florida'], ['UNITED STATES', 'Colorado'], ['UNITED STATES', 'California'], ['UNITED STATES', 'California'], ['UNITED STATES', 'Alabama'], ['UNITED STATES', 'California'], ['UNITED STATES', 'California'], ['UNITED STATES', 'New York'], ['UNITED STATES', 'Pennsylvania'], ['UNITED STATES', 'Maryland'], ['UNITED STATES', 'Maryland'], ['UNITED STATES', 'Massachusetts'], ['UNITED STATES', 'Ohio'], ['UNITED STATES', 'Iowa'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Illinois'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Virginia'], ['UNITED STATES', 'Tennessee'], ['UNITED STATES', 'Arizona'], ['UNITED STATES', 'Pennsylvania'], ['UNITED STATES', 'Pennsylvania'], ['UNITED STATES', 'California'], ['UNITED STATES', 'Missouri']]
nodes=[]
for i in range(0,len(network['subaward_primary_place_of_performance_state_name'])):
state= network['subaward_primary_place_of_performance_state_name'][i]
parent=network['subawardee_parent_name'][i]
connection=[state, parent]
nodes.append(connection)
nodes
[['Virginia', 'AEROJET ROCKETDYNE HOLDINGS, INC.'], ['New York', 'AI CONVOY HOLDCO LIMITED'], ['New York', 'AI Convoy & Cy S.C.A.'], ['Oklahoma', 'ALLIED MOTION TECHNOLOGIES INC.'], ['New York', 'AMPHENOL CORPORATION'], ['California', 'AMRO FABRICATING CORPORATION'], ['Arizona', 'APPLIED TECHNICAL SERVICES, LLC'], ['Arizona', 'ARLINGTON CAPITAL PARTNERS IV, L.P.'], ['Maryland', 'ASB AEROSPATIALE BATTERIES'], ['Wisconsin', 'BADGER METER, INC.'], ['Iowa', 'BAE SYSTEMS PLC'], ['Oregon', 'BERKSHIRE HATHAWAY INC.'], ['Pennsylvania', 'CONCURRENT TECHNOLOGIES CORPORATION'], ['North Carolina', 'CORVID TECHNOLOGIES LLC'], ['Arizona', 'CREATION TECHNOLOGIES INC'], ['Pennsylvania', 'CURTISS-WRIGHT CORPORATION'], ['California', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.'], ['Alabama', 'DYNETICS, INC.'], ['Missouri', 'Ducommun Incorporated'], ['Missouri', 'EAGLEPICHER TECHNOLOGIES, LLC'], ['Ohio', 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.'], ['Ohio', 'ELEMENT MATERIALS TECHNOLOGY GROUP LIMITED'], ['Connecticut', 'ENSIGN-BICKFORD INDUSTRIES, INC.'], ['Utah', 'Ems Holdco, Inc.'], ['Connecticut', 'Ensign-Bickford Industries, Inc.'], ['Tennessee', 'Etex'], ['California', 'Fortive Corporation'], ['California', 'GLENAIR, INC.'], ['Minnesota', 'HONEYWELL INTERNATIONAL INC.'], ['Arizona', 'Imaginetics Holdings LLC'], ['Colorado', 'KEYSIGHT TECHNOLOGIES, INC.'], ['Florida', 'KRATOS DEFENSE & SECURITY SOLUTIONS, INC.'], ['Colorado', 'Keystone Holdings Group, LLC'], ['California', 'L3 TECHNOLOGIES, INC.'], ['California', 'L3HARRIS TECHNOLOGIES, INC.'], ['Alabama', 'LEIDOS HOLDINGS, INC.'], ['California', 'MARVIN ENGINEERING CO., INC.'], ['California', 'MORGAN ADVANCED MATERIALS PLC'], ['New York', 'MTS SYSTEMS CORPORATION'], ['Pennsylvania', 'NICOMATIC'], ['Maryland', 'NORTHROP GRUMMAN CORPORATION'], ['Maryland', 'ORBITAL ATK, INC.'], ['Massachusetts', 'PARKER-HANNIFIN CORPORATION'], ['Ohio', 'QUASONIX, LLC'], ['Iowa', 'ROCKWELL COLLINS, INC.'], ['Arizona', 'Radius Aerospace, Inc.'], ['Illinois', 'STANLEY MACHINING & TOOL CORP.'], ['Arizona', 'Samuel, Son & Co., Limited'], ['Virginia', 'TE Connectivity Ltd.'], ['Tennessee', 'TEVET, LLC'], ['Arizona', 'TRIUMPH GROUP, INC.'], ['Pennsylvania', 'The Jordan Company L P'], ['Pennsylvania', 'ULTRA ELECTRONICS HOLDINGS PLC'], ['California', 'VISHAY PRECISION GROUP, INC.'], ['Missouri', 'Vectra Co.']]
leaves=[]
for i in range(0,len(network['subawardee_parent_name'])):
state= network['subawardee_parent_name'][i]
parent=network['subawardee_name'][i]
connection=[state, parent]
leaves.append(connection)
leaves
[['AEROJET ROCKETDYNE HOLDINGS, INC.', 'AEROJET ROCKETDYNE, INC.'], ['AI CONVOY HOLDCO LIMITED', 'COBHAM MISSION SYSTEMS ORCHARD PARK INC.'], ['AI Convoy & Cy S.C.A.', 'COBHAM MISSION SYSTEMS ORCHARD PARK INC.'], ['ALLIED MOTION TECHNOLOGIES INC.', 'EMOTEQ CORPORATION'], ['AMPHENOL CORPORATION', 'PCB PIEZOTRONICS, INC.'], ['AMRO FABRICATING CORPORATION', 'AMRO FABRICATING CORPORATION'], ['APPLIED TECHNICAL SERVICES, LLC', "GRAY'S ENGINEERING & CONSULTING, LLC"], ['ARLINGTON CAPITAL PARTNERS IV, L.P.', 'RADIUS AEROSPACE, INC.'], ['ASB AEROSPATIALE BATTERIES', 'ADVANCED THERMAL BATTERIES INC.'], ['BADGER METER, INC.', 'BADGER METER, INC.'], ['BAE SYSTEMS PLC', 'BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS INTEGRATION INC.'], ['BERKSHIRE HATHAWAY INC.', 'PCC STRUCTURALS, INC.'], ['CONCURRENT TECHNOLOGIES CORPORATION', 'CONCURRENT TECHNOLOGIES CORPORATION'], ['CORVID TECHNOLOGIES LLC', 'CORVID TECHNOLOGIES LLC'], ['CREATION TECHNOLOGIES INC', "GRAY'S ENGINEERING & CONSULTING, INC."], ['CURTISS-WRIGHT CORPORATION', 'TELETRONICS TECHNOLOGY CORPORATION'], ['DIVERSIFIED TECHNICAL SYSTEMS, INC.', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.'], ['DYNETICS, INC.', 'DYNETICS TECHNICAL SOLUTIONS, INC.'], ['Ducommun Incorporated', 'DUCOMMUN LABARGE TECHNOLOGIES, INC.'], ['EAGLEPICHER TECHNOLOGIES, LLC', 'EAGLEPICHER TECHNOLOGIES, LLC'], ['ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.', 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.'], ['ELEMENT MATERIALS TECHNOLOGY GROUP LIMITED', 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.'], ['ENSIGN-BICKFORD INDUSTRIES, INC.', 'ENSIGN-BICKFORD AEROSPACE & DEFENSE COMPANY'], ['Ems Holdco, Inc.', 'SPARTRONICS LOGAN, LLC'], ['Ensign-Bickford Industries, Inc.', 'ENSIGN-BICKFORD AEROSPACE & DEFENSE COMPANY'], ['Etex', 'PROMAT INC'], ['Fortive Corporation', 'PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC'], ['GLENAIR, INC.', 'GLENAIR, INC.'], ['HONEYWELL INTERNATIONAL INC.', 'HONEYWELL INTERNATIONAL INC.'], ['Imaginetics Holdings LLC', 'AZMARK AERO SYSTEMS, LLC'], ['KEYSIGHT TECHNOLOGIES, INC.', 'KEYSIGHT TECHNOLOGIES, INC.'], ['KRATOS DEFENSE & SECURITY SOLUTIONS, INC.', 'MICRO SYSTEMS, INC.'], ['Keystone Holdings Group, LLC', 'COORSTEK, INC.'], ['L3 TECHNOLOGIES, INC.', 'L3 TECHNOLOGIES, INC.'], ['L3HARRIS TECHNOLOGIES, INC.', 'L3 TECHNOLOGIES, INC.'], ['LEIDOS HOLDINGS, INC.', 'DYNETICS TECHNICAL SOLUTIONS, INC.'], ['MARVIN ENGINEERING CO., INC.', 'MARVIN ENGINEERING CO., INC.'], ['MORGAN ADVANCED MATERIALS PLC', 'MORGAN ADVANCED CERAMICS, INC'], ['MTS SYSTEMS CORPORATION', 'PCB PIEZOTRONICS, INC.'], ['NICOMATIC', 'NICOMATIC, L.P.'], ['NORTHROP GRUMMAN CORPORATION', 'ALLIANT TECHSYSTEMS OPERATIONS LLC'], ['ORBITAL ATK, INC.', 'ALLIANT TECHSYSTEMS OPERATIONS LLC'], ['PARKER-HANNIFIN CORPORATION', 'PARKER-HANNIFIN CORPORATION'], ['QUASONIX, LLC', 'QUASONIX, LLC'], ['ROCKWELL COLLINS, INC.', 'ROCKWELL COLLINS, INC.'], ['Radius Aerospace, Inc.', 'RADIUS AEROSPACE, INC.'], ['STANLEY MACHINING & TOOL CORP.', 'STANLEY MACHINING & TOOL CORP.'], ['Samuel, Son & Co., Limited', 'CAID INDUSTRIES, INC'], ['TE Connectivity Ltd.', 'MEASUREMENT SPECIALTIES, INC.'], ['TEVET, LLC', 'TEVET, LLC'], ['TRIUMPH GROUP, INC.', 'TRIUMPH ENGINEERED SOLUTIONS, INC.'], ['The Jordan Company L P', 'ARCH GLOBAL PRECISION - HUNTINGDON VALLEY, LLC'], ['ULTRA ELECTRONICS HOLDINGS PLC', 'HERLEY INDUSTRIES, INC.'], ['VISHAY PRECISION GROUP, INC.', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.'], ['Vectra Co.', 'EAGLEPICHER TECHNOLOGIES, LLC']]