Loading the data set

In [ ]:
import pandas as pd
df= pd.read_csv('/content/Dataset_Contract_Sub-Awards.csv')
cols= df.columns.tolist()
cols
Out[ ]:
['prime_award_unique_key',
 'prime_award_piid',
 'prime_award_parent_piid',
 'prime_award_amount',
 'prime_award_disaster_emergency_fund_codes',
 'prime_award_outlayed_amount_funded_by_COVID-19_supplementals',
 'prime_award_obligated_amount_funded_by_COVID-19_supplementals',
 'prime_award_base_action_date',
 'prime_award_base_action_date_fiscal_year',
 'prime_award_latest_action_date',
 'prime_award_latest_action_date_fiscal_year',
 'prime_award_period_of_performance_start_date',
 'prime_award_period_of_performance_current_end_date',
 'prime_award_period_of_performance_potential_end_date',
 'prime_award_awarding_agency_code',
 'prime_award_awarding_agency_name',
 'prime_award_awarding_sub_agency_code',
 'prime_award_awarding_sub_agency_name',
 'prime_award_awarding_office_code',
 'prime_award_awarding_office_name',
 'prime_award_funding_agency_code',
 'prime_award_funding_agency_name',
 'prime_award_funding_sub_agency_code',
 'prime_award_funding_sub_agency_name',
 'prime_award_funding_office_code',
 'prime_award_funding_office_name',
 'prime_award_treasury_accounts_funding_this_award',
 'prime_award_federal_accounts_funding_this_award',
 'prime_award_object_classes_funding_this_award',
 'prime_award_program_activities_funding_this_award',
 'prime_awardee_duns',
 'prime_awardee_uei',
 'prime_awardee_name',
 'prime_awardee_dba_name',
 'prime_awardee_parent_duns',
 'prime_awardee_parent_uei',
 'prime_awardee_parent_name',
 'prime_awardee_country_code',
 'prime_awardee_country_name',
 'prime_awardee_address_line_1',
 'prime_awardee_city_name',
 'prime_awardee_county_name',
 'prime_awardee_state_code',
 'prime_awardee_state_name',
 'prime_awardee_zip_code',
 'prime_awardee_congressional_district',
 'prime_awardee_foreign_postal_code',
 'prime_awardee_business_types',
 'prime_award_primary_place_of_performance_city_name',
 'prime_award_primary_place_of_performance_state_code',
 'prime_award_primary_place_of_performance_state_name',
 'prime_award_primary_place_of_performance_address_zip_code',
 'prime_award_primary_place_of_performance_congressional_district',
 'prime_award_primary_place_of_performance_country_code',
 'prime_award_primary_place_of_performance_country_name',
 'prime_award_description',
 'prime_award_project_title',
 'prime_award_naics_code',
 'prime_award_naics_description',
 'prime_award_national_interest_action_code',
 'prime_award_national_interest_action',
 'subaward_type',
 'subaward_fsrs_report_id',
 'subaward_fsrs_report_year',
 'subaward_fsrs_report_month',
 'subaward_number',
 'subaward_amount',
 'subaward_action_date',
 'subaward_action_date_fiscal_year',
 'subawardee_duns',
 'subawardee_name',
 'subawardee_dba_name',
 'subawardee_parent_duns',
 'subawardee_parent_name',
 'subawardee_country_code',
 'subawardee_country_name',
 'subawardee_address_line_1',
 'subawardee_city_name',
 'subawardee_state_code',
 'subawardee_state_name',
 'subawardee_zip_code',
 'subawardee_congressional_district',
 'subawardee_foreign_postal_code',
 'subawardee_business_types',
 'subaward_primary_place_of_performance_address_line_1',
 'subaward_primary_place_of_performance_city_name',
 'subaward_primary_place_of_performance_state_code',
 'subaward_primary_place_of_performance_state_name',
 'subaward_primary_place_of_performance_address_zip_code',
 'subaward_primary_place_of_performance_congressional_district',
 'subaward_primary_place_of_performance_country_code',
 'subaward_primary_place_of_performance_country_name',
 'subaward_description',
 'subawardee_highly_compensated_officer_1_name',
 'subawardee_highly_compensated_officer_1_amount',
 'subawardee_highly_compensated_officer_2_name',
 'subawardee_highly_compensated_officer_2_amount',
 'subawardee_highly_compensated_officer_3_name',
 'subawardee_highly_compensated_officer_3_amount',
 'subawardee_highly_compensated_officer_4_name',
 'subawardee_highly_compensated_officer_4_amount',
 'subawardee_highly_compensated_officer_5_name',
 'subawardee_highly_compensated_officer_5_amount',
 'usaspending_permalink',
 'subaward_fsrs_report_last_modified_date']

View first 5 rows of the dataset

In [ ]:
df.head()
Out[ ]:
prime_award_unique_key prime_award_piid prime_award_parent_piid prime_award_amount prime_award_disaster_emergency_fund_codes prime_award_outlayed_amount_funded_by_COVID-19_supplementals prime_award_obligated_amount_funded_by_COVID-19_supplementals prime_award_base_action_date prime_award_base_action_date_fiscal_year prime_award_latest_action_date ... subawardee_highly_compensated_officer_2_name subawardee_highly_compensated_officer_2_amount subawardee_highly_compensated_officer_3_name subawardee_highly_compensated_officer_3_amount subawardee_highly_compensated_officer_4_name subawardee_highly_compensated_officer_4_amount subawardee_highly_compensated_officer_5_name subawardee_highly_compensated_officer_5_amount usaspending_permalink subaward_fsrs_report_last_modified_date
0 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2021-11-16 13:35:00+00
1 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2020-11-17 10:56:12+00
2 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-07-09 19:26:13+00
3 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-02-15 14:22:36+00
4 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-03-26 19:23:55+00

5 rows × 105 columns

Remove any duplicate value present in the data set

In [ ]:
df=df.drop_duplicates()
df.head()
Out[ ]:
prime_award_unique_key prime_award_piid prime_award_parent_piid prime_award_amount prime_award_disaster_emergency_fund_codes prime_award_outlayed_amount_funded_by_COVID-19_supplementals prime_award_obligated_amount_funded_by_COVID-19_supplementals prime_award_base_action_date prime_award_base_action_date_fiscal_year prime_award_latest_action_date ... subawardee_highly_compensated_officer_2_name subawardee_highly_compensated_officer_2_amount subawardee_highly_compensated_officer_3_name subawardee_highly_compensated_officer_3_amount subawardee_highly_compensated_officer_4_name subawardee_highly_compensated_officer_4_amount subawardee_highly_compensated_officer_5_name subawardee_highly_compensated_officer_5_amount usaspending_permalink subaward_fsrs_report_last_modified_date
0 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2021-11-16 13:35:00+00
1 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2020-11-17 10:56:12+00
2 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-07-09 19:26:13+00
3 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-02-15 14:22:36+00
4 CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 NaN 174746702.0 NaN NaN NaN 2016-10-31 2017 2021-09-15 ... NaN NaN NaN NaN NaN NaN NaN NaN https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-03-26 19:23:55+00

5 rows × 105 columns

Data cleaning: Check for column with insignificant amount of data/ missing values or columns with no data at all

In [ ]:
def describe_nan(df):
    return pd.DataFrame([(i, df[df[i].isna()].shape[0],df[df[i].isna()].shape[0]/df.shape[0]) for i in df.columns], columns=['column', 'nan_counts', 'nan_rate'])

missing_value_count= describe_nan(df)
missing_value_count
Out[ ]:
column nan_counts nan_rate
0 prime_award_unique_key 0 0.000000
1 prime_award_piid 0 0.000000
2 prime_award_parent_piid 347 1.000000
3 prime_award_amount 0 0.000000
4 prime_award_disaster_emergency_fund_codes 329 0.948127
... ... ... ...
100 subawardee_highly_compensated_officer_4_amount 329 0.948127
101 subawardee_highly_compensated_officer_5_name 326 0.939481
102 subawardee_highly_compensated_officer_5_amount 329 0.948127
103 usaspending_permalink 0 0.000000
104 subaward_fsrs_report_last_modified_date 0 0.000000

105 rows × 3 columns

We can see that many of the columns are completely empty. Hence, we remove such columns

In [ ]:
### Removing columns with more than 90% missing data 
major_data_missing_cols= missing_value_count[missing_value_count['nan_rate']>0.9]['column'].to_list()
major_data_missing_cols
Out[ ]:
['prime_award_parent_piid',
 'prime_award_disaster_emergency_fund_codes',
 'prime_award_outlayed_amount_funded_by_COVID-19_supplementals',
 'prime_award_obligated_amount_funded_by_COVID-19_supplementals',
 'prime_awardee_foreign_postal_code',
 'subawardee_foreign_postal_code',
 'subaward_primary_place_of_performance_address_line_1',
 'subawardee_highly_compensated_officer_1_name',
 'subawardee_highly_compensated_officer_1_amount',
 'subawardee_highly_compensated_officer_2_name',
 'subawardee_highly_compensated_officer_2_amount',
 'subawardee_highly_compensated_officer_3_name',
 'subawardee_highly_compensated_officer_3_amount',
 'subawardee_highly_compensated_officer_4_name',
 'subawardee_highly_compensated_officer_4_amount',
 'subawardee_highly_compensated_officer_5_name',
 'subawardee_highly_compensated_officer_5_amount']
In [ ]:
df= df.drop(major_data_missing_cols, axis=1)
cols= df.columns.tolist()
cols
Out[ ]:
['prime_award_unique_key',
 'prime_award_piid',
 'prime_award_amount',
 'prime_award_base_action_date',
 'prime_award_base_action_date_fiscal_year',
 'prime_award_latest_action_date',
 'prime_award_latest_action_date_fiscal_year',
 'prime_award_period_of_performance_start_date',
 'prime_award_period_of_performance_current_end_date',
 'prime_award_period_of_performance_potential_end_date',
 'prime_award_awarding_agency_code',
 'prime_award_awarding_agency_name',
 'prime_award_awarding_sub_agency_code',
 'prime_award_awarding_sub_agency_name',
 'prime_award_awarding_office_code',
 'prime_award_awarding_office_name',
 'prime_award_funding_agency_code',
 'prime_award_funding_agency_name',
 'prime_award_funding_sub_agency_code',
 'prime_award_funding_sub_agency_name',
 'prime_award_funding_office_code',
 'prime_award_funding_office_name',
 'prime_award_treasury_accounts_funding_this_award',
 'prime_award_federal_accounts_funding_this_award',
 'prime_award_object_classes_funding_this_award',
 'prime_award_program_activities_funding_this_award',
 'prime_awardee_duns',
 'prime_awardee_uei',
 'prime_awardee_name',
 'prime_awardee_dba_name',
 'prime_awardee_parent_duns',
 'prime_awardee_parent_uei',
 'prime_awardee_parent_name',
 'prime_awardee_country_code',
 'prime_awardee_country_name',
 'prime_awardee_address_line_1',
 'prime_awardee_city_name',
 'prime_awardee_county_name',
 'prime_awardee_state_code',
 'prime_awardee_state_name',
 'prime_awardee_zip_code',
 'prime_awardee_congressional_district',
 'prime_awardee_business_types',
 'prime_award_primary_place_of_performance_city_name',
 'prime_award_primary_place_of_performance_state_code',
 'prime_award_primary_place_of_performance_state_name',
 'prime_award_primary_place_of_performance_address_zip_code',
 'prime_award_primary_place_of_performance_congressional_district',
 'prime_award_primary_place_of_performance_country_code',
 'prime_award_primary_place_of_performance_country_name',
 'prime_award_description',
 'prime_award_project_title',
 'prime_award_naics_code',
 'prime_award_naics_description',
 'prime_award_national_interest_action_code',
 'prime_award_national_interest_action',
 'subaward_type',
 'subaward_fsrs_report_id',
 'subaward_fsrs_report_year',
 'subaward_fsrs_report_month',
 'subaward_number',
 'subaward_amount',
 'subaward_action_date',
 'subaward_action_date_fiscal_year',
 'subawardee_duns',
 'subawardee_name',
 'subawardee_dba_name',
 'subawardee_parent_duns',
 'subawardee_parent_name',
 'subawardee_country_code',
 'subawardee_country_name',
 'subawardee_address_line_1',
 'subawardee_city_name',
 'subawardee_state_code',
 'subawardee_state_name',
 'subawardee_zip_code',
 'subawardee_congressional_district',
 'subawardee_business_types',
 'subaward_primary_place_of_performance_city_name',
 'subaward_primary_place_of_performance_state_code',
 'subaward_primary_place_of_performance_state_name',
 'subaward_primary_place_of_performance_address_zip_code',
 'subaward_primary_place_of_performance_congressional_district',
 'subaward_primary_place_of_performance_country_code',
 'subaward_primary_place_of_performance_country_name',
 'subaward_description',
 'usaspending_permalink',
 'subaward_fsrs_report_last_modified_date']

Making copy of the dataframe to avoid losing original data

In [ ]:
clean_df= df

BASIC TEXT EXPLORATION AND GETTING DATA FOR HIGHCHARTS

Find the funding offices which provide awards

In [ ]:
clean_df['prime_award_funding_office_name'].value_counts()
Out[ ]:
DEF ADVANCED RESEARCH PROJECTS AGCY    257
AFRL RWP                                54
AFRL RQH         HIGH SPEED SYS DIV     29
AFRL RW                                  6
OFFICE OF NAVAL RESEARCH                 1
Name: prime_award_funding_office_name, dtype: int64

Explore the different project titles and see the ones with most awards

In [ ]:
projects= pd.DataFrame(clean_df['prime_award_project_title'].value_counts().reset_index())
projects
Out[ ]:
index prime_award_project_title
0 HYPERSONIC AIR BREAT 207
1 AMS: ADV PROGRAMS 126
2 AMS: ADV PROGRAMS; AMS:AAWS 6
3 AMS: ADV PROGRAMS/RMS: NBI 5
4 AMS:HYPERSONICS 2
5 AMS:AAWS 1
In [ ]:
projects['prime_award_project_title']= (projects['prime_award_project_title']/347)*100
projects
Out[ ]:
index prime_award_project_title
0 HYPERSONIC AIR BREAT 59.654179
1 AMS: ADV PROGRAMS 36.311239
2 AMS: ADV PROGRAMS; AMS:AAWS 1.729107
3 AMS: ADV PROGRAMS/RMS: NBI 1.440922
4 AMS:HYPERSONICS 0.576369
5 AMS:AAWS 0.288184
In [ ]:
projects['index'].to_list()
Out[ ]:
['HYPERSONIC AIR BREAT',
 'AMS: ADV PROGRAMS',
 'AMS: ADV PROGRAMS; AMS:AAWS',
 'AMS: ADV PROGRAMS/RMS: NBI',
 'AMS:HYPERSONICS',
 'AMS:AAWS']

Look at the company and parent company working on the AMS:AAWS project since only o the companies are working on it which stands out.

In [ ]:
print(clean_df['subawardee_parent_name'][clean_df['prime_award_project_title']=='AMS:AAWS'])
print(clean_df['subawardee_name'][clean_df['prime_award_project_title']=='AMS:AAWS'])
61    ORBITAL ATK, INC.
Name: subawardee_parent_name, dtype: object
61    ALLIANT TECHSYSTEMS OPERATIONS LLC
Name: subawardee_name, dtype: object

Let's look at the prime award descriptions

In [ ]:
clean_df['prime_award_naics_description'].value_counts()
Out[ ]:
RESEARCH AND DEVELOPMENT IN THE PHYSICAL, ENGINEERING, AND LIFE SCIENCES (EXCEPT BIOTECHNOLOGY)    347
Name: prime_award_naics_description, dtype: int64

We can see that all the awards fall into the R&D category only. This insight is even more important since the scope of losing this important data to a cyberattack is zero.

Let's look at the different subawardee names with the number of awards granted to each

In [ ]:
sub=pd.DataFrame(clean_df['subawardee_name'].value_counts().reset_index())
sub
Out[ ]:
index subawardee_name
0 ALLIANT TECHSYSTEMS OPERATIONS LLC 25
1 DUCOMMUN LABARGE TECHNOLOGIES, INC. 22
2 PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY... 16
3 DYNETICS TECHNICAL SOLUTIONS, INC. 13
4 A. P. I. INCORPORATED 12
... ... ...
74 CARLETON TECHNOLOGIES INC 1
75 MORGAN ADVANCED CERAMICS, INC. 1
76 GRAY'S ENGINEERING & CONSULTING, INC. 1
77 PORT ELECTRONICS CORP. 1
78 ROCKWELL COLLINS, INC. 1

79 rows × 2 columns

In [ ]:
sub['index'].to_list()
Out[ ]:
['ALLIANT TECHSYSTEMS OPERATIONS LLC',
 'DUCOMMUN LABARGE TECHNOLOGIES, INC.',
 'PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC',
 'DYNETICS TECHNICAL SOLUTIONS, INC.',
 'A. P. I. INCORPORATED',
 'STANLEY MACHINING & TOOL CORP.',
 'TRI MODELS, INC.',
 'UNI-CAST, INC.',
 'MEASUREMENT SPECIALTIES, INC.',
 'L3 TECHNOLOGIES, INC.',
 'EAGLEPICHER TECHNOLOGIES, LLC',
 'ALLCOMP INC.',
 'MARVIN ENGINEERING CO., INC.',
 'ENSIGN-BICKFORD AEROSPACE & DEFENSE COMPANY',
 'MICRO CRAFT, INC.',
 'KEYSIGHT TECHNOLOGIES, INC.',
 'VENTURA AEROSPACE, INC.',
 'INOVAR, INC.',
 'PRAXIS RESOURCES INC.',
 'PARKER-HANNIFIN CORPORATION',
 'HI-TECH MACHINING & ENGINEERING, L.L.C.',
 'TELETRONICS TECHNOLOGY CORPORATION',
 "JANSEN'S AIRCRAFT SYSTEMS CONTROLS, INC.",
 'AZMARK AERO SYSTEMS, LLC',
 'ORBITAL SCIENCES CORPORATION',
 'RADIUS AEROSPACE, INC.',
 'HERLEY INDUSTRIES, INC.',
 'PCC STRUCTURALS, INC.',
 'SPARTRONICS LOGAN, LLC',
 'PORT ELECTRONICS CORPORATION',
 'MORGAN ADVANCED CERAMICS, INC',
 'ATK SPACE SYSTEMS INC.',
 'AMRO FABRICATING CORPORATION',
 'PARALLEL VENTURES, INC.',
 'QUASONIX, LLC',
 'BADGER METER, INC.',
 'CONCURRENT TECHNOLOGIES CORPORATION',
 'PROMAT INC',
 'HONEYWELL INTERNATIONAL INC.',
 'GLENAIR, INC.',
 'KLUNE INDUSTRIES, INC.',
 'PCB PIEZOTRONICS, INC.',
 'SOUTHERN GEAR & MACHINE, INC.',
 'KIRSH MANUFACTURING, INC.',
 'AEROJET ROCKETDYNE, INC.',
 'ADVANCED THERMAL BATTERIES INC.',
 'DYTRAN INSTRUMENTS INC.',
 'CAID INDUSTRIES, INC',
 'SPACE VECTOR CORPORATION',
 'CAMI RESEARCH, INC.',
 'TEVET, LLC',
 'CICOIL, LLC',
 'DIVERSIFIED TECHNICAL SYSTEMS, INC.',
 'BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS INTEGRATION INC.',
 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.',
 'EMOTEQ CORPORATION',
 'DESIGNLINX HARDWARE SOLUTIONS, INC.',
 'COBHAM MISSION SYSTEMS ORCHARD PARK INC.',
 'ARCH GLOBAL PRECISION - HUNTINGDON VALLEY, LLC',
 'NICOMATIC, L.P.',
 'MICRO SYSTEMS, INC.',
 'LABARGE ACQUISITION COMPANY, INC.',
 'AEROSPEC, INC.',
 'CORVID TECHNOLOGIES LLC',
 'ORBITAL SCIENCES LLC',
 'ADVANCED MATERIALS TECHNOLOGIES, LLC',
 'COORSTEK, INC.',
 'SHELLI INDUSTRIES LLC',
 "GRAY'S ENGINEERING & CONSULTING, LLC",
 'UNI-CAST, LLC',
 'TRIUMPH ENGINEERED SOLUTIONS, INC.',
 'GLOBE MOTORS, INC.',
 'DYNETICS, INC.',
 'DESIGNLINX HARDWARE SOLUTIONS, LLC',
 'CARLETON TECHNOLOGIES INC',
 'MORGAN ADVANCED CERAMICS, INC.',
 "GRAY'S ENGINEERING & CONSULTING, INC.",
 'PORT ELECTRONICS CORP.',
 'ROCKWELL COLLINS, INC.']
In [ ]:
sub['subawardee_name'].to_list()
Out[ ]:
[25,
 22,
 16,
 13,
 12,
 11,
 10,
 8,
 8,
 8,
 8,
 7,
 7,
 7,
 6,
 6,
 6,
 6,
 5,
 5,
 5,
 5,
 5,
 5,
 4,
 4,
 4,
 4,
 4,
 4,
 4,
 4,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1]

Let's look at the subawardee parent names now and the number of awards granted to each

In [ ]:
imp_sub= pd.DataFrame(df['subawardee_parent_name'].value_counts().reset_index())
imp_sub.head()
Out[ ]:
index subawardee_parent_name
0 Ducommun Incorporated 24
1 NORTHROP GRUMMAN CORPORATION 18
2 ORBITAL ATK, INC. 16
3 Fortive Corporation 16
4 STANLEY MACHINING & TOOL CORP. 11
In [ ]:
imp_sub['index'].to_list()
Out[ ]:
['Ducommun Incorporated',
 'NORTHROP GRUMMAN CORPORATION',
 'ORBITAL ATK, INC.',
 'Fortive Corporation',
 'STANLEY MACHINING & TOOL CORP.',
 'LEIDOS HOLDINGS, INC.',
 'TE Connectivity Ltd.',
 'EAGLEPICHER TECHNOLOGIES, LLC',
 'MARVIN ENGINEERING CO., INC.',
 'BERKSHIRE HATHAWAY INC.',
 'DYNETICS, INC.',
 'L3HARRIS TECHNOLOGIES, INC.',
 'KEYSIGHT TECHNOLOGIES, INC.',
 'CURTISS-WRIGHT CORPORATION',
 'PARKER-HANNIFIN CORPORATION',
 'MORGAN ADVANCED MATERIALS PLC',
 'Imaginetics Holdings LLC',
 'ULTRA ELECTRONICS HOLDINGS PLC',
 'Ensign-Bickford Industries, Inc.',
 'Ems Holdco, Inc.',
 'AMRO FABRICATING CORPORATION',
 'GLENAIR, INC.',
 'ASB AEROSPATIALE BATTERIES',
 'HONEYWELL INTERNATIONAL INC.',
 'ALLIED MOTION TECHNOLOGIES INC.',
 'BADGER METER, INC.',
 'Samuel, Son & Co., Limited',
 'QUASONIX, LLC',
 'Etex',
 'ENSIGN-BICKFORD INDUSTRIES, INC.',
 'AEROJET ROCKETDYNE HOLDINGS, INC.',
 'CONCURRENT TECHNOLOGIES CORPORATION',
 'MTS SYSTEMS CORPORATION',
 'BAE SYSTEMS PLC',
 'TEVET, LLC',
 'KRATOS DEFENSE & SECURITY SOLUTIONS, INC.',
 'Keystone Holdings Group, LLC',
 'NICOMATIC',
 'ARLINGTON CAPITAL PARTNERS IV, L.P.',
 'L3 TECHNOLOGIES, INC.',
 'CORVID TECHNOLOGIES LLC',
 'The Jordan Company L P',
 'Radius Aerospace, Inc.',
 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.',
 'DIVERSIFIED TECHNICAL SYSTEMS, INC.',
 'VISHAY PRECISION GROUP, INC.',
 'AMPHENOL CORPORATION',
 'TRIUMPH GROUP, INC.',
 'ELEMENT MATERIALS TECHNOLOGY GROUP LIMITED',
 'CREATION TECHNOLOGIES INC',
 'AI Convoy & Cy S.C.A.',
 'AI CONVOY HOLDCO LIMITED',
 'APPLIED TECHNICAL SERVICES, LLC',
 'ROCKWELL COLLINS, INC.',
 'Vectra Co.']
In [ ]:
imp_sub['subawardee_parent_name'].to_list()
Out[ ]:
[24,
 18,
 16,
 16,
 11,
 8,
 8,
 7,
 7,
 7,
 6,
 6,
 6,
 5,
 5,
 5,
 5,
 4,
 4,
 4,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 3,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1]

Exploring the different types of subawardee bussines types

In [ ]:
clean_df['subawardee_business_types'].value_counts()
Out[ ]:
For-Profit Organization,Manufacturer of Goods                                                                                                                                                                                                                                     140
For-Profit Organization,Limited Liability Company,Manufacturer of Goods                                                                                                                                                                                                            28
For-Profit Organization,S Corporation                                                                                                                                                                                                                                              25
For-Profit Organization                                                                                                                                                                                                                                                            24
For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods                                                                                                                                                                                                            21
For-Profit Organization,Manufacturer of Goods,S Corporation                                                                                                                                                                                                                        18
For-Profit Organization,Manufacturer of Goods,Woman-Owned Business                                                                                                                                                                                                                 13
For-Profit Organization,S Corporation,Veteran Owned Business                                                                                                                                                                                                                       12
For-Profit Organization,Limited Liability Company                                                                                                                                                                                                                                  11
Contracts and Grants,For-Profit Organization,Manufacturer of Goods                                                                                                                                                                                                                  9
For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business                                                                                                                                                                      5
Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business                                                                                                                                      5
Contracts,For-Profit Organization,Manufacturer of Goods                                                                                                                                                                                                                             4
Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business      4
For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm                                                                                                                                                                                 4
For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm                                                                                                                                                                                                           3
Nonprofit Organization                                                                                                                                                                                                                                                              3
For-Profit Organization,Foreign Owned and Located                                                                                                                                                                                                                                   2
For-Profit Organization,Limited Liability Company,SBA Certified Hub Zone Firm,Service Disabled Veteran Owned,Veteran Owned Business                                                                                                                                                 2
For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business                                                                                                                                                                                           2
For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods,Self-Certified Small Disadvantaged Business                                                                                                                                                                 2
For-Profit Organization,Veteran Owned Business                                                                                                                                                                                                                                      2
For-Profit Organization,Manufacturer of Goods,Service Disabled Veteran Owned,Veteran Owned Business                                                                                                                                                                                 2
Contracts and Grants,For-Profit Organization,Limited Liability Company                                                                                                                                                                                                              1
For-Profit Organization,Manufacturer of Goods,Veteran Owned Business                                                                                                                                                                                                                1
Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business                                  1
Contracts and Grants,For-Profit Organization,Limited Liability Company,Veteran Owned Business                                                                                                                                                                                       1
For-Profit Organization,Limited Liability Company,Woman-Owned Business                                                                                                                                                                                                              1
Contracts,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Other than one of the preceding,S Corporation                                                                                                                                                       1
Name: subawardee_business_types, dtype: int64

Preparing data for word cloud

In [ ]:
subawardee_biz_desc=' '.join(clean_df['subawardee_business_types'])
subawardee_biz_desc
Out[ ]:
'For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Limited Liability Company,Veteran Owned Business For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation Contracts and Grants,For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization Economically Disadvantaged Women-Owned Small Business,For-Profit Organization,Minority-Owned business,Native American Owned,SBA Certified Hub Zone Firm,Self-Certified Small Disadvantaged Business,Service Disabled Veteran Owned,Veteran Owned Business,Woman-Owned Business For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business,Woman-Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Other than one of the preceding,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Manufacturer of Goods,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Veteran Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Veteran Owned Business For-Profit Organization,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Limited Liability Company,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization Contracts and Grants,For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Contracts,For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation Nonprofit Organization For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Nonprofit Organization Nonprofit Organization For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,S Corporation Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company,SBA Certified Hub Zone Firm,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Limited Liability Company,SBA Certified Hub Zone Firm,Service Disabled Veteran Owned,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization For-Profit Organization,S Corporation For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Limited Liability Company For-Profit Organization,Limited Liability Company For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Self-Certified Small Disadvantaged Business Asian-Pacific American Owned,For-Profit Organization,Manufacturer of Goods,Minority-Owned business,Self-Certified Small Disadvantaged Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located For-Profit Organization,Foreign Owned and Located For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization For-Profit Organization For-Profit Organization,Manufacturer of Goods,SBA Certified Hub Zone Firm For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,Woman-Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Manufacturer of Goods For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Manufacturer of Goods,S Corporation For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,Limited Liability Company,Manufacturer of Goods For-Profit Organization,S Corporation For-Profit Organization,S Corporation For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,S Corporation,Veteran Owned Business For-Profit Organization,Limited Liability Company,Woman-Owned Business For-Profit Organization,Limited Liability Company,Manufacturer of Goods Contracts and Grants,For-Profit Organization,Manufacturer of Goods For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods,Self-Certified Small Disadvantaged Business For-Profit Organization,Foreign Owned and Located,Manufacturer of Goods,Self-Certified Small Disadvantaged Business'

Identifying important contractors based on the critical technologies they work with (either supply or input)

In [ ]:
clean_df['subaward_description'].to_list()
Out[ ]:
['Detonator&Initiator, Fuselage, Gen Structural Assys, Molded Rubber&O Ring, Non-complex Machined, NRE - Other, Seals, Tech/Eng Services, Wire Cable.',
 'Detonator&Initiator, Fuselage, Gen Structural Assys, Molded Rubber&O Ring, Non-complex Machined, NRE - Other, Seals, Tech/Eng Services, Wire Cable.',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'NRE - Other.',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'Cost Plus Fixed Fee',
 'NRE - Other.',
 'Cost Plus Fixed Fee',
 'Detonator&Initiator, NRE - Engineering, NRE - Other, NRE - Qualification, S&A Devices.',
 'Detonator&Initiator, NRE - Engineering, NRE - Other, NRE - Qualification, S&A Devices.',
 'Firm Fixed Price',
 'NRE - Other.',
 'NRE - Other.',
 'Cost Plus Fixed Fee',
 'Firm Fixed Price',
 'FinsWings&Boattails, NRE - Other, Pyrotechnic Fuses, Rocket Motors.',
 'FinsWings&Boattails, NRE - Other, Pyrotechnic Fuses, Rocket Motors.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Explosive Cut Device, NRE - Engineering, NRE - Other.',
 'Explosive Cut Device, NRE - Engineering, NRE - Other.',
 'Couplers, Gen Structural Assys, NRE - Other, Nuts.',
 'Couplers, Gen Structural Assys, NRE - Other, Nuts.',
 'Firm Fixed Price',
 'EnvTestEq(Shock/etc), NRE - Engineering, Tech/Eng Services.',
 'EnvTestEq(Shock/etc), NRE - Engineering, Tech/Eng Services.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Encoders, NRE - Other.',
 'Encoders, NRE - Other.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Fuselage, Gen Structural Assys, NRE - Other.',
 'Fuselage, Gen Structural Assys, NRE - Other.',
 'Firm Fixed Price',
 'Cost Plus Fixed Fee',
 'Multi-Function Assys.',
 'Multi-Function Assys.',
 'Testing (Non-Prod).',
 'Testing (Non-Prod).',
 'Firm Fixed Price',
 'NRE - Data Items, NRE - Engineering, NRE - Qualification, Pumps, Tech/Eng Services.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Gen Structural Assys, NRE - Other, Valves.',
 'Gen Structural Assys, NRE - Other, Valves.',
 'Cable Assemblies RF, CableAssy&HarnMulti, NRE - Other.',
 'Cost Plus Fixed Fee',
 'Time & Material',
 'Cable Assemblies RF, CableAssy&HarnMulti, NRE - Other.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Alum Invest Casting, NRE - Engineering, NRE - Other.',
 'Alum Invest Casting, NRE - Engineering, NRE - Other.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Time & Material',
 'Tech/Eng Services.',
 'Tech/Eng Services.',
 'NRE - Data Items, NRE - Engineering, NRE - Qualification, Pumps, Tech/Eng Services.',
 'NRE - Engineering, Titanium Invest Cast.',
 'NRE - Engineering, Titanium Invest Cast.',
 'Firm Fixed Price',
 'Cost Plus Fixed Fee',
 'Firm Fixed Price',
 'NRE - Other.',
 'NRE - Other.',
 'Firm Fixed Price',
 'Tech/Eng Services.',
 'Tech/Eng Services.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Time & Material',
 'FinsWings&Boattails.',
 'FinsWings&Boattails.',
 'Firm Fixed Price',
 'Gen Structural Assys, NRE - Engineering.',
 'Gen Structural Assys, NRE - Engineering.',
 'Firm Fixed Price',
 'Time & Material',
 'Firm Fixed Price',
 'Explosive Cut Device.',
 'Explosive Cut Device.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Cost Plus Fixed Fee',
 'NRE - Engineering, Receivers.',
 'NRE - Engineering, Receivers.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'NRE - Other.',
 "Metal Shp'g Containr.",
 "Metal Shp'g Containr.",
 'NRE - Other.',
 'NRE - Other.',
 'Firm Fixed Price',
 'Missile Antenna &Ped.',
 'Missile Antenna &Ped.',
 'AlarmBuzzerSensor, EnvTestEq(Shock/etc).',
 'AlarmBuzzerSensor, EnvTestEq(Shock/etc).',
 'Missile Antenna &Ped, NRE - Engineering, NRE - Other.',
 'Missile Antenna &Ped, NRE - Engineering, NRE - Other.',
 'Firm Fixed Price',
 'Iron Batteries.',
 'Iron Batteries.',
 'Firm Fixed Price',
 'Time & Material',
 "Custom CCA's, NRE - Other.",
 'Firm Fixed Price',
 "Custom CCA's, NRE - Other.",
 'Gen Structural Assys.',
 'Gen Structural Assys.',
 'Test Equipment.',
 'Test Equipment.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Transducers.',
 'Firm Fixed Price',
 'Chargers, Lithium Batteries, NRE - Other.',
 'Chargers, Lithium Batteries, NRE - Other.',
 'NRE - Other.',
 'Transducers.',
 'NRE - Other.',
 'NRE - Other.',
 'Iron Batteries, NRE - Other.',
 'Firm Fixed Price',
 'Iron Batteries, NRE - Other.',
 'Firm Fixed Price',
 'Accelerometers, Amplifiers, Cable/CableAssyHV, Non-complex Machined.',
 'Accelerometers, Amplifiers, Cable/CableAssyHV, Non-complex Machined.',
 'Firm Fixed Price',
 'Cost Plus Fixed Fee',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'NRE - Other.',
 'Iron Batteries.',
 'Iron Batteries.',
 'Firm Fixed Price',
 'Test Equipment.',
 'Test Equipment.',
 'Firm Fixed Price',
 'Services: Nonproduct.',
 'Services: Nonproduct.',
 'Firm Fixed Price',
 'Measuring Devices.',
 'Measuring Devices.',
 'Firm Fixed Price',
 'Gen Structural Assys, NRE - Other.',
 'Gen Structural Assys, NRE - Other.',
 'Measuring Devices.',
 'Measuring Devices.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Launchers&Cannisters.',
 'Firm Fixed Price',
 'Launchers&Cannisters.',
 'Machine Shop Work.',
 'Machine Shop Work.',
 'Firm Fixed Price',
 'NRE - Other, T/E Rental/Lease.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Gen Structural Assys, Non-complex Machined.',
 'Gen Structural Assys, Non-complex Machined.',
 'NRE - Other, Titanium Plate.',
 'NRE - Other, Titanium Plate.',
 'Gears, Precision Machined.',
 'Gears, Precision Machined.',
 'NRE - Other.',
 'Firm Fixed Price',
 'NRE - Other.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'NRE - Other.',
 'Bolts, Launchers&Cannisters.',
 'Bolts, Launchers&Cannisters.',
 'FinsWings&Boattails.',
 'FinsWings&Boattails.',
 'Firm Fixed Price',
 "Custom CCA's, NRE - Other.",
 "Custom CCA's, NRE - Other.",
 'Missile Antenna &Ped, NRE - Other.',
 'Missile Antenna &Ped, NRE - Other.',
 'Firm Fixed Price',
 'Gen Structural Assys, Non-complex Machined.',
 'Gen Structural Assys, Non-complex Machined.',
 'Firm Fixed Price',
 'Iron Batteries.',
 'Firm Fixed Price',
 'CableAssy&HarnMulti, NRE - Other.',
 'CableAssy&HarnMulti, NRE - Other.',
 'Firm Fixed Price',
 'NRE - Other, T/E Rental/Lease.',
 'Firm Fixed Price',
 'Gen Structural Assys, NRE - Engineering.',
 'Gen Structural Assys, NRE - Engineering.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Time & Material',
 'Gen Structural Assys.',
 'Gen Structural Assys.',
 'Gen Structural Assys, NRE - Engineering.',
 'Gen Structural Assys, NRE - Engineering.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Time & Material',
 'Firm Fixed Price',
 'Firm Fixed Price',
 "Custom CCA's.",
 "Custom CCA's.",
 "Custom CCA's.",
 "Custom CCA's.",
 'CableAssy&HarnMulti, NRE - Other.',
 'CableAssy&HarnMulti, NRE - Other.',
 'NRE - Other.',
 'NRE - Other.',
 'Major Assemblies.',
 'Major Assemblies.',
 "Custom CCA's, NRE - Other.",
 "Custom CCA's, NRE - Other.",
 'Transmitters.',
 'Transmitters.',
 'Firm Fixed Price',
 'Missile Antenna &Ped.',
 'Missile Antenna &Ped.',
 'Non-complex Machined, Precision Machined.',
 'Non-complex Machined, Precision Machined.',
 'Firm Fixed Price',
 'T/E Rental/Lease.',
 'T/E Rental/Lease.',
 'IMUs IRUs.',
 'IMUs IRUs.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Test Equipment.',
 'Test Equipment.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Test Equipment.',
 'Firm Fixed Price',
 'Test Equipment.',
 'Firm Fixed Price',
 'NRE - Engineering.',
 'NRE - Engineering.',
 'Non-complex ShtMetal.',
 'Non-complex ShtMetal.',
 'Test Equipment.',
 'Test Equipment.',
 'Firm Fixed Price',
 'Gen Structural Assys.',
 'Gen Structural Assys.',
 'NRE - Other, Protect&Dust Covers, Rectanglar Connector, S&A Devices.',
 'NRE - Other, Protect&Dust Covers, Rectanglar Connector, S&A Devices.',
 'Firm Fixed Price',
 'Tech/Eng Services.',
 'Time & Material',
 'Tech/Eng Services.',
 'NRE - Other.',
 'NRE - Other.',
 'Firm Fixed Price',
 'CableAssy&HarnMulti, NRE - Other.',
 'Fasteners & Hardware.',
 'Fasteners & Hardware.',
 'Firm Fixed Price',
 'Measuring Devices, NRE - Other.',
 'Measuring Devices, NRE - Other.',
 'Firm Fixed Price',
 'Shafts.',
 'Firm Fixed Price',
 'Testing (Non-Prod).',
 'Testing (Non-Prod).',
 'CableAssy&HarnMulti.',
 'GPS Receivers.',
 'GPS Receivers.',
 'Major Assemblies.',
 'Major Assemblies.',
 'Integrtd Electr Assy, NRE - Data Items.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Encoders.',
 'Encoders.',
 'Clamps, Washers.',
 'Clamps, Washers.',
 'Accelerometers, CableMulticonductor.',
 'CableAssy&HarnMulti.',
 'Machine Shop Work.',
 'Firm Fixed Price',
 'Composites.',
 'Composites.',
 'Accelerometers, CableMulticonductor.',
 'Wire Cable.',
 'Wire Cable.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Encoders.',
 'Encoders.',
 'Clamps, Non-complex Machined, Protect&Dust Covers.',
 'Clamps, Non-complex Machined, Protect&Dust Covers.',
 'Non-complex Machined.',
 'Non-complex Machined.',
 'AC-DC Power Supplies, Adaptors, Backshells, CableAssy&HarnMulti, Chargers, Custom - Computer SW, Filter Pin Connector, Flex Assy(w/Connect), Lithium Batteries, Microprocessors.',
 'AC-DC Power Supplies, Adaptors, Backshells, CableAssy&HarnMulti, Chargers, Custom - Computer SW, Filter Pin Connector, Flex Assy(w/Connect), Lithium Batteries, Microprocessors.',
 'Amplifiers.',
 'CableAssy&HarnMulti, NRE - Other.',
 'CableAssy&HarnMulti, NRE - Other.',
 'Major Assemblies.',
 'Major Assemblies.',
 'Firm Fixed Price',
 'Test Equipment.',
 'Test Equipment.',
 'Firm Fixed Price',
 'Lithium Batteries.',
 'Firm Fixed Price',
 'Firm Fixed Price',
 'Firm Fixed Price']

Identify states involved with Critical Technologies

In [ ]:
ctech= clean_df[clean_df['subaward_description'].str.contains('Batteries|batteries|Sensors|sensors|sensor|Sensor|Detonator&Initiaor|explosive|Explosive|Missile|missile|explosives|Explosives|Launchers&Cannisters|transmitters|Transmitters|Transmitter|Receivers|Receiver|receiver|Encoders|Encoder')==True]

ctech['subaward_primary_place_of_performance_state_name'].value_counts()
Out[ ]:
California       16
Arizona           6
Missouri          6
Pennsylvania      4
Massachusetts     2
Virginia          2
Maryland          2
Ohio              2
Iowa              2
Name: subaward_primary_place_of_performance_state_name, dtype: int64

Batteries

In [ ]:
batteries_sensors=clean_df[clean_df['subaward_description'].str.contains('Batteries|batteries|Sensors|sensors|sensor|Sensor')==True]
pd.DataFrame(batteries_sensors[['subawardee_name','subaward_primary_place_of_performance_city_name',
                   'subaward_primary_place_of_performance_state_name']]).drop_duplicates()
Out[ ]:
subawardee_name subaward_primary_place_of_performance_city_name subaward_primary_place_of_performance_state_name
116 MEASUREMENT SPECIALTIES, INC. HAMPTON Virginia
121 EAGLEPICHER TECHNOLOGIES, LLC JOPLIN Missouri
122 EAGLEPICHER TECHNOLOGIES, LLC Joplin Missouri
140 SPACE VECTOR CORPORATION CHATSWORTH California
159 ADVANCED THERMAL BATTERIES INC. WESTMINSTER Maryland
333 DIVERSIFIED TECHNICAL SYSTEMS, INC. SEAL BEACH California
In [ ]:
batteries_sensors['subawardee_name'].value_counts()
Out[ ]:
EAGLEPICHER TECHNOLOGIES, LLC          6
MEASUREMENT SPECIALTIES, INC.          2
SPACE VECTOR CORPORATION               2
ADVANCED THERMAL BATTERIES INC.        2
DIVERSIFIED TECHNICAL SYSTEMS, INC.    2
Name: subawardee_name, dtype: int64

Explosives

In [ ]:
explosives=clean_df[clean_df['subaward_description'].str.contains('Detonator&Initiaor|explosive|Explosive|Missile|missile|explosives|Explosives|Launchers&Cannisters')==True]

pd.DataFrame(explosives[['subawardee_name','subaward_primary_place_of_performance_city_name',
                   'subaward_primary_place_of_performance_state_name']]).drop_duplicates()
Out[ ]:
subawardee_name subaward_primary_place_of_performance_city_name subaward_primary_place_of_performance_state_name
33 PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY... CHANDLER Arizona
114 PORT ELECTRONICS CORPORATION LAWRENCE Massachusetts
118 MORGAN ADVANCED CERAMICS, INC HAYWARD California
177 MARVIN ENGINEERING CO., INC. INGLEWOOD California
202 HI-TECH MACHINING & ENGINEERING, L.L.C. TUCSON Arizona
209 ATK SPACE SYSTEMS INC. SAN DIEGO California
252 ALLCOMP INC. CITY OF INDUSTRY California
In [ ]:
explosives['subawardee_name'].value_counts()
Out[ ]:
PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC    4
PORT ELECTRONICS CORPORATION                                       2
MORGAN ADVANCED CERAMICS, INC                                      2
MARVIN ENGINEERING CO., INC.                                       2
HI-TECH MACHINING & ENGINEERING, L.L.C.                            2
ATK SPACE SYSTEMS INC.                                             2
ALLCOMP INC.                                                       2
Name: subawardee_name, dtype: int64

Radio Frequency Devices

In [ ]:
rf=clean_df[clean_df['subaward_description'].str.contains('transmitters|Transmitters|Transmitter|Receivers|Receiver|receiver|Encoders|Encoder')==True]

pd.DataFrame(rf[['subawardee_name','subaward_primary_place_of_performance_city_name',
                   'subaward_primary_place_of_performance_state_name']]).drop_duplicates()
Out[ ]:
subawardee_name subaward_primary_place_of_performance_city_name subaward_primary_place_of_performance_state_name
42 L3 TECHNOLOGIES, INC. SAN DIEGO California
104 HERLEY INDUSTRIES, INC. LANCASTER Pennsylvania
249 QUASONIX, LLC WEST CHESTER Ohio
304 BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS... CEDAR RAPIDS Iowa
311 L3 TECHNOLOGIES, INC. BRISTOL Pennsylvania
In [ ]:
rf['subawardee_name'].value_counts()
Out[ ]:
L3 TECHNOLOGIES, INC.                                              6
HERLEY INDUSTRIES, INC.                                            2
QUASONIX, LLC                                                      2
BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS INTEGRATION INC.    2
Name: subawardee_name, dtype: int64

How long do the contracts run on an average? Which are the longest and smallest duration contracts?

In [ ]:
contract_duration= df[['prime_award_period_of_performance_start_date',
                       'prime_award_period_of_performance_potential_end_date',
                       'prime_award_funding_office_name','prime_award_project_title',
                       'subawardee_name','subawardee_parent_name','prime_award_primary_place_of_performance_state_name']]
contract_duration.info()
<class 'pandas.core.frame.DataFrame'>
Int64Index: 347 entries, 0 to 347
Data columns (total 7 columns):
 #   Column                                                Non-Null Count  Dtype 
---  ------                                                --------------  ----- 
 0   prime_award_period_of_performance_start_date          347 non-null    object
 1   prime_award_period_of_performance_potential_end_date  347 non-null    object
 2   prime_award_funding_office_name                       347 non-null    object
 3   prime_award_project_title                             347 non-null    object
 4   subawardee_name                                       347 non-null    object
 5   subawardee_parent_name                                242 non-null    object
 6   prime_award_primary_place_of_performance_state_name   347 non-null    object
dtypes: object(7)
memory usage: 21.7+ KB

Convert Dates to appropriate column types

In [ ]:
contract_duration['prime_award_period_of_performance_start_date'] = pd.to_datetime(
    contract_duration['prime_award_period_of_performance_start_date'], format='%Y-%m-%d')

contract_duration['prime_award_period_of_performance_potential_end_date'] = pd.to_datetime(
    contract_duration['prime_award_period_of_performance_potential_end_date'], format='%Y-%m-%d')

contract_duration.head()
/usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:2: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  
/usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:5: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  """
Out[ ]:
prime_award_period_of_performance_start_date prime_award_period_of_performance_potential_end_date prime_award_funding_office_name prime_award_project_title subawardee_name subawardee_parent_name prime_award_primary_place_of_performance_state_name
0 2016-10-31 2022-03-31 DEF ADVANCED RESEARCH PROJECTS AGCY HYPERSONIC AIR BREAT ALLIANT TECHSYSTEMS OPERATIONS LLC NORTHROP GRUMMAN CORPORATION Arizona
1 2016-10-31 2022-03-31 DEF ADVANCED RESEARCH PROJECTS AGCY HYPERSONIC AIR BREAT ALLIANT TECHSYSTEMS OPERATIONS LLC NORTHROP GRUMMAN CORPORATION Arizona
2 2016-10-31 2022-03-31 AFRL RWP AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC ORBITAL ATK, INC. Arizona
3 2016-10-31 2022-03-31 AFRL RQH HIGH SPEED SYS DIV AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC ORBITAL ATK, INC. Arizona
4 2016-10-31 2022-03-31 DEF ADVANCED RESEARCH PROJECTS AGCY AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC ORBITAL ATK, INC. Arizona

Calculate the number of days that it takes for each contract to be completed

In [ ]:
contract_duration['duration']= contract_duration['prime_award_period_of_performance_potential_end_date']- contract_duration['prime_award_period_of_performance_start_date']
contract_duration.head()
Out[ ]:
prime_award_period_of_performance_start_date prime_award_period_of_performance_potential_end_date prime_award_funding_office_name prime_award_project_title subawardee_name subawardee_parent_name prime_award_primary_place_of_performance_state_name duration
0 2016-10-31 2022-03-31 DEF ADVANCED RESEARCH PROJECTS AGCY HYPERSONIC AIR BREAT ALLIANT TECHSYSTEMS OPERATIONS LLC NORTHROP GRUMMAN CORPORATION Arizona 1977 days
2 2016-10-31 2022-03-31 AFRL RWP AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC ORBITAL ATK, INC. Arizona 1977 days
3 2016-10-31 2022-03-31 AFRL RQH HIGH SPEED SYS DIV AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC ORBITAL ATK, INC. Arizona 1977 days
4 2016-10-31 2022-03-31 DEF ADVANCED RESEARCH PROJECTS AGCY AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC ORBITAL ATK, INC. Arizona 1977 days
6 2016-10-31 2022-03-31 AFRL RWP AMS: ADV PROGRAMS ALLIANT TECHSYSTEMS OPERATIONS LLC NORTHROP GRUMMAN CORPORATION Arizona 1977 days
In [ ]:
contract_duration['duration'].describe()
Out[ ]:
count                   171
mean     1977 days 00:00:00
std         0 days 00:00:00
min      1977 days 00:00:00
25%      1977 days 00:00:00
50%      1977 days 00:00:00
75%      1977 days 00:00:00
max      1977 days 00:00:00
Name: duration, dtype: object

It seems that all the contracts last for about 5.4 years which is again a significant long time for hackers to knwo about the companies and hack into the systems

Q: How many contracts have each agency funded?

In [ ]:
contract_count_agency= pd.DataFrame(clean_df['prime_award_funding_sub_agency_name'].value_counts().reset_index())
contract_count_agency
Out[ ]:
index prime_award_funding_sub_agency_name
0 DEFENSE ADVANCED RESEARCH PROJECTS AGENCY (DA... 257
1 DEPT OF THE AIR FORCE 89
2 DEPT OF THE NAVY 1
In [ ]:
clean_df['subawardee_name'].value_counts()
Out[ ]:
ALLIANT TECHSYSTEMS OPERATIONS LLC                                 25
DUCOMMUN LABARGE TECHNOLOGIES, INC.                                22
PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC    16
DYNETICS TECHNICAL SOLUTIONS, INC.                                 13
A. P. I. INCORPORATED                                              12
                                                                   ..
CARLETON TECHNOLOGIES INC                                           1
MORGAN ADVANCED CERAMICS, INC.                                      1
GRAY'S ENGINEERING & CONSULTING, INC.                               1
PORT ELECTRONICS CORP.                                              1
ROCKWELL COLLINS, INC.                                              1
Name: subawardee_name, Length: 79, dtype: int64

Group subcontractors by parent name

In [ ]:
contractors= clean_df.groupby('subawardee_parent_name').first().reset_index()
contractors.head()
Out[ ]:
subawardee_parent_name prime_award_unique_key prime_award_piid prime_award_amount prime_award_base_action_date prime_award_base_action_date_fiscal_year prime_award_latest_action_date prime_award_latest_action_date_fiscal_year prime_award_period_of_performance_start_date prime_award_period_of_performance_current_end_date ... subaward_primary_place_of_performance_city_name subaward_primary_place_of_performance_state_code subaward_primary_place_of_performance_state_name subaward_primary_place_of_performance_address_zip_code subaward_primary_place_of_performance_congressional_district subaward_primary_place_of_performance_country_code subaward_primary_place_of_performance_country_name subaward_description usaspending_permalink subaward_fsrs_report_last_modified_date
0 AEROJET ROCKETDYNE HOLDINGS, INC. CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 174746702.0 2016-10-31 2017 2021-09-15 2021 2016-10-31 2022-03-31 ... BRISTOW VA Virginia 201361152 11 USA UNITED STATES Cost Plus Fixed Fee https://www.usaspending.gov/award/CONT_AWD_HR0... 2017-09-27 14:39:26+00
1 AI CONVOY HOLDCO LIMITED CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 174746702.0 2016-10-31 2017 2021-09-15 2021 2016-10-31 2022-03-31 ... ORCHARD PARK NY New York 141274121 27 USA UNITED STATES Tech/Eng Services. https://www.usaspending.gov/award/CONT_AWD_HR0... 2020-11-17 10:56:12+00
2 AI Convoy & Cy S.C.A. CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 174746702.0 2016-10-31 2017 2021-09-15 2021 2016-10-31 2022-03-31 ... ORCHARD PARK NY New York 141274121 27 USA UNITED STATES Tech/Eng Services. https://www.usaspending.gov/award/CONT_AWD_HR0... 2021-11-16 13:35:00+00
3 ALLIED MOTION TECHNOLOGIES INC. CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 174746702.0 2016-10-31 2017 2021-09-15 2021 2016-10-31 2022-03-31 ... TULSA OK Oklahoma 741463638 01 USA UNITED STATES Firm Fixed Price https://www.usaspending.gov/award/CONT_AWD_HR0... 2018-12-14 17:39:50+00
4 AMPHENOL CORPORATION CONT_AWD_HR001117C0025_9700_-NONE-_-NONE- HR001117C0025 174746702.0 2016-10-31 2017 2021-09-15 2021 2016-10-31 2022-03-31 ... DEPEW NY New York 140432417 27 USA UNITED STATES Accelerometers, CableMulticonductor. https://www.usaspending.gov/award/CONT_AWD_HR0... 2021-11-16 13:35:00+00

5 rows × 88 columns

Preparing data for the network graph

In [ ]:
network=pd.DataFrame(contractors[['subaward_primary_place_of_performance_state_name',
             'subawardee_parent_name','subawardee_name',
             'subaward_primary_place_of_performance_country_name'
             ]])
network.head()
Out[ ]:
subaward_primary_place_of_performance_state_name subawardee_parent_name subawardee_name subaward_primary_place_of_performance_country_name
0 Virginia AEROJET ROCKETDYNE HOLDINGS, INC. AEROJET ROCKETDYNE, INC. UNITED STATES
1 New York AI CONVOY HOLDCO LIMITED COBHAM MISSION SYSTEMS ORCHARD PARK INC. UNITED STATES
2 New York AI Convoy & Cy S.C.A. COBHAM MISSION SYSTEMS ORCHARD PARK INC. UNITED STATES
3 Oklahoma ALLIED MOTION TECHNOLOGIES INC. EMOTEQ CORPORATION UNITED STATES
4 New York AMPHENOL CORPORATION PCB PIEZOTRONICS, INC. UNITED STATES
In [ ]:
network['subaward_primary_place_of_performance_state_name'].value_counts().reset_index()
Out[ ]:
index subaward_primary_place_of_performance_state_name
0 California 9
1 Arizona 7
2 Pennsylvania 5
3 New York 4
4 Maryland 3
5 Ohio 3
6 Missouri 3
7 Virginia 2
8 Colorado 2
9 Tennessee 2
10 Connecticut 2
11 Alabama 2
12 Iowa 2
13 North Carolina 1
14 Oregon 1
15 Utah 1
16 Wisconsin 1
17 Minnesota 1
18 Oklahoma 1
19 Florida 1
20 Massachusetts 1
21 Illinois 1
In [ ]:
nodes1=[]

for i in range(0,len(network['subaward_primary_place_of_performance_state_name'])):
  state= network['subaward_primary_place_of_performance_country_name'][i]
  parent=network['subaward_primary_place_of_performance_state_name'][i]
  connection=[state, parent]
  nodes1.append(connection)


nodes1
Out[ ]:
[['UNITED STATES', 'Virginia'],
 ['UNITED STATES', 'New York'],
 ['UNITED STATES', 'New York'],
 ['UNITED STATES', 'Oklahoma'],
 ['UNITED STATES', 'New York'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Maryland'],
 ['UNITED STATES', 'Wisconsin'],
 ['UNITED STATES', 'Iowa'],
 ['UNITED STATES', 'Oregon'],
 ['UNITED STATES', 'Pennsylvania'],
 ['UNITED STATES', 'North Carolina'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Pennsylvania'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'Alabama'],
 ['UNITED STATES', 'Missouri'],
 ['UNITED STATES', 'Missouri'],
 ['UNITED STATES', 'Ohio'],
 ['UNITED STATES', 'Ohio'],
 ['UNITED STATES', 'Connecticut'],
 ['UNITED STATES', 'Utah'],
 ['UNITED STATES', 'Connecticut'],
 ['UNITED STATES', 'Tennessee'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'Minnesota'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Colorado'],
 ['UNITED STATES', 'Florida'],
 ['UNITED STATES', 'Colorado'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'Alabama'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'New York'],
 ['UNITED STATES', 'Pennsylvania'],
 ['UNITED STATES', 'Maryland'],
 ['UNITED STATES', 'Maryland'],
 ['UNITED STATES', 'Massachusetts'],
 ['UNITED STATES', 'Ohio'],
 ['UNITED STATES', 'Iowa'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Illinois'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Virginia'],
 ['UNITED STATES', 'Tennessee'],
 ['UNITED STATES', 'Arizona'],
 ['UNITED STATES', 'Pennsylvania'],
 ['UNITED STATES', 'Pennsylvania'],
 ['UNITED STATES', 'California'],
 ['UNITED STATES', 'Missouri']]
In [ ]:
nodes=[]

for i in range(0,len(network['subaward_primary_place_of_performance_state_name'])):
  state= network['subaward_primary_place_of_performance_state_name'][i]
  parent=network['subawardee_parent_name'][i]
  connection=[state, parent]
  nodes.append(connection)


nodes
Out[ ]:
[['Virginia', 'AEROJET ROCKETDYNE HOLDINGS, INC.'],
 ['New York', 'AI CONVOY HOLDCO LIMITED'],
 ['New York', 'AI Convoy & Cy S.C.A.'],
 ['Oklahoma', 'ALLIED MOTION TECHNOLOGIES INC.'],
 ['New York', 'AMPHENOL CORPORATION'],
 ['California', 'AMRO FABRICATING CORPORATION'],
 ['Arizona', 'APPLIED TECHNICAL SERVICES, LLC'],
 ['Arizona', 'ARLINGTON CAPITAL PARTNERS IV, L.P.'],
 ['Maryland', 'ASB AEROSPATIALE BATTERIES'],
 ['Wisconsin', 'BADGER METER, INC.'],
 ['Iowa', 'BAE SYSTEMS PLC'],
 ['Oregon', 'BERKSHIRE HATHAWAY INC.'],
 ['Pennsylvania', 'CONCURRENT TECHNOLOGIES CORPORATION'],
 ['North Carolina', 'CORVID TECHNOLOGIES LLC'],
 ['Arizona', 'CREATION TECHNOLOGIES INC'],
 ['Pennsylvania', 'CURTISS-WRIGHT CORPORATION'],
 ['California', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.'],
 ['Alabama', 'DYNETICS, INC.'],
 ['Missouri', 'Ducommun Incorporated'],
 ['Missouri', 'EAGLEPICHER TECHNOLOGIES, LLC'],
 ['Ohio', 'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.'],
 ['Ohio', 'ELEMENT MATERIALS TECHNOLOGY GROUP LIMITED'],
 ['Connecticut', 'ENSIGN-BICKFORD INDUSTRIES, INC.'],
 ['Utah', 'Ems Holdco, Inc.'],
 ['Connecticut', 'Ensign-Bickford Industries, Inc.'],
 ['Tennessee', 'Etex'],
 ['California', 'Fortive Corporation'],
 ['California', 'GLENAIR, INC.'],
 ['Minnesota', 'HONEYWELL INTERNATIONAL INC.'],
 ['Arizona', 'Imaginetics Holdings LLC'],
 ['Colorado', 'KEYSIGHT TECHNOLOGIES, INC.'],
 ['Florida', 'KRATOS DEFENSE & SECURITY SOLUTIONS, INC.'],
 ['Colorado', 'Keystone Holdings Group, LLC'],
 ['California', 'L3 TECHNOLOGIES, INC.'],
 ['California', 'L3HARRIS TECHNOLOGIES, INC.'],
 ['Alabama', 'LEIDOS HOLDINGS, INC.'],
 ['California', 'MARVIN ENGINEERING CO., INC.'],
 ['California', 'MORGAN ADVANCED MATERIALS PLC'],
 ['New York', 'MTS SYSTEMS CORPORATION'],
 ['Pennsylvania', 'NICOMATIC'],
 ['Maryland', 'NORTHROP GRUMMAN CORPORATION'],
 ['Maryland', 'ORBITAL ATK, INC.'],
 ['Massachusetts', 'PARKER-HANNIFIN CORPORATION'],
 ['Ohio', 'QUASONIX, LLC'],
 ['Iowa', 'ROCKWELL COLLINS, INC.'],
 ['Arizona', 'Radius Aerospace, Inc.'],
 ['Illinois', 'STANLEY MACHINING & TOOL CORP.'],
 ['Arizona', 'Samuel, Son & Co., Limited'],
 ['Virginia', 'TE Connectivity Ltd.'],
 ['Tennessee', 'TEVET, LLC'],
 ['Arizona', 'TRIUMPH GROUP, INC.'],
 ['Pennsylvania', 'The Jordan Company L P'],
 ['Pennsylvania', 'ULTRA ELECTRONICS HOLDINGS PLC'],
 ['California', 'VISHAY PRECISION GROUP, INC.'],
 ['Missouri', 'Vectra Co.']]
In [ ]:
leaves=[]
for i in range(0,len(network['subawardee_parent_name'])):
  state= network['subawardee_parent_name'][i]
  parent=network['subawardee_name'][i]
  connection=[state, parent]
  leaves.append(connection)

leaves
Out[ ]:
[['AEROJET ROCKETDYNE HOLDINGS, INC.', 'AEROJET ROCKETDYNE, INC.'],
 ['AI CONVOY HOLDCO LIMITED', 'COBHAM MISSION SYSTEMS ORCHARD PARK INC.'],
 ['AI Convoy & Cy S.C.A.', 'COBHAM MISSION SYSTEMS ORCHARD PARK INC.'],
 ['ALLIED MOTION TECHNOLOGIES INC.', 'EMOTEQ CORPORATION'],
 ['AMPHENOL CORPORATION', 'PCB PIEZOTRONICS, INC.'],
 ['AMRO FABRICATING CORPORATION', 'AMRO FABRICATING CORPORATION'],
 ['APPLIED TECHNICAL SERVICES, LLC', "GRAY'S ENGINEERING & CONSULTING, LLC"],
 ['ARLINGTON CAPITAL PARTNERS IV, L.P.', 'RADIUS AEROSPACE, INC.'],
 ['ASB AEROSPATIALE BATTERIES', 'ADVANCED THERMAL BATTERIES INC.'],
 ['BADGER METER, INC.', 'BADGER METER, INC.'],
 ['BAE SYSTEMS PLC',
  'BAE SYSTEMS INFORMATION AND ELECTRONIC SYSTEMS INTEGRATION INC.'],
 ['BERKSHIRE HATHAWAY INC.', 'PCC STRUCTURALS, INC.'],
 ['CONCURRENT TECHNOLOGIES CORPORATION',
  'CONCURRENT TECHNOLOGIES CORPORATION'],
 ['CORVID TECHNOLOGIES LLC', 'CORVID TECHNOLOGIES LLC'],
 ['CREATION TECHNOLOGIES INC', "GRAY'S ENGINEERING & CONSULTING, INC."],
 ['CURTISS-WRIGHT CORPORATION', 'TELETRONICS TECHNOLOGY CORPORATION'],
 ['DIVERSIFIED TECHNICAL SYSTEMS, INC.',
  'DIVERSIFIED TECHNICAL SYSTEMS, INC.'],
 ['DYNETICS, INC.', 'DYNETICS TECHNICAL SOLUTIONS, INC.'],
 ['Ducommun Incorporated', 'DUCOMMUN LABARGE TECHNOLOGIES, INC.'],
 ['EAGLEPICHER TECHNOLOGIES, LLC', 'EAGLEPICHER TECHNOLOGIES, LLC'],
 ['ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.',
  'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.'],
 ['ELEMENT MATERIALS TECHNOLOGY GROUP LIMITED',
  'ELEMENT MATERIALS TECHNOLOGY CINCINNATI INC.'],
 ['ENSIGN-BICKFORD INDUSTRIES, INC.',
  'ENSIGN-BICKFORD AEROSPACE & DEFENSE COMPANY'],
 ['Ems Holdco, Inc.', 'SPARTRONICS LOGAN, LLC'],
 ['Ensign-Bickford Industries, Inc.',
  'ENSIGN-BICKFORD AEROSPACE & DEFENSE COMPANY'],
 ['Etex', 'PROMAT INC'],
 ['Fortive Corporation',
  'PACIFIC SCIENTIFIC ENERGETIC MATERIALS COMPANY (CALIFORNIA) LLC'],
 ['GLENAIR, INC.', 'GLENAIR, INC.'],
 ['HONEYWELL INTERNATIONAL INC.', 'HONEYWELL INTERNATIONAL INC.'],
 ['Imaginetics Holdings LLC', 'AZMARK AERO SYSTEMS, LLC'],
 ['KEYSIGHT TECHNOLOGIES, INC.', 'KEYSIGHT TECHNOLOGIES, INC.'],
 ['KRATOS DEFENSE & SECURITY SOLUTIONS, INC.', 'MICRO SYSTEMS, INC.'],
 ['Keystone Holdings Group, LLC', 'COORSTEK, INC.'],
 ['L3 TECHNOLOGIES, INC.', 'L3 TECHNOLOGIES, INC.'],
 ['L3HARRIS TECHNOLOGIES, INC.', 'L3 TECHNOLOGIES, INC.'],
 ['LEIDOS HOLDINGS, INC.', 'DYNETICS TECHNICAL SOLUTIONS, INC.'],
 ['MARVIN ENGINEERING CO., INC.', 'MARVIN ENGINEERING CO., INC.'],
 ['MORGAN ADVANCED MATERIALS PLC', 'MORGAN ADVANCED CERAMICS, INC'],
 ['MTS SYSTEMS CORPORATION', 'PCB PIEZOTRONICS, INC.'],
 ['NICOMATIC', 'NICOMATIC, L.P.'],
 ['NORTHROP GRUMMAN CORPORATION', 'ALLIANT TECHSYSTEMS OPERATIONS LLC'],
 ['ORBITAL ATK, INC.', 'ALLIANT TECHSYSTEMS OPERATIONS LLC'],
 ['PARKER-HANNIFIN CORPORATION', 'PARKER-HANNIFIN CORPORATION'],
 ['QUASONIX, LLC', 'QUASONIX, LLC'],
 ['ROCKWELL COLLINS, INC.', 'ROCKWELL COLLINS, INC.'],
 ['Radius Aerospace, Inc.', 'RADIUS AEROSPACE, INC.'],
 ['STANLEY MACHINING & TOOL CORP.', 'STANLEY MACHINING & TOOL CORP.'],
 ['Samuel, Son & Co., Limited', 'CAID INDUSTRIES, INC'],
 ['TE Connectivity Ltd.', 'MEASUREMENT SPECIALTIES, INC.'],
 ['TEVET, LLC', 'TEVET, LLC'],
 ['TRIUMPH GROUP, INC.', 'TRIUMPH ENGINEERED SOLUTIONS, INC.'],
 ['The Jordan Company L P', 'ARCH GLOBAL PRECISION - HUNTINGDON VALLEY, LLC'],
 ['ULTRA ELECTRONICS HOLDINGS PLC', 'HERLEY INDUSTRIES, INC.'],
 ['VISHAY PRECISION GROUP, INC.', 'DIVERSIFIED TECHNICAL SYSTEMS, INC.'],
 ['Vectra Co.', 'EAGLEPICHER TECHNOLOGIES, LLC']]