You are on page 1of 1

import pandas as pd

processed_firme = pd.read_csv('processed_valid_phone_numbers_all_years.csv',
sep=',', dtype=str)
firme_neradiate = pd.read_csv(
'3firme_neradiate_cu_sediu.csv',
sep='^',
encoding='ISO-8859-1',
index_col=False,
dtype=str
)

processed_firme['CUI'] =
processed_firme['CUI'].fillna(0.0).astype('float').astype('Int64').astype(str)
processed_firme['CAEN'] =
processed_firme['CAEN'].fillna(0.0).astype('float').astype('Int64').astype(str)

processed_firme['CAEN'] =
processed_firme['CAEN'].fillna(0.0).astype('float').astype('Int64').astype(str)

processed_firme['Cifra de afacere'] = processed_firme['Cifra de


afacere'].fillna(0.0).astype('float')
processed_firme['Cifra de afacere'] = processed_firme['Cifra de
afacere'].multiply(0.001)
processed_firme['Cifra de afacere'] = processed_firme['Cifra de
afacere'].astype('Int64').astype(str)

d = processed_firme.loc[processed_firme['CUI'].isin(firme_neradiate['CUI'])]

d.to_excel('firme_neradiate_processed.xlsx', index=False)

You might also like