27 lines
		
	
	
		
			551 B
		
	
	
	
		
			Python
		
	
	
	
			
		
		
	
	
			27 lines
		
	
	
		
			551 B
		
	
	
	
		
			Python
		
	
	
	
# %%
 | 
						|
import pandas as pd
 | 
						|
 | 
						|
# %%
 | 
						|
data_path = '../../data_preprocess/exports/preprocessed_data.csv'
 | 
						|
full_df = pd.read_csv(data_path, skipinitialspace=True)
 | 
						|
 | 
						|
# %%
 | 
						|
df_in = full_df[full_df['MDM']].reset_index(drop=True)
 | 
						|
# %%
 | 
						|
df_out = full_df[~full_df['MDM']].reset_index(drop=True)
 | 
						|
# %%
 | 
						|
label_counts_in = df_in['unit'].value_counts()
 | 
						|
print(label_counts_in.to_string())
 | 
						|
 | 
						|
# %%
 | 
						|
label_counts_out = df_out['unit'].value_counts()
 | 
						|
print(label_counts_out.to_string())
 | 
						|
 | 
						|
 | 
						|
# %%
 | 
						|
label_counts_out['NOVALUE']/len(df_out)
 | 
						|
 | 
						|
# %%
 | 
						|
label_counts_in['NOVALUE']/len(df_out)
 | 
						|
# %%
 |