Skip to content

Instantly share code, notes, and snippets.

View mepsrajput's full-sized avatar
🎯
Focusing

Pradeep Singh mepsrajput

🎯
Focusing
View GitHub Profile
@mepsrajput
mepsrajput / simple_freq_procedure.sas
Last active April 14, 2022 14:52
Simple proc freq
/* Import the CSV */
FILENAME Gov_C "/folders/myfolders/Assignments/governors_county.csv";
PROC IMPORT DATAFILE=Gov_C DBMS=CSV OUT=WORK.Gov_C_SAS;
GETNAMES=YES;
RUN;
/* freq procedure */
proc freq data=Gov_C_SAS;
# Import Pandas
import pandas as pd
# Import CSV
data = pd.read_csv("../input/us-election-2020/governors_county.csv");
# Frequencies in Actual Order
datax = data['state'].value_counts().sort_index()
# Create a dataframe
/* Proc freq with descending order */
proc freq data=Gov_C_SAS order=freq;
tables state;
run;
datax = data['state'].value_counts()
datay = pd.DataFrame({
'state': datax.index,
'Frequency': datax.values,
'Percent': ((datax.values/datax.values.sum())*100).round(2),
'Cumulative Frequenc': datax.values.cumsum(),
'Cumulative Percen':((datax.values.cumsum()/datax.values.sum())*100).round(2)
})
datay
proc freq data = Gov_C_SAS;
tables state / nopercent nocum;
run;
datax = data['state'].value_counts().sort_index()
datay = pd.DataFrame({
'state': datax.index,
'Frequency': datax.values
})
datay
proc freq data=Gov_C_SAS;
tables county*state / norow nocol nopercent;
run;
datab = pd.crosstab(data.county, data.state, margins=True, margins_name='Total')
datab
/* freq procedure with missing */
proc freq data=Gov_C_SAS;
tables GENRE / missing;
run;
datax = data['GENRE'].value_counts(dropna=False)
datay = pd.DataFrame({
'GENRE': datax.index,
'Frequency': datax.values,
'Percent': ((datax.values/datax.values.sum())*100).round(2),
'Cumulative Frequency': datax.values.cumsum(),
'Cumulative Percent': ((datax.values.cumsum()/datax.values.sum())*100).round(2)
})
datay