所以我正在使用SUM运行PROC SUMMARY来查看某些事物的频率,但我只有160个观测值但是我遇到的问题是频率之和为161.我仔细检查了原始数据集,即160个观测值和所有值但事情正在使频率161,我不知道是什么。
我试过一些代码
PROC SQL;
CREATE TABLE DiseaseFreq AS
SELECT Concomitant_Disease,
count(*) AS Freq
FROM CAS.PreOp
GROUP BY Concomitant_Disease;
QUIT;
DATA Disease (KEEP=var freq RENAME=var=Concomitant_Disease);
SET DiseaseFreq;
LENGTH var $25. freq 3.;
DO i=1 BY 1 WHILE(SCAN(Concomitant_Disease,i,"~^,")^='');
var=STRIP(PROPCASE(SCAN(Concomitant_Disease,i,"~^,")));
Freq=Freq;
OUTPUT;
END;
RUN;
PROC SUMMARY DATA=Disease;
CLASS Concomitant_Disease;
VAR Freq;
OUTPUT OUT=Count SUM=Freq;
RUN;