# 筛选需要的列 nowcoder = nowcoder[['user_id', 'date']] # 转换日期格式 nowcoder['date'] = pd.to_datetime(nowcoder['date']).dt.date # 去重 nowcoder.drop_duplicates(inplace=True) # 拷贝原表 df = nowcoder.copy(deep=True) # 根据SQL解题思路进行计算 df['last_date'] = df['date'] + timedelta(days=1) df1 = pd.merge(nowcoder, df, left_on=['user_id', 'date'], right_on=['user_id', 'last_date'], how='left')[['user_id', 'date_x', 'date_y','last_date']] df2 = df1.dropna() print(round(len(df2)/len(df1),2))