博文

目前显示的是 六月, 2023的博文

pandas 计算年龄分组计算非重复计数和年龄小于7岁非重复计数

import pandas as pd import numpy as np import janitor sc = (     pd . read_excel ( "/mnt/c/Users/xuefeng/Downloads/非重卡删除.xlsx" , dtype = { 'SC_GLDW_BM' : 'object' , 'YM_BM' : 'object' }).clean_names() ) (     sc .query( 'ym_mc.str.startswith("新冠")' )     .astype({ 'sc_gldw_bm' : 'string' })     .assign( shi = lambda x : x .sc_gldw_bm.str[ 0 : 4 ])     .groupby( 'shi' )     .agg( count = ( 'shi' , 'count' ))     .reset_index()     .sort_values( 'shi' )     .to_excel( "/mnt/c/Users/xuefeng/Downloads/非重卡删除1.xlsx" ) ) test = (     sc .assign( xian = sc .sc_gldw_bm.str[: 6 ], shi = sc .sc_gldw_bm.str.slice( 0 , 4 ), csrq = sc .zjhm.str[ 6 : 14 ])     .query( "sc_gldw_bm.str.startswith('6211') & csrq.str.len()==8 & csrq.str.slice(0,2) in ('19','20')" )     .assign( age = lambda x :( pd . to_datetime ( x .jz_sj) - pd . to_da