目录
dataframe
def merge2Date(year, month, day, hour, minute):
date = datetime(int(year), int(month), int(day), int(hour), int(minute))
return date
Train_data['cdate'] = Train_data.apply(lambda x: merge2Date(x.year, x.month, x.day, x.hour, x.minute), axis = 1)
df_bar['insize_k'] = pd.to_numeric(df_bar['insize_k']).round(0).astype(int)
df['gene1_old'] = pd.DataFrame(np.random.randint(1, 5, (20, 1)))[0]
df['gene'].unique()
df[col_name].value_counts()
for index, row in df.iterrows():
print(index) # 输出每行的索引值
df['index'] = df.index
del df['colName']
df.set_index(["Column"], inplace=True)
df.rename(columns={'a':'A'})
df[['a', 'b']]
df0 = pd.merge(df_tmp, df_tmp2, on='gene')
统计方法实现
import statsmodels.api as sm
reject, pvals_corrected, alphacSidak, alphacBonf = sm.stats.multipletests(df['p'])
文件操作
语法操作
def foo(var, x, y):
return {
'+': lambda x,y: x+y,
'-': lambda x,y: x-y,
'*': lambda x,y: x*y,
'/': lambda x,y: x/y,
}[var](x,y)
## dic.items() 已经将字典变成(key,value)元组
## key中代表用item[1]作为
tmp = sorted(dic.items(), key=lambda item:item[1], reverse=True)
网页操作
import html
def make_element(name, value, **attrs):
keyvals = [' %s="%s"' % item for item in attrs.items()]
attr_str = ''.join(keyvals)
element = '<{name}{attrs}>{value}</{name}>'.format(
name=name,
attrs=attr_str,
value=html.escape(value))
return element
# Example
# Creates '<item size="large" quantity="6">Albatross</item>'
make_element('item', 'Albatross', size='large', quantity=6)
# Creates '<p><spam></p>'
make_element('p', '<spam>')
网友评论