|
|

楼主 |
发表于 2019-10-24 09:41:34
|
显示全部楼层
import pandas as pd
import numpy as np
from collections import Counter
from sklearn import preprocessing
import scipy
import sys
#查找路径
import os
path1=os.path.abspath('.')
print(path1)
name=pd.read_table("genotype.csv",header=0,sep=',')
print(name)
# 读取 数据
print(name.columns)
for i in name.columns:
a,b,c=Counter(name[i]).keys()
# 找次要等位基因
if a[0]==a[1]:
#print(keys[0],keys[1])
name[i].replace(a, 0, inplace=True)
name[i].replace(b, 1, inplace=True)
name[i].replace(c, 2, inplace=True)
elif a[0]!=a[1]:
name[i].replace(a, 1, inplace=True)
name[i].replace(b, 0, inplace=True)
name[i].replace(c, 2, inplace=True)
#print(keys)
#print(name[i])
name.to_csv('rename.csv')
#recode_ID()
|
|