data='''taxonomy coverage
ko04141,map04141 338.586386
ko00970,map00970 338.586386
ko00970,map00970 338.586386'''
%store data >test_data.txt
Writing 'data' (str) to file 'test_data.txt'.
import pandas as pd
df51 = pd.read_csv("test_data.txt",sep="\t")
df51
taxonomy | coverage | |
---|---|---|
0 | ko04141,map04141 | 338.586386 |
1 | ko00970,map00970 | 338.586386 |
2 | ko00970,map00970 | 338.586386 |
def split_at_comma_n_get_2nd(item):
parts = item.split(",")
return parts[1]
df51.taxonomy = df51.taxonomy.apply(split_at_comma_n_get_2nd)
df51
taxonomy | coverage | |
---|---|---|
0 | map04141 | 338.586386 |
1 | map00970 | 338.586386 |
2 | map00970 | 338.586386 |
# reset back to 'unfixed'
import pandas as pd
df51 = pd.read_csv("test_data.txt",sep="\t")
df51.taxonomy = df51.taxonomy.apply(lambda x: x.split(',')[1])
df51
taxonomy | coverage | |
---|---|---|
0 | map04141 | 338.586386 |
1 | map00970 | 338.586386 |
2 | map00970 | 338.586386 |