import sys
import pandas as pd
import numpy as np
import itertools as it
import zipfile
import re
#adding the lib path
sys.path.append('/Users/abhishek/dev/appys/lib/')
import utils
#presets
data_dir = "/Users/abhishek/apratap_bt/projects/PCBC_integrative_analysis/data/"
#get all the expression files
fpkm_files = utils.get_FilesList(data_dir,pattern='genes.fpkm_tracking')
[get_FilesList]: Found 8 files at /Users/abhishek/apratap_bt/projects/PCBC_integrative_analysis/data/
fpkms = {}
index = ''
for fpkm_file in fpkm_files:
sample_name = fpkm_file.split('/')[7].split('_')[2]
df = pd.DataFrame.from_csv(fpkm_file,sep="\t",header=0)
fpkms[sample_name]= df['FPKM'].values
index = df.index
df = pd.DataFrame(fpkms,index=index)
df.to_csv('/Users/abhishek/apratap_bt/projects/PCBC_integrative_analysis/data/summarized_expression_calls.tsv',
sep="\t",header=True)