I am working on attribution modelling on millions of records so want to parallelize this function on pandas dataframe
from multiprocessing import Pool
def paths_gen(df):
for p in df.index:
for q in df.columns[:-1]:
if df.at[p,q]!='empty':
df.at[p,'Path']= str(df.at[p,'Path'])+str(df.at[p,q])+' > '
return df
pool = Pool(4)
results=pool.map(paths_gen,data)
But its stuck forever can anybody help me