preprocess cptac dataset for benchmarking

cptac_bench_preprocess(data, idcol = "protein_Id")