PhosMap

Running

App Files Files Community

liuzan commited on Aug 23, 2023

Commit

7491e03

1 Parent(s): ba9ea8f

Upload 73 files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +10 -0
Dockerfile +14 -0
README.md +12 -0
backend/FUNCTIONS.R +1275 -0
backend/analysis.R +0 -0
backend/fill_missing_values.R +41 -0
backend/get_aligned_seq_for_mea02.R +60 -0
backend/get_normalized_data_of_psites3.R +149 -0
backend/get_normalized_data_of_psites4.R +192 -0
backend/import_extract.R +23 -0
backend/preprocess.R +27 -0
backend/visualization_deps_with_scatter02.R +117 -0
examplefile/Clinicaltest.csv +40 -0
examplefile/analysistools/Clinical_for_Demo.csv +40 -0
examplefile/analysistools/Clinical_for_Pre.csv +10 -0
examplefile/analysistools/Clinicaltest.csv +6 -0
examplefile/analysistools/PreNormBasedProSummary.csv +0 -0
examplefile/analysistools/phosphorylation_exp_design_info.txt +40 -0
examplefile/data_frame_normalization_with_control_no_pair.csv +0 -0
examplefile/download/anaysis_demo.zip +3 -0
examplefile/download/mascot_xml.zip +3 -0
examplefile/download/motif_kinase_relation.xlsx +0 -0
examplefile/download/phosphorylation_peptide_txt.zip +3 -0
examplefile/download/profiling_gene_txt.zip +3 -0
examplefile/mascot/phosphorylation_exp_design_info.txt +10 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027015_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027016_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027017_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027031_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027032_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027033_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027046_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027047_peptide.txt +0 -0
examplefile/mascot/phosphorylation_peptide_txt/Exp027048_peptide.txt +0 -0
examplefile/mascot/profiling_exp_design_info.txt +7 -0
examplefile/mascot/profiling_gene_txt/Exp026982_gene.txt +0 -0
examplefile/mascot/profiling_gene_txt/Exp026983_gene.txt +0 -0
examplefile/mascot/profiling_gene_txt/Exp026995_gene.txt +0 -0
examplefile/mascot/profiling_gene_txt/Exp026996_gene.txt +0 -0
examplefile/mascot/profiling_gene_txt/Exp027008_gene.txt +0 -0
examplefile/mascot/profiling_gene_txt/Exp027009_gene.txt +0 -0
examplefile/maxquant/Phospho (STY)Sites.txt +0 -0
examplefile/maxquant/phosphorylation_exp_design_info.txt +10 -0
examplefile/maxquant/profiling_exp_design_info.txt +7 -0
examplefile/maxquant/proteinGroups.txt +0 -0
examplefile/motifanalysis.csv +0 -0
examplefile/phosphorylation_exp_design_info.txt +40 -0
examplefile/root/mascot/mascot_xml/Exp027015/Exp027015_F1_R1.txt +3 -0
examplefile/root/mascot/mascot_xml/Exp027016/Exp027016_F1_R1.txt +3 -0
examplefile/root/mascot/mascot_xml/Exp027017/Exp027017_F1_R1.txt +3 -0

.gitattributes CHANGED Viewed

@@ -42,3 +42,13 @@ PhosMap_datasets/motif_library/refseq/rattus/STY_background_of_refseq_rattus_for
 PhosMap_datasets/motif_library/uniprot/human/STY_background_of_uniprot_human_for_motif_enrichment.txt filter=lfs diff=lfs merge=lfs -text
 PhosMap_datasets/motif_library/uniprot/mouse/STY_background_of_uniprot_mouse_for_motif_enrichment.txt filter=lfs diff=lfs merge=lfs -text
 PhosMap_datasets/motif_library/uniprot/rattus/STY_background_of_uniprot_rattus_for_motif_enrichment.txt filter=lfs diff=lfs merge=lfs -text

 PhosMap_datasets/motif_library/uniprot/human/STY_background_of_uniprot_human_for_motif_enrichment.txt filter=lfs diff=lfs merge=lfs -text
 PhosMap_datasets/motif_library/uniprot/mouse/STY_background_of_uniprot_mouse_for_motif_enrichment.txt filter=lfs diff=lfs merge=lfs -text
 PhosMap_datasets/motif_library/uniprot/rattus/STY_background_of_uniprot_rattus_for_motif_enrichment.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027015/Exp027015_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027016/Exp027016_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027017/Exp027017_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027031/Exp027031_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027032/Exp027032_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027033/Exp027033_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027046/Exp027046_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027047/Exp027047_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+examplefile/root/mascot/mascot_xml/Exp027048/Exp027048_F1_R1.txt filter=lfs diff=lfs merge=lfs -text
+www/manual.pdf filter=lfs diff=lfs merge=lfs -text

Dockerfile ADDED Viewed

	@@ -0,0 +1,14 @@

+FROM liuzandh/phosmap:1.0.0
+RUN useradd -m -u 1000 user
+USER user
+ENV HOME=/home/user \
+	PATH=/home/user/.local/bin:$PATH
+WORKDIR $HOME/app
+COPY --chown=user . $HOME/app
+CMD ["R", "--quiet", "-e", "shiny::runApp(host='0.0.0.0', port=7860)"]

README.md ADDED Viewed

	@@ -0,0 +1,12 @@

+---
+title: PhosMap
+emoji: 📚
+colorFrom: blue
+colorTo: yellow
+sdk: docker
+pinned: false
+duplicated_from: posit/shiny-for-r-template
+license: mit
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

backend/FUNCTIONS.R ADDED Viewed

	@@ -0,0 +1,1275 @@

+extract_psites_score <- function(
+    phosphorylation_exp_design_info_file_path,
+    mascot_xml_dir,
+    mascot_txt_dir
+){
+  requireNamespace('utils')
+  withProgress(message = "Start extracting the confidence of Psites from mascot.xml", detail = "This may take a while...", value = 0, {
+    phosphorylation_exp_design_info_file_path <- normalizePath(phosphorylation_exp_design_info_file_path)
+    if (!file.exists(phosphorylation_exp_design_info_file_path)) {
+      cat('\n', phosphorylation_exp_design_info_file_path, ' -> ', 'No the file.')
+      stop('')
+    }
+    mascot_xml_dir <- normalizePath(mascot_xml_dir)
+    if (!file.exists(mascot_xml_dir)) {
+      cat('\n', mascot_xml_dir, ' -> ', 'No the directory.')
+      stop('')
+    }
+    mascot_xml_dir_files <- list.files(mascot_xml_dir)
+    mascot_txt_dir <- normalizePath(mascot_txt_dir)
+    if (!file.exists(mascot_txt_dir)) {
+      cat('\n', mascot_txt_dir, ' -> ', 'No the directory, create it.')
+      dir.create(mascot_txt_dir)
+    }
+    command <- "python"
+    path2script <- system.file("src", "XMLParser_mascot_dat.py", package = "PhosMap") # The location of python script called
+    # path2script <- "w:/R/R-3.3.2/library/PhosMap/src/XMLParser_mascot_dat.py"
+    path2script <- normalizePath(path2script, mustWork = FALSE)
+    # Get experiments codes by reading txt files
+    experiment_code <- utils::read.table(phosphorylation_exp_design_info_file_path,
+                                         sep = '\t',
+                                         header = TRUE)
+    experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+    # match txt files to mascot_xml_dir
+    experiment_match_index <- match(experiment_code, mascot_xml_dir_files)
+    na_index <- which(is.na(experiment_match_index))
+    if(length(na_index)>0){
+      na_experiments <- experiment_code[na_index]
+      cat('\n', 'The following experiments do not exist in', mascot_xml_dir, '\n')
+      for(na_experiment in na_experiments){
+        cat('\n', na_experiment, '\n')
+      }
+      stop('')
+    }
+    experiment_code_count <- length(experiment_code)
+    if (experiment_code_count < 1) {
+      cat('\n', phosphorylation_exp_design_info_file_path, '\n')
+      stopifnot('No experiments')
+    }
+    cat('\n Start extracting the confidence of Psites from mascot.xml.')
+    cat('\n Total ', experiment_code_count, ' experiment(s).')
+    cat('\n It will take a little while.')
+    parent_dir <- dirname(phosphorylation_exp_design_info_file_path)
+    parent_dir <- normalizePath(parent_dir)
+    log_dir <- normalizePath(file.path(parent_dir, 'log'), mustWork = FALSE)
+    if (!file.exists(log_dir)) {
+      cat('\n', log_dir, ' -> ', 'No the directory, create it.')
+      dir.create(log_dir)
+    }
+    log_df <- NULL
+    for(i in seq_len(experiment_code_count)){
+      experiment_code_i <- experiment_code[i]
+      args <- c(experiment_code_i, mascot_xml_dir, mascot_txt_dir)  # Set args to vector
+      allArgs <- c(path2script, args)  # Add python script path to parameters vector
+      log_out <- tryCatch(
+        {
+          output <- system2(command, args = allArgs, stdout = TRUE) # R call python script by pass parameters vector
+          cat('\n', i, '->', experiment_code_i, '->', 'success', '\n')
+          c(experiment_code_i, 'success')
+        },
+        warning = function(w){ # process warning
+          cat('\n', i, '->', experiment_code_i, '->', 'warning', '\n')
+          print(w)
+          log_i <- c(experiment_code_i, 'warning')
+          return(log_i)
+        },
+        error = function(e){ # process error
+          cat('\n', i, '->', experiment_code_i, '->', 'error', '\n')
+          print(e)
+          log_i <- c(experiment_code_i, 'error')
+          return(log_i)
+        }
+      )
+      log_df <- rbind(log_df, log_out)
+      incProgress(1/seq_len(experiment_code_count), detail = paste0('\n Completed file: ', i, '/', experiment_code_count))
+    }
+    colnames(log_df) <- c('Exp_no', 'Status')
+    now_time <- Sys.time()
+    now_time <- gsub(':', '-', now_time)
+    log_df_file_name <- paste(now_time, 'log_of_extract_psites_score.txt')
+    log_df_file_path <- normalizePath(file.path(log_dir, log_df_file_name), mustWork = FALSE)
+    utils::write.table(log_df, log_df_file_path, sep = '\t', row.names = FALSE, quote = FALSE)
+    cat('\n Program finish, please see result log to check status.', '->', log_df_file_path)
+  })
+}
+get_file_info_from_dir <- function(specific_dir, experiment_ID){
+  requireNamespace('utils')
+  withProgress(message = 'Reading peptide identification files', style = "notification", detail = "processing...", value = 0,{
+    # read all files from specific director and save them into a list
+    all_files <- list.files(specific_dir)
+    all_files_count <- length(all_files)
+    if(all_files_count>0){
+      file_suffix <- get_file_suffix(all_files[1])
+      if(file_suffix=='txt'){
+        read_file_function <- utils::read.table
+        sep <- '\t'
+      }else{
+        read_file_function <- utils::read.csv
+        sep <- ','
+      }
+      sep_symbol <- paste('.', file_suffix, sep = '')
+      all_files_ID <- apply(data.frame(all_files), 1, function(x, sep){
+        x <- strsplit(x, split = sep)[[1]][1]
+        x
+      }, sep=sep_symbol)
+      all_files_ID_code <- apply(data.frame(all_files_ID), 1, function(x, sep){
+        x <- strsplit(x, split = sep)[[1]][1]
+        x
+      }, sep='_')
+      all_files_paths <- normalizePath(file.path(specific_dir, all_files))
+      index_of_match <- match(experiment_ID, all_files_ID_code)
+      matched_all_files_paths <- all_files_paths[index_of_match]
+      matched_all_files_ID <- all_files_ID[index_of_match]
+      file_data_list <- list()
+      matched_all_files_count <- length(matched_all_files_paths)
+      cat('\n Total file: ', matched_all_files_count)
+      for(i in seq_len(matched_all_files_count)){
+        # Read bach data and save to file_data_list.
+        cat('\n completed: ', i, '/', matched_all_files_count)
+        file_data <- as.matrix(read_file_function(matched_all_files_paths[i], header = TRUE, sep = sep))
+        file_data_list[[i]] <- file_data
+        incProgress(1/matched_all_files_count, detail = paste0('\n completed: ', i, '/', matched_all_files_count))
+      }
+      attr(file_data_list,'names') <- matched_all_files_ID
+      result_list <- list(file_data_list=file_data_list, file_ID=matched_all_files_ID)
+      return(result_list)
+    }else{
+      stop('The directory of ', specific_dir, ' has no files.')
+    }
+  })
+}
+get_list_with_filtered_sites <- function(peptide_id, files, files_site_score, qc, min_score, min_FDR){
+  withProgress(message = 'Reading psites QC files', style = "notification", detail = "processing...", value = 0,{
+    peptide_df_with_area_psm_list <- list() # data.frame(area, psm)
+    ID_of_seq_gi_site_list <- list() # seq_gi_psite
+    ID_DF_list <- list() # seq_gi_psite + data.frame(area, psm)
+    peptide_id_len <- length(peptide_id) # File Numbers
+    # ************
+    # *Required column:
+    # *file_peptide: Ion_Score, FDR, Area, PSMs, Sequence, Protein_Groups_Accessions, Modification
+    # *file_site_score: pep_seq, pep_var_mod_conf
+    cat('\n Total file: ', peptide_id_len)
+    for(i in seq_len(peptide_id_len)){
+      cat('\n completed: ',i,'/',peptide_id_len)
+      file_peptide <- data.frame(files[[i]])
+      # Set parameters 1：reserve peptides with ion score><-20 and FDR<0.01.
+      index_of_row_filters_meet_ionscore_and_FDR <- which(as.numeric(as.vector(file_peptide$Ion.Score)) >= min_score &
+                                                            as.numeric(as.vector(file_peptide$FDR)) < min_FDR)
+      file_peptide <- file_peptide[index_of_row_filters_meet_ionscore_and_FDR, ]
+      if(!qc){
+        file_peptide_subset <- file_peptide
+      }else{
+        # Extract peptides with psites score.
+        file_site_score  <-  as.data.frame(files_site_score[[i]])
+        index_of_row_filters_have_site_score <- which(grepl('%', file_site_score$pep_var_mod_conf))
+        file_site_score  <-  file_site_score[index_of_row_filters_have_site_score,]
+        # Reserve peptides with psites score in file_peptide.
+        index_of_peptide_with_site_score_in_file_peptide <- match(as.vector(file_site_score[,1]), as.vector(file_peptide[,1]))
+        index_of_NA <- which(is.na(index_of_peptide_with_site_score_in_file_peptide))
+        if(length(index_of_NA)>0){
+          index_of_peptide_with_site_score_in_file_peptide <- index_of_peptide_with_site_score_in_file_peptide[-index_of_NA]
+        }
+        file_peptide_subset <- file_peptide[index_of_peptide_with_site_score_in_file_peptide,]
+      }
+      area <- as.numeric(as.vector(file_peptide_subset$Area))
+      psms <- as.numeric(as.vector(file_peptide_subset$PSMs))
+      peptide_df_with_area_psm <- data.frame(area, psms)
+      peptide_df_with_area_psm_colnames <- paste(peptide_id[i], c('Area', 'PSMs'), sep = '_')
+      colnames(peptide_df_with_area_psm) <- peptide_df_with_area_psm_colnames
+      sequence_id <- as.vector(file_peptide_subset$Sequence)
+      accession <- as.vector(file_peptide_subset$Protein.Groups.Accessions)
+      modification <- as.vector(file_peptide_subset$Modification)
+      ID_of_seq_gi_site <- paste(sequence_id, accession, modification, sep = '||')
+      ID_DF <- data.frame(ID_of_seq_gi_site, peptide_df_with_area_psm)
+      colnames(ID_DF) <- c("ID", peptide_df_with_area_psm_colnames)
+      peptide_df_with_area_psm_list[[i]] <- peptide_df_with_area_psm # area, psm
+      ID_of_seq_gi_site_list[[i]] <- ID_of_seq_gi_site # seq_gi_psite
+      ID_DF_list[[i]] <- ID_DF # seq_gi_psite, area, psm
+      incProgress(1/peptide_id_len, detail = paste0('\n completed: ',i,'/',peptide_id_len))
+    }
+    result_list <- list(
+      peptide_df_with_area_psm_list = peptide_df_with_area_psm_list,
+      ID_of_seq_gi_site_list = ID_of_seq_gi_site_list,
+      ID_DF_list = ID_DF_list
+    )
+    return(result_list)
+  })
+}
+pre_process_filter_psites <- function(firmiana_peptide_dir, psites_score_dir,
+                                      phospho_experiment_design_file_path, qc,
+                                      min_score = 20, min_FDR = 0.01) {
+  requireNamespace('utils')
+  withProgress(message = 'Step2:QC and Merging', style = "notification", detail = "processing...", value = 0, max = 4,{
+    PEPTIDE_DIR <- normalizePath(firmiana_peptide_dir, mustWork = FALSE)
+    if(!file.exists(firmiana_peptide_dir)){
+      cat(firmiana_peptide_dir, ' -> ', 'No the directory.')
+      stop('')
+    }
+    PSITES_WITH_SCORE_DIR <- normalizePath(psites_score_dir, mustWork = FALSE)
+    if(!file.exists(psites_score_dir)){
+      cat(psites_score_dir, ' -> ', 'No the directory.')
+      stop('')
+    }
+    phospho_experiment_design_file_path <- normalizePath(phospho_experiment_design_file_path, mustWork = FALSE)
+    if(!file.exists(phospho_experiment_design_file_path)){
+      cat(phospho_experiment_design_file_path, ' -> ', 'No the file')
+      stop('')
+    }
+    # read experiment design file and make merged experments keep order of experiment design
+    phospho_experiment_design_file <- utils::read.table(phospho_experiment_design_file_path, sep = '\t',
+                                                        header = TRUE, stringsAsFactors = NA)
+    phospho_experiment_ID <- as.vector(unlist(phospho_experiment_design_file$Experiment_Code))
+    for(j in 1:4){
+      # withProgress(message = 'please wait', style = "notification", detail = "processing...", value = 0,{
+      if(j == 1){
+        result_list_from_PEPTIDE_DIR <- get_file_info_from_dir(PEPTIDE_DIR, phospho_experiment_ID)
+        files <- result_list_from_PEPTIDE_DIR$file_data_list
+        peptide.id <- result_list_from_PEPTIDE_DIR$file_ID
+      }
+      if(j == 2){
+        cat('\n The 2nd step: read psites QC files.')
+        # rewrite function
+        get_file_info_from_dir <- function(specific_dir, experiment_ID){
+          requireNamespace('utils')
+          withProgress(message = 'Reading psites QC files', style = "notification", detail = "processing...", value = 0,{
+            # read all files from specific director and save them into a list
+            all_files <- list.files(specific_dir)
+            all_files_count <- length(all_files)
+            if(all_files_count>0){
+              file_suffix <- get_file_suffix(all_files[1])
+              if(file_suffix=='txt'){
+                read_file_function <- utils::read.table
+                sep <- '\t'
+              }else{
+                read_file_function <- utils::read.csv
+                sep <- ','
+              }
+              sep_symbol <- paste('.', file_suffix, sep = '')
+              all_files_ID <- apply(data.frame(all_files), 1, function(x, sep){
+                x <- strsplit(x, split = sep)[[1]][1]
+                x
+              }, sep=sep_symbol)
+              all_files_ID_code <- apply(data.frame(all_files_ID), 1, function(x, sep){
+                x <- strsplit(x, split = sep)[[1]][1]
+                x
+              }, sep='_')
+              all_files_paths <- normalizePath(file.path(specific_dir, all_files))
+              index_of_match <- match(experiment_ID, all_files_ID_code)
+              matched_all_files_paths <- all_files_paths[index_of_match]
+              matched_all_files_ID <- all_files_ID[index_of_match]
+              file_data_list <- list()
+              matched_all_files_count <- length(matched_all_files_paths)
+              cat('\n Total file: ', matched_all_files_count)
+              for(i in seq_len(matched_all_files_count)){
+                # Read bach data and save to file_data_list.
+                cat('\n completed: ', i, '/', matched_all_files_count)
+                file_data <- as.matrix(read_file_function(matched_all_files_paths[i], header = TRUE, sep = sep))
+                file_data_list[[i]] <- file_data
+                incProgress(1/matched_all_files_count, detail = paste0('\n completed: ', i, '/', matched_all_files_count))
+              }
+              attr(file_data_list,'names') <- matched_all_files_ID
+              result_list <- list(file_data_list=file_data_list, file_ID=matched_all_files_ID)
+              return(result_list)
+            }else{
+              stop('The directory of ', specific_dir, ' has no files.')
+            }
+          })
+        }
+        result_list_from_PSITES_WITH_SCORE_DIR <- get_file_info_from_dir(PSITES_WITH_SCORE_DIR,
+                                                                         phospho_experiment_ID)
+        files_site_score <- result_list_from_PSITES_WITH_SCORE_DIR$file_data_list
+        site_score.id <- result_list_from_PSITES_WITH_SCORE_DIR$file_ID
+      }
+      if(j == 3){
+        cat('\n The 3rd step: filter peptides based on site quality.')
+        result_list_with_filtered_sites <- get_list_with_filtered_sites(peptide.id, files,
+                                                                        files_site_score, qc,
+                                                                        min_score, min_FDR)
+        peptide_df_with_area_psm_list <- result_list_with_filtered_sites$peptide_df_with_area_psm_list # including: area, psm
+        ID_of_seq_gi_site_list <- result_list_with_filtered_sites$ID_of_seq_gi_site_list # including: seq_gi_psite
+        ID_DF_list <- result_list_with_filtered_sites$ID_DF_list # including: seq_gi_psite, area, psm
+      }
+      if(j == 4){
+        #### (4) Based on unique peptide, merge all experiments ####
+        cat('\n The 4th step: merge data based on peptides (unique ID).')
+        withProgress(message = 'Merging data based on peptides (unique ID)', style = "notification", detail = "processing...", value = 0,{
+          for (i in 1:1) {
+            merge_df_with_phospho_peptides <- get_merged_phospho_df(peptide.id,
+                                                                    peptide_df_with_area_psm_list,
+                                                                    ID_of_seq_gi_site_list, ID_DF_list)
+            # delete psm column
+            merge_df_with_phospho_peptides_colnames <- colnames(merge_df_with_phospho_peptides)
+            index_of_PSMs <- grep('_PSMs', merge_df_with_phospho_peptides_colnames)
+            merge_df_with_phospho_peptides <- merge_df_with_phospho_peptides[,-index_of_PSMs]
+            merge_df_with_phospho_peptides_colnames <- colnames(merge_df_with_phospho_peptides)
+            ID <- as.vector(merge_df_with_phospho_peptides[,1])
+            Value <- merge_df_with_phospho_peptides[,-1]
+            Value_colnames <- colnames(Value)
+            Value_colnames_ID <- apply(data.frame(Value_colnames), 1, function(x){
+              x <- strsplit(x, split = '_')[[1]][1]
+              x
+            })
+            index_of_match <- match(phospho_experiment_ID, Value_colnames_ID)
+            Value <- Value[,index_of_match]
+            merge_df_with_phospho_peptides <- data.frame(ID, Value)
+            colnames(merge_df_with_phospho_peptides) <- c(merge_df_with_phospho_peptides_colnames[1], phospho_experiment_ID)
+            incProgress(1, detail = 'finishing...')
+          }
+        })
+        return(merge_df_with_phospho_peptides)
+      }
+      incProgress(1, detail = '')
+    }
+  })
+}
+get_combined_data_frame02 <- function(merge_df_with_phospho_peptides, species = 'human', id_type = 'RefSeq_Protein_GI'
+){
+  # Read library file, map GI to Gene Symbol
+  requireNamespace('utils')
+  requireNamespace('stringr')
+  cat('\n The 5th step: write the data frame with symbols mapping to genes.')
+  withProgress(message = 'Writing the data frame with symbols mapping to genes', style = "notification", detail = "This may take a while...", value = 0,{
+    id_coversion_table_dir = "./PhosMap_datasets/id_coversion_table/"
+    id_coversion_table = utils::read.table((paste0(id_coversion_table_dir, species, "_ID.txt")), sep = '\t', header = TRUE)
+    cat('\n The 5th step is running.')
+    # Split a string: sequenceID, accession, modification
+    seq_gi_site_vector <- as.vector(merge_df_with_phospho_peptides$ID_of_seq_gi_site)
+    Sequence <- apply(data.frame(seq_gi_site_vector), 1, function(x){
+      strsplit(x, split="||", fixed = TRUE)[[1]][1]
+    })
+    ID <- apply(data.frame(seq_gi_site_vector), 1, function(x){
+      strsplit(x, split="||", fixed = TRUE)[[1]][2]
+    })
+    Modification <- apply(data.frame(seq_gi_site_vector), 1, function(x){
+      strsplit(x, split="||", fixed = TRUE)[[1]][3]
+    })
+    ##########################################################################################################
+    # id_types <- c('GeneID', 'RefSeq_Protein_GI', 'RefSeq_Protein_Accession', 'Uniprot_Protein_Accession')
+    # GeneSymbol
+    # construct dict
+    # id_type <- 'RefSeq_Protein_GI'
+    MappingDf <- id_coversion_table[, c('GeneSymbol', id_type)]
+    invalid_index <- which(as.vector(unlist(MappingDf[,2])) == '' | as.vector(unlist(MappingDf[,2])) == '-')
+    if(length(invalid_index)>0){
+      MappingDf <- MappingDf[-invalid_index,]
+    }
+    MappingDf_row <- nrow(MappingDf)
+    cat('\n', 'Construct dictionary based on GeneSymbol and specific ID.')
+    mapping_dict <- NULL
+    cat('\n', 'The total:', MappingDf_row)
+    for(i in 1:MappingDf_row){
+      x <- as.vector(MappingDf[i,1])
+      y <- as.vector(unlist(MappingDf[i,2]))
+      y <- strsplit(y, split = '; ')[[1]]
+      x_v <- rep(x, length(y))
+      names(x_v) <- y
+      mapping_dict <- c(mapping_dict, x_v)
+      if(i%%5000==0 | i == MappingDf_row){
+        cat('\n', 'Completed:', i, '/', MappingDf_row)
+        # incProgress(1/seq_len(MappingDf_row), detail = paste0('\n', 'Completed:', i, '/', MappingDf_row))
+      }
+      incProgress(1/MappingDf_row, detail = paste0('\n', 'Completed:', i, '/', MappingDf_row))
+    }
+    ##########################################################################################################
+    GeneSymbol <- apply(data.frame(ID), 1, function(x, mapping_dict, id_type){
+      gi_all <- strsplit(x, split=";", fixed = TRUE)[[1]]
+      gi_mapping_symbol <- apply(data.frame(gi_all), 1, function(y, mapping_dict, id_type){
+        if(id_type == 'RefSeq_Protein_GI'){
+          y = stringr::str_replace_all(y, 'gi[|]', '')
+        }
+        return(mapping_dict[y])
+      }, mapping_dict = mapping_dict, id_type)
+      gi_mapping_symbol_unique <- unique(gi_mapping_symbol[which(!is.na(gi_mapping_symbol))])
+      gi_mapping_symbol_unique_count <- length(gi_mapping_symbol_unique)
+      if(gi_mapping_symbol_unique_count == 0){
+        return(NA)
+      }else if(gi_mapping_symbol_unique_count == 1){
+        return(gi_mapping_symbol_unique)
+      }else{
+        return(paste(gi_all, collapse = ';'))
+      }
+    }, mapping_dict = mapping_dict, id_type = id_type)
+    # sequenceID, accession, symbol, modification, quantification_value_in_experiment
+    df_of_combination <- data.frame(Sequence, ID, Modification, GeneSymbol, merge_df_with_phospho_peptides[,-1]) # delete first column
+    index_of_NonNA <- which(!is.na(GeneSymbol))
+    df_of_combination <- df_of_combination[index_of_NonNA,]
+    cat('\n The 5th step is over ^_^.')
+    cat('\n The 5th step: write the data frame with symbols mapping to genes.')
+    incProgress(1, detail = 'Please wait a moment')
+  })
+  return(df_of_combination)
+}
+get_summary_with_unique_sites02 <- function(combined_df_with_mapped_gene_symbol, species = 'human', fasta_type = 'refseq'
+){
+  requireNamespace('utils')
+  requireNamespace('stringr')
+  # unique phosphorylation sites
+  withProgress(message = 'Constructing the data frame with unique phosphorylation site for each protein sequence', style = "notification", detail = "This may take a while...", value = 0,{
+    cat('\n The 6th step: construct the data frame with unique phosphorylation site for each protein sequence.')
+    path <- "./PhosMap_datasets/fasta_library/"
+    fasta_data <- utils::read.table(paste0(path, fasta_type, "/", species, "/", species, "_", fasta_type, "_fasta.txt"), header=TRUE, sep="\t")
+    id_data <- combined_df_with_mapped_gene_symbol
+    # Keep peptides assigned to unique protein
+    id_data_only_peptide2gi <- id_data[which(!grepl(';', as.vector(id_data$ID))),]
+    for(j in 1:2){
+      if(j == 1){
+        withProgress(message = 'Getting modification index in protein sequence. ', style = "notification", detail = "This may take a while...", value = 0,{
+          get_modification_index <- function(id_data_only_peptide2gi, fasta_data){
+            # 1
+            # Get modification index in protein sequence.
+            cat('\n', 'Get modification index in protein sequence.')
+            id_data_only_peptide2gi_row <- nrow(id_data_only_peptide2gi)
+            modification_index_in_protein_seq_list <- list()
+            for(i in seq_len(id_data_only_peptide2gi_row)){
+              peptide_seq <- as.vector(id_data_only_peptide2gi$Sequence[i])
+              peptide_id <- as.vector(id_data_only_peptide2gi$ID[i])
+              modification_index_in_peptide_seq <- unlist(gregexpr("[a-z]", peptide_seq))
+              protein_seq <- as.vector(fasta_data$Sequence[which(fasta_data$ID==peptide_id)])
+              first_index_of_peptide2protein <- unlist(gregexpr(toupper(peptide_seq), protein_seq))
+              modification_index_in_protein_seq <- NULL
+              for(elemt in first_index_of_peptide2protein){
+                tmp_modification_index_in_protein_seq <- elemt + modification_index_in_peptide_seq -1
+                modification_index_in_protein_seq <- c(modification_index_in_protein_seq,
+                                                       tmp_modification_index_in_protein_seq)
+              }
+              modification_index_in_protein_seq_list[[i]] <- modification_index_in_protein_seq
+              if(i%%500==0 | i==id_data_only_peptide2gi_row ){
+                cat('\n completed: ', i, '/', id_data_only_peptide2gi_row)
+              }
+              incProgress(1/id_data_only_peptide2gi_row, detail = paste0('\n', 'Completed:', i, '/', id_data_only_peptide2gi_row))
+            }
+            return(modification_index_in_protein_seq_list)
+          }
+          # Determine locations of the psites each peptide mapped to protein squence.
+          modification_index_in_protein_seq_list <- get_modification_index(id_data_only_peptide2gi,
+                                                                           fasta_data)
+          proteins_in_id_data_only_peptide2gi <- as.vector(id_data_only_peptide2gi$ID)
+          sequences_in_id_data_only_peptide2gi <- as.vector(id_data_only_peptide2gi$Sequence)
+          value_in_id_data_only_peptide2gi <- id_data_only_peptide2gi[, -c(seq_len(4))]
+          unique_proteins <- unique(proteins_in_id_data_only_peptide2gi)
+          unique_protein_count <- length(unique_proteins)
+        })
+      }
+      if(j == 2){
+        # Show psites and modifications of one protein, merge the values with the same modification type.
+        cat('\n', 'Map phosphorylation sites to protein sequence and eliminate redundancy.')
+        withProgress(message = 'Mapping phosphorylation sites to protein sequence and eliminate redundancy. ', style = "notification", detail = "This may take a while...", value = 0,{
+          system.time({
+            summary_df_of_unique_proteins_with_sites <- c()
+            for(i in seq_len(unique_protein_count)){
+              df_with_AAs_i <- get_df_with_AAs_i(unique_proteins,
+                                                 i,
+                                                 id_data_only_peptide2gi,
+                                                 proteins_in_id_data_only_peptide2gi,
+                                                 sequences_in_id_data_only_peptide2gi,
+                                                 modification_index_in_protein_seq_list)
+              summary_df_of_unique_protein_with_sites <- get_unique_AAs_i_df(df_with_AAs_i)
+              summary_df_of_unique_proteins_with_sites <- rbind(
+                summary_df_of_unique_proteins_with_sites,
+                summary_df_of_unique_protein_with_sites
+              )
+              if(i%%500==0 | i == unique_protein_count){
+                cat('\n completed: ', i, '/', unique_protein_count)
+              }
+              incProgress(1/unique_protein_count, detail = paste0('\n', 'Completed:', i, '/', unique_protein_count))
+              summary_df_of_unique_proteins_with_sites_rownames <- paste(as.vector(summary_df_of_unique_proteins_with_sites$ID),
+                                                                         as.vector(summary_df_of_unique_proteins_with_sites$AA_in_protein),
+                                                                         sep = '_')
+              rownames(summary_df_of_unique_proteins_with_sites) <- summary_df_of_unique_proteins_with_sites_rownames
+              summary_df_of_unique_proteins_with_sites_colnames <- colnames(summary_df_of_unique_proteins_with_sites)
+              index_of_PSMs <- which(grepl('_PSMs', summary_df_of_unique_proteins_with_sites_colnames))
+              if(length(index_of_PSMs)>0){
+                summary_df_of_unique_proteins_with_sites <- summary_df_of_unique_proteins_with_sites[,-index_of_PSMs]
+              }
+              summary_df_of_unique_proteins_with_sites$GeneSymbol <- apply(data.frame(summary_df_of_unique_proteins_with_sites$GeneSymbol),
+                                                                           1,
+                                                                           function(x){
+                                                                             if(grepl('||', x)){
+                                                                               x <- as.vector(x)
+                                                                               x <- strsplit(x, split = '||', fixed = TRUE)
+                                                                               x[[1]][1]
+                                                                             }
+                                                                           })
+            }
+          })
+        })
+      }
+      incProgress(1/2, detail = paste0('\n '))
+    }
+    cat('\n The 6th step: construct over.')
+  })
+  return(summary_df_of_unique_proteins_with_sites)
+}
+merge_profiling_file_from_Firmiana <- function(firmiana_gene_dir, US_cutoff = 1, experiment_gene_file_path){
+  requireNamespace('utils')
+  withProgress(message = 'Step5 : Normalization [Normalizing phosphoproteomics data based on proteomics data.] ', style = "notification", detail = "processing...", value = 0,{
+    for (j in 1:2) {
+      if(j == 1){
+        DATA_DIR <- normalizePath(firmiana_gene_dir, mustWork = FALSE)
+        if(!file.exists(DATA_DIR)){
+          cat(DATA_DIR, ' -> ', 'No the file')
+          stop('')
+        }
+        data_list <- list()
+        file_names <- list.files(path = DATA_DIR, pattern = '.txt')
+        file_names_count <- length(file_names)
+        if(length(file_names_count)<1){
+          stop('The directory of ', DATA_DIR, ' has no files.')
+        }
+        exp_names <- apply(data.frame(file_names), 1, function(x){
+          x <- strsplit(x, split = '_')[[1]][1]
+          x
+        })
+        experiment_code <- utils::read.table(experiment_gene_file_path, header = TRUE, sep = '\t', stringsAsFactors = NA)
+        experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+        index_of_match <- match(experiment_code, exp_names)
+        na_index <- which(is.na(index_of_match))
+        na_count <- length(na_index)
+        if(na_count > 0){
+          na_experiment_code <- experiment_code[na_index]
+          cat(
+            '\n',
+            na_experiment_code,
+            'not in',
+            DATA_DIR
+          )
+          stop('')
+        }
+        exp_names <- exp_names[index_of_match]
+        file_names <- file_names[index_of_match]
+        file_names_count <- length(file_names)
+        # Table headers of input data
+        # "Gene.ID" "Symbol" "Annotation"  "Modification" "Description"
+        # "Protein.GI" "Protein.Num" "Area" "FoT.1e.6." "iBAQ"
+        # "Peptide.Num" "Unique.Peptide.Num"  "Strict.Peptide.Num"  "US.Peptide.Num"  "Identified.Proteins.Num"
+        # "Unique.Proteins.Num"
+        # New table headers of input data
+        file_data_colnames <- c(
+          "Gene_ID", "Symbol", "Annotation", "Modification", "Description",
+          "Protein_GI",  "Protein_Num", "Area", "FoT5", "iBAQ",
+          "Peptide_Num", "UPeptide_Num",  "SPeptide_Num",  "USPeptide_Num",  "Identified_Proteins_Num", "Unique_Proteins_Num"
+        )
+        kept_colnames <- c(
+          "Symbol", "iBAQ", "USPeptide_Num"
+        )
+        kept_colnames_index <- match(kept_colnames, file_data_colnames)
+        cat('\n Merge profiling files downloaded from Firmiana.')
+        cat('\n Total files: ', file_names_count)
+        for(i in seq_len(file_names_count)){
+          file_name <- file_names[i]
+          file_path <- normalizePath(file.path(DATA_DIR, file_name))
+          file_data <- utils::read.delim(file_path, header = TRUE, stringsAsFactors = NA, sep = '\t')
+          colnames(file_data) <- file_data_colnames
+          file_data <- file_data[, kept_colnames_index]
+          index_of_US <- which(file_data$USPeptide_Num >= US_cutoff)
+          file_data <- file_data[index_of_US, c(1,2)]
+          exp_name <- exp_names[i]
+          file_data_colnames.i <- colnames(file_data)
+          file_data_colnames.i <- paste(exp_name, file_data_colnames.i, sep = '_')
+          file_data_colnames.i[1] <- 'Symbol'
+          colnames(file_data) <- file_data_colnames.i
+          data_list[[i]] <- file_data
+          cat('\n Read and filter: ', i, '/', file_names_count)
+          incProgress(1/seq_len(file_names_count), detail = paste0('\n Read and filter: ', i, '/', file_names_count))
+        }
+        attr(data_list, 'names') <- exp_names
+        data_list_count <- length(data_list)
+        merge_df <- data_list[[1]]
+        merge_df_colnames <- colnames(merge_df)
+      }
+      if(j == 2){
+        cat('\n merge_complete: ', 1, '/', data_list_count)
+        if(data_list_count>1){
+          for(i in 2:data_list_count){
+            tmp_merge_df <- data_list[[i]]
+            merge_df <- merge(merge_df, tmp_merge_df, by = 'Symbol', all = TRUE)
+            cat('\n merge_complete: ', i, '/', data_list_count)
+            incProgress(1/data_list_count, detail = paste0('\n merge_complete: ', i, '/', data_list_count))
+          }
+        }
+        Symbol <- as.vector(merge_df[,1])
+        Value <- as.matrix(merge_df[,-1])
+        index_of_NA <- which(is.na(Value))
+        if(length(index_of_NA)>0){
+          Value[index_of_NA] <- 0
+        }
+        colnames(Value) <- exp_names
+        merge_df_no_NA <- data.frame(Symbol, Value)
+      }
+    }
+    incProgress(1/2, detail = '')
+  })
+  return(merge_df_no_NA)
+}
+get_normalized_data_FOT5 <- function(data_frame, experiment_code_file_path
+){
+  requireNamespace('utils')
+  # cat('\n The 7th step: Normalize data and filter data only including phosphorylation site.')
+  cat('Normalize proteomics data based on the total sum (x 1e5).')
+  experiment_code <- utils::read.table(experiment_code_file_path, header = TRUE, sep = '\t', stringsAsFactors = NA)
+  experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+  data_frame_colnames <- colnames(data_frame)
+  ID <- as.vector(data_frame[,1])
+  Value_raw <- data_frame[,-1]
+  Value_FOT5 <- Value_raw
+  Value_FOT5_col <- ncol(Value_FOT5)
+  for(i in seq_len(Value_FOT5_col)){
+    x <- Value_raw[,i]
+    valid_index <- which(x>0)
+    valid_x <- x[valid_index]
+    valid_x_sum <- sum(valid_x)
+    valid_x_FOT5 <- valid_x/valid_x_sum*1e5
+    Value_FOT5[valid_index,i] <- valid_x_FOT5
+  }
+  data_frame_normaliation <- data.frame(ID, Value_FOT5)
+  data_frame_normaliation_colnames <- c(data_frame_colnames[1], experiment_code)
+  colnames(data_frame_normaliation) <- data_frame_normaliation_colnames
+  return(data_frame_normaliation)
+}
+keep_psites_with_max_in_topX2 <- function(phospho_data, percent_of_kept_sites = 3/4){
+  percent_of_kept_sites_str <- paste('top', percent_of_kept_sites*100, '%', sep = '')
+  cat('\n The 8th step: filter psites with row maximum in', percent_of_kept_sites_str, '.')
+  # ID <- as.vector(phospho_data[,1])
+  Value <- phospho_data[,-c(1,2,3)]
+  Value_rowmax <- apply(Value, 1, function(x){
+    x <- as.vector(unlist(x))
+    max(x)
+  })
+  index_of_Value_rowmax_desc <- order(Value_rowmax, decreasing = TRUE)
+  count_of_kept_sites <- round(nrow(Value)*percent_of_kept_sites)
+  index_of_Value_rowmax_desc_kept <- index_of_Value_rowmax_desc[seq_len(count_of_kept_sites)]
+  phospho_data_meet_percent <- phospho_data[index_of_Value_rowmax_desc_kept,]
+  cat('\n The 8th step: filter over with ', percent_of_kept_sites_str, ' cutoff.')
+  return(phospho_data_meet_percent)
+}
+analysis_deps_limma2 <- function(expr_data_frame, group, comparison_factor,
+                                 log2_label = FALSE, adjust_method = 'BH'){
+  requireNamespace('limma')
+  requireNamespace('stats')
+  # experiment_design_file_path <- "D:\\Phosphate-data\\Bioinfomatics\\demo_data_from_WYN\\experiment_design_noPair.txt"
+  # experiment_design_file <- read.table(experiment_design_file_path, sep = '\t', header = T)
+  # group <- experiment_design_file$Group[experiment_design_file$Data_Type == 'Phospho']
+  # group <- paste('t', group, sep = '')
+  # group <- factor(group, levels = c('t0', 't10', 't30', 't120'))
+  # expr_data_frame <- data_frame_normalization_0
+  expr_ID <- as.vector(expr_data_frame[,1])
+  expr_Valule <- expr_data_frame[,-1]
+  if(!log2_label){
+    expr_Valule <- log2(expr_data_frame[,-1]) # have to log
+  }
+  expr_Valule_row_duplicated <- apply(expr_Valule, 1, function(x){
+    stats::var(x)
+  })
+  expr_Valule_col <- ncol(expr_Valule)
+  duplicated_row_index <- which(expr_Valule_row_duplicated == 0)
+  if(length(duplicated_row_index)>0){
+    #  Zero sample variances detected, have been offset away from zero
+    expr_ID <- expr_ID[-duplicated_row_index]
+    expr_Valule <- expr_Valule[-duplicated_row_index,]
+  }
+  # rownames(expr_Valule) <- expr_ID
+  design <- stats::model.matrix(~ 0 + group)
+  cat('\n', 'The matrix of experiment design.')
+  print(design)
+  colnames(design) <- levels(factor(group))
+  rownames(design) <- colnames(expr_Valule)
+  # comparison_statement <- c('t10-t0', 't30-t0', 't120-t0')
+  # comparison_statement <- c('t10-t0')
+  group_levels <- comparison_factor
+  group_levels_count <- length(group_levels)
+  if(group_levels_count<2){
+    cat('\n', 'Do not construct pairwise comparison pattern.')
+    stop('')
+  }else{
+    comparison_statement <- NULL
+    i_end <- group_levels_count - 1
+    for(i in seq_len(i_end)){
+      ctrl <- group_levels[i]
+      j_start <- i + 1
+      for(j in j_start:group_levels_count){
+        treat <- group_levels[j]
+        cs <- paste(treat, '-', ctrl, sep = '')
+        comparison_statement <- c(comparison_statement, cs)
+      }
+    }
+    cat('\n', 'The combination of pairwise comparison(s).')
+    cat('\n', comparison_statement, '\n')
+  }
+  contrast.matrix <- limma::makeContrasts(contrasts = comparison_statement, levels = design)
+  cat('\n', 'The matrix of comparison statement, compare other groups with control.')
+  print(contrast.matrix) # the matrix of comparison statement, compare other groups with control.
+  # step1
+  fit <- limma::lmFit(expr_Valule, design)
+  # step2
+  fit2 <- limma::contrasts.fit(fit, contrast.matrix) # An important step.
+  fit2 <- limma::eBayes(fit2)  # default no trend!
+  # return(fit2)
+  # step3
+  alls <- limma::topTable(fit2, coef = 1, adjust.method = adjust_method, p.value = 1, number = Inf) # logFC = log(a/b) = log(a) - log(b) = A - B
+  # results <- decideTests(fit2, method = "global", adjust.method = adjust_method, p.value = minPvalue, lfc = minFC)
+  # vennDiagram(results)
+  alls <- stats::na.omit(alls)
+  # plot
+  ID <- rownames(alls)
+  logFC <- alls$logFC # log2
+  pvalue <- alls$adj.P.Val
+  result_df <- data.frame(ID, logFC, pvalue)
+  return(result_df)
+}
+analysis_deps_sam2 <- function(expr_data_frame, group, log2_label = FALSE,
+                               nperms = 100, rand = NULL, minFDR = 0.05,
+                               samr_plot = TRUE){
+  requireNamespace('samr')
+  requireNamespace('stats')
+  expr_ID <- as.vector(expr_data_frame[,1])
+  #(李佳澳)加入赋值
+  expr_Valule <- expr_data_frame[,-1]
+  #结束
+  if(!log2_label){
+    expr_Valule <- log2(expr_data_frame[,-1]) # have to log
+  }
+  expr_Valule_row_duplicated <- apply(expr_Valule, 1, function(x){
+    stats::var(x)
+  })
+  expr_Valule_col <- ncol(expr_Valule)
+  duplicated_row_index <- which(expr_Valule_row_duplicated == 0)
+  if(length(duplicated_row_index)>0){
+    expr_ID <- expr_ID[-duplicated_row_index]
+    expr_Valule <- expr_Valule[-duplicated_row_index,]
+  }
+  # construct the samr data
+  sam_data <- list(x = as.matrix(expr_Valule), y = as.numeric(as.factor(group)),
+                   geneid = expr_ID, genenames = expr_ID, logged2=TRUE)
+  group_nlevels <- nlevels(group)
+  if(group_nlevels < 2){
+    cat('\n', 'Groups are less than one.', '\n')
+    stop('')
+  }
+  if(group_nlevels == 2){
+    resp_type <- "Two class unpaired"
+  }else{
+    resp_type <- "Multiclass"
+  }
+  cat('\n', resp_type, '\n')
+  samr_obj <- samr::samr(sam_data, resp.type = resp_type, nperms = nperms, random.seed = rand)
+  # Compute the delta values
+  delta_table <- samr::samr.compute.delta.table(samr_obj)
+  # Determine a FDR cut-off
+  index_less_than_min_FDR <- which(delta_table[,5] < minFDR)
+  if(length(index_less_than_min_FDR) < 1){
+    cat('\n', 'Not found appropiate cutoff less than specific minimum FDR.')
+    stop('')
+  }else{
+    delta_index <- index_less_than_min_FDR[1]
+    delta <- delta_table[delta_index,1]
+  }
+  if(samr_plot){
+    cat('\n', 'Plot samr plot to view DEPs (or DEGs) distribution.')
+    samr::samr.plot(samr_obj, delta)
+  }
+  # Extract significant genes at the cut-off delta
+  siggenes_table <- samr::samr.compute.siggenes.table(samr_obj, delta, sam_data, delta_table, all.genes = FALSE)
+  genes_up_n <- siggenes_table$ngenes.up
+  if(genes_up_n > 0){
+    genes_up_df <- data.frame(siggenes_table$genes.up)
+    genes_up_df_col <- ncol(genes_up_df)
+    genes_up_df <- genes_up_df[,c(3,7:genes_up_df_col)]
+    genes_up_df_col <- ncol(genes_up_df)
+    genes_up_df[,genes_up_df_col] <- as.numeric(genes_up_df[,genes_up_df_col])/100
+    genes_up_df_colnames <- colnames(genes_up_df)
+    colnames(genes_up_df) <- c('ID', genes_up_df_colnames[-c(1,genes_up_df_col)], 'qvalue')
+  }else{
+    genes_up_df <- NULL
+  }
+  genes_lo_n <- siggenes_table$ngenes.lo
+  if(genes_lo_n > 0){
+    genes_lo_df <- data.frame(siggenes_table$genes.lo)
+    genes_lo_df_col <- ncol(genes_lo_df)
+    genes_lo_df <- genes_lo_df[,c(3,7:genes_lo_df_col)]
+    genes_lo_df_col <- ncol(genes_lo_df)
+    genes_lo_df[,genes_lo_df_col] <- as.numeric(genes_lo_df[,genes_lo_df_col])/100
+    genes_lo_df_colnames <- colnames(genes_lo_df)
+    colnames(genes_lo_df) <- c('ID', genes_lo_df_colnames[-c(1,genes_lo_df_col)], 'qvalue')
+  }else{
+    genes_lo_df <- NULL
+  }
+  sam_result_list <- list(
+    genes_up_df <- genes_up_df,
+    genes_down_df <- genes_lo_df
+  )
+  return(sam_result_list)
+}
+get_summary_from_ksea2 <- function(
+    ptypes_data,
+    species = 'human',
+    log2_label = TRUE,
+    ratio_cutoff = 3
+){
+  requireNamespace('utils')
+  withProgress(message = "Running KSEA", style = "notification", detail = "processing...",{
+    # read relationship of kinase-substrate provided by PhosMap
+    # KSRR: kinase substrate regulation relationship
+    # A data frame contanning relationship of kinase-substrate that consists of "kinase", "substrate", "site", "sequence" and "predicted" columns.
+    KSRR_FILE_PATH <- paste0("./PhosMap_datasets/kinase_substrate_regulation_relationship_table/", species, "/", species, "_ksrr.csv")
+    kinase_substrate_regulation_relationship <- utils::read.csv(KSRR_FILE_PATH, header = TRUE, sep= ",", stringsAsFactors = NA)
+    ID <- as.vector(ptypes_data[,1])
+    ptypes_data_ratio <- ptypes_data[,-1]
+    if(!log2_label){
+      ptypes_data_ratio <- log2(ptypes_data_ratio)
+    }
+    ptypes_data_ratio_colnames <- colnames(ptypes_data_ratio)
+    ksea_es_list <- list()
+    ksea_pvalue_list <- list()
+    ksea_regulons_list <- list()
+    ksea_activity_list <- list()
+    ksea_trans_list <- list()
+    ptypes_data_exp_count <- ncol(ptypes_data_ratio)
+    cat('\n Starting KSEA')
+    for(i in seq_len(ptypes_data_exp_count)){
+      cat('\n completing: ', i, '/', ptypes_data_exp_count)
+      ptypes_data_ratio_in_single_exp <- as.numeric(unlist(ptypes_data_ratio[,i]))
+      ksea_result_list_i <- get_ksea_result_list(
+        ptypes_data_ratio_in_single_exp, ID,
+        kinase_substrate_regulation_relationship,
+        ksea_activity_i_pvalue = 0.05
+      )
+      ksea_es_list[[i]] <- ksea_result_list_i$ksea_es_i_non_NA
+      ksea_pvalue_list[[i]] <- ksea_result_list_i$ksea_pvalue_i_non_NA
+      ksea_regulons_list[[i]] <- ksea_result_list_i$ksea_regulons_i_non_NA
+      ksea_activity_list[[i]] <- ksea_result_list_i$ksea_activity_i
+      ksea_trans_list[[i]] <- ksea_result_list_i$ksea_trans_i
+      cat('\n completed: ', i, '/', ptypes_data_exp_count)
+      incProgress(1/ptypes_data_exp_count, detail = paste0("\n completed: ", i, "/",ptypes_data_exp_count))
+    }
+    cat('\n Ending KSEA')
+    cat('\n Extracting information data frame derived from KSEA')
+    cat('\n ********** Regulation direction from KSEA **********')
+    cat('\n ********** Pvalue from KSEA **********')
+    cat('\n ********** Activity from KSEA **********')
+    cat('\n ********** Kinase_site_substrate quantification matrix after KSEA **********')
+    cat('\n')
+    ksea_regulons <- unique(unlist(ksea_regulons_list))
+    ksea_regulons_count <- length(ksea_regulons)
+    # enrichment score from ksea
+    # pvalue from ksea
+    # regulons (kinase) from ksea
+    # kinase activity based on pvalue and enrichment score computed by ksea
+    # regulation direction: 1 = activate, 0 = no work, -1 = supress
+    ksea_regulons_regulation_direction_df <- get_ksea_regulons_info(ksea_regulons, ksea_trans_list, ksea_trans_list,
+                                                                    ptypes_data_ratio_colnames)
+    ksea_regulons_pvalue_df <- get_ksea_regulons_info(ksea_regulons, ksea_trans_list, ksea_pvalue_list,
+                                                      ptypes_data_ratio_colnames)
+    ksea_regulons_activity_df <- get_ksea_regulons_info(ksea_regulons, ksea_trans_list, ksea_activity_list,
+                                                        ptypes_data_ratio_colnames)
+    ksea_kinase_site_substrate_original_ratio_df <- get_substrate_expr_df(ID,
+                                                                          kinase_substrate_regulation_relationship,
+                                                                          ksea_regulons,
+                                                                          ptypes_data_ratio,
+                                                                          ratio_cutoff)
+    summary_df_list_from_ksea <- list(
+      ksea_regulons_regulation_direction_df = ksea_regulons_regulation_direction_df, # regulation direction: 1 = activate, 0 = no work, -1 = supress
+      ksea_regulons_pvalue_df = ksea_regulons_pvalue_df, # pvalue from ksea
+      ksea_regulons_activity_df = ksea_regulons_activity_df, # kinase activity based on pvalue and enrichment score computed by ksea
+      ksea_kinase_site_substrate_original_ratio_df = ksea_kinase_site_substrate_original_ratio_df #
+    )
+    cat('\n KSEA OK! ^_^')
+    return(summary_df_list_from_ksea)
+  })
+}
+mea_based_on_background <- function(foreground, AA_in_protein, background, motifx_pvalue){
+  # foreground <- as.vector(foreground)
+  # background <- as.vector(background$Aligned_Seq)
+  center_vector_candidate <- c('S', 'T', 'Y')
+  center_vector_candidate_len <- length(center_vector_candidate)
+  center_vector <- NULL
+  for(i in seq_len(center_vector_candidate_len)){
+    cat(i)
+    center <- center_vector_candidate[i]
+    if(length(grep(center, AA_in_protein)) > 0){
+      center_vector <- c(center_vector, center)
+    }
+  }
+  cat('Start executing motifx and find motif pattern. \n')
+  cat('Foreground sequences: ', length(foreground), '.\n', sep = '')
+  cat('Background sequences: ', length(background), '.\n', sep = '')
+  cat('Phosphorylation: [', center_vector, '] exists in foreground.\n', sep = '')
+  cat('Motifx pvalue cutoff: ', motifx_pvalue, '.\n', sep = '')
+  motifs_list <- get_motifs_list(foreground, background, center_vector, motifx_pvalue)
+  cat('Motifx analysis OK! ^_^', '\n')
+  print(motifs_list)
+  cat('\n')
+  return(motifs_list)
+}
+get_motifs_list <- function(foreground, background, center_vector, motifx_pvalue){
+  motifs_list <- list()
+  motifs_list_names <- NULL
+  motifs_list_index <- 0
+  center_vector_len <- length(center_vector)
+  for(i in seq_len(center_vector_len)){
+    cat(center_vector_len)
+    cat(i)
+    center <- center_vector[i]
+    motifs <- get_motif_analysis_summary(foreground, background, center = center, min_sequence_count = 1, min_pvalue = motifx_pvalue)
+    if(!is.null(motifs)){
+      motifs_list_index <- motifs_list_index + 1
+      motifs_list[[motifs_list_index]] <- motifs
+      motifs_list_names <- c(motifs_list_names, center)
+    }
+  }
+  if(motifs_list_index > 0){
+    names(motifs_list) <- motifs_list_names
+    return(motifs_list)
+  }else{
+    return(NULL)
+  }
+}
+get_motif_analysis_summary <- function(
+    foreground,
+    background,
+    center='S',
+    min_sequence_count = 1,
+    min_pvalue = 0.01
+){
+  check_result_list <- check_mea_input(foreground, background, center)
+  loop_foreground <- check_result_list$foreground
+  loop_background <- check_result_list$background
+  motif_result_list <- list()
+  motif_result_list_index <- 0
+  while(length(loop_foreground) >= min_sequence_count){
+    motif_result_loop_i <- seach_motif_pattern(
+      loop_foreground,
+      loop_background,
+      min_sequence_count = min_sequence_count,
+      min_pvalue = min_pvalue,
+      center = center,
+      width = check_result_list$width
+    )
+    if(is.null(motif_result_loop_i)){
+      break
+    }
+    motif_result_list_index <- motif_result_list_index + 1
+    motif_result_list[[motif_result_list_index]] <- motif_result_loop_i
+    loop_foreground <- loop_foreground[!grepl(motif_result_loop_i$motif_pattern, loop_foreground)]
+    loop_background <- loop_background[!grepl(motif_result_loop_i$motif_pattern, loop_background)]
+  }
+  summry_list <- data.frame(
+    motif = vapply(motif_result_list, function(x){x$motif_pattern},c('character')),
+    score = vapply(motif_result_list, function(x){x$motif_pattern_score}, c(1)),
+    foreground_matches = vapply(motif_result_list, function(x){x$foreground_matches}, 1),
+    foreground_size = vapply(motif_result_list, function(x){x$foreground_size}, 1),
+    background_matches = vapply(motif_result_list, function(x){x$background_matches}, 1),
+    background_size = vapply(motif_result_list, function(x){x$background_size}, 1)
+  )
+  foreground_fold_increase <- summry_list$foreground_matches/summry_list$foreground_size
+  background_fold_increase <- summry_list$background_matches/summry_list$background_size
+  summry_list$fold_increase <- foreground_fold_increase/background_fold_increase
+  if(nrow(summry_list) == 0){
+    return(NULL)
+  }
+  return(summry_list)
+}
+get_normalized_data_of_psites2 <- function(data_frame, experiment_code_file_path, nathreshold, normmethod = "global", imputemethod = "minimum/10", topN = NA, mod_types = c('S', 'T', 'Y')){
+  requireNamespace('utils')
+  experiment_code <- utils::read.table(experiment_code_file_path, header = TRUE, sep = '\t', stringsAsFactors = NA)
+  # experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+  nathreshold <- length(experiment_code$Experiment_Code) - nathreshold
+  if(nathreshold < 0) {
+    nathreshold = 0
+  }
+  NAnumthresig <- c()
+  for (row in 1:nrow(data_frame)) {
+    NAnumthresig[row] <- (sum(data_frame[row,][-c(seq(6))] == 0) <= nathreshold)
+    # NAnumthresigtest[raw] <- (sum(newdata2[raw,][-c(1,2)] == 0) >= NAnumthre)
+  }
+  data_frame <- data_frame[NAnumthresig,]
+  data_frame_colnames <- colnames(data_frame)
+  cat('\n The 7th step is running.')
+  summary_df_ID_Info <- data_frame[, seq_len(6)]
+  summary_df_ID_Info$AA_in_protein <- toupper(summary_df_ID_Info$AA_in_protein)
+  summary_df_Value <- data_frame[, -(seq_len(6))]
+  cat('\n Filtering data only including S/T/Y modifications.')
+  ptypes <- mod_types
+  index_of_AA_in_protein <- apply(data.frame(summary_df_ID_Info$AA_in_protein), 1, function(x){
+    if(grepl('S', x) | grepl('T', x) | grepl('Y', x)){
+      return(TRUE)
+    }else{
+      return(FALSE)
+    }
+  })
+  index_of_ptypes <- which(index_of_AA_in_protein)
+  if(length(index_of_ptypes)>0){
+    ptypes_id_df <- summary_df_ID_Info[index_of_ptypes,]
+    ptypes_value <- summary_df_Value[index_of_ptypes,]
+  }else{
+    message('No data with modifications taking place on ', paste(mod_types, collapse = '|'))
+    stop('')
+  }
+  Value_FOT5 <- ptypes_value
+  Value_FOT5_col <- ncol(Value_FOT5)
+  if(is.na(topN)){
+    if(normmethod == "global") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        Value_FOT5[,i] <- x/sum(x)*1e5
+      }
+    } else if(normmethod == "median") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        Value_FOT5[,i] <- x/median(x)*1e5
+      }
+    }
+  }else{
+    if(normmethod == "global") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        x_order <- order(x, decreasing = TRUE)
+        x_order_top <- x_order[seq_len(topN)]
+        x[-x_order_top] <- 0
+        Value_FOT5[,i] <- x/sum(x)*1e5
+      }
+    } else if(normmethod == "median") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        x_order <- order(x, decreasing = TRUE)
+        x_order_top <- x_order[seq_len(topN)]
+        x[-x_order_top] <- 0
+        Value_FOT5[,i] <- x/median(x)*1e5
+      }
+    }
+  }
+  ptypes_value_FOT5 <- as.matrix(Value_FOT5)
+  index_of_zero <- which(ptypes_value_FOT5==0)
+  if(imputemethod=="0"){
+    ptypes_value_FOT5[index_of_zero] <- 0
+  }else if(imputemethod=="minimum"){
+    min_value_of_non_zero <- min(ptypes_value_FOT5[-index_of_zero])
+    ptypes_value_FOT5[index_of_zero] <- min_value_of_non_zero
+  }else if(imputemethod=="minimum/10"){
+    min_value_of_non_zero <- min(ptypes_value_FOT5[-index_of_zero])
+    ptypes_value_FOT5[index_of_zero] <- min_value_of_non_zero*0.1
+  }
+  ptypes_df_list <- list(
+    ptypes_area_df_with_id = data.frame(ptypes_id_df, ptypes_value),
+    ptypes_fot5_df_with_id = data.frame(ptypes_id_df, ptypes_value_FOT5)
+  )
+  cat('\n The 7th step is over ^_^.')
+  return(ptypes_df_list)
+}
+get_normalized_data_FOT52 <- function(data_frame, experiment_code_file_path, normmethod = "global", imputemethod = "minimum/10"){
+  requireNamespace('utils')
+  cat('\n The 7th step: Normalize data and filter data only including phosphorylation site.')
+  experiment_code <- utils::read.table(experiment_code_file_path, header = TRUE, sep = '\t', stringsAsFactors = NA)
+  experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+  data_frame_colnames <- colnames(data_frame)
+  ID <- as.vector(data_frame[,1])
+  Value_raw <- data_frame[,-1]
+  Value_FOT5 <- Value_raw
+  Value_FOT5_col <- ncol(Value_FOT5)
+  if(normmethod == "global") {
+    for(i in seq_len(Value_FOT5_col)){
+      x <- Value_raw[,i]
+      valid_index <- which(x>0)
+      valid_x <- x[valid_index]
+      valid_x_sum <- sum(valid_x)
+      valid_x_FOT5 <- valid_x/valid_x_sum*1e5
+      Value_FOT5[valid_index,i] <- valid_x_FOT5
+    }
+  } else if(normmethod == "median") {
+    for(i in seq_len(Value_FOT5_col)){
+      x <- Value_raw[,i]
+      valid_index <- which(x>0)
+      valid_x <- x[valid_index]
+      valid_x_median <- median(valid_x)
+      valid_x_FOT5 <- valid_x/valid_x_median*1e5
+      Value_FOT5[valid_index,i] <- valid_x_FOT5
+    }
+  }
+  Value_FOT5 <- as.matrix(Value_FOT5)
+  index_of_zero <- which(Value_FOT5==0)
+  if(imputemethod=="0"){
+    Value_FOT5[index_of_zero] <- 0
+  }else if(imputemethod=="minimum"){
+    min_value_of_non_zero <- min(Value_FOT5[-index_of_zero])
+    Value_FOT5[index_of_zero] <- min_value_of_non_zero
+  }else if(imputemethod=="minimum/10"){
+    min_value_of_non_zero <- min(Value_FOT5[-index_of_zero])
+    Value_FOT5[index_of_zero] <- min_value_of_non_zero*0.1
+  }
+  data_frame_normaliation <- data.frame(ID, Value_FOT5)
+  data_frame_normaliation_colnames <- c(data_frame_colnames[1], experiment_code)
+  colnames(data_frame_normaliation) <- data_frame_normaliation_colnames
+  return(data_frame_normaliation)
+}

backend/analysis.R ADDED Viewed

File without changes

backend/fill_missing_values.R ADDED Viewed

	@@ -0,0 +1,41 @@

+fill_missing_values <- function(nadata, method) {
+  df <- df1 <- nadata
+  if (method == "none") {
+    df[is.na(df)] <- 0
+  } else if (method == "minimum") {
+    fill_value <- min(df1, na.rm = TRUE)
+    df[is.na(df)] <- fill_value
+  } else if (method == "minimum/10") {
+    fill_value <- min(df1, na.rm = TRUE) / 10
+    df[is.na(df)] <- fill_value
+  } else if (method == "bpca") {
+    # take medium time
+    library(pcaMethods)
+    data_zero1 <- pcaMethods::pca(as.matrix(df1), nPcs = ncol(df1)-1, method = "bpca", maxSteps =100)
+    df <- completeObs(data_zero1)
+  } else if (method == "lls" && anyNA(df1)) {
+    # take long time
+    library(pcaMethods)
+    data_zero1 <- llsImpute(t(df1), k = 10, allVariables = TRUE)
+    df <- t(completeObs(data_zero1))
+  } else if (method == "impseq") {
+    # library(rrcovNA)
+    df <- impSeq(df1)
+  } else if(method == "impseqrob"){
+    # library(rrcovNA)
+    data_zero1 <- impSeqRob(df1, alpha = 0.9)
+    df <- data_zero1$x
+  } else if(method == "knnmethod"){
+    # library(impute)
+    data_zero1 <- impute.knn(as.matrix(df1), k = 10, rowmax = 1, colmax = 1)
+    df <- data_zero1$data
+  } else if(method == "colmedian"){
+    # library(e1071)
+    df <- impute(df1, what = "median")
+  } else if(method == "rowmedian"){
+    # library(e1071)
+    dfx <- impute(t(df1), what = "median")
+    df <- t(dfx)
+  }
+  return(df)
+}

backend/get_aligned_seq_for_mea02.R ADDED Viewed

	@@ -0,0 +1,60 @@

+get_aligned_seq_for_mea02 <- function(ID, Sequence, AA_in_protein, fixed_length, species = 'human', fasta_type = 'refseq'){
+  requireNamespace('stringr')
+  requireNamespace('utils')
+  # require(PhosMap)
+  cat('Aligned sequence based on fasta library for motif enrichment anlysis.\n')
+  fasta_library_dir = "./PhosMap_datasets/fasta_library/"
+  fasta_data <- utils::read.table((paste0(fasta_library_dir, fasta_type, "/", species, "/", species, "_", fasta_type, "_fasta.txt")), sep = '\t', header = TRUE)
+  border_limit <- floor(fixed_length/2)
+  aligned_seq <- NULL
+  GI_nrow <- length(ID)
+  cat('Pre-align:', GI_nrow, 'phos-pepitdes.\n')
+  cat('Fixed sequence length is ', fixed_length, '.\n', sep = '')
+  cat('It needs few time.\n')
+  for(i in seq_len(GI_nrow)){
+    gi <- ID[i]
+    aa_index <- AA_in_protein[i]
+    loc_index <- as.numeric(stringr::str_split(aa_index, "[STY]", n = Inf, simplify = FALSE)[[1]])[2]
+    index <- which(fasta_data[,1] == gi)
+    if(length(index) > 0){
+      refseq <- as.vector(fasta_data[index,2])
+      refseq_len <- nchar(refseq)
+      left_limit <- loc_index - border_limit
+      right_limit <- loc_index + border_limit
+      if(left_limit>=1 & right_limit>refseq_len){
+        right_limit <- refseq_len
+        truncated_seq <- stringr::str_sub(refseq, left_limit, right_limit)
+        truncated_seq <- stringr::str_pad(truncated_seq, fixed_length, "right", pad = '_')
+      }else if(left_limit<1 & right_limit<=refseq_len){
+        left_limit <- 1
+        truncated_seq <- stringr::str_sub(refseq, left_limit, right_limit)
+        truncated_seq <- stringr::str_pad(truncated_seq, fixed_length, "left", pad = '_')
+      }else if(left_limit<1 & right_limit>refseq_len){
+        left_limit <- 1
+        right_limit <- refseq_len
+        truncated_seq <- stringr::str_sub(refseq, left_limit, right_limit)
+        truncated_seq <- stringr::str_pad(truncated_seq, fixed_length, "both", pad = '_')
+      }else{
+        truncated_seq <- stringr::str_sub(refseq, left_limit, right_limit)
+      }
+    }else{
+      truncated_seq <- NA
+    }
+    aligned_seq <- c(aligned_seq, truncated_seq)
+    if(i %% 5000 == 0){
+      cat('Aligned:', i, 'phos-pepitdes.\n')
+    }
+    if(i == GI_nrow){
+      cat('Aligned:', i, 'phos-pepitdes.\n')
+      cat('Finish OK! ^_^\n')
+    }
+  }
+  cat('\n')
+  aligned_sequence_df_based_on_fasta_library <- data.frame(ID, Sequence, AA_in_protein, aligned_seq)
+  return(aligned_sequence_df_based_on_fasta_library)
+}

backend/get_normalized_data_of_psites3.R ADDED Viewed

	@@ -0,0 +1,149 @@

+get_normalized_data_of_psites3 <- function(data_frame, experiment_code_file_path, nathreshold, normmethod = "global", imputemethod = "minimum/10", topN = NA, mod_types = c('S', 'T', 'Y')){
+  requireNamespace('utils')
+  experiment_code <- utils::read.table(experiment_code_file_path, header = TRUE, sep = '\t', stringsAsFactors = NA)
+  # experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+  nathreshold <- length(experiment_code$Experiment_Code) - nathreshold
+  if(nathreshold < 0) {
+    nathreshold = 0
+  }
+  NAnumthresig <- c()
+  for (row in 1:nrow(data_frame)) {
+    NAnumthresig[row] <- (sum(data_frame[row,][-c(seq(6))] == 0) <= nathreshold)
+    # NAnumthresigtest[raw] <- (sum(newdata2[raw,][-c(1,2)] == 0) >= NAnumthre)
+  }
+  data_frame <- data_frame[NAnumthresig,]
+  data_frame_colnames <- colnames(data_frame)
+  cat('\n The 7th step is running.')
+  summary_df_ID_Info <- data_frame[, seq_len(6)]
+  summary_df_ID_Info$AA_in_protein <- toupper(summary_df_ID_Info$AA_in_protein)
+  summary_df_Value <- data_frame[, -(seq_len(6))]
+  cat('\n Filtering data only including S/T/Y modifications.')
+  ptypes <- mod_types
+  index_of_AA_in_protein <- apply(data.frame(summary_df_ID_Info$AA_in_protein), 1, function(x){
+    if(grepl('S', x) | grepl('T', x) | grepl('Y', x)){
+      return(TRUE)
+    }else{
+      return(FALSE)
+    }
+  })
+  index_of_ptypes <- which(index_of_AA_in_protein)
+  if(length(index_of_ptypes)>0){
+    ptypes_id_df <- summary_df_ID_Info[index_of_ptypes,]
+    ptypes_value <- summary_df_Value[index_of_ptypes,]
+  }else{
+    message('No data with modifications taking place on ', paste(mod_types, collapse = '|'))
+    stop('')
+  }
+  Value_FOT5 <- ptypes_value
+  Value_FOT5_col <- ncol(Value_FOT5)
+  if(is.na(topN)){
+    if(normmethod == "global") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        Value_FOT5[,i] <- x/sum(x)*1e5
+      }
+    } else if(normmethod == "median") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        Value_FOT5[,i] <- x/median(x)*1e5
+      }
+    }
+  }else{
+    if(normmethod == "global") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        x_order <- order(x, decreasing = TRUE)
+        x_order_top <- x_order[seq_len(topN)]
+        x[-x_order_top] <- 0
+        Value_FOT5[,i] <- x/sum(x)*1e5
+      }
+    } else if(normmethod == "median") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        x_order <- order(x, decreasing = TRUE)
+        x_order_top <- x_order[seq_len(topN)]
+        x[-x_order_top] <- 0
+        Value_FOT5[,i] <- x/median(x)*1e5
+      }
+    }
+  }
+  ptypes_value_FOT5 <- as.matrix(Value_FOT5)
+  index_of_zero <- which(ptypes_value_FOT5==0)
+  # if(imputemethod=="0"){
+  #   ptypes_value_FOT5[index_of_zero] <- 0
+  # }else if(imputemethod=="minimum"){
+  #   min_value_of_non_zero <- min(ptypes_value_FOT5[-index_of_zero])
+  #   ptypes_value_FOT5[index_of_zero] <- min_value_of_non_zero
+  # }else if(imputemethod=="minimum/10"){
+  #   min_value_of_non_zero <- min(ptypes_value_FOT5[-index_of_zero])
+  #   ptypes_value_FOT5[index_of_zero] <- min_value_of_non_zero*0.1
+  # }
+  ptypes_value_FOT5 <- as.data.frame(ptypes_value_FOT5)
+  ptypes_value_FOT5[ptypes_value_FOT5 == 0] <- NA
+  fill_missing_values01 <- function(nadata, method) {
+    df <- df1 <- nadata
+    if (method == "none") {
+      df[is.na(df)] <- 0
+    } else if (method == "minimum") {
+      fill_value <- min(df1, na.rm = TRUE)
+      df[is.na(df)] <- fill_value
+    } else if (method == "minimum/10") {
+      fill_value <- min(df1, na.rm = TRUE) / 10
+      df[is.na(df)] <- fill_value
+    } else if (method == "bpca") {
+      # take medium time
+      library(pcaMethods)
+      data_zero1<-pcaMethods::pca(as.matrix(df1), nPcs = ncol(df1)-1, method = "bpca", maxSteps =100)
+      df<-completeObs(data_zero1)
+    } else if (method == "lls") {
+      # take long time
+      # library(pcaMethods)
+      data_zero1<-llsImpute(t(df1), k = 10, allVariables = TRUE)
+      df<-t(completeObs(data_zero1))
+    } else if (method == "impseq") {
+      # library(rrcovNA)
+      df <- impSeq(df1)
+    } else if(method=="impseqrob"){
+      # library(rrcovNA)
+      data_zero1 <- impSeqRob(df1, alpha=0.9)
+      df<-data_zero1$x
+    } else if(method=="knnmethod"){
+      # library(impute)
+      data_zero1<-impute.knn(as.matrix(df1),k = 10, rowmax = 1, colmax = 1)#rowmax = 0.9, colmax = 0.9
+      df<-data_zero1$data
+    } else if(method=="colmedian"){
+      # library(e1071)
+      df<-impute(df1,what ="median")
+    } else if(method=="rowmedian"){
+      # library(e1071)
+      dfx<-impute(t(df1),what ="median")
+      df<-t(dfx)
+      # } else if(method=="grr"){
+      #   library(DreamAI)
+      #   df<-impute.RegImpute(data=as.matrix(df1), fillmethod = "row_mean", maxiter_RegImpute = 10,conv_nrmse = 1e-03)
+      # } else if(method=="mle"){
+      #   library(norm)
+      #   xxm<-as.matrix(df1)
+      #   ss <- norm::prelim.norm(xxm)
+      #   thx <- norm::em.norm(ss)
+      #   norm::rngseed(123)
+      #   df <- norm::imp.norm(ss, thx, xxm)
+    }
+    return(df)
+  }
+  ptypes_value_FOT5 = fill_missing_values01(ptypes_value_FOT5, imputemethod)
+  ptypes_df_list <- list(
+    ptypes_area_df_with_id = data.frame(ptypes_id_df, ptypes_value),
+    ptypes_fot5_df_with_id = data.frame(ptypes_id_df, ptypes_value_FOT5)
+  )
+  cat('\n The 7th step is over ^_^.')
+  return(ptypes_df_list)
+}

backend/get_normalized_data_of_psites4.R ADDED Viewed

	@@ -0,0 +1,192 @@

+get_normalized_data_of_psites4 <- function(data_frame, experiment_code_file_path, nathreshold, normmethod = "global", imputemethod = "minimum/10", topN = NA, mod_types = c('S', 'T', 'Y'), design_file){
+  requireNamespace('utils')
+  experiment_code <- utils::read.table(experiment_code_file_path, header = TRUE, sep = '\t', stringsAsFactors = NA)
+  # experiment_code <- as.vector(unlist(experiment_code$Experiment_Code))
+  nathreshold <- length(experiment_code$Experiment_Code) - nathreshold
+  if(nathreshold < 0) {
+    nathreshold = 0
+  }
+  NAnumthresig <- c()
+  for (row in 1:nrow(data_frame)) {
+    NAnumthresig[row] <- (sum(data_frame[row,][-c(seq(6))] == 0) <= nathreshold)
+    # NAnumthresigtest[raw] <- (sum(newdata2[raw,][-c(1,2)] == 0) >= NAnumthre)
+  }
+  data_frame <- data_frame[NAnumthresig,]
+  data_frame_colnames <- colnames(data_frame)
+  cat('\n The 7th step is running.')
+  summary_df_ID_Info <- data_frame[, seq_len(6)]
+  summary_df_ID_Info$AA_in_protein <- toupper(summary_df_ID_Info$AA_in_protein)
+  summary_df_Value <- data_frame[, -(seq_len(6))]
+  cat('\n Filtering data only including S/T/Y modifications.')
+  ptypes <- mod_types
+  index_of_AA_in_protein <- apply(data.frame(summary_df_ID_Info$AA_in_protein), 1, function(x){
+    if(grepl('S', x) | grepl('T', x) | grepl('Y', x)){
+      return(TRUE)
+    }else{
+      return(FALSE)
+    }
+  })
+  index_of_ptypes <- which(index_of_AA_in_protein)
+  if(length(index_of_ptypes)>0){
+    ptypes_id_df <- summary_df_ID_Info[index_of_ptypes,]
+    ptypes_value <- summary_df_Value[index_of_ptypes,]
+  }else{
+    message('No data with modifications taking place on ', paste(mod_types, collapse = '|'))
+    stop('')
+  }
+  Value_FOT5 <- ptypes_value
+  Value_FOT5_col <- ncol(Value_FOT5)
+  if(is.na(topN)){
+    if(normmethod == "global") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        Value_FOT5[,i] <- x/sum(x)*1e5
+      }
+    } else if(normmethod == "median") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        Value_FOT5[,i] <- x/median(x)*1e5
+      }
+    }
+  }else{
+    if(normmethod == "global") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        x_order <- order(x, decreasing = TRUE)
+        x_order_top <- x_order[seq_len(topN)]
+        x[-x_order_top] <- 0
+        Value_FOT5[,i] <- x/sum(x)*1e5
+      }
+    } else if(normmethod == "median") {
+      for(i in seq_len(Value_FOT5_col)){
+        x <- as.vector(unlist(ptypes_value[,i]))
+        x_order <- order(x, decreasing = TRUE)
+        x_order_top <- x_order[seq_len(topN)]
+        x[-x_order_top] <- 0
+        Value_FOT5[,i] <- x/median(x)*1e5
+      }
+    }
+  }
+  ptypes_value_FOT5 <- as.matrix(Value_FOT5)
+  index_of_zero <- which(ptypes_value_FOT5==0)
+  # if(imputemethod=="0"){
+  #   ptypes_value_FOT5[index_of_zero] <- 0
+  # }else if(imputemethod=="minimum"){
+  #   min_value_of_non_zero <- min(ptypes_value_FOT5[-index_of_zero])
+  #   ptypes_value_FOT5[index_of_zero] <- min_value_of_non_zero
+  # }else if(imputemethod=="minimum/10"){
+  #   min_value_of_non_zero <- min(ptypes_value_FOT5[-index_of_zero])
+  #   ptypes_value_FOT5[index_of_zero] <- min_value_of_non_zero*0.1
+  # }
+  ptypes_value_FOT5 <- as.data.frame(ptypes_value_FOT5)
+  ptypes_value_FOT5[ptypes_value_FOT5 == 0] <- NA
+  fill_missing_values01 <- function(nadata, method) {
+    df <- df1 <- nadata
+    if (method == "none") {
+      df[is.na(df)] <- 0
+    } else if (method == "minimum") {
+      fill_value <- min(df1, na.rm = TRUE)
+      df[is.na(df)] <- fill_value
+    } else if (method == "minimum/10") {
+      fill_value <- min(df1, na.rm = TRUE) / 10
+      df[is.na(df)] <- fill_value
+    } else if (method == "bpca") {
+      # take medium time
+      library(pcaMethods)
+      data_zero1<-pcaMethods::pca(as.matrix(df1), nPcs = ncol(df1)-1, method = "bpca", maxSteps =100)
+      df<-completeObs(data_zero1)
+    } else if (method == "lls") {
+      # take long time
+      # library(pcaMethods)
+      data_zero1<-llsImpute(t(df1), k = 10, allVariables = TRUE)
+      df<-t(completeObs(data_zero1))
+    } else if (method == "impseq") {
+      # library(rrcovNA)
+      df <- impSeq(df1)
+    } else if(method=="impseqrob"){
+      # library(rrcovNA)
+      data_zero1 <- impSeqRob(df1, alpha=0.9)
+      df<-data_zero1$x
+    } else if(method=="knnmethod"){
+      # library(impute)
+      data_zero1<-impute.knn(as.matrix(df1),k = 10, rowmax = 1, colmax = 1)#rowmax = 0.9, colmax = 0.9
+      df<-data_zero1$data
+    } else if(method=="colmedian"){
+      # library(e1071)
+      df<-impute(df1,what ="median")
+    } else if(method=="rowmedian"){
+      # library(e1071)
+      dfx<-impute(t(df1),what ="median")
+      df<-t(dfx)
+      # } else if(method=="grr"){
+      #   library(DreamAI)
+      #   df<-impute.RegImpute(data=as.matrix(df1), fillmethod = "row_mean", maxiter_RegImpute = 10,conv_nrmse = 1e-03)
+      # } else if(method=="mle"){
+      #   library(norm)
+      #   xxm<-as.matrix(df1)
+      #   ss <- norm::prelim.norm(xxm)
+      #   thx <- norm::em.norm(ss)
+      #   norm::rngseed(123)
+      #   df <- norm::imp.norm(ss, thx, xxm)
+    }
+    return(df)
+  }
+  errorlabel = FALSE
+  errorlabel_values <- c()
+  if (imputemethod %in% c('bpca', 'rowmedian', 'lls', 'knnmethod')) {
+    for (group in unique(design_file$Group)) {
+      samples <- design_file[design_file$Group == group,1]
+      group_data <- ptypes_value_FOT5[, samples]
+      # Check if any row in group_data has missing values
+      if (any(rowSums(is.na(group_data)) > 0)) {
+        errorlabel <- TRUE
+      } else {
+        errorlabel <- FALSE
+      }
+      errorlabel_values <- c(errorlabel_values, errorlabel)
+    }
+  }
+  if (!any(errorlabel_values)) {
+    for (group in unique(design_file$Group)) {
+      # 选择该分组下的所有样本
+      # samples <- design_file$Experiment_code[design_file$Group == group]
+      samples <- design_file[design_file$Group == group,1]
+      # 从原始数据框中提取该分组下的所有样本数据
+      group_data <- ptypes_value_FOT5[, samples]
+      # 对该分组下的样本进行缺失值填充
+      filled_group_data <- fill_missing_values(group_data, method = imputemethod)
+      # 将填充后的数据框添加到结果列表中
+      if (exists('result_list')) {
+        result_list <- c(result_list, list(filled_group_data))
+      } else {
+        result_list <- list(filled_group_data)
+      }
+    }
+    # 将所有填充后的数据框合并为一个数据框
+    ptypes_value_FOT5 <- Reduce(cbind, result_list)
+    # ptypes_value_FOT5 = fill_missing_values01(ptypes_value_FOT5, imputemethod)
+    ptypes_df_list <- list(
+      ptypes_area_df_with_id = data.frame(ptypes_id_df, ptypes_value),
+      ptypes_fot5_df_with_id = data.frame(ptypes_id_df, ptypes_value_FOT5)
+    )
+    cat('\n The 7th step is over ^_^.')
+    return(ptypes_df_list)
+  } else {
+    empty_list <- list()
+    return(empty_list)
+  }
+}

backend/import_extract.R ADDED Viewed

	@@ -0,0 +1,23 @@

+# unzip file and return file path
+get_file_path <- function(inputfile, pathname) {
+  # if (dir.exists(paste0("tmp/", pathname))) {
+  #   unlink(paste0("tmp/", pathname), recursive = TRUE)
+  # }
+  zip::unzip(
+    inputfile$datapath,
+    # exdir = paste0("tmp/", pathname)
+    exdir = pathname
+  )
+  namestrs = inputfile$name
+  normalizePath(paste0(pathname, "/", substring(namestrs, 0, nchar(namestrs)-4)))
+}
+# Get a list of file names without suffixes based on the path
+get_target_name <- function(path, depth) {
+  if(depth == 2) {
+    path = normalizePath(list.files(path, full.names = T))
+  }
+  tmp <- list.files(path)
+  substring(tmp, 0, nchar(tmp)-4)
+}

backend/preprocess.R ADDED Viewed

	@@ -0,0 +1,27 @@

+# imageMap <- function(inputId, imgsrc, opts) {
+#   areas <- lapply(names(opts), function(n)
+#     shiny::tags$area(title=n, coords=opts[[n]],
+#                      href="#", shape="poly"))
+#   js <- paste0("$(document).on('click', 'map area', function(evt) {
+#   evt.preventDefault();
+#   var val = evt.target.title;
+#   Shiny.onInputChange('", inputId, "', val);})")
+#   list(
+#     shiny::tags$img(src=imgsrc, usemap=paste0("#", inputId),
+#                     shiny::tags$head(tags$script(shiny::HTML(js)))),
+#     shiny::tags$map(name=inputId, areas))
+# }
+imageMap <- function(inputId, imgsrc, opts) {
+  areas <- lapply(names(opts), function(n)
+    shiny::tags$area(title=n, coords=opts[[n]],
+                     href="#", shape="poly"))
+  js <- paste0("$(document).on('click', 'map area', function(evt) {
+  evt.preventDefault();
+  var val = evt.target.title;
+  print('hello');})")
+  list(
+    shiny::tags$img(src=imgsrc, usemap=paste0("#", inputId),
+                    shiny::tags$head(tags$script(shiny::HTML(js)))),
+    shiny::tags$map(name=inputId, areas))
+}

backend/visualization_deps_with_scatter02.R ADDED Viewed

	@@ -0,0 +1,117 @@

+#' Visualize differentially expressed results with scatter
+#'
+#' @param deps_data a data frame containing ID, logFC and pvalue.
+#' @param minFC a numeric for the minimum fold change.
+#' @param minPvalue a numeric for the significance cutoff.
+#' @param main an overall title for the plot.
+#' @param show_text a boolean value representing whether or not the text is showed, the default is FALSE.
+#' @param min_up_text cutoff value for showing up-IDs. Only IDs with lower than min_up_text are showed.
+#' @param min_down_text cutoff value for showing down-IDs. Only IDs with lower than min_down_text are showed.
+#'
+#' @author Dongdong Zhan and Mengsha Tong
+#' @export
+#'
+#'
+#' @return A scatter plot for showing differentially expressed results.
+#'
+#' @examples
+#' ftp_url <- "ftp://111.198.139.72:4000/pub/PhosMap_datasets/function_demo_data/visualization_deps_with_scatter.RData"
+#' load_data <- load_data_with_ftp(ftp_url, 'RData')
+#' writeBin(load_data, "visualization_deps_with_scatter.RData")
+#' load("visualization_deps_with_scatter.RData")
+#'
+#' visualization_deps_with_scatter(limma_results_df, minFC = 2,
+#'   minPvalue = 0.05, main = 'Differentially expressed proteins  \n with limma',
+#'   show_text = TRUE, min_up_text = 70, min_down_text = 70
+#' )
+#'
+visualization_deps_with_scatter02 <- function(
+    deps_data,
+    minFC = 2,
+    minPvalue = 0.05,
+    main = 'Differentially expressed proteins',
+    show_text = FALSE,
+    min_up_text = 15,
+    min_down_text = 15
+){
+  p <- ggplot(
+    # 数据、映射、颜色
+    deps_data, aes(x = logFC, y = -log10(pvalue))) +
+    geom_point(alpha=0.4, size=3.5) +
+    scale_color_manual(values=c("#546de5", "#d2dae2","#ff4757"))+
+    # 辅助线
+    geom_vline(xintercept=c(-1,1),lty=4,col="black",lwd=0.8) +
+    geom_hline(yintercept = -log10(0.01),lty=4,col="black",lwd=0.8) +
+    # 坐标轴
+    labs(x="log2(fold change)",
+         y="-log10 (p-value)") +
+    theme_bw()+
+    # 图例
+    theme(plot.title = element_text(hjust = 0.5),
+          legend.position="right",
+          legend.title = element_blank())
+  p
+  # requireNamespace('graphics')
+  # requireNamespace('stats')
+  # x_v <- deps_data$logFC
+  # x_v_max <- max(x_v)
+  # x_v_right <- ceiling(x_v_max)
+  # x_v_min <- min(x_v)
+  # x_v_left <- floor(x_v_min)
+  #
+  # x_up <- log2(minFC)
+  # x_down <- log2(1/minFC)
+  #
+  # zero_index <- which(deps_data$pvalue==0)
+  # zero_index_count <- length(zero_index)
+  # if(zero_index_count){
+  #   minimum_p <- min(deps_data$pvalue[-zero_index])
+  #   min <- minimum_p/10
+  #   max <- minimum_p-minimum_p/10
+  #   minimum_p_new <- stats::runif(zero_index_count, min = min, max = max)
+  #   deps_data$pvalue[zero_index] <- minimum_p_new
+  # }
+  #
+  # y_v <- (-log10(deps_data$pvalue))
+  # y_v_max <- max(y_v)
+  # y_v_up <- ceiling(y_v_max)
+  # y_v_sig <- (-log10(minPvalue))
+  #
+  #
+  # index_of_up <- which(x_v > x_up & y_v > y_v_sig)
+  # index_of_down <- which(x_v < x_down & y_v > y_v_sig)
+  #
+  #
+  # graphics::plot(x_v, y_v,
+  #                xlim = c(x_v_left, x_v_right), ylim = c(0, y_v_up),
+  #                xlab = 'log2(FC)', ylab = '-log10(pvalue)', main = main)
+  # graphics::abline(h = y_v_sig, lty = 'dotdash', col = 'firebrick', lwd = 2)
+  # graphics::abline(v = x_up, lty = 'dotdash', col = 'firebrick', lwd = 2)
+  # graphics::abline(v = x_down, lty = 'dotdash', col = 'firebrick', lwd = 2)
+  #
+  # graphics::points(x_v[index_of_up], y_v[index_of_up], pch = 20, col = 'red')
+  # graphics::points(x_v[index_of_down], y_v[index_of_down], pch = 20, col = 'blue')
+  #
+  # if(show_text){
+  #   s <- as.vector(deps_data$ID)
+  #   s_up <- s[index_of_up]
+  #   x_v_up_set <- x_v[index_of_up]
+  #   x_v_up_set_order <- order(x_v_up_set, decreasing = TRUE)
+  #   y_v_up_set <- y_v[index_of_up]
+  #   y_v_up_set_order <- order(y_v_up_set, decreasing = TRUE)
+  #
+  #   index_up_set <- intersect(x_v_up_set_order[seq_len(min_up_text)], y_v_up_set_order[seq_len(min_up_text)])
+  #   graphics::text(x_v_up_set[index_up_set], y_v_up_set[index_up_set], s_up[index_up_set], pos = 3, cex = 0.6)
+  #
+  #   s_down <- s[index_of_down]
+  #   x_v_down_set <- x_v[index_of_down]
+  #   x_v_down_set_order <- order(x_v_down_set, decreasing = FALSE)
+  #   y_v_down_set <- y_v[index_of_down]
+  #   y_v_down_set_order <- order(y_v_down_set, decreasing = TRUE)
+  #
+  #   index_down_set <- intersect(x_v_down_set_order[seq_len(min_down_text)], y_v_down_set_order[seq_len(min_down_text)])
+  #   graphics::text(x_v_down_set[index_down_set], y_v_down_set[index_down_set], s_down[index_down_set], pos = 3, cex = 0.6)
+  # }
+}

examplefile/Clinicaltest.csv ADDED Viewed

	@@ -0,0 +1,40 @@

+PatientID,status,time
+Exp027012,0,1290
+Exp027013,0,1187
+Exp027014,1,1106
+Exp027015,1,1264
+Exp027016,1,948
+Exp027017,0,1401
+Exp027018,1,961
+Exp027019,0,1867
+Exp027020,1,986
+Exp027021,0,1593
+Exp027022,1,566
+Exp027023,1,1353
+Exp027024,0,1592
+Exp027025,0,1468
+Exp027026,1,120
+Exp027027,1,145
+Exp027028,0,1471
+Exp027029,1,507
+Exp027030,1,1294
+Exp027031,1,317
+Exp027032,1,235
+Exp027033,0,1186
+Exp027034,1,1204
+Exp027035,0,1253
+Exp027036,1,659
+Exp027037,0,1177
+Exp027038,1,807
+Exp027039,1,238
+Exp027040,1,498
+Exp027041,0,781
+Exp027042,1,497
+Exp027043,1,424
+Exp027044,1,407
+Exp027045,1,1421
+Exp027046,0,1386
+Exp027047,0,1390
+Exp027048,0,1348
+Exp027049,0,716
+Exp027050,0,1250

examplefile/analysistools/Clinical_for_Demo.csv ADDED Viewed

	@@ -0,0 +1,40 @@

+PatientID,status,time
+Exp027012,0,1290
+Exp027013,0,1187
+Exp027014,1,1106
+Exp027015,1,1264
+Exp027016,1,948
+Exp027017,0,1401
+Exp027018,1,961
+Exp027019,0,1867
+Exp027020,1,986
+Exp027021,0,1593
+Exp027022,1,566
+Exp027023,1,1353
+Exp027024,0,1592
+Exp027025,0,1468
+Exp027026,1,120
+Exp027027,1,145
+Exp027028,0,1471
+Exp027029,1,507
+Exp027030,1,1294
+Exp027031,1,317
+Exp027032,1,235
+Exp027033,0,1186
+Exp027034,1,1204
+Exp027035,0,1253
+Exp027036,1,659
+Exp027037,0,1177
+Exp027038,1,807
+Exp027039,1,238
+Exp027040,1,498
+Exp027041,0,781
+Exp027042,1,497
+Exp027043,1,424
+Exp027044,1,407
+Exp027045,1,1421
+Exp027046,0,1386
+Exp027047,0,1390
+Exp027048,0,1348
+Exp027049,0,716
+Exp027050,0,1250

examplefile/analysistools/Clinical_for_Pre.csv ADDED Viewed

	@@ -0,0 +1,10 @@

+PatientID,status,time
+Exp027015,1,1264
+Exp027016,1,948
+Exp027017,0,1401
+Exp027031,1,317
+Exp027032,1,235
+Exp027033,0,1186
+Exp027046,0,1386
+Exp027047,0,1390
+Exp027048,0,1348

examplefile/analysistools/Clinicaltest.csv ADDED Viewed

	@@ -0,0 +1,6 @@

+PatientID,status,time
+Exp027012,0,1290
+Exp027020,1,986
+Exp027028,0,1471
+Exp027036,1,659
+Exp027044,1,407

examplefile/analysistools/PreNormBasedProSummary.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/analysistools/phosphorylation_exp_design_info.txt ADDED Viewed

	@@ -0,0 +1,40 @@

+Experiment_Code	Group	Description
+Exp027012	0	ctr_0h_R1_IMAC_1.raw
+Exp027013	0	ctr_0h_R1_IMAC_2.raw
+Exp027014	0	ctr_0h_R1_IMAC_3.raw
+Exp027015	0	ctr_0h_R2_IMAC_1.raw
+Exp027016	0	ctr_0h_R2_IMAC_2.raw
+Exp027017	0	ctr_0h_R2_IMAC_3.raw
+Exp027018	0	ctr_0h_R3_IMAC_1.raw
+Exp027019	0	ctr_0h_R3_IMAC_2.raw
+Exp027020	2	PLX_2h_R1_IMAC_1.raw
+Exp027021	2	PLX_2h_R1_IMAC_2.raw
+Exp027022	2	PLX_2h_R1_IMAC_3.raw
+Exp027023	2	PLX_2h_R2_IMAC_2.raw
+Exp027024	2	PLX_2h_R2_IMAC_3.raw
+Exp027025	2	PLX_2h_R3_IMAC_1.raw
+Exp027026	2	PLX_2h_R3_IMAC_2.raw
+Exp027027	2	PLX_2h_R3_IMAC_3.raw
+Exp027028	6	PLX_6h_R1_IMAC_1.raw
+Exp027029	6	PLX_6h_R1_IMAC_2.raw
+Exp027030	6	PLX_6h_R1_IMAC_3.raw
+Exp027031	6	PLX_6h_R2_IMAC_1.raw
+Exp027032	6	PLX_6h_R2_IMAC_2.raw
+Exp027033	6	PLX_6h_R2_IMAC_3.raw
+Exp027034	6	PLX_6h_R3_IMAC_1.raw
+Exp027035	6	PLX_6h_R3_IMAC_2.raw
+Exp027036	24	PLX_24h_R1_IMAC_1.raw
+Exp027037	24	PLX_24h_R1_IMAC_2.raw
+Exp027038	24	PLX_24h_R1_IMAC_3.raw
+Exp027039	24	PLX_24h_R2_IMAC_1.raw
+Exp027040	24	PLX_24h_R2_IMAC_2.raw
+Exp027041	24	PLX_24h_R2_IMAC_3.raw
+Exp027042	24	PLX_24h_R3_IMAC_1.raw
+Exp027043	24	PLX_24h_R3_IMAC_3.raw
+Exp027044	48	PLX_48h_R1_IMAC_2.raw
+Exp027045	48	PLX_48h_R1_IMAC_3.raw
+Exp027046	48	PLX_48h_R2_IMAC_1.raw
+Exp027047	48	PLX_48h_R2_IMAC_2.raw
+Exp027048	48	PLX_48h_R2_IMAC_3.raw
+Exp027049	48	PLX_48h_R3_IMAC_1.raw
+Exp027050	48	PLX_48h_R3_IMAC_2.raw

examplefile/data_frame_normalization_with_control_no_pair.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/download/anaysis_demo.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23bba0455c82f9d839711c3239ef883b8e86a45d20dd5ab18758ab4e19bc8b02
+size 407517

examplefile/download/mascot_xml.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e52baf8a2cb215e2c42e8470f29382a0ca5ce7ed5f19c4104d2d16c557b87c9
+size 21818471

examplefile/download/motif_kinase_relation.xlsx ADDED Viewed

Binary file (40.8 kB). View file

examplefile/download/phosphorylation_peptide_txt.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aebf94fc6d5de4b116fbeb89856cbed50a34bf37d81e92dbce12d61cb60a53ee
+size 3944372

examplefile/download/profiling_gene_txt.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e35cbdc0f2bbb77e85a421ec390f3a7e105ba86ab66e498561b7e802c86908c5
+size 1384071

examplefile/mascot/phosphorylation_exp_design_info.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+Experiment_Code	Group	Description
+Exp027015	0	ctr_0h_R2_IMAC_1.raw
+Exp027016	0	ctr_0h_R2_IMAC_2.raw
+Exp027017	0	ctr_0h_R2_IMAC_3.raw
+Exp027031	6	PLX_6h_R2_IMAC_1.raw
+Exp027032	6	PLX_6h_R2_IMAC_2.raw
+Exp027033	6	PLX_6h_R2_IMAC_3.raw
+Exp027046	48	PLX_48h_R2_IMAC_1.raw
+Exp027047	48	PLX_48h_R2_IMAC_2.raw
+Exp027048	48	PLX_48h_R2_IMAC_3.raw

examplefile/mascot/phosphorylation_peptide_txt/Exp027015_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027016_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027017_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027031_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027032_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027033_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027046_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027047_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/phosphorylation_peptide_txt/Exp027048_peptide.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/profiling_exp_design_info.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Experiment_Code	Group	Description
+Exp026982	0	ctr_0h_R2_injection_1.raw
+Exp026983	0	ctr_0h_R2_injection_2.raw
+Exp026995	6	PLX_6h_R2_injection_1.raw
+Exp026996	6	PLX_6h_R2_injection_2.raw
+Exp027008	48	PLX_48h_R2_injection_1.raw
+Exp027009	48	PLX_48h_R2_injection_4.raw

examplefile/mascot/profiling_gene_txt/Exp026982_gene.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/profiling_gene_txt/Exp026983_gene.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/profiling_gene_txt/Exp026995_gene.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/profiling_gene_txt/Exp026996_gene.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/profiling_gene_txt/Exp027008_gene.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/mascot/profiling_gene_txt/Exp027009_gene.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/maxquant/Phospho (STY)Sites.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/maxquant/phosphorylation_exp_design_info.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+Experiment_Code	Group	Description
+Exp027015	0	ctr_0h_R2_IMAC_1.raw
+Exp027016	0	ctr_0h_R2_IMAC_2.raw
+Exp027017	0	ctr_0h_R2_IMAC_3.raw
+Exp027031	6	PLX_6h_R2_IMAC_1.raw
+Exp027032	6	PLX_6h_R2_IMAC_2.raw
+Exp027033	6	PLX_6h_R2_IMAC_3.raw
+Exp027046	48	PLX_48h_R2_IMAC_1.raw
+Exp027047	48	PLX_48h_R2_IMAC_2.raw
+Exp027048	48	PLX_48h_R2_IMAC_3.raw

examplefile/maxquant/profiling_exp_design_info.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Experiment_Code	Group	Description
+Exp026982	0	ctr_0h_R2_injection_1.raw
+Exp026983	0	ctr_0h_R2_injection_2.raw
+Exp026995	6	PLX_6h_R2_injection_1.raw
+Exp026996	6	PLX_6h_R2_injection_2.raw
+Exp027008	48	PLX_48h_R2_injection_1.raw
+Exp027009	48	PLX_48h_R2_injection_4.raw

examplefile/maxquant/proteinGroups.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/motifanalysis.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

examplefile/phosphorylation_exp_design_info.txt ADDED Viewed

	@@ -0,0 +1,40 @@

+Experiment_Code	Group	Description
+Exp027012	0	ctr_0h_R1_IMAC_1.raw
+Exp027013	0	ctr_0h_R1_IMAC_2.raw
+Exp027014	0	ctr_0h_R1_IMAC_3.raw
+Exp027015	0	ctr_0h_R2_IMAC_1.raw
+Exp027016	0	ctr_0h_R2_IMAC_2.raw
+Exp027017	0	ctr_0h_R2_IMAC_3.raw
+Exp027018	0	ctr_0h_R3_IMAC_1.raw
+Exp027019	0	ctr_0h_R3_IMAC_2.raw
+Exp027020	2	PLX_2h_R1_IMAC_1.raw
+Exp027021	2	PLX_2h_R1_IMAC_2.raw
+Exp027022	2	PLX_2h_R1_IMAC_3.raw
+Exp027023	2	PLX_2h_R2_IMAC_2.raw
+Exp027024	2	PLX_2h_R2_IMAC_3.raw
+Exp027025	2	PLX_2h_R3_IMAC_1.raw
+Exp027026	2	PLX_2h_R3_IMAC_2.raw
+Exp027027	2	PLX_2h_R3_IMAC_3.raw
+Exp027028	6	PLX_6h_R1_IMAC_1.raw
+Exp027029	6	PLX_6h_R1_IMAC_2.raw
+Exp027030	6	PLX_6h_R1_IMAC_3.raw
+Exp027031	6	PLX_6h_R2_IMAC_1.raw
+Exp027032	6	PLX_6h_R2_IMAC_2.raw
+Exp027033	6	PLX_6h_R2_IMAC_3.raw
+Exp027034	6	PLX_6h_R3_IMAC_1.raw
+Exp027035	6	PLX_6h_R3_IMAC_2.raw
+Exp027036	24	PLX_24h_R1_IMAC_1.raw
+Exp027037	24	PLX_24h_R1_IMAC_2.raw
+Exp027038	24	PLX_24h_R1_IMAC_3.raw
+Exp027039	24	PLX_24h_R2_IMAC_1.raw
+Exp027040	24	PLX_24h_R2_IMAC_2.raw
+Exp027041	24	PLX_24h_R2_IMAC_3.raw
+Exp027042	24	PLX_24h_R3_IMAC_1.raw
+Exp027043	24	PLX_24h_R3_IMAC_3.raw
+Exp027044	48	PLX_48h_R1_IMAC_2.raw
+Exp027045	48	PLX_48h_R1_IMAC_3.raw
+Exp027046	48	PLX_48h_R2_IMAC_1.raw
+Exp027047	48	PLX_48h_R2_IMAC_2.raw
+Exp027048	48	PLX_48h_R2_IMAC_3.raw
+Exp027049	48	PLX_48h_R3_IMAC_1.raw
+Exp027050	48	PLX_48h_R3_IMAC_2.raw

examplefile/root/mascot/mascot_xml/Exp027015/Exp027015_F1_R1.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bbe17096e89e287b9984b93499f376f814bb9b263d4ae3128fe3c13c40d4df26
+size 42212493

examplefile/root/mascot/mascot_xml/Exp027016/Exp027016_F1_R1.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b81689b2f7d4e3e41f1a4edd9ed80b01f7a29901b7d745601be70aa15611a825
+size 38644883

examplefile/root/mascot/mascot_xml/Exp027017/Exp027017_F1_R1.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5cbcc19156bbb4f0e2a92c5dca4fc2d5d01d4ac6c0d210ee28639b2d559b252
+size 39234041