[1] "libdir: /xchip/tcga/gdac_prod/applications/process_mgmt/firehose_task_registry/tcga-gdac/ClinicalAnalysisAllGenes_new/broadinstitute.org/cancer.genome.analysis/00333/69/"
[1] "op: MUTATION_RATE"
[1] "dfn: /xchip/cga/gdac-prod/tcga-gdac/jobResults/MutSigRun/LUAD-TP/20177982/iteration1/LUAD-TP.patients.counts_and_rates.txt"
[1] "cfn: /xchip/cga/gdac-prod/tcga-gdac/jobResults/Append_Data/LUAD-TP/19775350/LUAD-TP.merged_data.txt"
[1] "gv: ALL"
[1] "gfn: "
[1] "sfn: "
[1] "fv: ALL"
[1] "ofn: "
[1] "dx: "
[1] "cfn"
[1] "/xchip/cga/gdac-prod/tcga-gdac/jobResults/Append_Data/LUAD-TP/19775350/LUAD-TP.merged_data.txt"
[1] "ok3"

nSamples in clinical file=521, in expression file=545, common to both=492
Number of genes in original expression dataset=2
[1] "ALL"
[1] "data2feature, selection=ALL"
 [1] "YEARS_TO_BIRTH"                      
 [2] "VITAL_STATUS"                        
 [3] "DAYS_TO_DEATH"                       
 [4] "DAYS_TO_LAST_FOLLOWUP"               
 [5] "TUMOR_TISSUE_SITE"                   
 [6] "PATHOLOGIC_STAGE"                    
 [7] "PATHOLOGY_T_STAGE"                   
 [8] "PATHOLOGY_N_STAGE"                   
 [9] "PATHOLOGY_M_STAGE"                   
[10] "GENDER"                              
[11] "DATE_OF_INITIAL_PATHOLOGIC_DIAGNOSIS"
[12] "DAYS_TO_LAST_KNOWN_ALIVE"            
[13] "RADIATION_THERAPY"                   
[14] "KARNOFSKY_PERFORMANCE_SCORE"         
[15] "HISTOLOGICAL_TYPE"                   
[16] "NUMBER_PACK_YEARS_SMOKED"            
[17] "YEAR_OF_TOBACCO_SMOKING_ONSET"       
[18] "RESIDUAL_TUMOR"                      
[19] "RACE"                                
[20] "ETHNICITY"                           

Input Data has 20 rows and 492 columns.

[1] "Last Follow UP"
Variable 1:'YEARS_TO_BIRTH':	nDistinctValues=50,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 2:'VITAL_STATUS':	nDistinctValues=2,	numeric=TRUE,	binary=TRUE,	exclude=FALSE.
Variable 3:'DAYS_TO_DEATH':	nDistinctValues=150,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('DAYS_?TO', vnms) to deal with survival parameters seperately"
Variable 4:'DAYS_TO_LAST_FOLLOWUP':	nDistinctValues=311,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('FOLLOWUP', vnms) to deal with survival parameters seperately"
Variable 5:'TUMOR_TISSUE_SITE':	nDistinctValues=1,	numeric=FALSE,	binary=FALSE,	exclude=TRUE.
[1] "TUMOR_TISSUE_SITE is excluded in the analysis because there is no more than two cases of (unique non-NA values)"
Variable 6:'PATHOLOGIC_STAGE':	nDistinctValues=8,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 7:'PATHOLOGY_T_STAGE':	nDistinctValues=9,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 8:'PATHOLOGY_N_STAGE':	nDistinctValues=5,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 9:'PATHOLOGY_M_STAGE':	nDistinctValues=5,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 10:'GENDER':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 11:'DATE_OF_INITIAL_PATHOLOGIC_DIAGNOSIS':	nDistinctValues=22,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('DATE', vnms) to deal with survival parameters seperately"
Variable 12:'DAYS_TO_LAST_KNOWN_ALIVE':	nDistinctValues=23,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('DAYS_?TO', vnms) to deal with survival parameters seperately"
Variable 13:'RADIATION_THERAPY':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 14:'KARNOFSKY_PERFORMANCE_SCORE':	nDistinctValues=9,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 15:'HISTOLOGICAL_TYPE':	nDistinctValues=11,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 16:'NUMBER_PACK_YEARS_SMOKED':	nDistinctValues=91,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 17:'YEAR_OF_TOBACCO_SMOKING_ONSET':	nDistinctValues=57,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 18:'RESIDUAL_TUMOR':	nDistinctValues=4,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 19:'RACE':	nDistinctValues=4,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 20:'ETHNICITY':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
[1] "## **** detect survival parameters (defined in index such as ind_OS, ind_MFS, ind_RFS, ind_RFS, ind_BCR and ind_d2ssd) *** ##"
[1] "detected survival parameters using [ind_OS, overall_survival]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_OS, curated_overall_survival]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_TCGAOS]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survivial parameters using [ind_MFS]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_RFS]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_BCR]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_Progression]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [index_additional_survival_time]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using condition: [is.null(surv.mat)&&(selection=='SURV')]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "************ conversion from categorical data to rank data ********** "
[1] "PATHOLOGY_T_STAGE is converted to numeric rank data using modified categoies"
[1] "PATHOLOGY_N_STAGE is converted to numeric rank data using modified categoies"
[1] "PATHOLOGY_M_STAGE is converted to rank data using modified categoies"
[1] "****** SUMMARY ***** "
Output Data has 492 columns, 1 survival variables, and 14 non-survival variables.
[1] "* survival variables: "
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "* non-survival variables: "
 [1] "YEARS_TO_BIRTH"                "PATHOLOGIC_STAGE"             
 [3] "PATHOLOGY_T_STAGE"             "PATHOLOGY_N_STAGE"            
 [5] "PATHOLOGY_M_STAGE"             "GENDER"                       
 [7] "RADIATION_THERAPY"             "KARNOFSKY_PERFORMANCE_SCORE"  
 [9] "HISTOLOGICAL_TYPE"             "NUMBER_PACK_YEARS_SMOKED"     
[11] "YEAR_OF_TOBACCO_SMOKING_ONSET" "RESIDUAL_TUMOR"               
[13] "RACE"                          "ETHNICITY"                    
[1] "changed to 15 non-survival variables adding another age variable for linear regression analysis on mutaion rate."
[1] "DAYS_TO_DEATH_OR_LAST_FUP"
[1] "DAYS_TO_DEATH_OR_LAST_FUP"
[1] "D"                         "DAYS_TO_DEATH_OR_LAST_FUP"
[3] "Month"                    
[1] "check if there is any case_to_report in survival time data or not"
[1] "alarming case(s) exist!"
[1] "[  1  ] case_to_report(s) is(are) excluded in survival analysis"
AGE, nv=50, binary=FALSE, numeric=TRUE
AGE_mutation.rate, nv=50, binary=FALSE, numeric=TRUE
$MUTATIONRATE_NONSYNONYMOUS

Call:
lm(formula = as.numeric(i) ~ vv)

Residuals:
       Min         1Q     Median         3Q        Max 
-9.496e-06 -5.328e-06 -2.116e-06  2.712e-06  4.047e-05 

Coefficients:
              Estimate Std. Error t value Pr(>|t|)    
(Intercept)  1.475e-05  2.542e-06   5.802 1.22e-08 ***
vv          -1.028e-07  3.831e-08  -2.684  0.00754 ** 
---
Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1 

Residual standard error: 7.982e-06 on 459 degrees of freedom
  (31 observations deleted due to missingness)
Multiple R-squared: 0.01545,	Adjusted R-squared: 0.0133 
F-statistic: 7.202 on 1 and 459 DF,  p-value: 0.007544 


$MUTATIONRATE_SILENT

Call:
lm(formula = as.numeric(i) ~ vv)

Residuals:
       Min         1Q     Median         3Q        Max 
-2.757e-06 -1.491e-06 -6.320e-07  7.602e-07  9.918e-06 

Coefficients:
              Estimate Std. Error t value Pr(>|t|)    
(Intercept)  4.174e-06  7.109e-07   5.871 8.33e-09 ***
vv          -2.882e-08  1.071e-08  -2.690   0.0074 ** 
---
Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1 

Residual standard error: 2.232e-06 on 459 degrees of freedom
  (31 observations deleted due to missingness)
Multiple R-squared: 0.01552,	Adjusted R-squared: 0.01338 
F-statistic: 7.237 on 1 and 459 DF,  p-value: 0.0074 


PATHOLOGIC_STAGE, nv=8, binary=FALSE, numeric=FALSE
PATHOLOGY_T_STAGE, nv=4, binary=FALSE, numeric=TRUE
[1] "PATHOLOGY_T_STAGE"
[1] "num to class table"
vv1
 T1  T2  T3  T4 
158 270  43  18 
PATHOLOGY_N_STAGE, nv=4, binary=FALSE, numeric=TRUE
[1] "PATHOLOGY_N_STAGE"
[1] "num to class table"
vv1
 N0  N1  N2  N3 
315  91  72   2 
PATHOLOGY_M_STAGE, nv=2, binary=FALSE, numeric=TRUE
GENDER, nv=2, binary=FALSE, numeric=FALSE
RADIATION_THERAPY, nv=2, binary=FALSE, numeric=FALSE
KARNOFSKY_PERFORMANCE_SCORE, nv=9, binary=FALSE, numeric=TRUE
HISTOLOGICAL_TYPE, nv=11, binary=FALSE, numeric=FALSE
NUMBER_PACK_YEARS_SMOKED, nv=91, binary=FALSE, numeric=TRUE
YEAR_OF_TOBACCO_SMOKING_ONSET, nv=57, binary=FALSE, numeric=TRUE
RESIDUAL_TUMOR, nv=4, binary=FALSE, numeric=FALSE
RACE, nv=4, binary=FALSE, numeric=FALSE
ETHNICITY, nv=2, binary=FALSE, numeric=FALSE
[1] "saved param, results, example.expr in analysis.result.Rdata "
