[1] "libdir: /xchip/tcga/gdac_prod/applications/process_mgmt/firehose_task_registry/tcga-gdac/ClinicalAnalysisAllGenes_new/broadinstitute.org/cancer.genome.analysis/00333/74/"
[1] "op: MUTATION_RATE"
[1] "dfn: /xchip/cga/gdac-prod/tcga-gdac/jobResults/MutSigRun/THCA-TP/22985931/THCA-TP.patients.counts_and_rates.txt"
[1] "cfn: /xchip/cga/gdac-prod/tcga-gdac/jobResults/Append_Data/THCA-TP/22507188/THCA-TP.merged_data.txt"
[1] "gv: ALL"
[1] "gfn: "
[1] "sfn: "
[1] "fv: ALL"
[1] "ofn: "
[1] "dx: "
[1] "cfn"
[1] "/xchip/cga/gdac-prod/tcga-gdac/jobResults/Append_Data/THCA-TP/22507188/THCA-TP.merged_data.txt"
[1] "ok3"

nSamples in clinical file=503, in expression file=496, common to both=492
Number of genes in original expression dataset=2
[1] "ALL"
[1] "data2feature, selection=ALL"
 [1] "YEARS_TO_BIRTH"                      
 [2] "VITAL_STATUS"                        
 [3] "DAYS_TO_DEATH"                       
 [4] "DAYS_TO_LAST_FOLLOWUP"               
 [5] "TUMOR_TISSUE_SITE"                   
 [6] "PATHOLOGIC_STAGE"                    
 [7] "PATHOLOGY_T_STAGE"                   
 [8] "PATHOLOGY_N_STAGE"                   
 [9] "PATHOLOGY_M_STAGE"                   
[10] "GENDER"                              
[11] "DATE_OF_INITIAL_PATHOLOGIC_DIAGNOSIS"
[12] "RADIATION_THERAPY"                   
[13] "HISTOLOGICAL_TYPE"                   
[14] "RADIATION_EXPOSURE"                  
[15] "EXTRATHYROIDAL_EXTENSION"            
[16] "RESIDUAL_TUMOR"                      
[17] "NUMBER_OF_LYMPH_NODES"               
[18] "MULTIFOCALITY"                       
[19] "TUMOR_SIZE"                          
[20] "RACE"                                
[21] "ETHNICITY"                           

Input Data has 21 rows and 492 columns.

[1] "Last Follow UP"
Variable 1:'YEARS_TO_BIRTH':	nDistinctValues=72,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 2:'VITAL_STATUS':	nDistinctValues=2,	numeric=TRUE,	binary=TRUE,	exclude=FALSE.
Variable 3:'DAYS_TO_DEATH':	nDistinctValues=14,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('DAYS_?TO', vnms) to deal with survival parameters seperately"
Variable 4:'DAYS_TO_LAST_FOLLOWUP':	nDistinctValues=431,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('FOLLOWUP', vnms) to deal with survival parameters seperately"
Variable 5:'TUMOR_TISSUE_SITE':	nDistinctValues=1,	numeric=FALSE,	binary=FALSE,	exclude=TRUE.
[1] "TUMOR_TISSUE_SITE is excluded in the analysis because there is no more than two cases of (unique non-NA values)"
Variable 6:'PATHOLOGIC_STAGE':	nDistinctValues=6,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 7:'PATHOLOGY_T_STAGE':	nDistinctValues=8,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 8:'PATHOLOGY_N_STAGE':	nDistinctValues=5,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 9:'PATHOLOGY_M_STAGE':	nDistinctValues=3,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 10:'GENDER':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 11:'DATE_OF_INITIAL_PATHOLOGIC_DIAGNOSIS':	nDistinctValues=19,	numeric=TRUE,	binary=FALSE,	exclude=TRUE.
[1] "exclude grep('DATE', vnms) to deal with survival parameters seperately"
Variable 12:'RADIATION_THERAPY':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 13:'HISTOLOGICAL_TYPE':	nDistinctValues=4,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 14:'RADIATION_EXPOSURE':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 15:'EXTRATHYROIDAL_EXTENSION':	nDistinctValues=4,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 16:'RESIDUAL_TUMOR':	nDistinctValues=4,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 17:'NUMBER_OF_LYMPH_NODES':	nDistinctValues=29,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 18:'MULTIFOCALITY':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 19:'TUMOR_SIZE':	nDistinctValues=61,	numeric=TRUE,	binary=FALSE,	exclude=FALSE.
Variable 20:'RACE':	nDistinctValues=4,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
Variable 21:'ETHNICITY':	nDistinctValues=2,	numeric=FALSE,	binary=FALSE,	exclude=FALSE.
[1] "## **** detect survival parameters (defined in index such as ind_OS, ind_MFS, ind_RFS, ind_RFS, ind_BCR and ind_d2ssd) *** ##"
[1] "detected survival parameters using [ind_OS, overall_survival]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_OS, curated_overall_survival]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_TCGAOS]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survivial parameters using [ind_MFS]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_RFS]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_BCR]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [ind_Progression]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using [index_additional_survival_time]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "detected survival parameters using condition: [is.null(surv.mat)&&(selection=='SURV')]"
[1] "survival parameters accumulated so far"
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "************ conversion from categorical data to rank data ********** "
[1] "PATHOLOGY_T_STAGE is converted to numeric rank data using modified categoies"
[1] "PATHOLOGY_N_STAGE is converted to numeric rank data using modified categoies"
[1] "PATHOLOGY_M_STAGE is converted to rank data using modified categoies"
[1] "****** SUMMARY ***** "
Output Data has 492 columns, 1 survival variables, and 16 non-survival variables.
[1] "* survival variables: "
[1] "DAYS_TO_DEATH_OR_LAST_FUP" "VITAL_STATUS"             
[1] "* non-survival variables: "
 [1] "YEARS_TO_BIRTH"           "PATHOLOGIC_STAGE"        
 [3] "PATHOLOGY_T_STAGE"        "PATHOLOGY_N_STAGE"       
 [5] "PATHOLOGY_M_STAGE"        "GENDER"                  
 [7] "RADIATION_THERAPY"        "HISTOLOGICAL_TYPE"       
 [9] "RADIATION_EXPOSURE"       "EXTRATHYROIDAL_EXTENSION"
[11] "RESIDUAL_TUMOR"           "NUMBER_OF_LYMPH_NODES"   
[13] "MULTIFOCALITY"            "TUMOR_SIZE"              
[15] "RACE"                     "ETHNICITY"               
[1] "changed to 17 non-survival variables adding another age variable for linear regression analysis on mutaion rate."
[1] "DAYS_TO_DEATH_OR_LAST_FUP"
[1] "DAYS_TO_DEATH_OR_LAST_FUP"
[1] "D"                         "DAYS_TO_DEATH_OR_LAST_FUP"
[3] "Month"                    
[1] "check if there is any case_to_report in survival time data or not"
[1] "alarming case(s) exist!"
[1] "[  1  ] case_to_report(s) is(are) excluded in survival analysis"
AGE, nv=72, binary=FALSE, numeric=TRUE
AGE_mutation.rate, nv=72, binary=FALSE, numeric=TRUE
$MUTATIONRATE_NONSYNONYMOUS

Call:
lm(formula = as.numeric(i) ~ vv)

Residuals:
       Min         1Q     Median         3Q        Max 
-5.304e-07 -1.457e-07 -3.570e-08  9.585e-08  1.424e-06 

Coefficients:
             Estimate Std. Error t value Pr(>|t|)    
(Intercept) 5.717e-08  3.405e-08   1.679   0.0937 .  
vv          6.998e-09  6.841e-10  10.230   <2e-16 ***
---
Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1 

Residual standard error: 2.381e-07 on 490 degrees of freedom
Multiple R-squared: 0.176,	Adjusted R-squared: 0.1743 
F-statistic: 104.6 on 1 and 490 DF,  p-value: < 2.2e-16 


$MUTATIONRATE_SILENT

Call:
lm(formula = as.numeric(i) ~ vv)

Residuals:
       Min         1Q     Median         3Q        Max 
-2.235e-07 -6.251e-08 -1.827e-08  4.376e-08  6.981e-07 

Coefficients:
             Estimate Std. Error t value Pr(>|t|)    
(Intercept) 4.329e-09  1.393e-08   0.311    0.756    
vv          2.520e-09  2.800e-10   8.999   <2e-16 ***
---
Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1 

Residual standard error: 9.745e-08 on 490 degrees of freedom
Multiple R-squared: 0.1418,	Adjusted R-squared: 0.1401 
F-statistic: 80.99 on 1 and 490 DF,  p-value: < 2.2e-16 


PATHOLOGIC_STAGE, nv=6, binary=FALSE, numeric=FALSE
PATHOLOGY_T_STAGE, nv=4, binary=FALSE, numeric=TRUE
[1] "PATHOLOGY_T_STAGE"
[1] "num to class table"
vv1
 T1  T2  T3  T4 
141 162 164  23 
PATHOLOGY_N_STAGE, nv=2, binary=FALSE, numeric=TRUE
PATHOLOGY_M_STAGE, nv=2, binary=FALSE, numeric=TRUE
GENDER, nv=2, binary=FALSE, numeric=FALSE
RADIATION_THERAPY, nv=2, binary=FALSE, numeric=FALSE
HISTOLOGICAL_TYPE, nv=4, binary=FALSE, numeric=FALSE
RADIATION_EXPOSURE, nv=2, binary=FALSE, numeric=FALSE
EXTRATHYROIDAL_EXTENSION, nv=4, binary=FALSE, numeric=FALSE
RESIDUAL_TUMOR, nv=4, binary=FALSE, numeric=FALSE
NUMBER_OF_LYMPH_NODES, nv=29, binary=FALSE, numeric=TRUE
MULTIFOCALITY, nv=2, binary=FALSE, numeric=FALSE
TUMOR_SIZE, nv=61, binary=FALSE, numeric=TRUE
RACE, nv=4, binary=FALSE, numeric=FALSE
ETHNICITY, nv=2, binary=FALSE, numeric=FALSE
[1] "saved param, results, example.expr in analysis.result.Rdata "
