Rows: 1,152
Columns: 27
Groups: disease [3]
$ primary_diagnosis <chr> "C34.1", "C34.1", "C34.3", "C34.1", "C34.1…
$ tumor_stage <chr> "stage ia", "stage ib", "stage ib", "stage…
$ age_at_diagnosis <dbl> 24477, 26615, 28171, 27154, 23370, 19025, …
$ vital_status <fct> dead, dead, dead, alive, alive, dead, dead…
$ morphology <chr> "8070/3", "8070/3", "8070/3", "8083/3", "8…
$ days_to_death <dbl> 371, 136, 2304, NA, NA, 345, 716, 2803, 97…
$ state <chr> "live", "live", "live", "live", "live", "l…
$ tissue_or_organ_of_origin <chr> "C34.1", "C34.1", "C34.3", "C34.1", "C34.1…
$ days_to_birth <dbl> -24477, -26615, -28171, -27154, -23370, -1…
$ site_of_resection_or_biopsy <chr> "C34.1", "C34.1", "C34.3", "C34.1", "C34.1…
$ days_to_last_follow_up <dbl> NA, NA, 2099, 3747, 3576, NA, NA, 1810, 95…
$ cigarettes_per_day <dbl> 10.9589041, 2.1917808, 1.6438356, 1.095890…
$ years_smoked <dbl> NA, NA, NA, NA, NA, NA, NA, NA, NA, 26, NA…
$ gender <fct> male, male, female, male, female, male, ma…
$ year_of_birth <dbl> 1936, 1931, 1927, 1930, 1942, 1953, 1932, …
$ race <chr> "white", "asian", "white", "white", "not r…
$ ethnicity <chr> "not hispanic or latino", "not hispanic or…
$ year_of_death <dbl> 2004, 2003, NA, NA, NA, 2005, 2006, NA, NA…
$ bcr_patient_barcode <chr> "TCGA-18-3406", "TCGA-18-3407", "TCGA-18-3…
$ disease <chr> "LUSC", "LUSC", "LUSC", "LUSC", "LUSC", "L…
$ alive <lgl> FALSE, FALSE, FALSE, TRUE, TRUE, FALSE, FA…
$ alive2 <dbl> 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, …
$ cigarettes_total <dbl> 268241.10, 58334.25, 46308.49, 29757.81, 6…
$ cigarettes_high <dbl> 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, …
$ disease_fac <fct> LUSC, LUSC, LUSC, LUSC, LUSC, LUSC, LUSC, …
$ days_to_last_follow_up2 <dbl> 0, 0, 2099, 3747, 3576, 0, 0, 1810, 956, 7…
$ stage_category <chr> "i", "i", "i", "i", "other", "i", "other",…