我正试图在泰坦尼克号数据集上运行svm,但我遇到了预测函数的问题 .

svm.iceberg <- svm(Survived ~ Pclass+Sex+SibSp+Parch+Ticket+Fare+Cabin+Embarked+Surname+Age_Range, data = train.iceberg)

svm.prediction <- predict(svm.iceberg, newdata = test.iceberg) #prediction

我收到以下错误:

Error in names(ret2) <- rowns :'names' attribute [418] must be the same length as the vector [0]

我认为错误是由于我为列车和一些变量测试数据的因子水平相同(这是我使用的代码):

test.iceberg$Name <- factor(test.iceberg$Name,levels =levels(train.iceberg$Name))
test.iceberg$Ticket <- factor(test.iceberg$Ticket,levels =levels(train.iceberg$Ticket))
test.iceberg$Cabin <- factor(test.iceberg$Cabin,levels =levels(train.iceberg$Cabin))
test.iceberg$Surname <- factor(test.iceberg$Ticket,levels =levels(train.iceberg$Surname))

这是火车数据框:

str(train.iceberg)
'data.frame':   891 obs. of  14 variables:
 $ PassengerId: int  1 2 3 4 5 6 7 8 9 10 ...
 $ Survived   : int  0 1 1 1 0 0 0 0 1 1 ...
 $ Pclass     : Factor w/ 3 levels "1","2","3": 3 1 3 1 3 3 1 3 3 2 ...
 $ Name       : Factor w/ 891 levels "Abbing, Mr. Anthony",..: 109 191 354 273 16 555 516 625 413 577 ...
 $ Sex        : Factor w/ 2 levels "female","male": 2 1 1 1 2 2 2 2 1 1 ...
 $ Age        : num  22 38 26 35 35 NA 54 2 27 14 ...
 $ SibSp      : int  1 1 0 1 0 0 0 3 0 1 ...
 $ Parch      : int  0 0 0 0 0 0 0 1 2 0 ...
 $ Ticket     : Factor w/ 681 levels "110152","110413",..: 524 597 670 50 473 276 86 396 345 133 ...
 $ Fare       : num  7.25 71.28 7.92 53.1 8.05 ...
 $ Cabin      : Factor w/ 147 levels "A10","A14","A16",..: NA 82 NA 56 NA NA 130 NA NA NA ...
 $ Embarked   : Factor w/ 3 levels "C","Q","S": 3 1 3 3 3 2 3 3 3 1 ...
 $ Surname    : Factor w/ 667 levels "Abbing","Abbott",..: 74 137 252 199 12 410 379 464 293 427 ...
 $ Age_Range  : num  4 4 4 4 4 NA 4 2 4 3 ...

这导致了测试数据框中的大量NA,如下所示:

> str(test.iceberg) #
'data.frame':   418 obs. of  14 variables:
 $ PassengerId: int  892 893 894 895 896 897 898 899 900 901 ...
 $ Survived   : int  NA NA NA NA NA NA NA NA NA NA ...
 $ Pclass     : Factor w/ 3 levels "1","2","3": 3 3 2 3 3 3 3 2 3 3 ...
 $ Name       : Factor w/ 891 levels "Abbing, Mr. Anthony",..: 434 NA NA NA NA NA 178 NA NA NA ...
 $ Sex        : Factor w/ 2 levels "female","male": 2 1 2 2 1 2 1 2 1 2 ...
 $ Age        : num  34 47 62 27 22 14 30 26 18 21 ...
 $ SibSp      : int  0 1 0 0 1 0 0 1 0 2 ...
 $ Parch      : int  0 0 0 0 1 0 0 1 0 0 ...
 $ Ticket     : Factor w/ 681 levels "110152","110413",..: NA NA NA NA 252 NA NA 159 NA 520 ...
 $ Fare       : num  7.83 7 9.69 8.66 12.29 ...
 $ Cabin      : Factor w/ 147 levels "A10","A14","A16",..: NA NA NA NA NA NA NA NA NA NA ...
 $ Embarked   : Factor w/ 3 levels "C","Q","S": 2 3 2 3 3 3 2 3 1 3 ...
 $ Surname    : Factor w/ 667 levels "Abbing","Abbott",..: NA NA NA NA NA NA NA NA NA NA ...
 $ Age_Range  : num  5 6 8 5 5 3 5 5 3 5 ...

以下是数据示例:

dput((droplevels(head(train.iceberg,100))))

structure(list(PassengerId = 1:100, Survived = c(0L, 1L, 1L, 
1L, 0L, 0L, 0L, 0L, 1L, 1L, 1L, 1L, 0L, 0L, 0L, 1L, 0L, 1L, 0L, 
1L, 0L, 1L, 1L, 1L, 0L, 1L, 0L, 0L, 1L, 0L, 0L, 1L, 1L, 0L, 0L, 
0L, 1L, 0L, 0L, 1L, 0L, 0L, 0L, 1L, 1L, 0L, 0L, 1L, 0L, 0L, 0L, 
0L, 1L, 1L, 0L, 1L, 1L, 0L, 1L, 0L, 0L, 1L, 0L, 0L, 0L, 1L, 1L, 
0L, 1L, 0L, 0L, 0L, 0L, 0L, 1L, 0L, 0L, 0L, 1L, 1L, 0L, 1L, 1L, 
0L, 1L, 1L, 0L, 0L, 1L, 0L, 0L, 0L, 0L, 0L, 0L, 0L, 0L, 1L, 1L, 
0L), Pclass = structure(c(3L, 1L, 3L, 1L, 3L, 3L, 1L, 3L, 3L, 
2L, 3L, 1L, 3L, 3L, 3L, 2L, 3L, 2L, 3L, 3L, 2L, 2L, 3L, 1L, 3L, 
3L, 3L, 1L, 3L, 3L, 1L, 1L, 3L, 2L, 1L, 1L, 3L, 3L, 3L, 3L, 3L, 
2L, 3L, 2L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 1L, 2L, 1L, 1L, 2L, 
3L, 2L, 3L, 3L, 1L, 1L, 3L, 1L, 3L, 2L, 3L, 3L, 3L, 2L, 3L, 2L, 
3L, 3L, 3L, 3L, 3L, 2L, 3L, 3L, 3L, 3L, 1L, 2L, 3L, 3L, 3L, 1L, 
3L, 3L, 3L, 1L, 3L, 3L, 3L, 1L, 1L, 2L, 2L), .Label = c("1", 
"2", "3"), class = "factor"), Name = structure(c(12L, 22L, 41L, 
32L, 2L, 61L, 56L, 72L, 48L, 64L, 79L, 11L, 80L, 4L, 95L, 42L, 
75L, 99L, 94L, 55L, 33L, 9L, 58L, 86L, 73L, 7L, 27L, 31L, 70L, 
90L, 92L, 87L, 34L, 98L, 59L, 43L, 54L, 14L, 93L, 65L, 1L, 91L, 
51L, 52L, 24L, 76L, 53L, 69L, 78L, 6L, 74L, 66L, 39L, 28L, 71L, 
100L, 77L, 67L, 97L, 36L, 83L, 45L, 40L, 84L, 89L, 62L, 68L, 
21L, 3L, 50L, 47L, 37L, 44L, 19L, 10L, 60L, 88L, 63L, 13L, 26L, 
96L, 81L, 57L, 15L, 46L, 8L, 29L, 85L, 30L, 16L, 18L, 5L, 17L, 
23L, 20L, 82L, 35L, 38L, 25L, 49L), .Label = c("Ahlin, Mrs. Johan (Johanna Persdotter Larsson)", 
"Allen, Mr. William Henry", "Andersson, Miss. Erna Alexandra", 
"Andersson, Mr. Anders Johan", "Andreasson, Mr. Paul Edvin", 
"Arnold-Franchi, Mrs. Josef (Josefine Franchi)", "Asplund, Mrs. Carl Oscar (Selma Augusta Emilia Johansson)", 
"Backstrom, Mrs. Karl Alfred (Maria Mathilda Gustafsson)", "Beesley, Mr. Lawrence", 
"Bing, Mr. Lee", "Bonnell, Miss. Elizabeth", "Braund, Mr. Owen Harris", 
"Caldwell, Master. Alden Gates", "Cann, Mr. Ernest Charles", 
"Carrau, Mr. Francisco M", "Celotti, Mr. Francesco", "Chaffee, Mr. Herbert Fuller", 
"Christmann, Mr. Emil", "Chronopoulos, Mr. Apostolos", "Coxon, Mr. Daniel", 
"Crease, Mr. Ernest James", "Cumings, Mrs. John Bradley (Florence Briggs Thayer)", 
"Dean, Mr. Bertram Frank", "Devaney, Miss. Margaret Delia", "Doling, Mrs. John T (Ada Julia Bone)", 
"Dowdell, Miss. Elizabeth", "Emir, Mr. Farred Chehab", "Faunthorpe, Mrs. Lizzie (Elizabeth Anne Wilkinson)", 
"Ford, Mr. William Neal", "Fortune, Miss. Mabel Helen", "Fortune, Mr. Charles Alexander", 
"Futrelle, Mrs. Jacques Heath (Lily May Peel)", "Fynney, Mr. Joseph J", 
"Glynn, Miss. Mary Agatha", "Goldschmidt, Mr. George B", "Goodwin, Master. William Frederick", 
"Goodwin, Miss. Lillian Amy", "Greenfield, Mr. William Bertram", 
"Harper, Mrs. Henry Sleeper (Myna Haxtun)", "Harris, Mr. Henry Birkhardt", 
"Heikkinen, Miss. Laina", "Hewlett, Mrs. (Mary D Kingcome) ", 
"Holverson, Mr. Alexander Oskar", "Hood, Mr. Ambrose Jr", "Icard, Miss. Amelie", 
"Ilett, Miss. Bertha", "Jenkin, Mr. Stephen Curnow", "Johnson, Mrs. Oscar W (Elisabeth Vilhelmina Berg)", 
"Kantor, Mr. Sinai", "Kink, Mr. Vincenz", "Kraeff, Mr. Theodor", 
"Laroche, Miss. Simonne Marie Anne Andree", "Lennon, Mr. Denis", 
"Mamee, Mr. Hanna", "Masselmani, Mrs. Fatima", "McCarthy, Mr. Timothy J", 
"McDermott, Miss. Brigdet Delia", "McGowan, Miss. Anna \"Annie\"", 
"Meyer, Mr. Edgar Joseph", "Moen, Mr. Sigurd Hansen", "Moran, Mr. James", 
"Moubarek, Master. Gerios", "Moutal, Mr. Rahamin Haim", "Nasser, Mrs. Nicholas (Adele Achem)", 
"Nicola-Yarred, Miss. Jamila", "Nosworthy, Mr. Richard Cater", 
"Novel, Mr. Mansouer", "Nye, Mrs. (Elizabeth Ramell)", "O'Driscoll, Miss. Bridget", 
"O'Dwyer, Miss. Ellen \"Nellie\"", "Ostby, Mr. Engelhart Cornelius", 
"Palsson, Master. Gosta Leonard", "Palsson, Miss. Torborg Danira", 
"Panula, Master. Juha Niilo", "Rice, Master. Eugene", "Rogers, Mr. William John", 
"Rugg, Miss. Emily", "Samaan, Mr. Youssef", "Sandstrom, Miss. Marguerite Rut", 
"Saundercock, Mr. William Henry", "Sheerlinck, Mr. Jan Baptist", 
"Shorney, Mr. Charles Joseph", "Sirayanian, Mr. Orsen", "Skoog, Master. Harald", 
"Slocovski, Mr. Selman Francis", "Sloper, Mr. William Thompson", 
"Spencer, Mrs. William Augustus (Marie Eugenie)", "Staneff, Mr. Ivan", 
"Stewart, Mr. Albert A", "Todoroff, Mr. Lalio", "Turpin, Mrs. William John Robert (Dorothy Ann Wonnacott)", 
"Uruchurtu, Don. Manuel E", "Vander Planke, Miss. Augusta Maria", 
"Vander Planke, Mrs. Julius (Emelia Maria Vandemoortele)", "Vestrom, Miss. Hulda Amanda Adolfina", 
"Waelens, Mr. Achille", "West, Miss. Constance Mirium", "Wheadon, Mr. Edward H", 
"Williams, Mr. Charles Eugene", "Woolner, Mr. Hugh"), class = "factor"), 
    Sex = structure(c(2L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 1L, 1L, 
    1L, 1L, 2L, 2L, 1L, 1L, 2L, 2L, 1L, 1L, 2L, 2L, 1L, 2L, 1L, 
    1L, 2L, 2L, 1L, 2L, 2L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 1L, 1L, 
    1L, 1L, 2L, 1L, 1L, 2L, 2L, 1L, 2L, 1L, 2L, 2L, 1L, 1L, 2L, 
    2L, 1L, 2L, 1L, 2L, 2L, 1L, 2L, 2L, 2L, 2L, 1L, 2L, 1L, 2L, 
    2L, 1L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 1L, 2L, 2L, 1L, 2L, 1L, 
    1L, 2L, 2L, 1L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 1L, 2L
    ), .Label = c("female", "male"), class = "factor"), Age = c(22, 
    38, 26, 35, 35, NA, 54, 2, 27, 14, 4, 58, 20, 39, 14, 55, 
    2, NA, 31, NA, 35, 34, 15, 28, 8, 38, NA, 19, NA, NA, 40, 
    NA, NA, 66, 28, 42, NA, 21, 18, 14, 40, 27, NA, 3, 19, NA, 
    NA, NA, NA, 18, 7, 21, 49, 29, 65, NA, 21, 28, 5, 11, 22, 
    38, 45, 4, NA, NA, 29, 19, 17, 26, 32, 16, 21, 26, 32, 25, 
    NA, NA, 1, 30, 22, 29, NA, 28, 17, 33, 16, NA, 23, 24, 29, 
    20, 46, 26, 59, NA, 71, 23, 34, 34), SibSp = c(1L, 1L, 0L, 
    1L, 0L, 0L, 0L, 3L, 0L, 1L, 1L, 0L, 0L, 1L, 0L, 0L, 4L, 0L, 
    1L, 0L, 0L, 0L, 0L, 0L, 3L, 1L, 0L, 3L, 0L, 0L, 0L, 1L, 0L, 
    0L, 1L, 1L, 0L, 0L, 2L, 1L, 1L, 1L, 0L, 1L, 0L, 0L, 1L, 0L, 
    2L, 1L, 4L, 0L, 1L, 1L, 0L, 0L, 0L, 0L, 1L, 5L, 0L, 0L, 1L, 
    3L, 0L, 1L, 0L, 0L, 4L, 2L, 0L, 5L, 0L, 1L, 0L, 0L, 0L, 0L, 
    0L, 0L, 0L, 0L, 0L, 0L, 0L, 3L, 1L, 0L, 3L, 0L, 0L, 0L, 1L, 
    1L, 0L, 0L, 0L, 0L, 0L, 1L), Parch = c(0L, 0L, 0L, 0L, 0L, 
    0L, 0L, 1L, 2L, 0L, 1L, 0L, 0L, 5L, 0L, 0L, 1L, 0L, 0L, 0L, 
    0L, 0L, 0L, 0L, 1L, 5L, 0L, 2L, 0L, 0L, 0L, 0L, 0L, 0L, 0L, 
    0L, 0L, 0L, 0L, 0L, 0L, 0L, 0L, 2L, 0L, 0L, 0L, 0L, 0L, 0L, 
    1L, 0L, 0L, 0L, 1L, 0L, 0L, 0L, 2L, 2L, 0L, 0L, 0L, 2L, 0L, 
    1L, 0L, 0L, 2L, 0L, 0L, 2L, 0L, 0L, 0L, 0L, 0L, 0L, 2L, 0L, 
    0L, 0L, 0L, 0L, 0L, 0L, 3L, 0L, 2L, 0L, 0L, 0L, 0L, 2L, 0L, 
    0L, 0L, 1L, 1L, 0L), Ticket = structure(c(71L, 82L, 95L, 
    7L, 64L, 36L, 11L, 58L, 52L, 15L, 88L, 4L, 72L, 49L, 59L, 
    20L, 67L, 18L, 44L, 23L, 16L, 19L, 37L, 5L, 58L, 48L, 22L, 
    13L, 40L, 55L, 83L, 80L, 41L, 74L, 84L, 6L, 28L, 69L, 45L, 
    24L, 68L, 8L, 57L, 92L, 39L, 89L, 63L, 9L, 26L, 56L, 34L, 
    70L, 81L, 31L, 2L, 12L, 76L, 30L, 78L, 79L, 27L, 3L, 62L, 
    50L, 85L, 25L, 75L, 91L, 33L, 35L, 77L, 79L, 90L, 29L, 10L, 
    53L, 54L, 65L, 21L, 61L, 46L, 47L, 38L, 1L, 93L, 32L, 96L, 
    94L, 13L, 42L, 43L, 51L, 97L, 73L, 60L, 66L, 86L, 87L, 14L, 
    17L), .Label = c("113059", "113509", "113572", "113783", 
    "113788", "113789", "113803", "11668", "14311", "1601", "17463", 
    "19947", "19950", "231919", "237736", "239865", "244367", 
    "244373", "248698", "248706", "248738", "2631", "2649", "2651", 
    "2661", "2662", "2669", "2677", "2680", "2697", "2926", "3101278", 
    "3101281", "3101295", "315151", "330877", "330923", "330932", 
    "330958", "330959", "335677", "343275", "343276", "345763", 
    "345764", "345767", "345779", "347077", "347082", "347088", 
    "347466", "347742", "348123", "349208", "349216", "349237", 
    "349253", "349909", "350406", "364500", "364516", "36973", 
    "370371", "373450", "374746", "374910", "382652", "7546", 
    "A./5. 2152", "A/4. 39886", "A/5 21171", "A/5. 2151", "C.A. 2315", 
    "C.A. 24579", "C.A. 29395", "C.A. 31026", "C.A. 33111", "C.A. 34651", 
    "CA 2144", "PC 17569", "PC 17572", "PC 17599", "PC 17601", 
    "PC 17604", "PC 17605", "PC 17754", "PC 17759", "PP 9549", 
    "S.C./A.4. 23567", "S.O.C. 14879", "S.P. 3464", "SC/Paris 2123", 
    "SO/C 14885", "SOTON/OQ 392086", "STON/O2. 3101282", "W./C. 6608", 
    "W.E.P. 5734"), class = "factor"), Fare = c(7.25, 71.2833, 
    7.925, 53.1, 8.05, 8.4583, 51.8625, 21.075, 11.1333, 30.0708, 
    16.7, 26.55, 8.05, 31.275, 7.8542, 16, 29.125, 13, 18, 7.225, 
    26, 13, 8.0292, 35.5, 21.075, 31.3875, 7.225, 263, 7.8792, 
    7.8958, 27.7208, 146.5208, 7.75, 10.5, 82.1708, 52, 7.2292, 
    8.05, 18, 11.2417, 9.475, 21, 7.8958, 41.5792, 7.8792, 8.05, 
    15.5, 7.75, 21.6792, 17.8, 39.6875, 7.8, 76.7292, 26, 61.9792, 
    35.5, 10.5, 7.2292, 27.75, 46.9, 7.2292, 80, 83.475, 27.9, 
    27.7208, 15.2458, 10.5, 8.1583, 7.925, 8.6625, 10.5, 46.9, 
    73.5, 14.4542, 56.4958, 7.65, 7.8958, 8.05, 29, 12.475, 9, 
    9.5, 7.7875, 47.1, 10.5, 15.85, 34.375, 8.05, 263, 8.05, 
    8.05, 7.8542, 61.175, 20.575, 7.25, 8.05, 34.6542, 63.3583, 
    23, 26), Cabin = structure(c(NA, 11L, NA, 7L, NA, NA, 16L, 
    NA, NA, NA, 19L, 6L, NA, NA, NA, NA, NA, NA, NA, NA, NA, 
    14L, NA, 2L, NA, NA, NA, 8L, NA, NA, NA, 5L, NA, NA, NA, 
    NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, 
    NA, NA, 13L, NA, 4L, 9L, NA, NA, NA, NA, NA, 3L, 10L, NA, 
    NA, NA, 18L, NA, NA, NA, NA, NA, NA, NA, NA, 17L, NA, NA, 
    NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, 8L, NA, NA, NA, 15L, 
    NA, NA, NA, 1L, 12L, NA, NA), .Label = c("A5", "A6", "B28", 
    "B30", "B78", "C103", "C123", "C23 C25 C27", "C52", "C83", 
    "C85", "D10 D12", "D33", "D56", "E31", "E46", "F G73", "F33", 
    "G6"), class = "factor"), Embarked = structure(c(3L, 1L, 
    3L, 3L, 3L, 2L, 3L, 3L, 3L, 1L, 3L, 3L, 3L, 3L, 3L, 3L, 2L, 
    3L, 3L, 1L, 3L, 3L, 2L, 3L, 3L, 3L, 1L, 3L, 2L, 3L, 1L, 1L, 
    2L, 3L, 1L, 3L, 1L, 3L, 3L, 1L, 3L, 3L, 1L, 1L, 2L, 3L, 2L, 
    2L, 1L, 3L, 3L, 3L, 1L, 3L, 1L, 3L, 3L, 1L, 3L, 3L, 1L, NA, 
    3L, 3L, 1L, 1L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 1L, 3L, 3L, 3L, 
    3L, 3L, 3L, 3L, 3L, 2L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 
    3L, 3L, 3L, 3L, 1L, 1L, 3L, 3L), .Label = c("C", "Q", "S"
    ), class = "factor"), Surname = structure(c(11L, 21L, 38L, 
    30L, 2L, 58L, 53L, 69L, 45L, 61L, 75L, 10L, 76L, 3L, 90L, 
    39L, 71L, 94L, 89L, 52L, 31L, 8L, 55L, 82L, 69L, 6L, 26L, 
    29L, 67L, 86L, 88L, 83L, 32L, 93L, 56L, 40L, 51L, 13L, 89L, 
    62L, 1L, 87L, 48L, 49L, 23L, 72L, 50L, 66L, 74L, 5L, 70L, 
    63L, 36L, 27L, 68L, 95L, 73L, 64L, 92L, 34L, 79L, 42L, 37L, 
    80L, 85L, 59L, 65L, 20L, 3L, 47L, 44L, 34L, 41L, 18L, 9L, 
    57L, 84L, 60L, 12L, 25L, 91L, 77L, 54L, 14L, 43L, 7L, 28L, 
    81L, 29L, 15L, 17L, 4L, 16L, 22L, 19L, 78L, 33L, 35L, 24L, 
    46L), .Label = c("Ahlin", "Allen", "Andersson", "Andreasson", 
    "Arnold-Franchi", "Asplund", "Backstrom", "Beesley", "Bing", 
    "Bonnell", "Braund", "Caldwell", "Cann", "Carrau", "Celotti", 
    "Chaffee", "Christmann", "Chronopoulos", "Coxon", "Crease", 
    "Cumings", "Dean", "Devaney", "Doling", "Dowdell", "Emir", 
    "Faunthorpe", "Ford", "Fortune", "Futrelle", "Fynney", "Glynn", 
    "Goldschmidt", "Goodwin", "Greenfield", "Harper", "Harris", 
    "Heikkinen", "Hewlett", "Holverson", "Hood", "Icard", "Ilett", 
    "Jenkin", "Johnson", "Kantor", "Kink", "Kraeff", "Laroche", 
    "Lennon", "Mamee", "Masselmani", "McCarthy", "McDermott", 
    "McGowan", "Meyer", "Moen", "Moran", "Moubarek", "Moutal", 
    "Nasser", "Nicola-Yarred", "Nosworthy", "Novel", "Nye", "O'Driscoll", 
    "O'Dwyer", "Ostby", "Palsson", "Panula", "Rice", "Rogers", 
    "Rugg", "Samaan", "Sandstrom", "Saundercock", "Sheerlinck", 
    "Shorney", "Sirayanian", "Skoog", "Slocovski", "Sloper", 
    "Spencer", "Staneff", "Stewart", "Todoroff", "Turpin", "Uruchurtu", 
    "Vander Planke", "Vestrom", "Waelens", "West", "Wheadon", 
    "Williams", "Woolner"), class = "factor"), Age_Range = c(4, 
    4, 4, 4, 4, NA, 4, 2, 4, 3, 2, 4, 4, 4, 3, 4, 2, NA, 4, NA, 
    4, 4, 3, 4, 2, 4, NA, 3, NA, NA, 6, NA, NA, 8, 5, 6, NA, 
    5, 3, 3, 6, 5, NA, 2, 3, NA, NA, NA, NA, 3, 2, 5, 6, 5, 8, 
    NA, 5, 5, 2, 2, 5, 5, 6, 2, NA, NA, 5, 3, 3, 5, 5, 3, 5, 
    5, 5, 5, NA, NA, 1, 5, 5, 5, NA, 5, 3, 5, 3, NA, 5, 5, 5, 
    5, 6, 5, 7, NA, 9, 5, 5, 5)), .Names = c("PassengerId", "Survived", 
"Pclass", "Name", "Sex", "Age", "SibSp", "Parch", "Ticket", "Fare", 
"Cabin", "Embarked", "Surname", "Age_Range"), row.names = c(NA, 
100L), class = "data.frame")