You are on page 1of 13

Week4_Assignment

Jnana Sagar Pedada

16/04/2022

Load the necessary libraries as well as the data.


library(tidyverse)

## Warning: package 'tidyverse' was built under R version 4.1.3

## -- Attaching packages --------------------------------------- tidyverse


1.3.1 --

## v ggplot2 3.3.5 v purrr 0.3.4


## v tibble 3.1.6 v dplyr 1.0.8
## v tidyr 1.2.0 v stringr 1.4.0
## v readr 2.0.2 v forcats 0.5.1

## -- Conflicts ------------------------------------------
tidyverse_conflicts() --
## x dplyr::filter() masks stats::filter()
## x dplyr::lag() masks stats::lag()

library('caret')

## Loading required package: lattice


##
## Attaching package: 'caret'

## The following object is masked from 'package:purrr':


##
## lift

library(e1071)

bank_statistics <- read.csv('train.csv')

Take a look at the example data.


head(bank_statistics)

## ID_code target var_0 var_1 var_2 var_3 var_4 var_5 var_6


var_7
## 1 train_0 0 8.9255 -6.7863 11.9081 5.0930 11.4607 -9.2834 5.1187
18.6266
## 2 train_1 0 11.5006 -4.1473 13.8588 5.3890 12.3622 7.0433 5.6208
16.5338
## 3 train_2 0 8.6093 -2.7457 12.0805 7.8928 10.5825 -9.0837 6.9427
14.6155
## 4 train_3 0 11.0604 -2.1518 8.9522 7.1957 12.5846 -1.8361 5.8428
14.9250
## 5 train_4 0 9.8369 -1.4834 12.8746 6.6375 12.2772 2.4486 5.9405
19.2514
## 6 train_5 0 11.4763 -2.3182 12.6080 8.6264 10.9621 3.5609 4.5322
15.2255
## var_8 var_9 var_10 var_11 var_12 var_13 var_14 var_15 var_16
## 1 -4.9200 5.7470 2.9252 3.1821 14.0137 0.5745 8.7989 14.5691 5.7487
## 2 3.1468 8.0851 -0.4032 8.0585 14.0239 8.4135 5.4345 13.7003 13.8275
## 3 -4.9193 5.9525 -0.3249 -11.2648 14.1929 7.3124 7.5244 14.6472 7.6782
## 4 -5.8609 8.2450 2.3061 2.8102 13.8463 11.9704 6.4569 14.8372 10.7430
## 5 6.2654 7.6784 -9.4458 -12.1419 13.8481 7.8895 7.7894 15.0553 8.4871
## 6 3.5855 5.9790 0.8010 -0.6192 13.6380 1.2589 8.1939 14.9894 12.0763
## var_17 var_18 var_19 var_20 var_21 var_22 var_23 var_24 var_25
## 1 -7.2393 4.2840 30.7133 10.5350 16.2191 2.5791 2.4716 14.3831 13.4325
## 2 -15.5849 7.8000 28.5708 3.4287 2.7407 8.5524 3.3716 6.9779 13.8910
## 3 -1.7395 4.7011 20.4775 17.7559 18.1377 1.2145 3.5137 5.6777 13.2177
## 4 -0.4299 15.9426 13.7257 20.3010 12.5579 6.8202 2.7229 12.1354 13.7367
## 5 -3.0680 6.5263 11.3152 21.4246 18.9608 10.1102 2.7142 14.2080 13.5433
## 6 -1.4710 6.7341 14.8241 19.7172 11.9882 1.0468 3.8663 4.7252 13.9427
## var_26 var_27 var_28 var_29 var_30 var_31 var_32 var_33 var_34
## 1 -5.1488 -0.4073 4.9306 5.9965 -0.3085 12.9041 -3.8766 16.8911 11.1920
## 2 -11.7684 -2.5586 5.0464 0.5481 -9.2987 7.8755 1.2859 19.3710 11.3702
## 3 -7.9940 -2.9029 5.8463 6.1439 -11.1025 12.4858 -2.2871 19.0422 11.0449
## 4 0.8135 -0.9059 5.9070 2.8407 -15.2398 10.4407 -2.5731 6.1796 10.6093
## 5 3.1736 -3.3423 5.9015 7.9352 -3.1582 9.4668 -0.0083 19.3239 12.4057
## 6 -1.2796 -4.3763 5.1494 0.4124 -5.0732 4.9010 1.5459 15.6423 10.7209
## var_35 var_36 var_37 var_38 var_39 var_40 var_41 var_42 var_43
var_44
## 1 10.5785 0.6764 7.8871 4.6667 3.8743 -5.2387 7.3746 11.5767 12.0446
11.6418
## 2 0.7399 2.7995 5.8434 10.8160 3.6783 -11.1147 1.8730 9.8775 11.7842
1.2444
## 3 4.1087 4.6974 6.9346 10.8917 0.9003 -13.5174 2.2439 11.5283 12.0406
4.1006
## 4 -5.9158 8.1723 2.8521 9.1738 0.6665 -3.8294 -1.0370 11.7770 11.2834
8.0485
## 5 0.6329 2.7922 5.8184 19.3038 1.4450 -5.5963 14.0685 11.9171 11.5111
6.9087
## 6 15.1886 1.8685 7.7223 5.5317 2.2308 2.6553 13.9730 11.5015 11.6891
14.1062
## var_45 var_46 var_47 var_48 var_49 var_50 var_51 var_52 var_53
## 1 -7.0170 5.9226 -14.2136 16.0283 5.3253 12.9194 29.0460 -0.6940 5.1736
## 2 -47.3797 7.3718 0.1948 34.4014 25.7037 11.8343 13.2256 -4.1083 6.6885
## 3 -7.9078 11.1405 -5.7864 20.7477 6.8874 12.9143 19.5856 0.7268 6.4059
## 4 -24.6840 12.7404 -35.1659 0.7613 8.3838 12.6832 9.5503 1.7895 5.2091
## 5 -65.4863 13.8657 0.0444 -0.1346 14.4268 13.3273 10.4857 -1.4367 5.7555
## 6 -44.7257 10.6470 -24.6935 29.9912 13.5894 13.2355 5.5513 -7.7762 5.2399
## var_54 var_55 var_56 var_57 var_58 var_59 var_60 var_61 var_62
## 1 -0.7474 14.8322 11.2668 5.3822 2.0183 10.1166 16.1828 4.9590 2.0771
## 2 -8.0946 18.5995 19.3219 7.0118 1.9210 8.8682 8.0109 -7.2417 1.7944
## 3 9.3124 6.2846 15.6372 5.8200 1.1000 9.1854 12.5963 -10.3734 0.8748
## 4 8.0913 12.3972 14.4698 6.5850 3.3164 9.4638 15.7820 -25.0222 3.4418
## 5 -8.5414 14.1482 16.9840 6.1812 1.9548 9.2048 8.6591 -27.7439 -0.4952
## 6 7.0189 15.2849 11.8258 5.9587 4.7676 8.2253 11.1254 -0.7472 -1.6063
## var_63 var_64 var_65 var_66 var_67 var_68 var_69 var_70 var_71
var_72
## 1 -0.2154 8.6748 9.5319 5.8056 22.4321 5.0109 -4.7010 21.6374 0.5663
5.1999
## 2 -1.3147 8.1042 1.5365 5.4007 7.9344 5.0220 2.2302 40.5632 0.5134
3.1701
## 3 5.8042 3.7163 -1.1016 7.3667 9.8565 5.0228 -5.7828 2.3612 0.8520
6.3577
## 4 -4.3923 8.6464 6.3072 5.6221 23.6143 5.0220 -3.9989 4.0462 0.2500
1.2516
## 5 -1.7839 5.2670 -4.3205 6.9860 1.6184 5.0301 -3.2431 40.1236 0.7737 -
0.7264
## 6 6.0702 6.0604 5.4693 4.9098 14.1160 5.0110 -5.6684 35.2664 0.6780
8.1653
## var_73 var_74 var_75 var_76 var_77 var_78 var_79 var_80 var_81
## 1 8.8600 43.1127 18.3816 -2.3440 23.4104 6.5199 12.1983 13.6468 13.8372
## 2 20.1068 7.7841 7.0529 3.2709 23.4822 5.5075 13.7814 2.5462 18.1782
## 3 12.1719 19.7312 19.4465 4.5048 23.2378 6.3191 12.8046 7.4729 15.7811
## 4 24.4187 4.5290 15.4235 11.6875 23.6273 4.0806 15.2733 0.7839 10.5404
## 5 4.5886 -4.5346 23.3521 1.0273 19.1600 7.1734 14.3937 2.9598 13.3317
## 6 9.9031 10.5392 14.4814 12.7784 17.4977 3.3793 16.0082 -5.4905 15.3766
## var_82 var_83 var_84 var_85 var_86 var_87 var_88 var_89
var_90
## 1 1.3675 2.9423 -4.5213 21.4669 9.3225 16.4597 7.9984 -1.7069 -
21.4494
## 2 0.3683 -4.8210 -5.4850 13.7867 -13.5901 11.0993 7.9022 12.2301
0.4768
## 3 13.3529 10.1852 5.4604 19.0773 -4.4577 9.5413 11.9052 2.1447 -
22.4038
## 4 1.6212 -5.2896 1.6027 17.9762 -2.3174 15.6298 4.5474 7.5509 -
7.5866
## 5 -9.2587 -6.7075 7.8984 14.5265 7.0799 20.1670 8.0053 3.7954 -
39.7997
## 6 1.8135 -1.9153 -8.3058 20.1690 2.6433 19.9457 9.4972 -3.5982 -
1.1717
## var_91 var_92 var_93 var_94 var_95 var_96 var_97 var_98 var_99
## 1 6.7806 11.0924 9.9913 14.8421 0.1812 8.9642 16.2572 2.1743 -3.4132
## 2 6.8852 8.0905 10.9631 11.7569 -1.2722 24.7876 26.6881 1.8944 0.6939
## 3 7.0883 14.1613 10.5080 14.2621 0.2647 20.4031 17.0360 1.6981 -0.0269
## 4 7.0364 14.4027 10.7795 7.2887 -1.0930 11.3596 18.1486 2.8344 1.9480
## 5 7.0065 9.3627 10.4316 14.0553 0.0213 14.7246 35.2988 1.6844 0.6715
## 6 6.9204 8.8093 10.5375 10.2029 1.1735 14.0648 17.9100 0.9217 0.0886
## var_100 var_101 var_102 var_103 var_104 var_105 var_106 var_107 var_108
## 1 9.4763 13.3102 26.5376 1.4403 14.7100 6.0454 9.5426 17.1554 14.1104
## 2 -13.6950 8.4068 35.4734 1.7093 15.1866 2.6227 7.3412 32.0888 13.9550
## 3 -0.3939 12.6317 14.8863 1.3854 15.0284 3.9995 5.3683 8.6273 14.1963
## 4 -19.8592 22.5316 18.6129 1.3512 9.3291 4.2835 10.3907 7.0874 14.3256
## 5 -22.9264 12.3562 17.3410 1.6940 7.1179 5.1934 8.8230 10.6617 14.0837
## 6 -8.3794 19.8236 12.2780 1.6012 15.4090 4.2972 10.5131 16.4164 14.1434
## var_109 var_110 var_111 var_112 var_113 var_114 var_115 var_116 var_117
## 1 24.3627 2.0323 6.7602 3.9141 -0.4851 2.5240 1.5093 2.5516 15.5752
## 2 13.0858 6.6203 7.1051 5.3523 8.5426 3.6159 4.1569 3.0454 7.8522
## 3 20.3882 3.2304 5.7033 4.5255 2.1929 3.1290 2.9044 1.1696 28.7632
## 4 14.4135 4.2827 6.9750 1.6480 11.6896 2.5762 -2.5459 5.3446 38.1015
## 5 28.2749 -0.1937 5.9654 1.0719 7.9923 2.9138 -3.6135 1.4684 25.6795
## 6 23.9731 7.0040 7.1879 3.9414 9.9727 3.6737 0.8970 2.2988 -18.1194
## var_118 var_119 var_120 var_121 var_122 var_123 var_124 var_125 var_126
## 1 -13.4221 7.2739 16.0094 9.7268 0.8897 0.7754 4.2218 12.0039 13.8571
## 2 -11.5100 7.5109 31.5899 9.5018 8.2736 10.1633 0.1225 12.5942 14.5697
## 3 -17.2738 2.1056 21.1613 8.9573 2.7768 -2.1746 3.6932 12.4653 14.1978
## 4 3.5732 5.0988 30.5644 11.3025 3.9618 -8.2464 2.7038 12.3441 12.5431
## 5 13.8224 4.7478 41.1037 12.7140 5.2964 9.7289 3.9370 12.1316 12.5815
## 6 8.6835 -2.8671 11.2701 9.0465 -1.5511 9.9305 4.3756 12.3697 13.0031
## var_127 var_128 var_129 var_130 var_131 var_132 var_133 var_134 var_135
## 1 -0.7338 -1.9245 15.4462 12.8287 0.3587 9.6508 6.5674 5.1726 3.1345
## 2 2.4354 0.8194 16.5346 12.4205 -0.1780 5.7582 7.0513 1.9568 -8.9921
## 3 -2.5511 -0.9479 17.1092 11.5419 0.0975 8.8186 6.6231 3.9358 -11.7218
## 4 -1.3683 3.5974 13.9761 14.3003 1.0486 8.9500 7.1954 -1.1984 1.9586
## 5 7.0642 5.6518 10.9346 11.4266 0.9442 7.7532 6.6173 -6.8304 6.4730
## 6 5.0993 -5.8702 15.0534 12.7212 0.5762 7.0965 6.6143 -8.8256 -0.9844
## var_136 var_137 var_138 var_139 var_140 var_141 var_142 var_143 var_144
## 1 29.4547 31.4045 2.8279 15.6599 8.3307 -5.6011 19.0614 11.2663 8.6989
## 2 9.7797 18.1577 -1.9721 16.1622 3.6937 6.6803 -0.3243 12.2806 8.6086
## 3 24.5437 15.5827 3.8212 8.6674 7.3834 -2.4438 10.2158 7.4844 9.1104
## 4 27.5609 24.6065 -2.8233 8.9821 3.8873 15.9638 10.0142 7.8388 9.9718
## 5 17.1728 25.8128 2.6791 13.9547 6.6289 -4.3965 11.7159 16.1080 7.6874
## 6 26.1603 11.9963 -5.9018 13.3065 4.4419 -0.0496 18.7239 14.1586 9.6607
## var_145 var_146 var_147 var_148 var_149 var_150 var_151 var_152 var_153
## 1 8.3694 11.5659 -16.4727 4.0288 17.9244 18.5177 10.7800 9.0056 16.6964
## 2 11.0738 8.9231 11.7700 4.2578 -4.4223 20.6294 14.8743 9.4317 16.7242
## 3 4.3649 11.4934 1.7624 4.0714 -1.2681 14.3330 8.0088 4.4015 14.1479
## 4 2.9253 10.4994 4.1622 3.7613 2.3701 18.0984 17.1765 7.6508 18.2452
## 5 9.1570 11.5670 -12.7047 3.7574 9.9110 20.1461 1.2995 5.8493 19.8234
## 6 2.6134 12.9650 4.7280 3.9799 1.4462 19.5171 7.5903 5.7223 15.2331
## var_154 var_155 var_156 var_157 var_158 var_159 var_160 var_161
var_162
## 1 10.4838 1.6573 12.1749 -13.1324 17.6054 11.5423 15.4576 5.3133
3.6159
## 2 -0.5687 0.1898 12.2419 -9.6953 22.3949 10.6261 29.4846 5.8683
3.8208
## 3 -5.1747 0.5778 14.5362 -1.7624 33.8820 11.6041 13.2070 5.8442
4.7086
## 4 17.0336 -10.9370 12.0500 -1.2155 19.9750 12.3892 31.8833 5.9684
7.2084
## 5 4.7022 10.6101 13.0021 -12.6068 27.0846 8.0913 33.5107 5.6953
5.4663
## 6 15.4401 -2.0738 12.4068 -16.8151 24.2054 4.9455 16.5552 5.3739
6.4487
## var_163 var_164 var_165 var_166 var_167 var_168 var_169 var_170 var_171
## 1 5.0384 6.6760 12.6644 2.7004 -0.6975 9.5981 5.4879 -4.7645 -8.4254
## 2 15.8348 -5.0121 15.1345 3.2003 9.3192 3.8821 5.7999 5.5378 5.0988
## 3 5.7141 -1.0410 20.5092 3.2790 -5.5952 7.3176 5.7690 -7.0927 -3.9116
## 4 3.8899 -11.0882 17.2502 2.5881 -2.7018 0.5641 5.3430 -7.1541 -6.1920
## 5 18.2201 6.5769 21.2607 3.2304 -1.7759 3.1283 5.5518 1.4493 -2.6627
## 6 11.5631 1.3847 14.9638 2.8455 -9.0953 3.8278 5.9714 -6.1449 -2.0285
## var_172 var_173 var_174 var_175 var_176 var_177 var_178 var_179
var_180
## 1 20.8773 3.1531 18.5618 7.7423 -10.1245 13.7241 -3.5189 1.7202 -
8.4051
## 2 22.0330 5.5134 30.2645 10.4968 -7.2352 16.5721 -7.3477 11.0752 -
5.5937
## 3 7.2569 -5.8234 25.6820 10.9202 -0.3104 8.8438 -9.7009 2.4013 -
4.2935
## 4 18.2366 11.7134 14.7483 8.1013 11.8771 13.9552 -10.4701 5.6961 -
3.7546
## 5 19.8056 2.3705 18.4685 16.3309 -3.3456 13.5261 1.7189 5.1743 -
7.6938
## 6 18.4106 1.4457 21.8853 9.2654 -6.5247 10.7687 -7.6283 1.0208
7.1968
## var_181 var_182 var_183 var_184 var_185 var_186 var_187 var_188
var_189
## 1 9.0164 3.0657 14.3691 25.8398 5.8764 11.8411 -19.7159 17.5743
0.5857
## 2 9.4878 -14.9100 9.4245 22.5441 -4.8622 7.6543 -15.9319 13.3175 -
0.3566
## 3 9.3908 -13.2648 3.1545 23.0866 -5.3000 5.3745 -6.2660 10.1934 -
0.8417
## 4 8.4117 1.8986 7.2601 -0.4639 -0.0498 7.9336 -12.8279 12.4124
1.8489
## 5 9.7685 4.8910 12.2198 11.8503 -7.8931 6.4209 5.9270 16.0201 -
0.2829
## 6 11.1227 2.2257 6.4056 21.0550 -13.6509 4.7691 -8.9114 15.1007
2.4286
## var_190 var_191 var_192 var_193 var_194 var_195 var_196 var_197 var_198
## 1 4.4354 3.9642 3.1364 1.6910 18.5227 -2.3978 7.8784 8.5635 12.7803
## 2 7.6421 7.7214 2.5837 10.9516 15.4305 2.0339 8.1267 8.7889 18.3560
## 3 2.9057 9.7905 1.6704 1.6858 21.6042 3.1417 -6.5213 8.2675 14.7222
## 4 4.4666 4.7433 0.7178 1.4214 23.0347 -1.2706 -2.9275 10.2922 17.9697
## 5 -1.4905 9.5214 -0.1508 9.1942 13.2876 -1.5121 3.9267 9.5031 17.9974
## 6 -6.3068 6.6025 5.2912 0.4403 14.9452 1.0314 -3.6241 9.7670 12.5809
## var_199
## 1 -1.0914
## 2 1.9518
## 3 0.3965
## 4 -8.9996
## 5 -8.8104
## 6 -4.7602

If you look at the example data, you’ll notice that the first variable, ‘ID code,’ isn’t used
much for forecasting the o/p variable, therefore we’ll get rid of it.
bank_statistics <- bank_statistics[-1]

Check to see if the data has any missing values. Missing values in the data as a percentage of
the total
colMeans(is.na(bank_statistics))

## target var_0 var_1 var_2 var_3 var_4 var_5 var_6 var_7


var_8
## 0 0 0 0 0 0 0 0 0
0
## var_9 var_10 var_11 var_12 var_13 var_14 var_15 var_16 var_17
var_18
## 0 0 0 0 0 0 0 0 0
0
## var_19 var_20 var_21 var_22 var_23 var_24 var_25 var_26 var_27
var_28
## 0 0 0 0 0 0 0 0 0
0
## var_29 var_30 var_31 var_32 var_33 var_34 var_35 var_36 var_37
var_38
## 0 0 0 0 0 0 0 0 0
0
## var_39 var_40 var_41 var_42 var_43 var_44 var_45 var_46 var_47
var_48
## 0 0 0 0 0 0 0 0 0
0
## var_49 var_50 var_51 var_52 var_53 var_54 var_55 var_56 var_57
var_58
## 0 0 0 0 0 0 0 0 0
0
## var_59 var_60 var_61 var_62 var_63 var_64 var_65 var_66 var_67
var_68
## 0 0 0 0 0 0 0 0 0
0
## var_69 var_70 var_71 var_72 var_73 var_74 var_75 var_76 var_77
var_78
## 0 0 0 0 0 0 0 0 0
0
## var_79 var_80 var_81 var_82 var_83 var_84 var_85 var_86 var_87
var_88
## 0 0 0 0 0 0 0 0 0
0
## var_89 var_90 var_91 var_92 var_93 var_94 var_95 var_96 var_97
var_98
## 0 0 0 0 0 0 0 0 0
0
## var_99 var_100 var_101 var_102 var_103 var_104 var_105 var_106 var_107
var_108
## 0 0 0 0 0 0 0 0 0
0
## var_109 var_110 var_111 var_112 var_113 var_114 var_115 var_116 var_117
var_118
## 0 0 0 0 0 0 0 0 0
0
## var_119 var_120 var_121 var_122 var_123 var_124 var_125 var_126 var_127
var_128
## 0 0 0 0 0 0 0 0 0
0
## var_129 var_130 var_131 var_132 var_133 var_134 var_135 var_136 var_137
var_138
## 0 0 0 0 0 0 0 0 0
0
## var_139 var_140 var_141 var_142 var_143 var_144 var_145 var_146 var_147
var_148
## 0 0 0 0 0 0 0 0 0
0
## var_149 var_150 var_151 var_152 var_153 var_154 var_155 var_156 var_157
var_158
## 0 0 0 0 0 0 0 0 0
0
## var_159 var_160 var_161 var_162 var_163 var_164 var_165 var_166 var_167
var_168
## 0 0 0 0 0 0 0 0 0
0
## var_169 var_170 var_171 var_172 var_173 var_174 var_175 var_176 var_177
var_178
## 0 0 0 0 0 0 0 0 0
0
## var_179 var_180 var_181 var_182 var_183 var_184 var_185 var_186 var_187
var_188
## 0 0 0 0 0 0 0 0 0
0
## var_189 var_190 var_191 var_192 var_193 var_194 var_195 var_196 var_197
var_198
## 0 0 0 0 0 0 0 0 0
0
## var_199
## 0

In the data, there are no missing values.


Because we have 200 input variables, we shall separate the target and input variables and
apply Principal component analysis to decrease the input variables.
Y = bank_statistics[1]
X = bank_statistics[-1]

PrinCompAna <- princomp(X, cor = TRUE, scores = TRUE, covmat = NULL)

Build the Support vector machine Model with the first three Principal Components.
summary(PrinCompAna)

## Importance of components:
## Comp.1 Comp.2 Comp.3 Comp.4
## Standard deviation 1.105719777 1.029822431 1.029429108 1.029245081
## Proportion of Variance 0.006113081 0.005302671 0.005298621 0.005296727
## Cumulative Proportion 0.006113081 0.011415752 0.016714374 0.022011101
## Comp.5 Comp.6 Comp.7 Comp.8
## Standard deviation 1.028391179 1.027880189 1.027567621 1.027060349
## Proportion of Variance 0.005287942 0.005282688 0.005279476 0.005274265
## Cumulative Proportion 0.027299043 0.032581731 0.037861208 0.043135472
## Comp.9 Comp.10 Comp.11 Comp.12
## Standard deviation 1.026221764 1.025946720 1.025236326 1.02468922
## Proportion of Variance 0.005265656 0.005262833 0.005255548 0.00524994
## Cumulative Proportion 0.048401128 0.053663961 0.058919509 0.06416945
## Comp.13 Comp.14 Comp.15 Comp.16
## Standard deviation 1.024306994 1.023413060 1.023309657 1.023233771
## Proportion of Variance 0.005246024 0.005236871 0.005235813 0.005235037
## Cumulative Proportion 0.069415473 0.074652344 0.079888158 0.085123194
## Comp.17 Comp.18 Comp.19 Comp.20
## Standard deviation 1.022474589 1.02213694 1.021691268 1.021593309
## Proportion of Variance 0.005227271 0.00522382 0.005219265 0.005218264
## Cumulative Proportion 0.090350466 0.09557429 0.100793551 0.106011815
## Comp.21 Comp.22 Comp.23 Comp.24
## Standard deviation 1.021270679 1.020801522 1.020518686 1.020040798
## Proportion of Variance 0.005214969 0.005210179 0.005207292 0.005202416
## Cumulative Proportion 0.111226784 0.116436963 0.121644255 0.126846671
## Comp.25 Comp.26 Comp.27 Comp.28
## Standard deviation 1.019779756 1.019264275 1.019116219 1.01907406
## Proportion of Variance 0.005199754 0.005194498 0.005192989 0.00519256
## Cumulative Proportion 0.132046425 0.137240923 0.142433912 0.14762647
## Comp.29 Comp.30 Comp.31 Comp.32
## Standard deviation 1.018573850 1.018183339 1.018125035 1.017674008
## Proportion of Variance 0.005187463 0.005183487 0.005182893 0.005178302
## Cumulative Proportion 0.152813935 0.157997422 0.163180315 0.168358617
## Comp.33 Comp.34 Comp.35 Comp.36
## Standard deviation 1.017245621 1.016780533 1.016496110 1.016461835
## Proportion of Variance 0.005173943 0.005169213 0.005166322 0.005165973
## Cumulative Proportion 0.173532560 0.178701773 0.183868095 0.189034068
## Comp.37 Comp.38 Comp.39 Comp.40
## Standard deviation 1.016112050 1.015851051 1.015350554 1.015219848
## Proportion of Variance 0.005162418 0.005159767 0.005154684 0.005153357
## Cumulative Proportion 0.194196487 0.199356254 0.204510937 0.209664294
## Comp.41 Comp.42 Comp.43 Comp.44
## Standard deviation 1.014838546 1.014393913 1.014158651 1.014012473
## Proportion of Variance 0.005149486 0.005144975 0.005142589 0.005141106
## Cumulative Proportion 0.214813780 0.219958756 0.225101344 0.230242451
## Comp.45 Comp.46 Comp.47 Comp.48
## Standard deviation 1.013610854 1.013356991 1.013096979 1.012820323
## Proportion of Variance 0.005137035 0.005134462 0.005131827 0.005129025
## Cumulative Proportion 0.235379486 0.240513948 0.245645775 0.250774800
## Comp.49 Comp.50 Comp.51 Comp.52
## Standard deviation 1.012704097 1.012436300 1.011836606 1.011706062
## Proportion of Variance 0.005127848 0.005125136 0.005119067 0.005117746
## Cumulative Proportion 0.255902648 0.261027784 0.266146851 0.271264597
## Comp.53 Comp.54 Comp.55 Comp.56
## Standard deviation 1.011570455 1.01143759 1.01088178 1.010575325
## Proportion of Variance 0.005116374 0.00511503 0.00510941 0.005106312
## Cumulative Proportion 0.276380971 0.28149600 0.28660541 0.291711723
## Comp.57 Comp.58 Comp.59 Comp.60
## Standard deviation 1.010532630 1.01026329 1.010079712 1.009774676
## Proportion of Variance 0.005105881 0.00510316 0.005101305 0.005098224
## Cumulative Proportion 0.296817604 0.30192076 0.307022069 0.312120293
## Comp.61 Comp.62 Comp.63 Comp.64
## Standard deviation 1.00948796 1.009225817 1.009070469 1.008761326
## Proportion of Variance 0.00509533 0.005092684 0.005091116 0.005087997
## Cumulative Proportion 0.31721562 0.322308307 0.327399423 0.332487420
## Comp.65 Comp.66 Comp.67 Comp.68
## Standard deviation 1.008359864 1.008017693 1.007888809 1.007549264
## Proportion of Variance 0.005083948 0.005080498 0.005079199 0.005075778
## Cumulative Proportion 0.337571368 0.342651866 0.347731065 0.352806843
## Comp.69 Comp.70 Comp.71 Comp.72
## Standard deviation 1.007177022 1.00686541 1.006768525 1.006323404
## Proportion of Variance 0.005072028 0.00506889 0.005067914 0.005063434
## Cumulative Proportion 0.357878871 0.36294776 0.368015675 0.373079109
## Comp.73 Comp.74 Comp.75 Comp.76
## Standard deviation 1.006203308 1.005898022 1.005621760 1.005434625
## Proportion of Variance 0.005062225 0.005059154 0.005056376 0.005054494
## Cumulative Proportion 0.378141334 0.383200488 0.388256864 0.393311358
## Comp.77 Comp.78 Comp.79 Comp.80
## Standard deviation 1.005193594 1.005056096 1.004629822 1.004335492
## Proportion of Variance 0.005052071 0.005050689 0.005046405 0.005043449
## Cumulative Proportion 0.398363429 0.403414118 0.408460523 0.413503972
## Comp.81 Comp.82 Comp.83 Comp.84
## Standard deviation 1.004246820 1.003960960 1.00388546 1.003389966
## Proportion of Variance 0.005042558 0.005039688 0.00503893 0.005033957
## Cumulative Proportion 0.418546530 0.423586218 0.42862515 0.433659106
## Comp.85 Comp.86 Comp.87 Comp.88
## Standard deviation 1.003027881 1.002843548 1.002692203 1.002394921
## Proportion of Variance 0.005030325 0.005028476 0.005026958 0.005023978
## Cumulative Proportion 0.438689430 0.443717906 0.448744864 0.453768842
## Comp.89 Comp.90 Comp.91 Comp.92
Comp.93
## Standard deviation 1.002129301 1.001959597 1.0017784 1.001399918
1.0013291
## Proportion of Variance 0.005021316 0.005019615 0.0050178 0.005014009
0.0050133
## Cumulative Proportion 0.458790158 0.463809773 0.4688276 0.473841582
0.4788549
## Comp.94 Comp.95 Comp.96 Comp.97
## Standard deviation 1.000906248 1.000564321 1.000319758 1.000246087
## Proportion of Variance 0.005009067 0.005005645 0.005003198 0.005002461
## Cumulative Proportion 0.483863948 0.488869593 0.493872791 0.498875252
## Comp.98 Comp.99 Comp.100 Comp.101
## Standard deviation 0.999843125 0.999293565 0.999202589 0.998936060
## Proportion of Variance 0.004998431 0.004992938 0.004992029 0.004989366
## Cumulative Proportion 0.503873683 0.508866622 0.513858651 0.518848017
## Comp.102 Comp.103 Comp.104 Comp.105
## Standard deviation 0.998748103 0.99861307 0.998331831 0.998149480
## Proportion of Variance 0.004987489 0.00498614 0.004983332 0.004981512
## Cumulative Proportion 0.523835506 0.52882165 0.533804978 0.538786490
## Comp.106 Comp.107 Comp.108 Comp.109
## Standard deviation 0.997771324 0.997668986 0.997339518 0.996849819
## Proportion of Variance 0.004977738 0.004976717 0.004973431 0.004968548
## Cumulative Proportion 0.543764228 0.548740945 0.553714376 0.558682924
## Comp.110 Comp.111 Comp.112 Comp.113
## Standard deviation 0.996723750 0.996441176 0.996258649 0.996082099
## Proportion of Variance 0.004967291 0.004964475 0.004962656 0.004960898
## Cumulative Proportion 0.563650215 0.568614690 0.573577346 0.578538244
## Comp.114 Comp.115 Comp.116 Comp.117
## Standard deviation 0.995765351 0.995622718 0.995382190 0.994997908
## Proportion of Variance 0.004957743 0.004956323 0.004953929 0.004950104
## Cumulative Proportion 0.583495987 0.588452310 0.593406239 0.598356343
## Comp.118 Comp.119 Comp.120 Comp.121
## Standard deviation 0.994868229 0.994660893 0.994424829 0.99402620
## Proportion of Variance 0.004948814 0.004946751 0.004944404 0.00494044
## Cumulative Proportion 0.603305157 0.608251908 0.613196312 0.61813675
## Comp.122 Comp.123 Comp.124 Comp.125
## Standard deviation 0.993908183 0.993571970 0.993493407 0.993088658
## Proportion of Variance 0.004939267 0.004935926 0.004935146 0.004931125
## Cumulative Proportion 0.623076020 0.628011946 0.632947092 0.637878217
## Comp.126 Comp.127 Comp.128 Comp.129
## Standard deviation 0.992966138 0.992702816 0.992625127 0.99220564
## Proportion of Variance 0.004929909 0.004927294 0.004926523 0.00492236
## Cumulative Proportion 0.642808126 0.647735421 0.652661944 0.65758430
## Comp.130 Comp.131 Comp.132 Comp.133
## Standard deviation 0.992042540 0.991908895 0.991439602 0.991234259
## Proportion of Variance 0.004920742 0.004919416 0.004914762 0.004912727
## Cumulative Proportion 0.662505046 0.667424462 0.672339225 0.677251951
## Comp.134 Comp.135 Comp.136 Comp.137
## Standard deviation 0.991050581 0.990732667 0.990468753 0.990376945
## Proportion of Variance 0.004910906 0.004907756 0.004905142 0.004904232
## Cumulative Proportion 0.682162858 0.687070614 0.691975756 0.696879988
## Comp.138 Comp.139 Comp.140 Comp.141
## Standard deviation 0.990043974 0.989915233 0.989638621 0.989350388
## Proportion of Variance 0.004900935 0.004899661 0.004896923 0.004894071
## Cumulative Proportion 0.701780923 0.706680584 0.711577507 0.716471578
## Comp.142 Comp.143 Comp.144 Comp.145
## Standard deviation 0.988808954 0.988676403 0.988471795 0.987895599
## Proportion of Variance 0.004888716 0.004887405 0.004885382 0.004879689
## Cumulative Proportion 0.721360294 0.726247699 0.731133082 0.736012770
## Comp.146 Comp.147 Comp.148 Comp.149
## Standard deviation 0.987489364 0.987237785 0.987163909 0.986930163
## Proportion of Variance 0.004875676 0.004873192 0.004872463 0.004870156
## Cumulative Proportion 0.740888446 0.745761639 0.750634101 0.755504257
## Comp.150 Comp.151 Comp.152 Comp.153
## Standard deviation 0.986730047 0.986360921 0.986046874 0.985848279
## Proportion of Variance 0.004868181 0.004864539 0.004861442 0.004859484
## Cumulative Proportion 0.760372438 0.765236977 0.770098420 0.774957904
## Comp.154 Comp.155 Comp.156 Comp.157
## Standard deviation 0.985601252 0.9854034 0.984950929 0.984777560
## Proportion of Variance 0.004857049 0.0048551 0.004850642 0.004848934
## Cumulative Proportion 0.779814953 0.7846701 0.789520694 0.794369628
## Comp.158 Comp.159 Comp.160 Comp.161
## Standard deviation 0.984524008 0.984393268 0.984114620 0.98396748
## Proportion of Variance 0.004846438 0.004845151 0.004842408 0.00484096
## Cumulative Proportion 0.799216066 0.804061217 0.808903625 0.81374458
## Comp.162 Comp.163 Comp.164 Comp.165
## Standard deviation 0.983431890 0.983259936 0.983081320 0.982790493
## Proportion of Variance 0.004835691 0.004834001 0.004832244 0.004829386
## Cumulative Proportion 0.818580276 0.823414276 0.828246521 0.833075907
## Comp.166 Comp.167 Comp.168 Comp.169
## Standard deviation 0.982689722 0.982193906 0.981566695 0.981350989
## Proportion of Variance 0.004828395 0.004823524 0.004817366 0.004815249
## Cumulative Proportion 0.837904302 0.842727826 0.847545192 0.852360441
## Comp.170 Comp.171 Comp.172 Comp.173
## Standard deviation 0.981156986 0.980937039 0.980634414 0.980446431
## Proportion of Variance 0.004813345 0.004811187 0.004808219 0.004806376
## Cumulative Proportion 0.857173786 0.861984974 0.866793193 0.871599569
## Comp.174 Comp.175 Comp.176 Comp.177
## Standard deviation 0.980058665 0.979885529 0.979669532 0.979178959
## Proportion of Variance 0.004802575 0.004800878 0.004798762 0.004793957
## Cumulative Proportion 0.876402144 0.881203022 0.886001784 0.890795741
## Comp.178 Comp.179 Comp.180 Comp.181
## Standard deviation 0.979123281 0.978591938 0.97813295 0.977674583
## Proportion of Variance 0.004793412 0.004788211 0.00478372 0.004779238
## Cumulative Proportion 0.895589153 0.900377364 0.90516108 0.909940322
## Comp.182 Comp.183 Comp.184 Comp.185
## Standard deviation 0.977534333 0.977241822 0.976819697 0.976228536
## Proportion of Variance 0.004777867 0.004775008 0.004770884 0.004765111
## Cumulative Proportion 0.914718189 0.919493197 0.924264081 0.929029192
## Comp.186 Comp.187 Comp.188 Comp.189
## Standard deviation 0.975882947 0.975736385 0.975336627 0.97489798
## Proportion of Variance 0.004761738 0.004760307 0.004756408 0.00475213
## Cumulative Proportion 0.933790929 0.938551237 0.943307644 0.94805977
## Comp.190 Comp.191 Comp.192 Comp.193
## Standard deviation 0.97444244 0.973860243 0.973657731 0.973090097
## Proportion of Variance 0.00474769 0.004742019 0.004740047 0.004734522
## Cumulative Proportion 0.95280747 0.957549484 0.962289531 0.967024052
## Comp.194 Comp.195 Comp.196 Comp.197
## Standard deviation 0.972756706 0.972401962 0.971319846 0.970912041
## Proportion of Variance 0.004731278 0.004727828 0.004717311 0.004713351
## Cumulative Proportion 0.971755331 0.976483158 0.981200470 0.985913821
## Comp.198 Comp.199 Comp.200
## Standard deviation 0.969434370 0.969170184 0.96857733
## Proportion of Variance 0.004699015 0.004696454 0.00469071
## Cumulative Proportion 0.990612836 0.995309290 1.00000000

split your time between training and testing 75% of the total sample size
X <- PrinCompAna$scores[,1:3]
PrinCompAna_Info<-cbind(Y,PrinCompAna$scores[,1:3])

Set the seed to ensure that your partition is repeatable.


size <- floor(0.5* nrow(PrinCompAna_Info))

set.seed(4)
sample_index <- sample(seq_len(nrow(PrinCompAna_Info)), size = size)

PrinCompAna_trainset <- PrinCompAna_Info[sample_index, ]


PrinCompAna_testset <- PrinCompAna_Info[-sample_index, ]
PrinCompAna_trainset[["target"]] =
as.factor(PrinCompAna_trainset[["target"]])

Create a model based on train data.


SuppVecMac <- svm(formula = target ~ .,
data = PrinCompAna_trainset,
type = 'C-classification',
kernel = 'linear')

testset_predictions <- predict(SuppVecMac, newdata = PrinCompAna_testset)

confusionMatrix(table(testset_predictions, PrinCompAna_testset$target))

## Confusion Matrix and Statistics


##
##
## testset_predictions 0 1
## 0 89831 10169
## 1 0 0
##
## Accuracy : 0.8983
## 95% CI : (0.8964, 0.9002)
## No Information Rate : 0.8983
## P-Value [Acc > NIR] : 0.5026
##
## Kappa : 0
##
## Mcnemar's Test P-Value : <2e-16
##
## Sensitivity : 1.0000
## Specificity : 0.0000
## Pos Pred Value : 0.8983
## Neg Pred Value : NaN
## Prevalence : 0.8983
## Detection Rate : 0.8983
## Detection Prevalence : 1.0000
## Balanced Accuracy : 0.5000
##
## 'Positive' Class : 0
##

You might also like