From d94b6c4ab4421b392eafb39a1b0cb87af88b7b5b Mon Sep 17 00:00:00 2001 From: Tanuj Vishnoi Date: Mon, 27 Aug 2018 04:14:10 +0530 Subject: [PATCH] first commit --- .../categorical_data.R | 20 --------- .../data_preprocessing_template.R | 16 ------- Part 1 - Data Preprocessing/missing_data.R | 12 ----- .../Multiple_Linear_Regression.zip | Bin 5501 -> 0 bytes .../Multiple_Linear_Regression/.DS_Store | Bin 6148 -> 0 bytes .../data_preprocessing_template.R | 16 ------- .../data_preprocessing_template.py | 23 ---------- .../multiple_linear_regression.R | 28 ------------ .../multiple_linear_regression.py | 41 ------------------ .../Multiple_Linear_Regression/._.DS_Store | Bin 120 -> 0 bytes .../._50_Startups.csv | Bin 576 -> 0 bytes 11 files changed, 156 deletions(-) delete mode 100644 Part 1 - Data Preprocessing/categorical_data.R delete mode 100644 Part 1 - Data Preprocessing/data_preprocessing_template.R delete mode 100644 Part 1 - Data Preprocessing/missing_data.R delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression.zip delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/.DS_Store delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/data_preprocessing_template.R delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/data_preprocessing_template.py delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/multiple_linear_regression.R delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/multiple_linear_regression.py delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/__MACOSX/Multiple_Linear_Regression/._.DS_Store delete mode 100644 Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/__MACOSX/Multiple_Linear_Regression/._50_Startups.csv diff --git a/Part 1 - Data Preprocessing/categorical_data.R b/Part 1 - Data Preprocessing/categorical_data.R deleted file mode 100644 index 84614db..0000000 --- a/Part 1 - Data Preprocessing/categorical_data.R +++ /dev/null @@ -1,20 +0,0 @@ -# Data Preprocessing - -# Importing the dataset -dataset = read.csv('Data.csv') - -# Taking care of missing data -dataset$Age = ifelse(is.na(dataset$Age), - ave(dataset$Age, FUN = function(x) mean(x, na.rm = TRUE)), - dataset$Age) -dataset$Salary = ifelse(is.na(dataset$Salary), - ave(dataset$Salary, FUN = function(x) mean(x, na.rm = TRUE)), - dataset$Salary) - -# Encoding categorical data -dataset$Country = factor(dataset$Country, - levels = c('France', 'Spain', 'Germany'), - labels = c(1, 2, 3)) -dataset$Purchased = factor(dataset$Purchased, - levels = c('No', 'Yes'), - labels = c(0, 1)) \ No newline at end of file diff --git a/Part 1 - Data Preprocessing/data_preprocessing_template.R b/Part 1 - Data Preprocessing/data_preprocessing_template.R deleted file mode 100644 index 73fd269..0000000 --- a/Part 1 - Data Preprocessing/data_preprocessing_template.R +++ /dev/null @@ -1,16 +0,0 @@ -# Data Preprocessing Template - -# Importing the dataset -dataset = read.csv('Data.csv') - -# Splitting the dataset into the Training set and Test set -# install.packages('caTools') -library(caTools) -set.seed(123) -split = sample.split(dataset$DependentVariable, SplitRatio = 0.8) -training_set = subset(dataset, split == TRUE) -test_set = subset(dataset, split == FALSE) - -# Feature Scaling -# training_set = scale(training_set) -# test_set = scale(test_set) \ No newline at end of file diff --git a/Part 1 - Data Preprocessing/missing_data.R b/Part 1 - Data Preprocessing/missing_data.R deleted file mode 100644 index 21baccb..0000000 --- a/Part 1 - Data Preprocessing/missing_data.R +++ /dev/null @@ -1,12 +0,0 @@ -# Data Preprocessing - -# Importing the dataset -dataset = read.csv('Data.csv') - -# Taking care of missing data -dataset$Age = ifelse(is.na(dataset$Age), - ave(dataset$Age, FUN = function(x) mean(x, na.rm = TRUE)), - dataset$Age) -dataset$Salary = ifelse(is.na(dataset$Salary), - ave(dataset$Salary, FUN = function(x) mean(x, na.rm = TRUE)), - dataset$Salary) \ No newline at end of file diff --git a/Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression.zip b/Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression.zip deleted file mode 100644 index c0d35d229fbc625ac31204ed609df2327f187924..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 5501 zcmbVQWmr_}79L7QLE$!%2!tswkKPUl20A&w*cN=GW zOSqDaqot`U9A;_lYU$=?lJW6eAnTCc9qrRtC&sIQz+$kf8Wb033kY>6K~acJ z1~}&A2f5XMA@@9r6F6L1LP}Lb_n1n56piTTCzb#GH8hpKUi$~<{1x%PJBQ<6BC^B( zr=QGCz~oSeRNwiq+edaxueI6aGw0e*DAJcOpy^cT}IYFH+%T( zY4yABx0SkyH`Mw}M{oezS#H;>$%UUMa@oBPb%7-%Dv=fmjMq#hE#>ESDNZOFpg{~37OakcB8!dJ5aUuNe6Cg$m_I^KW%|ZLy8kBpI6=R?xQM@bN)!q)*qzo?K zzGRUAf5S^wNT;L@eWOqfG5DfnccV{Y!)v9(s=WS7%flzUr7|%ClP2qydR+UqOi&KB z+~k@fV^Vw{;!8)0qlZGy!1u|=Q?(XX?ku3|Ag7^BWuRc_)=WIN%OT%oc@Ze2W z=TBO?;6t)zTI_t(J)|X;4n=rRC`Rt-3p;BQV9?KfTQ0F0Yc8HI`Zin{mf?VPq_;3k zd~cp5Ud|vlNTPG9r;}x8uuseXtu$8-opnS$-GiB`E7w>n>ye558z0S=BatdfwcDkI zNwi>08f8u@Uq0@I8NqGaAdhqHIJc>@vX(cjn>L$pi1Tq(&6?_MugP4xJvab5=OD}x z7|X1yIQr5>J*N+A6nqZ1)L_9(Q1l3l z^a>~Fq1W>4HLy!ThGc2^94$o9S}k5Yc(K?WG|_D>&tHoSjT&RMJ^z9hR`C86|43>r z{6;meIDIWn_%?E}*4el4oi1iX^L5HfxP?%ChZPsfdRd6uy@}^s>JYIB;)BzdA zZgX`*`IvdR$#7-0xRcqX&^uNLQjF1hUvl0L_mStR1YQ4AIR}p)}&o&FoAxdT}hgj&8r=Nc>Cmb692t0pQ%H#dlIr$&5-)r@5 zmA4S0rX@~%}6qs zMFraTKkqTcI+^Ua6I%GOZ+|VX-M^ZGY{e%CTmpP8ZcBg6@j+*JerHWAk8K(Z8Qu45 zLmJwPZ+yxLjkS;nC!S3(d6>81nAd2-gMU+Tg6Cm^AJpke1%Mg8J4Er^tG$si$fg8H zE;p|b!(2J%w-KnN72ib7`rTz2uP8P5y23T4>#1=!;&Vnd$tR2Mv{D=BOz#PMk^wQul>Q{ ztl}T8BOy{=?SYTDn?38qAwv4OK)QS@edEfP$XEKeZoO%gmFtGctJvjOz#l=CGX)Zj z)bTUYSP{r~Alyn>Ji1oS%cPSSX#XX2KGRpm001DEC;f+SL4T@b37%cDEKJ=^;m)p> z&aO`8Xffqz4R^P6aJDyfw`6zrMprPjrmD#9IIdt0(W-WhocPUahoE#(o_k%(z4=9B zWXpUv3GZ?FKNd)OVoqtm=9O{>mKc$>bggGiR6%u{A{oTu^*~5^YB4TC_>D1P1Is(f zmme*GVplZw-|U-egU-rX@7>drX@1u;DjBSCb1pdhb@xg|Eiy z4hV^(ohVMTfvJLWV*V*7X8*;B0{_1gVLyF1^8AMngVdDKKCGS70Sbj;F)mM+KnVlN zI7du*kOfi-($=3xTVS|*JFz5$iX6gvK0c~z?W`l|v^7j&*CLwi4~Tt)WI`mhUi;5! z;45&mq+rL!JjrC?u%{(fS!tWf?g@9*;@5jGV?C>nI}A;@CziJ5ov6MU>r*l#n>G9@ z)y<*l3tnVXHgz#!L$MbX3HBpekU@J` zM@&=;#?E_B*|JwFeN{Qn+%0m9(xzIUq27<4%;Dg;VHFDH2 zYm>*llmV-L+p4B?iR3m}GFN!BB{cSjCGF$UibWfZH=l=A3PcnJWBOJl_g4fJ55$oj zL*sQZIS<+A6%*s4sr>C|54m~32H#U}JA+k&D;kYfXN;d{LV_^s47Qp-I(Ol>YTl*2 zs9~#8qSyMA3MaefYpS|Q6d$$W&9C=Ld!A|a62QZ{g=R@UeoAF1o1uwL7Km-V(P>5y8OdVQMNXzC^4{7l_S5fO2v-s^nh63B_qtMat05% z6?+;3!rDTi3kcPEEBQayynu&~m{GuMYdf0FG5VFRxb^Mq^B@{|(|`!0WZS0<>x5B6l^mi)*J z4Z~&%d##^L6i-Uyb^a-pm&?`?u)Ek=ON%uo)87HJ(Oy1N{?~JJ_n~Z4&m&0oj*D@X zh@d(HDhEuX3i9vBWYuCl6`A~J=YcaK^EeH3qgvz=vY{V=2~)NkgAmm&>EJV@f`QS5 z7iwqJ!YIs-S+7%#tflExc~jkgh^*Cr4c?p(ZsKv%?P%(0nck#mhrRUCgx9v zE(H-pC&`FcbX}TzK@7_f)xU3V+~9#hBc4p%&a9=UahS=xOZ6@7W!nD3$rXCskV<_Y zhY>S9-_?L>fTmGCYeC3HG@E;Vz8GNx@R6%E(g;K@uP2C=v~8dzeD zdC1R`a3-p}I@s?GAUtQZ?sZwu=%9Z-IkHxct)>4B{N^N^(3CQH;f77%t?XgsVDQ|* z!rC()O_t>HByLUQ18Fx~W2w~VNJQPxaXpY*h`AJt%1*La=s3W@1Y`ZLfe1b-j~!o- z6$$kBnH@Or*LdUy=Q06o!y1AmQ5PA>WHV}{@82NFi8P5zo5 zXz2n0KSu;-L7ZIRfkfO%h%;9Dcl6)eKiT(loZ9~9e~Er-81Yvoei%ZJ5l*UYmQ#j8 zP{;m^)&EUa1Ah$_PWlpU&}?ljsEg z5}hY^h!#aB3%I~3lSim?a>mBaGKtEKKP;jp(n*VGVQ?}rpSI|L3g0b?sa}J#`@KCods@@P1qyPN}@}|2b diff --git a/Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/.DS_Store b/Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/Multiple_Linear_Regression/.DS_Store deleted file mode 100644 index 5008ddfcf53c02e82d7eee2e57c38e5672ef89f6..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 6148 zcmeH~Jr2S!425mzP>H1@V-^m;4Wg<&0T*E43hX&L&p$$qDprKhvt+--jT7}7np#A3 zem<@ulZcFPQ@L2!n>{z**++&mCkOWA81W14cNZlEfg7;MkzE(HCqgga^y>{tEnwC%0;vJ&^%eQ zLs35+`xjp>T0$Vqox1Ojhs@R)|o50+1L3ClDI}u^SMB_!U6R09PRZ;$Z`hAt6CfagYwM HE_8JOM2!ci diff --git a/Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/__MACOSX/Multiple_Linear_Regression/._50_Startups.csv b/Part 2 - Regression/Section 5 - Multiple Linear Regression/Multiple_Linear_Regression/__MACOSX/Multiple_Linear_Regression/._50_Startups.csv deleted file mode 100644 index be931daf95f3c13c53fc8494dfff9926ebd65bf7..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 576 zcmcJL%}&BV6oqeVj2ew$qiZ&@E1j19PzVtU7LgDWA^aE*kTQf`1aX>s4H!#kMV7tTrA0rEeQwUrWSXP|do&<~QQ4D~nKbIsLC2by zx0A?pr$}~6rmtT4zgJU>_w=8Q>$Os2}?jfA5WrUDY)lJth6l-2>f5r5)RZ%nGk&`Ma fSvN+hi6mRG%95rvRLL@QMY55jwGgs3&351ub@7Wo