diff --git a/intern-basics/EEG_Alcohol/EEG_ALCOHOLIC_AJAY.ipynb b/intern-basics/EEG_Alcohol/EEG_ALCOHOLIC_AJAY.ipynb
new file mode 100644
index 0000000..69e6bfb
--- /dev/null
+++ b/intern-basics/EEG_Alcohol/EEG_ALCOHOLIC_AJAY.ipynb
@@ -0,0 +1 @@
+{"cells":[{"metadata":{"_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","trusted":true},"cell_type":"code","source":"# This Python 3 environment comes with many helpful analytics libraries installed\n# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python\n# For example, here's several helpful packages to load\n\nimport numpy as np # linear algebra\nimport pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)\n\n# Input data files are available in the read-only \"../input/\" directory\n# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory\n\nimport os\nfor dirname, _, filenames in os.walk('/kaggle/input'):\n for filename in filenames:\n print(os.path.join(dirname, filename))\n\n# You can write up to 5GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using \"Save & Run All\" \n# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session","execution_count":null,"outputs":[]},{"metadata":{},"cell_type":"markdown","source":"****CODE START****"},{"metadata":{},"cell_type":"markdown","source":"Import necessary libraries"},{"metadata":{"_uuid":"d629ff2d2480ee46fbb7e2d37f6b5fab8052498a","_cell_guid":"79c7e3d0-c299-4dcb-8224-4455121ee9b0","trusted":true},"cell_type":"code","source":"import numpy as np\nimport pandas as pd \nimport os\nimport random\nfrom tqdm import tqdm\nimport matplotlib\nimport seaborn as sns\nimport matplotlib.pyplot as plt\nimport plotly.graph_objs as go\nfrom plotly.offline import init_notebook_mode, iplot\nfrom plotly import tools\nfrom scipy.stats import mannwhitneyu\n\ninit_notebook_mode(connected=True) ## plotly init\nseed = 123\nrandom.seed = seed","execution_count":1,"outputs":[{"output_type":"display_data","data":{"text/html":" \n "},"metadata":{}}]},{"metadata":{"trusted":true},"cell_type":"code","source":"filenames_list = os.listdir('../input/Alcoholics/SMNI_CMI_TRAIN/Train/')\n\nData = pd.DataFrame({})\n\nfor file_names in tqdm(filenames_list):\n temp_df = pd.read_csv('../input/Alcoholics/SMNI_CMI_TRAIN/Train/' + file_names)\n Data = Data.append(temp_df)\n","execution_count":2,"outputs":[{"output_type":"stream","text":"100%|██████████| 468/468 [11:27<00:00, 1.47s/it]\n","name":"stderr"}]},{"metadata":{"trusted":true},"cell_type":"code","source":"Data.head(100000)","execution_count":3,"outputs":[{"output_type":"execute_result","execution_count":3,"data":{"text/plain":" Unnamed: 0 trial number sensor position sample num sensor value \\\n0 5 34 FP1 0 2.360 \n1 6 34 FP1 1 2.848 \n2 7 34 FP1 2 1.383 \n3 8 34 FP1 3 -1.546 \n4 9 34 FP1 4 -3.499 \n... ... ... ... ... ... \n1691 1702 71 FZ 155 6.510 \n1692 1703 71 FZ 156 6.022 \n1693 1704 71 FZ 157 5.534 \n1694 1705 71 FZ 158 5.534 \n1695 1706 71 FZ 159 5.046 \n\n subject identifier matching condition channel name time \n0 c S1 obj 0 co2c0000337 0.000000 \n1 c S1 obj 0 co2c0000337 0.003906 \n2 c S1 obj 0 co2c0000337 0.007812 \n3 c S1 obj 0 co2c0000337 0.011719 \n4 c S1 obj 0 co2c0000337 0.015625 \n... ... ... ... ... ... \n1691 a S2 match 6 co2a0000368 0.605469 \n1692 a S2 match 6 co2a0000368 0.609375 \n1693 a S2 match 6 co2a0000368 0.613281 \n1694 a S2 match 6 co2a0000368 0.617188 \n1695 a S2 match 6 co2a0000368 0.621094 \n\n[100000 rows x 10 columns]","text/html":"
\n\n
\n \n
\n
\n
Unnamed: 0
\n
trial number
\n
sensor position
\n
sample num
\n
sensor value
\n
subject identifier
\n
matching condition
\n
channel
\n
name
\n
time
\n
\n \n \n
\n
0
\n
5
\n
34
\n
FP1
\n
0
\n
2.360
\n
c
\n
S1 obj
\n
0
\n
co2c0000337
\n
0.000000
\n
\n
\n
1
\n
6
\n
34
\n
FP1
\n
1
\n
2.848
\n
c
\n
S1 obj
\n
0
\n
co2c0000337
\n
0.003906
\n
\n
\n
2
\n
7
\n
34
\n
FP1
\n
2
\n
1.383
\n
c
\n
S1 obj
\n
0
\n
co2c0000337
\n
0.007812
\n
\n
\n
3
\n
8
\n
34
\n
FP1
\n
3
\n
-1.546
\n
c
\n
S1 obj
\n
0
\n
co2c0000337
\n
0.011719
\n
\n
\n
4
\n
9
\n
34
\n
FP1
\n
4
\n
-3.499
\n
c
\n
S1 obj
\n
0
\n
co2c0000337
\n
0.015625
\n
\n
\n
...
\n
...
\n
...
\n
...
\n
...
\n
...
\n
...
\n
...
\n
...
\n
...
\n
...
\n
\n
\n
1691
\n
1702
\n
71
\n
FZ
\n
155
\n
6.510
\n
a
\n
S2 match
\n
6
\n
co2a0000368
\n
0.605469
\n
\n
\n
1692
\n
1703
\n
71
\n
FZ
\n
156
\n
6.022
\n
a
\n
S2 match
\n
6
\n
co2a0000368
\n
0.609375
\n
\n
\n
1693
\n
1704
\n
71
\n
FZ
\n
157
\n
5.534
\n
a
\n
S2 match
\n
6
\n
co2a0000368
\n
0.613281
\n
\n
\n
1694
\n
1705
\n
71
\n
FZ
\n
158
\n
5.534
\n
a
\n
S2 match
\n
6
\n
co2a0000368
\n
0.617188
\n
\n
\n
1695
\n
1706
\n
71
\n
FZ
\n
159
\n
5.046
\n
a
\n
S2 match
\n
6
\n
co2a0000368
\n
0.621094
\n
\n \n
\n
100000 rows × 10 columns
\n
"},"metadata":{}}]},{"metadata":{},"cell_type":"markdown","source":"**DATA STRUCTURE DETAILS**"},{"metadata":{"trusted":true},"cell_type":"code","source":"print(Data.shape)\nprint(Data.dtypes)","execution_count":4,"outputs":[{"output_type":"stream","text":"(7667712, 10)\nUnnamed: 0 int64\ntrial number int64\nsensor position object\nsample num int64\nsensor value float64\nsubject identifier object\nmatching condition object\nchannel int64\nname object\ntime float64\ndtype: object\n","name":"stdout"}]},{"metadata":{},"cell_type":"markdown","source":"**DATA CLEAN CHECKING**"},{"metadata":{"trusted":true},"cell_type":"code","source":"for col in Data.columns:\n pct_missing = np.mean(Data[col].isnull())\n print('{} - {}%'.format(col, round(pct_missing*100)))","execution_count":5,"outputs":[{"output_type":"stream","text":"Unnamed: 0 - 0.0%\ntrial number - 0.0%\nsensor position - 0.0%\nsample num - 0.0%\nsensor value - 0.0%\nsubject identifier - 0.0%\nmatching condition - 0.0%\nchannel - 0.0%\nname - 0.0%\ntime - 0.0%\n","name":"stdout"}]},{"metadata":{},"cell_type":"markdown","source":"**Dropping necessary columns **"},{"metadata":{"trusted":true},"cell_type":"code","source":"Data=Data.drop(['Unnamed: 0','sensor position','name'],axis = 1) \n\n\n","execution_count":6,"outputs":[]},{"metadata":{"trusted":true},"cell_type":"code","source":"#Importing Data Visualization Libraries seaborn and matplotlib\nimport matplotlib.pyplot as plt\nimport seaborn as sns\nsns.violinplot(x=\"subject identifier\",y=\"sensor value\", hue=\"subject identifier\", data=Data[:1000],color='green'); #Selecting only first 500 columns from Dataset\nplt.show()","execution_count":7,"outputs":[{"output_type":"display_data","data":{"text/plain":"
","image/png":"\n"},"metadata":{"needs_background":"light"}}]},{"metadata":{},"cell_type":"markdown","source":"# Plotting Pairwise Data Relationship"},{"metadata":{"trusted":true},"cell_type":"code","source":"Data_sample = Data[0:100]\n#Data_sample = Data_sample.drop(['trial number'],axis=1)\nData_sample.head()","execution_count":11,"outputs":[{"output_type":"execute_result","execution_count":11,"data":{"text/plain":" trial number sample num sensor value subject identifier \\\n0 34 0 2.360 c \n1 34 1 2.848 c \n2 34 2 1.383 c \n3 34 3 -1.546 c \n4 34 4 -3.499 c \n\n matching condition channel time \n0 S1 obj 0 0.000000 \n1 S1 obj 0 0.003906 \n2 S1 obj 0 0.007812 \n3 S1 obj 0 0.011719 \n4 S1 obj 0 0.015625 ","text/html":"
\n\n
\n \n
\n
\n
trial number
\n
sample num
\n
sensor value
\n
subject identifier
\n
matching condition
\n
channel
\n
time
\n
\n \n \n
\n
0
\n
34
\n
0
\n
2.360
\n
c
\n
S1 obj
\n
0
\n
0.000000
\n
\n
\n
1
\n
34
\n
1
\n
2.848
\n
c
\n
S1 obj
\n
0
\n
0.003906
\n
\n
\n
2
\n
34
\n
2
\n
1.383
\n
c
\n
S1 obj
\n
0
\n
0.007812
\n
\n
\n
3
\n
34
\n
3
\n
-1.546
\n
c
\n
S1 obj
\n
0
\n
0.011719
\n
\n
\n
4
\n
34
\n
4
\n
-3.499
\n
c
\n
S1 obj
\n
0
\n
0.015625
\n
\n \n
\n
"},"metadata":{}}]},{"metadata":{},"cell_type":"markdown","source":"**These graph shows plots of all the selected attributes against each other**"},{"metadata":{"trusted":true},"cell_type":"code","source":"g = sns.PairGrid(Data_sample)\ng.map(plt.scatter ,color=\"orange\")","execution_count":12,"outputs":[{"output_type":"execute_result","execution_count":12,"data":{"text/plain":""},"metadata":{}},{"output_type":"display_data","data":{"text/plain":"
"},"metadata":{}}]},{"metadata":{},"cell_type":"markdown","source":"# Selection of data and target"},{"metadata":{"trusted":true},"cell_type":"code","source":"x= Data.iloc[:, Data.columns != 'subject identifier']\ny= Data.iloc[:, 3]\n# In the above code x represent data and y represent target","execution_count":21,"outputs":[]},{"metadata":{"trusted":true},"cell_type":"code","source":"#import the necessary module to train-test split\n\nfrom sklearn.model_selection import train_test_split\nx_train,x_test,y_train,y_test=train_test_split(x,y,test_size=0.25)\nprint(\"Shape of data training set {}\".format(x_train.shape)) \nprint(\"Shape of data test set {}\".format(x_test.shape)) \nprint(\"Shape of target training set {}\".format(y_train.shape)) \nprint(\"Shape of target test set {}\".format(y_train.shape)) \n","execution_count":22,"outputs":[{"output_type":"stream","text":"Shape of data training set (5750784, 6)\nShape of data test set (1916928, 6)\nShape of target training set (5750784,)\nShape of target test set (5750784,)\n","name":"stdout"}]},{"metadata":{},"cell_type":"markdown","source":"# Various machine learning algorithms"},{"metadata":{},"cell_type":"markdown","source":"1. **Logistic Regression**"},{"metadata":{"trusted":true},"cell_type":"code","source":"from sklearn.linear_model import LogisticRegression\nfrom sklearn.metrics import accuracy_score\nfrom sklearn.metrics import confusion_matrix\nlogmodel=LogisticRegression()\nlogmodel.fit(x_train,y_train)\ny_pred=logmodel.predict(x_test)\nprint(y_pred)\n\n\n\n#print the accuracy score\nprint(\"Logistic Regression Accuracy\",accuracy_score(y_test,y_pred,normalize = True))\n\n\n#code for confusion matrix\nconfusion_matrix(y_test,y_pred)\n\n#from yellowbrick.classifier import ClassificationReport\nfrom yellowbrick.classifier import ClassificationReport\n# Instantiate the classification model and visualizer\nvisualizer = ClassificationReport(logmodel, classes=['0','1'])\nvisualizer.fit(x_train, y_train) # Fit the training data to the visualizer\nvisualizer.score(x_test, y_test) # Evaluate the model on the test data\ng = visualizer.poof() # Draw/show/poof the data\n\n\n","execution_count":27,"outputs":[{"output_type":"stream","text":"[0 1 0 ... 1 0 1]\nLogistic Regression Accuracy 0.5578634147970085\n","name":"stdout"},{"output_type":"stream","text":"/opt/conda/lib/python3.7/site-packages/sklearn/base.py:213: FutureWarning:\n\nFrom version 0.24, get_params will raise an AttributeError if a parameter cannot be retrieved as an instance attribute. Previously it would return None.\n\n","name":"stderr"},{"output_type":"display_data","data":{"text/plain":"","image/png":"\n"},"metadata":{}}]},{"metadata":{},"cell_type":"markdown","source":"**2.K-Nearest Neighbors**\n\n\nK nearest neighbors is a simple algorithm that stores all available cases and classifies new cases based on a similarity measure "},{"metadata":{"trusted":true},"cell_type":"code","source":"#import the necessary module\nfrom sklearn.neighbors import KNeighborsClassifier\nfrom sklearn.metrics import accuracy_score\nfrom sklearn.metrics import confusion_matrix\n\nlogmodel=KNeighborsClassifier()\nlogmodel.fit(x_train,y_train)\ny_pred=logmodel.predict(x_test)\nprint(y_pred)\n\n\n\n\n#print the accuracy score\nprint(\"K-Nearest Neighbors Accuracy\",accuracy_score(y_test,y_pred,normalize = True))\n\n\n#code for confusion matrix\nconfusion_matrix(y_test,y_pred)\n\nfrom yellowbrick.classifier import ClassificationReport\n# Instantiate the classification model and visualizer\nvisualizer = ClassificationReport(logmodel, classes=['0','1'])\nvisualizer.fit(x_train, y_train) # Fit the training data to the visualizer\nvisualizer.score(x_test, y_test) # Evaluate the model on the test data\ng = visualizer.poof() # Draw/show/poof the data\n\n\n\n","execution_count":28,"outputs":[{"output_type":"stream","text":"[0 0 0 ... 0 0 0]\nK-Nearest Neighbors Accuracy 0.6680809086204594\n","name":"stdout"},{"output_type":"stream","text":"/opt/conda/lib/python3.7/site-packages/sklearn/base.py:213: FutureWarning:\n\nFrom version 0.24, get_params will raise an AttributeError if a parameter cannot be retrieved as an instance attribute. Previously it would return None.\n\n","name":"stderr"},{"output_type":"display_data","data":{"text/plain":"","image/png":"\n"},"metadata":{}}]},{"metadata":{},"cell_type":"markdown","source":"**3.Naive Bayes**\n\nNaive-Bayes algorithm calculates the probability of the connection of a feature with a target variable and then it selects the feature with the highest probability."},{"metadata":{"trusted":true},"cell_type":"code","source":"#import the necessary module\nfrom sklearn.naive_bayes import GaussianNB\nfrom sklearn.metrics import accuracy_score\nfrom sklearn.metrics import confusion_matrix\n#Create an object of GaussianNB\ngnb = GaussianNB()\n#train the algorithm on taining data and predict using the testing data\n#Fitting the data\ngnb.fit(x_train,y_train)\n#prediction \ny_pred = gnb.predict(x_test)\nprint(y_pred)\n\n#print the accuracy score\nprint(\"Naive Bayes Accuracy \",accuracy_score(y_test,y_pred,normalize = True))\n\n#Confusion Matrix\nprint(confusion_matrix(y_test,y_pred))\n\n\n\nfrom yellowbrick.classifier import ClassificationReport\n# Instantiate the classification model and visualizer\nvisualizer = ClassificationReport(gnb, classes=['0','1'])\nvisualizer.fit(x_train, y_train) # Fit the training data to the visualizer\nvisualizer.score(x_test, y_test) # Evaluate the model on the test data\ng = visualizer.poof() # Draw/show/poof the data\n","execution_count":24,"outputs":[{"output_type":"stream","text":"[0 1 0 ... 1 0 1]\nNaive Bayes Accuracy 0.5545774280515492\n[[773747 189017]\n [664826 289338]]\n","name":"stdout"},{"output_type":"stream","text":"/opt/conda/lib/python3.7/site-packages/sklearn/utils/deprecation.py:143: FutureWarning:\n\nThe sklearn.metrics.classification module is deprecated in version 0.22 and will be removed in version 0.24. The corresponding classes / functions should instead be imported from sklearn.metrics. Anything that cannot be imported from sklearn.metrics is now part of the private API.\n\n/opt/conda/lib/python3.7/site-packages/sklearn/base.py:213: FutureWarning:\n\nFrom version 0.24, get_params will raise an AttributeError if a parameter cannot be retrieved as an instance attribute. Previously it would return None.\n\n","name":"stderr"},{"output_type":"display_data","data":{"text/plain":"","image/png":"\n"},"metadata":{}}]},{"metadata":{"trusted":true},"cell_type":"code","source":"","execution_count":null,"outputs":[]},{"metadata":{},"cell_type":"markdown","source":"**4.Decision Tree**\n\nDecision tree algorithm falls under the category of supervised learning. They can be used to solve both regression and classification problems."},{"metadata":{"trusted":true},"cell_type":"code","source":"#import the necessary module\nfrom sklearn.tree import DecisionTreeClassifier\nfrom sklearn.metrics import accuracy_score\nfrom sklearn.metrics import confusion_matrix\n#Create an object of GaussianNB\ndec_tree = DecisionTreeClassifier(criterion=\"entropy\", max_depth=5)\n#train the algorithm on taining data and predict using the testing data\n#Fitting the data\ndec_tree.fit(x_train,y_train)\n#prediction \npred = dec_tree.predict(x_test)\nprint(pred)\n\n\n\n\n\n#print the accuracy score\nprint(\"Decision Tree Accuracy \",accuracy_score(y_test,pred,normalize = True))\n\n#Confusion Matrix\nprint(confusion_matrix(y_test,pred))\n\n\n\n\n\nfrom yellowbrick.classifier import ClassificationReport\n# Instantiate the classification model and visualizer\nvisualizer = ClassificationReport(dec_tree, classes=['0','1'])\nvisualizer.fit(x_train, y_train) # Fit the training data to the visualizer\nvisualizer.score(x_test, y_test) # Evaluate the model on the test data\ng = visualizer.poof() # Draw/show/poof the data\n\n\n\n\nfrom sklearn import tree\ntree.plot_tree(dec_tree)","execution_count":25,"outputs":[{"output_type":"stream","text":"[0 1 0 ... 0 1 1]\nDecision Tree Accuracy 0.5911599183693911\n[[781566 181198]\n [602519 351645]]\n","name":"stdout"},{"output_type":"stream","text":"/opt/conda/lib/python3.7/site-packages/sklearn/base.py:213: FutureWarning:\n\nFrom version 0.24, get_params will raise an AttributeError if a parameter cannot be retrieved as an instance attribute. Previously it would return None.\n\n","name":"stderr"},{"output_type":"display_data","data":{"text/plain":"","image/png":"\n"},"metadata":{}},{"output_type":"execute_result","execution_count":25,"data":{"text/plain":"[Text(269.7, 274.065, 'X[0] <= 72.0\\nentropy = 1.0\\nsamples = 5750784\\nvalue = [2887476, 2863308]'),\n Text(251.09999999999997, 224.235, 'X[0] <= 52.0\\nentropy = 0.999\\nsamples = 5578801\\nvalue = [2887476, 2691325]'),\n Text(148.79999999999998, 174.405, 'X[2] <= 6.302\\nentropy = 0.998\\nsamples = 5222385\\nvalue = [2764524, 2457861]'),\n Text(74.39999999999999, 124.57499999999999, 'X[3] <= 0.5\\nentropy = 0.995\\nsamples = 4587657\\nvalue = [2488869, 2098788]'),\n Text(37.199999999999996, 74.745, 'X[0] <= 29.0\\nentropy = 1.0\\nsamples = 1644852\\nvalue = [841369, 803483]'),\n Text(18.599999999999998, 24.914999999999964, 'entropy = 0.995\\nsamples = 1556751\\nvalue = [841369, 715382]'),\n Text(55.8, 24.914999999999964, 'entropy = 0.0\\nsamples = 88101\\nvalue = [0, 88101]'),\n Text(111.6, 74.745, 'X[0] <= 8.0\\nentropy = 0.99\\nsamples = 2942805\\nvalue = [1647500, 1295305]'),\n Text(92.99999999999999, 24.914999999999964, 'entropy = 0.994\\nsamples = 393266\\nvalue = [179283, 213983]'),\n Text(130.2, 24.914999999999964, 'entropy = 0.983\\nsamples = 2549539\\nvalue = [1468217, 1081322]'),\n Text(223.2, 124.57499999999999, 'X[0] <= 29.5\\nentropy = 0.988\\nsamples = 634728\\nvalue = [275655, 359073]'),\n Text(185.99999999999997, 74.745, 'X[0] <= 5.5\\nentropy = 0.994\\nsamples = 485547\\nvalue = [220977, 264570]'),\n Text(167.39999999999998, 24.914999999999964, 'entropy = 0.964\\nsamples = 109714\\nvalue = [42635, 67079]'),\n Text(204.59999999999997, 24.914999999999964, 'entropy = 0.998\\nsamples = 375833\\nvalue = [178342, 197491]'),\n Text(260.4, 74.745, 'X[3] <= 0.5\\nentropy = 0.948\\nsamples = 149181\\nvalue = [54678, 94503]'),\n Text(241.79999999999998, 24.914999999999964, 'entropy = 0.0\\nsamples = 22281\\nvalue = [0, 22281]'),\n Text(278.99999999999994, 24.914999999999964, 'entropy = 0.986\\nsamples = 126900\\nvalue = [54678, 72222]'),\n Text(353.4, 174.405, 'X[0] <= 54.0\\nentropy = 0.929\\nsamples = 356416\\nvalue = [122952, 233464]'),\n Text(334.79999999999995, 124.57499999999999, 'entropy = 0.0\\nsamples = 49149\\nvalue = [0, 49149]'),\n Text(371.99999999999994, 124.57499999999999, 'X[0] <= 62.0\\nentropy = 0.971\\nsamples = 307267\\nvalue = [122952, 184315]'),\n Text(334.79999999999995, 74.745, 'X[0] <= 58.0\\nentropy = 0.996\\nsamples = 159961\\nvalue = [86183, 73778]'),\n Text(316.2, 24.914999999999964, 'entropy = 0.991\\nsamples = 110691\\nvalue = [49234, 61457]'),\n Text(353.4, 24.914999999999964, 'entropy = 0.811\\nsamples = 49270\\nvalue = [36949, 12321]'),\n Text(409.19999999999993, 74.745, 'X[3] <= 1.5\\nentropy = 0.811\\nsamples = 147306\\nvalue = [36769, 110537]'),\n Text(390.59999999999997, 24.914999999999964, 'entropy = 0.881\\nsamples = 122623\\nvalue = [36769, 85854]'),\n Text(427.79999999999995, 24.914999999999964, 'entropy = 0.0\\nsamples = 24683\\nvalue = [0, 24683]'),\n Text(288.29999999999995, 224.235, 'entropy = 0.0\\nsamples = 171983\\nvalue = [0, 171983]')]"},"metadata":{}},{"output_type":"display_data","data":{"text/plain":"","image/png":"\n"},"metadata":{}}]},{"metadata":{},"cell_type":"markdown","source":"**5.Random Forest**\n\nRandom forest, like its name implies, consists of a large number of individual decision trees that operate as an ensemble. Each individual tree in the random forest spits out a class prediction and the class with the most votes becomes our model’s prediction "},{"metadata":{"trusted":true},"cell_type":"code","source":"from sklearn.ensemble import RandomForestClassifier\nfrom sklearn.metrics import accuracy_score\nfrom sklearn.metrics import confusion_matrix\n#Create an object of GaussianNB\nrandom_forest = RandomForestClassifier(criterion=\"entropy\", max_depth=3)\n#train the algorithm on taining data and predict using the testing data\n#Fitting the data\nrandom_forest.fit(x_train,y_train)\n#prediction \npred = random_forest.predict(x_test)\nprint(pred)\n\n\n\n\n\n\n#print the accuracy score\nprint(\"Random Forest Accuracy \",accuracy_score(y_test,pred,normalize = True))\n\n\n\n\n\n#Confusion Matrix\nprint(confusion_matrix(y_test,pred))\n\nfrom yellowbrick.classifier import ClassificationReport\n# Instantiate the classification model and visualizer\nvisualizer = ClassificationReport(random_forest, classes=['0','1'])\nvisualizer.fit(x_train, y_train) # Fit the training data to the visualizer\nvisualizer.score(x_test, y_test) # Evaluate the model on the test data","execution_count":26,"outputs":[{"output_type":"stream","text":"[0 1 0 ... 1 0 1]\nRandom Forest Accuracy 0.5812717013888888\n[[829532 133232]\n [669440 284724]]\n","name":"stdout"},{"output_type":"stream","text":"/opt/conda/lib/python3.7/site-packages/sklearn/base.py:213: FutureWarning:\n\nFrom version 0.24, get_params will raise an AttributeError if a parameter cannot be retrieved as an instance attribute. Previously it would return None.\n\n","name":"stderr"},{"output_type":"execute_result","execution_count":26,"data":{"text/plain":"0.5812717013888888"},"metadata":{}},{"output_type":"display_data","data":{"text/plain":"","image/png":"\n"},"metadata":{}}]}],"metadata":{"kernelspec":{"name":"python3","display_name":"Python 3","language":"python"},"language_info":{"name":"python","version":"3.7.6","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"}},"nbformat":4,"nbformat_minor":4}
\ No newline at end of file
diff --git a/intern-basics/EEG_Alcohol/EEG_Alcohol.md b/intern-basics/EEG_Alcohol/EEG_Alcohol.md
new file mode 100644
index 0000000..2575bb1
--- /dev/null
+++ b/intern-basics/EEG_Alcohol/EEG_Alcohol.md
@@ -0,0 +1,51 @@
+# EEG-Alcohol
+
+# Data Set Information:
+This data arises from a large study to examine EEG correlates of genetic predisposition to alcoholism. It contains measurements from 64 electrodes placed on subject's scalps which were sampled at 256 Hz (3.9-msec epoch) for 1 second.
+
+There were two groups of subjects: alcoholic and control. Each subject was exposed to either a single stimulus (S1) or to two stimuli (S1 and S2) which were pictures of objects chosen from the 1980 Snodgrass and Vanderwart picture set. When two stimuli were shown, they were presented in either a matched condition where S1 was identical to S2 or in a non-matched condition where S1 differed from S2.
+
+# Attribute Information
+
+Each trial is stored in its own file and will appear in the following format.
+
+trial number sensor position sample num sensor value subject identifier matching condition channel name time
+
+0 FP1 0 -8.921 a S1 obj 0 co2a0000364 0
+
+0 AF8 87 4.14 a S1 obj 33 co2a0000364 0.33
+
+The columns of data are:
+
+**the trial number**,
+
+**sensor position**,
+
+**sample number** (0-255),
+
+**sensor value** (in micro volts),
+
+**subject identifier**(Alcoholic(a) or Control (c)),
+
+**matching condition**(a single object shown (S1 obj), object 2 shown in a matching condition (S2 match), and object 2 shown in non matching condition (S2 nomatch)),
+
+**channel number**(0-63),
+
+**name**(a serial code assigned to each subject),
+
+**time**(inverse of sample num measured in seconds))
+
+# Working
+**Subject Identifer** is our label of the data, the dataset was divided into 75-25 ratio using train_test split .
+I used 5 algorithms on my dataset and compared their accuracy:-
+- **Logistic Regression** 55.78%
+- **Naive Bayes** 55.46%
+- **K-Nearest Neighbors** 66.81%
+- **Decision Tree** 59.11%
+- **Random Forest** 58.12%
+
+We further used Confusion Matrix to evaluate performance of our algorithms.
+Since K-Nearest Neighbors has the highest accuracy,we will use K-Nearest Neighbors on our data.
+
+
+# Dataset Link - https://www.kaggle.com/nnair25/Alcoholics