Update the grammar and syntax and fix typos (#23)

SirSpidey · stevemart · commit f08d7bf2e902 · 2018-10-12T14:24:13.000-04:00
cc @zmohammad01
diff --git a/tools/getdata.ipynb b/tools/getdata.ipynb
@@ -38,19 +38,19 @@
     "import numpy as np\n",
     "from github import GithubException\n",
     "\n",
-    "#create GitHub Personal access token here https://github.com/settings/tokens\n",
+    "#Create a GitHub personal access token at https://github.com/settings/tokens\n",
     "login = 'YOURLOGIN'\n",
     "token = 'YOURTOKEN'\n",
     "\n",
     "g = github.Github(login, token)\n",
     "repos = []\n",
     "org = g.get_organization('IBM')\n",
     "\n",
-    "#we are only going to look at code with the following extensions, trying changing for other\n",
-    "#programming langauges and for binary classificition (2, not 8, classes)\n",
+    "#We'll look at code only with the following extensions. You can try this with other\n",
+    "#programming languages and for binary classification (2, not 8, classes).\n",
     "targetlangs = ['.go','.java','.js','.m','.py','.sh','.swift','.xml']\n",
     "\n",
-    "#get the list of repos at https://github.com/IBM\n",
+    "#Get the list of repos at https://github.com/IBM.\n",
     "for repo in g.get_organization('IBM').get_repos():\n",
     "    repos.append(repo.name)"
    ]
@@ -536,9 +536,9 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "### Splitting the code into training/testing set.\n",
-    "Here the length of the dataset and it contents can be seen.\n",
-    "Pickle the training/testing sets for the next notebook (mine are included in the github)"
+    "### Split the code into a training and a testing set.\n",
+    "You can see the length of the dataset and its contents.\n",
+    "Pickle the training and testing sets for the next notebook (mine are included in the github)"
    ]
   },
   {