|
38 | 38 | "import numpy as np\n",
|
39 | 39 | "from github import GithubException\n",
|
40 | 40 | "\n",
|
41 |
| - "#create GitHub Personal access token here https://github.com/settings/tokens\n", |
| 41 | + "#Create a GitHub personal access token at https://github.com/settings/tokens\n", |
42 | 42 | "login = 'YOURLOGIN'\n",
|
43 | 43 | "token = 'YOURTOKEN'\n",
|
44 | 44 | "\n",
|
45 | 45 | "g = github.Github(login, token)\n",
|
46 | 46 | "repos = []\n",
|
47 | 47 | "org = g.get_organization('IBM')\n",
|
48 | 48 | "\n",
|
49 |
| - "#we are only going to look at code with the following extensions, trying changing for other\n", |
50 |
| - "#programming langauges and for binary classificition (2, not 8, classes)\n", |
| 49 | + "#We'll look at code only with the following extensions. You can try this with other\n", |
| 50 | + "#programming languages and for binary classification (2, not 8, classes).\n", |
51 | 51 | "targetlangs = ['.go','.java','.js','.m','.py','.sh','.swift','.xml']\n",
|
52 | 52 | "\n",
|
53 |
| - "#get the list of repos at https://github.com/IBM\n", |
| 53 | + "#Get the list of repos at https://github.com/IBM.\n", |
54 | 54 | "for repo in g.get_organization('IBM').get_repos():\n",
|
55 | 55 | " repos.append(repo.name)"
|
56 | 56 | ]
|
|
536 | 536 | "cell_type": "markdown",
|
537 | 537 | "metadata": {},
|
538 | 538 | "source": [
|
539 |
| - "### Splitting the code into training/testing set.\n", |
540 |
| - "Here the length of the dataset and it contents can be seen.\n", |
541 |
| - "Pickle the training/testing sets for the next notebook (mine are included in the github)" |
| 539 | + "### Split the code into a training and a testing set.\n", |
| 540 | + "You can see the length of the dataset and its contents.\n", |
| 541 | + "Pickle the training and testing sets for the next notebook (mine are included in the github)" |
542 | 542 | ]
|
543 | 543 | },
|
544 | 544 | {
|
|
0 commit comments