topcoderinc
diff --git a/‎.eslintrc
+30 b/‎.eslintrc
+30
diff --git a/‎.gitignore
+47 b/‎.gitignore
+47
diff --git a/‎README.md
+51 b/‎README.md
+51
diff --git a/‎common/logger.js
+49 b/‎common/logger.js
+49
diff --git a/‎config/custom-environment-variables.json
+8 b/‎config/custom-environment-variables.json
+8
diff --git a/‎config/default.json
+8 b/‎config/default.json
+8
diff --git a/‎constants.js
+65 b/‎constants.js
+65
diff --git a/‎csvCounts.txt
+55 b/‎csvCounts.txt
+55
diff --git a/‎models/Branch.js
+19 b/‎models/Branch.js
+19
diff --git a/‎models/Burial.js
+18 b/‎models/Burial.js
+18
diff --git a/‎models/Cemetery.js
+22 b/‎models/Cemetery.js
+22
@@ -0,0 +1,30 @@
+{
+  "extends": "airbnb-base",
+  "rules": {
+      "no-use-before-define": 0,
+      "strict": 0,
+      "comma-dangle": [2, "never"],
+      "func-names": 0,
+      "no-underscore-dangle": 0,
+      "prefer-rest-params": 0,
+      "no-param-reassign": 0,
+      "prefer-template": 0,
+      "new-cap": 0,
+      "global-require": 0,
+      "consistent-return": 0,
+      "max-len": [2, 200],
+      "camelcase": 0,
+      "import/no-dynamic-require": 0
+  },
+  "parserOptions": {
+    "ecmaVersion": 6
+  },
+  "globals": {
+    "describe": true,
+    "it": true,
+    "before": true,
+    "beforeEach": true,
+    "after": true,
+    "afterEach": true
+  }
+}
@@ -0,0 +1,47 @@
+node_modules
+*.zip
+# Logs
+logs
+*.log
+npm-debug.log*
+
+#kyle
+.DS_Store
+*.csv
+
+# Runtime data
+pids
+*.pid
+*.seed
+*.pid.lock
+
+# Directory for instrumented libs generated by jscoverage/JSCover
+lib-cov
+
+# Coverage directory used by tools like istanbul
+coverage
+
+# nyc test coverage
+.nyc_output
+
+# Grunt intermediate storage (http://gruntjs.com/creating-plugins#storing-task-files)
+.grunt
+
+# node-waf configuration
+.lock-wscript
+
+# Compiled binary addons (http://nodejs.org/api/addons.html)
+build/Release
+
+# Dependency directories
+node_modules
+jspm_packages
+
+# Optional npm cache directory
+.npm
+
+# Optional eslint cache
+.eslintcache
+
+# Optional REPL history
+.node_repl_history
@@ -0,0 +1,51 @@
+# VA ONLINE MEMORIAL - DATA IMPORT & SYNC
+
+## Dependencies
+-   [Nodejs](https://nodejs.org/en/)
+-   [PostgreSQL](https://www.postgresql.org/)
+-   [eslint](http://eslint.org/)
+
+## Configuration
+-   Edit configuration in `config/default.json` and
+-   custom environment variables names in `config/custom-environment-variables.json`,
+
+## Application constants
+
+-   Application constants can be configured in `./constants.js`
+
+## Available tools
+
+-   Since the data we need to download and process is huge it's better (/ safer) to use 2 different tools instead of one single script so in case that something goes wrong during processing, we'll minimise the damage.
+
+### Download datasets
+
+-   Run `npm run download-data` to download all available datasets.
+-   The datasets will be stored in the configured directory.
+-   Old data will be replaced.
+-   This operation does not affect the database.
+
+### Import data from downloaded files
+
+-   Run `npm run import-data` to import all data using the downloaded files from the previous step.
+
+## Local Deployment
+
+*Before starting the application, make sure that PostgreSQL is running and you have configured everything correctly in `config/default.json`*
+
+-   Install dependencies `npm i`
+-   Run lint check `npm run lint`
+-   Start app `npm start`. This will run all tools in the following sequence:
+
+`npm run download-data` => `npm run import-data`
+
+*The application will print progress information and the results in the terminal.*
+
+## Verification
+
+-   To verify that the data is imported, you can use the [pgAdmin](https://www.pgadmin.org/) tool and browser the database.
+
+## Notes:
+
+-   The total size of all datasets is > 1.5GB so it will take quite some time, depending on your internet connection, to finish the operation.
+-   `max_old_space_size` has been set to *4096MB* to allow parse/process such huge data files without any issues. The app will clean the memory right after using the data to prevent memory/heap leaks.
+-   The dataset for `FOREIGN ADDRESSES` doesn't have a header in the CSV file and it has slightly different format (it has an extra column). The app handles all datasets without any issue.
@@ -0,0 +1,49 @@
+'use strict';
+
+/*
+ * Copyright (C) 2017 Topcoder Inc., All Rights Reserved.
+ */
+
+/**
+ * This module contains the winston logger configuration.
+ */
+
+const winston = require('winston');
+const config = require('config');
+const chalk = require('chalk');
+
+const logger = new (winston.Logger)({
+  transports: [
+    new (winston.transports.Console)({
+      level: config.logLevel,
+      timestamp: () => new Date().toISOString(),
+      formatter(options) {
+        const message = options.message || '';
+
+        let meta = '';
+        if (options.meta && Object.keys(options.meta).length) {
+          meta = '\n\t' + JSON.stringify(options.meta);
+        }
+
+        let level = options.level.toUpperCase();
+        switch (level) {
+          case 'INFO':
+            level = chalk.cyan(level);
+            break;
+          case 'WARN':
+            level = chalk.yellow(level);
+            break;
+          case 'ERROR':
+            level = chalk.red(level);
+            break;
+          default:
+            break;
+        }
+
+        return `[${options.timestamp()}][${level}] ${message} ${meta}`;
+      }
+    })
+  ]
+});
+
+module.exports = logger;
@@ -0,0 +1,8 @@
+{
+  "dataset_url": "DATASET_URL",
+  "logLevel": "LOG_LEVEL",
+  "dbConfig": {
+    "db_url": "DATABASE_URL"
+  },
+  "downloadPath": "DOWNLOAD_PATH"
+}
@@ -0,0 +1,8 @@
+{
+  "dataset_url": "https://www.data.va.gov/data.json",
+  "logLevel": "info",
+  "dbConfig": {
+    "db_url": "postgres://user:pass@localhost:5432/va"
+  },
+  "downloadPath": "downloads"
+}
@@ -0,0 +1,65 @@
+'use strict';
+
+/*
+ * Copyright (c) 2017 Topcoder, Inc. All rights reserved.
+ */
+
+/**
+ * Application constants
+ */
+
+// The accepted program codes
+const acceptedProgramCodes = [
+  '029:001'
+];
+
+// The accepted keywords
+const acceptedKeywords = [
+  'burial data'
+];
+
+// The accepted file format
+const acceptedFormat = 'csv';
+
+// Entry names that should be ignored
+const ignoredNames = [
+  // Source of cemeteries data
+  'VA Cemeteries - Address, Location, Contact Information, Burial Space'
+];
+
+// CSV headers
+const csvHeaders = [
+  'd_first_name',
+  'd_mid_name',
+  'd_last_name',
+  'd_suffix',
+  'd_birth_date',
+  'd_death_date',
+  'section_id',
+  'row_num',
+  'site_num',
+  'cem_name',
+  'cem_addr_one',
+  'cem_addr_two',
+  'city',
+  'state',
+  'zip',
+  'cem_url',
+  'cem_phone',
+  'relationship',
+  'v_first_name',
+  'v_mid_name',
+  'v_last_name',
+  'v_suffix',
+  'branch',
+  'rank',
+  'war'
+];
+
+module.exports = {
+  acceptedProgramCodes,
+  acceptedKeywords,
+  acceptedFormat,
+  ignoredNames,
+  csvHeaders
+};
@@ -0,0 +1,55 @@
+       0 csvCounts.txt
+   21872 ngl_alabama.csv
+    8880 ngl_alaska.csv
+   96485 ngl_arizona.csv
+   64296 ngl_arkansas.csv
+  741842 ngl_california.csv
+  141187 ngl_colorado.csv
+       1 ngl_connecticut.csv
+   21309 ngl_delaware.csv
+  305774 ngl_florida.csv
+    4313 ngl_foreign_addresses.csv
+   57960 ngl_georgia.csv
+   73123 ngl_hawaii.csv
+    7362 ngl_idaho.csv
+  135405 ngl_illinois.csv
+   24972 ngl_indiana.csv
+    9565 ngl_iowa.csv
+   77240 ngl_kansas.csv
+   60459 ngl_kentucky.csv
+   35590 ngl_louisiana.csv
+   30708 ngl_maine.csv
+  137464 ngl_maryland.csv
+   84708 ngl_massachusetts.csv
+   71418 ngl_michigan.csv
+  234249 ngl_minnesota.csv
+   41613 ngl_mississippi.csv
+  252711 ngl_missouri.csv
+    3784 ngl_montana.csv
+   12859 ngl_nebraska.csv
+   49952 ngl_nevada.csv
+   10217 ngl_new_hampshire.csv
+  113334 ngl_new_jersey.csv
+   65241 ngl_new_mexico.csv
+  683640 ngl_new_york.csv
+   40412 ngl_north_carolina.csv
+    7678 ngl_north_dakota.csv
+   90253 ngl_ohio.csv
+   31285 ngl_oklahoma.csv
+  202501 ngl_oregon.csv
+   94842 ngl_pennsylvania.csv
+   28365 ngl_rhode_island.csv
+   45634 ngl_south_carolina.csv
+   30243 ngl_south_dakota.csv
+  207440 ngl_tennessee.csv
+  384140 ngl_texas.csv
+   90157 ngl_usa_territoties.csv
+    6017 ngl_utah.csv
+      28 ngl_vermont.csv
+  122320 ngl_virginia.csv
+   56423 ngl_washington.csv
+     465 ngl_washingtondc.csv
+    9229 ngl_west_virginia.csv
+   67260 ngl_wisconsin.csv
+    1813 ngl_wyoming_0.csv
+ 5196038 total
@@ -0,0 +1,19 @@
+'use strict';
+
+/*
+ * Copyright (c) 2017 Topcoder, Inc. All rights reserved.
+ */
+
+/*
+ * Branch model definition
+ */
+module.exports = (sequelize, DataTypes) => sequelize.define('Branch', {
+  value: {
+    type: DataTypes.STRING,
+    allowNull: null,
+    primaryKey: true,
+    unique: true
+  }
+}, {
+  timestamps: false
+});
@@ -0,0 +1,18 @@
+'use strict';
+
+/*
+ * Copyright (c) 2017 Topcoder, Inc. All rights reserved.
+ */
+
+/*
+ * Burial model definition
+ */
+module.exports = (sequelize, DataTypes) => sequelize.define('Burial', {
+  d_id: { type: DataTypes.STRING, allowNull: false, primaryKey: true },
+  cem_id: { type: DataTypes.STRING, allowNull: false },
+  section_id: DataTypes.STRING,
+  row_num: DataTypes.STRING,
+  site_num: DataTypes.STRING
+}, {
+  timestamps: false
+});
@@ -0,0 +1,22 @@
+'use strict';
+
+/*
+ * Copyright (c) 2017 Topcoder, Inc. All rights reserved.
+ */
+
+/*
+ * Cemetery model definition
+ */
+module.exports = (sequelize, DataTypes) => sequelize.define('Cemetery', {
+  cem_id: { type: DataTypes.STRING, primaryKey: true, unique: true },
+  cem_name: { type: DataTypes.STRING, allowNull: false },
+  cem_addr_one: { type: DataTypes.STRING, allowNull: false },
+  cem_addr_two: DataTypes.STRING,
+  cem_url: DataTypes.STRING,
+  cem_phone: DataTypes.STRING,
+  city: DataTypes.STRING,
+  state: DataTypes.STRING,
+  zip: DataTypes.INTEGER
+}, {
+  timestamps: false
+});