statsim
diff --git a/‎index.html
+45-27 b/‎index.html
+45-27
diff --git a/‎package-lock.json
+46-1 b/‎package-lock.json
+46-1
diff --git a/‎package.json
+3-2 b/‎package.json
+3-2
diff --git a/‎src/process.js
+90-70 b/‎src/process.js
+90-70
@@ -10,17 +10,18 @@
     <link rel="icon" type="image/png" href="https://statsim.com/app/images/favicon-16x16.png" sizes="16x16">
     <style>
       a { color: #3030B7 }
+      .logo { width: 75px; padding: 0; margin: 8px 0 0 0}
       .btn, .port-btn { background: #3030B7 }
       .btn:hover, .port-btn:hover { background: #21218B }
       .file-field .btn { background: #BBB }
       .file-field .btn:hover { background: #AAA }
-      .status-bar { background: #f5f5f5 }
+      .grey-bar { background: #f5f5f5 }
       .spinner-green, .spinner-green-only { border-color: #3030B7 }
     </style>
   </head>
   <body>
 
-    <div class="status-bar">
+    <div class="grey-bar">
       <div class="container">
         <div class="row">
           <div class="col s11" style="font-size: 14px;">
@@ -36,28 +37,31 @@
     <div class="container">
       <div class="row">
         <div class="col m12">
-          <h4>Visualize high-dimensional data</h4>
-          <p>Feature extraction is the process of reducing the number of variables (columns) in a dataset by obtaining a smaller representative set of variables using various methods of dimensionality reduction (<a href="https://en.wikipedia.org/wiki/Dimensionality_reduction">Wiki</a>). Try dimensionality reduction methods in the browser using Vis, a 100% free open-source tool for feature extraction and visualization.</p>
-          <p>Currently supported methods: <i>PCA, t-SNE, UMAP, SOM, Autoencoder</i></p>
+          <img src="vis.png" class="logo" alt="StatSim.Vis">
         </div>
       </div>
       <div class="row">
         <div id="port-container"></div>
       </div>
-      <div class="row">
-        <div class="col m12">
-          <small>
-            All processing and visualization happens in your browser. We don't see, collect or sell data you explore <br> 
-            Based on <a href="https://github.com/statsim/port">port</a> and some awesome npm packages: 
-            <a href="https://www.npmjs.com/package/ml-js">ml-js</a>, 
-            <a href="https://www.npmjs.com/package/tsne">tsne</a>, 
-            <a href="https://www.npmjs.com/package/umap-js">umap-js</a>, 
-            <a href="https://www.npmjs.com/package/plotly.js">plotly.js</a> and <a href="https://github.com/statsim/vis/blob/master/package.json">other</a>
-          </small>
-          <p>
-            <a class="github-button" href="https://github.com/statsim/vis" data-icon="octicon-star" data-show-count="true" aria-label="Star statsim/vis on GitHub">Star</a>
-            <a class="github-button" href="https://github.com/statsim/vis/issues" data-icon="octicon-issue-opened" data-show-count="true" aria-label="Issue statsim/vis on GitHub">Issue</a>
-          </p>
+    </div>
+    <div class="grey-bar">
+      <div class="container">
+        <div class="row">
+          <div class="col m12">
+            <h4>Visualize high-dimensional data online</h4>
+            <p>
+              Feature extraction is the process of reducing the number of variables (columns) in a dataset by obtaining a smaller representative set of variables using various methods of dimensionality reduction (<a href="https://en.wikipedia.org/wiki/Dimensionality_reduction">Wiki</a>). Try dimensionality reduction methods in the browser using Vis, a 100% free open-source tool for feature extraction and visualization.
+              Supported methods: <i>PCA, t-SNE, UMAP, SOM, Autoencoder</i>
+            </p>
+
+            <small>
+              All processing and visualization happens in your browser. We don't see, collect or sell data you explore <br> 
+            </small>
+            <p>
+              <a class="github-button" href="https://github.com/statsim/vis" data-icon="octicon-star" data-show-count="true" aria-label="Star statsim/vis on GitHub">Star</a>
+              <a class="github-button" href="https://github.com/statsim/vis/issues" data-icon="octicon-issue-opened" data-show-count="true" aria-label="Issue statsim/vis on GitHub">Issue</a>
+            </p>
+          </div>
         </div>
       </div>
     </div>
@@ -87,18 +91,32 @@ <h4>Visualize high-dimensional data</h4>
           },
           "inputs": [
             { "type": "file", "name": "File", "reactive": true },
-            { "type": "select", "name": "Dimensions", "options": [2, 3], "default": 2},
-            { "type": "select", "name": "Target variable" },
-            { "type": "select", "name": "Transform", "options": ['None', 'Scale', 'Log'], "default": 'None' },
-            { "type": "select", "name": "Method", "options": ['PCA', 'SOM', 't-SNE', 'UMAP', 'Autoencoder'], "default": "PCA", "onchange": (value) => {
-              if (value === 'PCA') {
-                return {'Steps': {'className': 'hidden'}}
+            { "type": "select", "name": "Target variable", "options": ['None'], "default": 'None' },
+            { "type": "select", "name": "Projection method", "options": ['None', 'PCA', 'SOM', 't-SNE', 'UMAP', 'Autoencoder'], "default": "None", "onchange": (value) => {
+              if (value === 'None') {
+                return {
+                  'Steps': {'className': 'hidden'},
+                  'Dimensions': {'className': 'hidden'},
+                  'Transform': {'className': 'hidden'}
+                }
+              } else if (value === 'PCA') {
+                return {
+                  'Steps': {'className': 'hidden'},
+                  'Dimensions': {'className': ''},
+                  'Transform': {'className': ''}
+                }
               } else {
-                return {'Steps': {'className': ''}}
+                return {
+                  'Steps': {'className': ''},
+                  'Dimensions': {'className': ''},
+                  'Transform': {'className': ''}
+                }
               }
             }},
-            { "type": "select", "name": "Feature importance", "options": ['None', 'Random Forest'], "default": 'None' },
+            { "type": "select", "name": "Dimensions", "options": [2, 3], "default": 2},
+            { "type": "select", "name": "Transform", "options": ['None', 'Scale', 'Log'], "default": 'None' },
             { "type": "int", "name": "Steps", "default": 200},
+            { "type": "select", "name": "Feature importance", "options": ['None', 'Random Forest'], "default": 'None' },
           ]
         }
       })
 
@@ -1,6 +1,6 @@
 {
   "name": "vis",
-  "version": "0.2.0",
+  "version": "0.3.0",
   "description": "Vis. Visualize high-dimensional data",
   "main": "main.js",
   "scripts": {
@@ -34,6 +34,7 @@
     "plotly.js": "^1.53.0",
     "random-forest": "0.0.7",
     "tsne": "^1.0.1",
-    "umap-js": "^1.3.2"
+    "umap-js": "^1.3.2",
+    "vis-network": "^8.5.4"
   }
 }
@@ -105,78 +105,82 @@ module.exports = class Process {
       console.log('[Vis] Embedding method:', params.method)
 
       let Y
-      if (params.method === 'PCA') {
-        console.log('[Vis] Fitting PCA')
-        const pca = new PCA(X)
-        Y = pca.predict(X, { 'nComponents': nDims}).to2DArray()
-      } else if (params.method === 'SOM') {
-        const som = new SOM(100, 100, { 'iterations': Math.round(params.steps / 10), 'fields': X[0].length})
-        som.train(X)
-        Y = som.predict(X)
-        if (nDims === 3) {
-          Y = Y.map(y => y.concat([0]))
-        }
-      } else if (params.method === 'UMAP') {
-        console.log('[Vis] Fitting UMAP')
-        const umap = new UMAP({ 'nComponents': nDims, 'nEpochs': params.steps })
-        umap.initializeFit(X)
-        for (let i = 0; i < params.steps; i++) {
-          umap.step()
-        }
-        Y = umap.getEmbedding()
-      } else if (params.method === 'Autoencoder') {
-        console.log('[Vis] Fitting Autoencoder')
-        // const ae = new Autoencoder({'nInputs': cols.length, 'nHidden': nDims, 'nLayers': 3, 'activation': 'tanh'})
-        const ae = new Autoencoder({
-          'encoder': [
-            {'nOut': 20, 'activation': 'tanh'},
-            {'nOut': nDims, 'activation': 'sigmoid'}
-          ],
-          'decoder': [
-            {'nOut': 20, 'activation': 'tanh'},
-            {'nOut': cols.length}
-          ]
-        })
-        ae.fit(X, {
-          'iterations': params.steps * 50,
-          'stepSize': 0.005,
-          'batchSize': 20,
-          'method': 'adam'
-        })
-        Y = ae.encode(X)
-
-        impMatrix = []
-
-        console.log('[Vis] Generate importance matrix with Autoencoder')
-        featuresFiltered.forEach((f, fi) => {
-          const impTemp = []
-          const Xr = []
-          X.forEach(x => Xr.push(x.slice(0)))
-          for (let i = Xr.length - 1; i > 0; i--) {
-            const j = Math.floor(Math.random() * (i + 1))
-            const x = Xr[i][fi]
-            Xr[i][fi] = Xr[j][fi]
-            Xr[j][fi] = x
+
+      // Projection
+      if (params.method !== 'None') {
+        if (params.method === 'PCA') {
+          console.log('[Vis] Fitting PCA')
+          const pca = new PCA(X)
+          Y = pca.predict(X, { 'nComponents': nDims}).to2DArray()
+        } else if (params.method === 'SOM') {
+          const som = new SOM(100, 100, { 'iterations': Math.round(params.steps / 10), 'fields': X[0].length})
+          som.train(X)
+          Y = som.predict(X)
+          if (nDims === 3) {
+            Y = Y.map(y => y.concat([0]))
           }
-          const Xp = ae.predict(Xr)
-          featuresFiltered.forEach((ff, ffi) => {
-            const mse = Xp.reduce((a, x, xi) => Math.pow(x[ffi] - X[xi][ffi], 2) + a, 0) / Xp.length
-            impTemp.push(mse)
+        } else if (params.method === 'UMAP') {
+          console.log('[Vis] Fitting UMAP')
+          const umap = new UMAP({ 'nComponents': nDims, 'nEpochs': params.steps })
+          umap.initializeFit(X)
+          for (let i = 0; i < params.steps; i++) {
+            umap.step()
+          }
+          Y = umap.getEmbedding()
+        } else if (params.method === 'Autoencoder') {
+          console.log('[Vis] Fitting Autoencoder')
+          // const ae = new Autoencoder({'nInputs': cols.length, 'nHidden': nDims, 'nLayers': 3, 'activation': 'tanh'})
+          const ae = new Autoencoder({
+            'encoder': [
+              {'nOut': 20, 'activation': 'tanh'},
+              {'nOut': nDims, 'activation': 'sigmoid'}
+            ],
+            'decoder': [
+              {'nOut': 20, 'activation': 'tanh'},
+              {'nOut': cols.length}
+            ]
           })
-          impMatrix.push(impTemp)
-        })
-        console.log('[Vis] Autoencoder importance matrix:', impMatrix)
-        impMatrix = new Matrix(impMatrix).scaleColumns().to2DArray()
-      } else {
-        console.log('[Vis] Fitting t-SNE')
-        const tsne = new TSNE({ 'epsilon': 10, 'dim': nDims })
-        tsne.initDataRaw(X)
-        const steps = params.steps || 100
-        for (let k = 0; k <= steps; k++) {
-          tsne.step()
+          ae.fit(X, {
+            'iterations': params.steps * 50,
+            'stepSize': 0.005,
+            'batchSize': 20,
+            'method': 'adam'
+          })
+          Y = ae.encode(X)
+
+          impMatrix = []
+
+          console.log('[Vis] Generate importance matrix with Autoencoder')
+          featuresFiltered.forEach((f, fi) => {
+            const impTemp = []
+            const Xr = []
+            X.forEach(x => Xr.push(x.slice(0)))
+            for (let i = Xr.length - 1; i > 0; i--) {
+              const j = Math.floor(Math.random() * (i + 1))
+              const x = Xr[i][fi]
+              Xr[i][fi] = Xr[j][fi]
+              Xr[j][fi] = x
+            }
+            const Xp = ae.predict(Xr)
+            featuresFiltered.forEach((ff, ffi) => {
+              const mse = Xp.reduce((a, x, xi) => Math.pow(x[ffi] - X[xi][ffi], 2) + a, 0) / Xp.length
+              impTemp.push(mse)
+            })
+            impMatrix.push(impTemp)
+          })
+          console.log('[Vis] Autoencoder importance matrix:', impMatrix)
+          impMatrix = new Matrix(impMatrix).scaleColumns().to2DArray()
+        } else {
+          console.log('[Vis] Fitting t-SNE')
+          const tsne = new TSNE({ 'epsilon': 10, 'dim': nDims })
+          tsne.initDataRaw(X)
+          const steps = params.steps || 100
+          for (let k = 0; k <= steps; k++) {
+            tsne.step()
+          }
+          Y = tsne.getSolution()
         }
-        Y = tsne.getSolution()
-      }
+      } // End projection
 
       let target
       let colorscale
@@ -210,7 +214,7 @@ module.exports = class Process {
         }
       } else {
         console.log('[Vis] No target variable specified')
-        target = Array(Y.length).fill(0)
+        target = Array(X.length).fill(0)
         colorscale = [
           [0, '#8A8DA1'],
           [1, '#8A8DA1']
@@ -234,6 +238,22 @@ module.exports = class Process {
             impTemp.splice(i, 0, 0)
             return impTemp
           })
+        } else if (params.importance === 'Mutual Information') {
+          // impMatrix = []
+          // for (let i = 0; i < featuresFiltered.length; i++) {
+          //   console.log(`Calculating ${i} of ${featuresFiltered.length}`)
+          //   const impMatrixRow = []
+          //   impMatrix.push(impMatrixRow)
+          //   for (let j = 0; j < featuresFiltered.length; j++) {
+          //     if (i === j) {
+          //       impMatrixRow.push(0)
+          //     } else {
+          //       const x = X.map(row => row[i])
+          //       const y = X.map(row => row[j])
+          //       impMatrixRow.push(Funzo(x).map().joint(Funzo(y).map()).mi(2)) //)mid(x, y))
+          //     }
+          //   }
+          // }
         }
       }
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "vis",`
`3`		`- "version": "0.2.0",`
	`3`	`+ "version": "0.3.0",`
`4`	`4`	`"description": "Vis. Visualize high-dimensional data",`
`5`	`5`	`"main": "main.js",`
`6`	`6`	`"scripts": {`
`@@ -34,6 +34,7 @@`
`34`	`34`	`"plotly.js": "^1.53.0",`
`35`	`35`	`"random-forest": "0.0.7",`
`36`	`36`	`"tsne": "^1.0.1",`
`37`		`- "umap-js": "^1.3.2"`
	`37`	`+ "umap-js": "^1.3.2",`
	`38`	`+ "vis-network": "^8.5.4"`
`38`	`39`	`}`
`39`	`40`	`}`