cpmpercussion
diff --git a/‎notebooks/MDN-RNN-RoboJam-touch-generation.ipynb
+98-42 b/‎notebooks/MDN-RNN-RoboJam-touch-generation.ipynb
+98-42
diff --git a/‎notebooks/MDN-RNN-kanji-generation-example.ipynb
+186-14 b/‎notebooks/MDN-RNN-kanji-generation-example.ipynb
+186-14
diff --git a/‎notebooks/MDN-RNN-time-distributed-MDN-training.ipynb
+10-8 b/‎notebooks/MDN-RNN-time-distributed-MDN-training.ipynb
+10-8
@@ -54,6 +54,24 @@
     "plt.style.use('seaborn-talk')"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Only for GPU use:\n",
+    "import os\n",
+    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"1\"\n",
+    "\n",
+    "import tensorflow as tf\n",
+    "config = tf.ConfigProto()\n",
+    "config.gpu_options.allow_growth = True\n",
+    "sess = tf.Session(config=config)\n",
+    "from keras import backend as K\n",
+    "K.set_session(sess)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -95,83 +113,108 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "def perf_df_to_array(perf_df):\n",
+    "SCALE_FACTOR = 1\n",
+    "\n",
+    "def perf_df_to_array(perf_df, include_moving=False):\n",
     "    \"\"\"Converts a dataframe of a performance into array a,b,dt format.\"\"\"\n",
     "    perf_df['dt'] = perf_df.time.diff()\n",
     "    perf_df.dt = perf_df.dt.fillna(0.0)\n",
     "    # Clean performance data\n",
     "    # Tiny Performance bounds defined to be in [[0,1],[0,1]], edit to fix this.\n",
-    "    perf_df.set_value(perf_df[perf_df.dt > 5].index, 'dt', 5.0)\n",
-    "    perf_df.set_value(perf_df[perf_df.dt < 0].index, 'dt', 0.0)\n",
-    "    perf_df.set_value(perf_df[perf_df.x > 1].index, 'x', 1.0)\n",
-    "    perf_df.set_value(perf_df[perf_df.x < 0].index, 'x', 0.0)\n",
-    "    perf_df.set_value(perf_df[perf_df.y > 1].index, 'y', 1.0)\n",
-    "    perf_df.set_value(perf_df[perf_df.y < 0].index, 'y', 0.0)\n",
-    "    return np.array(perf_df[['x', 'y', 'dt']])\n",
+    "    perf_df.at[perf_df[perf_df.dt > 5].index, 'dt'] = 5.0\n",
+    "    perf_df.at[perf_df[perf_df.dt < 0].index, 'dt'] = 0.0\n",
+    "    perf_df.at[perf_df[perf_df.x > 1].index, 'x'] = 1.0\n",
+    "    perf_df.at[perf_df[perf_df.x < 0].index, 'x'] = 0.0\n",
+    "    perf_df.at[perf_df[perf_df.y > 1].index, 'y'] = 1.0\n",
+    "    perf_df.at[perf_df[perf_df.y < 0].index, 'y'] = 0.0\n",
+    "    if include_moving:\n",
+    "        output = np.array(perf_df[['x', 'y', 'dt', 'moving']])\n",
+    "    else:\n",
+    "        output = np.array(perf_df[['x', 'y', 'dt']])\n",
+    "    return output\n",
     "\n",
     "\n",
     "def perf_array_to_df(perf_array):\n",
-    "    \"\"\"Converts an array of a performance (a,b,dt format) into a dataframe.\"\"\"\n",
+    "    \"\"\"Converts an array of a performance (a,b,dt(,moving) format) into a dataframe.\"\"\"\n",
     "    perf_array = perf_array.T\n",
     "    perf_df = pd.DataFrame({'x': perf_array[0], 'y': perf_array[1], 'dt': perf_array[2]})\n",
+    "    if len(perf_array) == 4:\n",
+    "        perf_df['moving'] = perf_array[3]\n",
+    "    else:\n",
+    "        # As a rule of thumb, could classify taps with dt>0.1 as taps, dt<0.1 as moving touches.\n",
+    "        perf_df['moving'] = 1\n",
+    "        perf_df.at[perf_df[perf_df.dt > 0.1].index, 'moving'] = 0\n",
     "    perf_df['time'] = perf_df.dt.cumsum()\n",
     "    perf_df['z'] = 38.0\n",
-    "    # As a rule of thumb, could classify taps with dt>0.1 as taps, dt<0.1 as moving touches.\n",
-    "    perf_df['moving'] = 1\n",
-    "    perf_df.set_value(perf_df[perf_df.dt > 0.1].index, 'moving', 0)\n",
     "    perf_df = perf_df.set_index(['time'])\n",
     "    return perf_df[['x', 'y', 'z', 'moving']]\n",
     "\n",
     "\n",
-    "def random_touch():\n",
+    "def random_touch(with_moving=False):\n",
     "    \"\"\"Generate a random tiny performance touch.\"\"\"\n",
-    "    return np.array([np.random.rand(), np.random.rand(), 0.01])\n",
+    "    if with_moving:\n",
+    "        return np.array([np.random.rand(), np.random.rand(), 0.01, 0])\n",
+    "    else:\n",
+    "        return np.array([np.random.rand(), np.random.rand(), 0.01])\n",
     "\n",
     "\n",
-    "def constrain_touch(touch):\n",
+    "def constrain_touch(touch, with_moving=False):\n",
     "    \"\"\"Constrain touch values from the MDRNN\"\"\"\n",
     "    touch[0] = min(max(touch[0], 0.0), 1.0)  # x in [0,1]\n",
     "    touch[1] = min(max(touch[1], 0.0), 1.0)  # y in [0,1]\n",
     "    touch[2] = max(touch[2], 0.001)  # dt # define minimum time step\n",
+    "    if with_moving:\n",
+    "        touch[3] = np.greater(touch[3], 0.5) * 1.0\n",
     "    return touch\n",
     "\n",
-    "def generate_random_tiny_performance(model, n_mixtures, first_touch, time_limit=5.0, steps_limit=1000, temp=1.0):\n",
+    "\n",
+    "def generate_random_tiny_performance(model, n_mixtures, first_touch, time_limit=5.0, steps_limit=1000, temp=1.0, sigma_temp=0.0, predict_moving=False):\n",
     "    \"\"\"Generates a tiny performance up to 5 seconds in length.\"\"\"\n",
+    "    if predict_moving:\n",
+    "        out_dim = 4\n",
+    "    else:\n",
+    "        out_dim = 3\n",
     "    time = 0\n",
     "    steps = 0\n",
     "    previous_touch = first_touch\n",
-    "    performance = [previous_touch.reshape((3,))]\n",
+    "    performance = [previous_touch.reshape((out_dim,))]\n",
     "    while (steps < steps_limit and time < time_limit):\n",
-    "        params = model.predict(previous_touch.reshape(1,1,3))\n",
-    "        previous_touch = mdn.sample_from_output(params[0], 3, n_mixtures, temp=temp)\n",
-    "        output_touch = previous_touch.reshape(3,)\n",
-    "        output_touch = constrain_touch(output_touch)\n",
-    "        performance.append(output_touch.reshape((3,)))\n",
+    "        params = model.predict(previous_touch.reshape(1,1,out_dim) * SCALE_FACTOR)\n",
+    "        previous_touch = mdn.sample_from_output(params[0], out_dim, n_mixtures, temp=temp, sigma_temp=sigma_temp) / SCALE_FACTOR\n",
+    "        output_touch = previous_touch.reshape(out_dim,)\n",
+    "        output_touch = constrain_touch(output_touch, with_moving=predict_moving)\n",
+    "        performance.append(output_touch.reshape((out_dim,)))\n",
     "        steps += 1\n",
     "        time += output_touch[2]\n",
     "    return np.array(performance)\n",
     "\n",
     "\n",
-    "def condition_and_generate(model, perf, n_mixtures, time_limit=5.0, steps_limit=1000, temp=1.0):\n",
+    "def condition_and_generate(model, perf, n_mixtures, time_limit=5.0, steps_limit=1000, temp=1.0, sigma_temp=0.0, predict_moving=False):\n",
     "    \"\"\"Conditions the network on an existing tiny performance, then generates a new one.\"\"\"\n",
+    "    if predict_moving:\n",
+    "        out_dim = 4\n",
+    "    else:\n",
+    "        out_dim = 3\n",
     "    time = 0\n",
     "    steps = 0\n",
     "    # condition\n",
     "    for touch in perf:\n",
-    "        params = model.predict(touch.reshape(1,1,3))\n",
-    "        previous_touch = mdn.sample_from_output(params[0], 3, n_mixtures, temp=temp)\n",
-    "    output = [previous_touch.reshape((3,))]\n",
+    "        params = model.predict(touch.reshape(1, 1, out_dim) * SCALE_FACTOR)\n",
+    "        previous_touch = mdn.sample_from_output(params[0], out_dim, n_mixtures, temp=temp, sigma_temp=sigma_temp) / SCALE_FACTOR\n",
+    "        output = [previous_touch.reshape((out_dim,))]\n",
+    "    # generate\n",
     "    while (steps < steps_limit and time < time_limit):\n",
-    "        params = model.predict(previous_touch.reshape(1,1,3))\n",
-    "        previous_touch = mdn.sample_from_output(params[0], 3, n_mixtures, temp=temp)\n",
-    "        output_touch = previous_touch.reshape(3,)\n",
-    "        output_touch = constrain_touch(output_touch)\n",
-    "        output.append(output_touch.reshape((3,)))\n",
+    "        params = model.predict(previous_touch.reshape(1, 1, out_dim) * SCALE_FACTOR)\n",
+    "        previous_touch = mdn.sample_from_output(params[0], out_dim, n_mixtures, temp=temp, sigma_temp=sigma_temp) / SCALE_FACTOR\n",
+    "        output_touch = previous_touch.reshape(out_dim,)\n",
+    "        output_touch = constrain_touch(output_touch, with_moving=predict_moving)\n",
+    "        output.append(output_touch.reshape((out_dim,)))\n",
     "        steps += 1\n",
     "        time += output_touch[2]\n",
     "    net_output = np.array(output)\n",
     "    return net_output\n",
     "\n",
+    "\n",
     "def divide_performance_into_swipes(perf_df):\n",
     "    \"\"\"Divides a performance into a sequence of swipe dataframes for plotting.\"\"\"\n",
     "    touch_starts = perf_df[perf_df.moving == 0].index\n",
@@ -184,10 +227,15 @@
     "    performance_swipes.append(remainder)\n",
     "    return performance_swipes\n",
     "\n",
-    "def plot_2D(perf_df, name=\"foo\", saving=False):\n",
+    "\n",
+    "input_colour = 'darkblue'\n",
+    "gen_colour = 'firebrick'\n",
+    "\n",
+    "\n",
+    "def plot_2D(perf_df, name=\"foo\", saving=False, figsize=(8, 8)):\n",
     "    \"\"\"Plot a 2D representation of a performance 2D\"\"\"\n",
     "    swipes = divide_performance_into_swipes(perf_df)\n",
-    "    plt.figure(figsize=(8, 8))\n",
+    "    plt.figure(figsize=figsize)\n",
     "    for swipe in swipes:\n",
     "        p = plt.plot(swipe.x, swipe.y, 'o-')\n",
     "        plt.setp(p, color=gen_colour, linewidth=5.0)\n",
@@ -200,10 +248,11 @@
     "        plt.close()\n",
     "    else:\n",
     "        plt.show()\n",
-    "        \n",
-    "def plot_double_2d(perf1, perf2, name=\"foo\", saving=False):\n",
+    "\n",
+    "\n",
+    "def plot_double_2d(perf1, perf2, name=\"foo\", saving=False, figsize=(8, 8)):\n",
     "    \"\"\"Plot two performances in 2D\"\"\"\n",
-    "    plt.figure(figsize=(8, 8))\n",
+    "    plt.figure(figsize=figsize)\n",
     "    swipes = divide_performance_into_swipes(perf1)\n",
     "    for swipe in swipes:\n",
     "        p = plt.plot(swipe.x, swipe.y, 'o-')\n",
@@ -387,10 +436,17 @@
    "outputs": [],
    "source": [
     "# Train the model\n",
-    "history = model.fit(X, y, batch_size=BATCH_SIZE, epochs=EPOCHS, validation_split=VAL_SPLIT)\n",
+    "\n",
+    "# Define callbacks\n",
+    "filepath=\"robojam_mdrnn-E{epoch:02d}-VL{val_loss:.2f}.h5\"\n",
+    "checkpoint = keras.callbacks.ModelCheckpoint(filepath, save_weights_only=True, verbose=1, save_best_only=True, mode='min')\n",
+    "early_stopping = keras.callbacks.EarlyStopping(monitor='val_loss', mode='min', verbose=1, patience=10)\n",
+    "callbacks = [keras.callbacks.TerminateOnNaN(), checkpoint, early_stopping]\n",
+    "\n",
+    "history = model.fit(X, y, batch_size=BATCH_SIZE, epochs=EPOCHS, callbacks=callbacks, validation_split=VAL_SPLIT)\n",
     "\n",
     "# Save the Model\n",
-    "#model.save('robojam-mdn-rnn.h5')  # creates a HDF5 file of the model\n",
+    "model.save('robojam-mdrnn.h5')  # creates a HDF5 file of the model\n",
     "\n",
     "# Plot the loss\n",
     "%matplotlib inline\n",
@@ -428,7 +484,7 @@
     "decoder.summary()\n",
     "\n",
     "# decoder.set_weights(model.get_weights())\n",
-    "decoder.load_weights(\"robojam-mdn-rnn.h5\")"
+    "decoder.load_weights(\"robojam-mdrnn.h5\")"
    ]
   },
   {
@@ -451,7 +507,7 @@
     "ex =  microjam_corpus[t:t+length]  #sequences[600]\n",
     "\n",
     "decoder.reset_states()\n",
-    "p = condition_and_generate(decoder, ex, NUMBER_MIXTURES, temp=0.2)\n",
+    "p = condition_and_generate(decoder, ex, NUMBER_MIXTURES, temp=1.0, sigma_temp=0.05)\n",
     "plot_double_2d(perf_array_to_df(ex), perf_array_to_df(p))"
    ]
   },
@@ -472,7 +528,7 @@
    "source": [
     "decoder.reset_states()\n",
     "t = random_touch()\n",
-    "p = generate_random_tiny_performance(decoder, NUMBER_MIXTURES, t, temp=0.1)\n",
+    "p = generate_random_tiny_performance(decoder, NUMBER_MIXTURES, t, temp=1.1, sigma_temp=0.05)\n",
     "plot_2D(perf_array_to_df(p))"
    ]
   },
@@ -506,7 +562,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.6.6"
+   "version": "3.6.7"
   }
  },
  "nbformat": 4,
 
@@ -203,10 +203,10 @@
    "outputs": [],
    "source": [
     "# Fit the model\n",
-    "filepath=\"kanji_mdnrnn-{epoch:02d}.hdf5\"\n",
-    "checkpoint = keras.callbacks.ModelCheckpoint(filepath, monitor='val_loss', verbose=1, save_best_only=True, mode='min')\n",
-    "callbacks = [keras.callbacks.TerminateOnNaN(), checkpoint]\n",
-    "\n",
+    "filepath=\"kanji_mdnrnn-{epoch:02d}.h5\"\n",
+    "checkpoint = keras.callbacks.ModelCheckpoint(filepath, save_weights_only=True, verbose=1, save_best_only=True, mode='min')\n",
+    "early_stopping = keras.callbacks.EarlyStopping(monitor='val_loss', mode='min', verbose=1, patience=10)\n",
+    "callbacks = [keras.callbacks.TerminateOnNaN(), checkpoint, early_stopping]\n",
     "history = model.fit(X, y, batch_size=BATCH_SIZE, epochs=EPOCHS, callbacks=callbacks, validation_data=(Xval,yval))\n",
     "model.save('kanji_mdnrnn_model_time_distributed.h5')  # creates a HDF5 file 'my_model.h5'"
    ]
@@ -259,7 +259,8 @@
     "decoder.summary()\n",
     "\n",
     "#decoder.load_weights('kanji_mdnrnn_model_time_distributed.h5') # load weights independently from file\n",
-    "decoder.load_weights('kanji_mdnrnn-99.hdf5')"
+    "#decoder.load_weights('kanji_mdnrnn-99.hdf5')\n",
+    "decoder.load_weights('kanji_mdnrnn_model_time_distributed.h5')"
    ]
   },
   {
@@ -397,14 +398,15 @@
    "outputs": [],
    "source": [
     "# Predict a character and plot the result.\n",
-    "temperature = 2 # seems to work well with rather high temperature (2.5)\n",
+    "temperature = 1.5 # seems to work well with rather high temperature (2.5)\n",
+    "sigma_temp = 0.01\n",
     "\n",
     "p = zero_start_position()\n",
     "sketch = [p.reshape(3,)]\n",
     "\n",
     "for i in range(100):\n",
     "    params = decoder.predict(p.reshape(1,1,3))\n",
-    "    p = mdn.sample_from_output(params[0], OUTPUT_DIMENSION, NUMBER_MIXTURES, temp=temperature)\n",
+    "    p = mdn.sample_from_output(params[0], OUTPUT_DIMENSION, NUMBER_MIXTURES, temp=temperature, sigma_temp=sigma_temp)\n",
     "    sketch.append(p.reshape((3,)))\n",
     "\n",
     "sketch = np.array(sketch)\n",
@@ -432,7 +434,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.6.6"
+   "version": "3.6.7"
   }
  },
  "nbformat": 4,