WhoIsJack
diff --git a/‎README.md
+29 b/‎README.md
+29
diff --git a/‎data_gen.ipynb
+345 b/‎data_gen.ipynb
+345
diff --git a/‎example_tree_color.png
31.3 KB b/‎example_tree_color.png
31.3 KB
diff --git a/‎example_tree_outline.png
20.1 KB b/‎example_tree_outline.png
20.1 KB
@@ -0,0 +1,29 @@
+# Track Tree - Epic Tree Timecourse Visualization
+
+by Jonas Hartmann, Gilmour group, EMBL Heidelberg
+
+----
+
+**Info:**
+
+This pipeline reads time course data of a tracked object that divides into multiple objects over time (for example a cell as observed with a fluorescence microscope and tracked by image analysis) and plots the track data as a tree, visualizing measurements as an outline and/or through coloring.
+
+See `About` section in `track_tree.ipynb` for more information!
+
+----
+
+**Example 1:** Tree with outline and color to represent track measurements
+
+![Example Track Tree with color](example_tree_color.png)
+
+
+**Example 2:** Example tree with two outlines to represent track measurements
+
+![Example Track Tree with double-outlines](example_tree_outline.png)
+
+
+
+
+
+
+
@@ -0,0 +1,345 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Track Tree - Example Data Generation\n",
+    "\n",
+    "----\n",
+    "\n",
+    "This generates some random example data to illustrate the \"track tree\" visualization. The values for the two measurement tracks are generated by a pink noise generator. The tree structure is also randomly generated (in a very awkward way that allows very little control). Have fun. "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Prep"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "### Import modules\n",
+    "from __future__ import division\n",
+    "import os, sys\n",
+    "import warnings\n",
+    "import numpy as np\n",
+    "import matplotlib.pyplot as plt"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "### Seed random generator\n",
+    "np.random.seed(5)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Tree Generation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "### Function to generate two branches from a stem\n",
+    "\n",
+    "def make_branches(ID, IDs):\n",
+    "    \n",
+    "    # First branch\n",
+    "    new_ID_1 = IDs[-1] + 1\n",
+    "    tree[new_ID_1] = {'stem'     : ID,\n",
+    "                      'branches' : '_none_'}\n",
+    "    IDs.append(new_ID_1)\n",
+    "    \n",
+    "    # Second branch\n",
+    "    new_ID_2 = IDs[-1] + 1\n",
+    "    tree[new_ID_2] = {'stem'     : ID,\n",
+    "                      'branches' : '_none_'}\n",
+    "    IDs.append(new_ID_2)\n",
+    "    \n",
+    "    # Update stem\n",
+    "    tree[ID]['branches'] = [new_ID_1, new_ID_2]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "### Generate the tree\n",
+    "\n",
+    "# Parameters\n",
+    "max_iter = 10\n",
+    "p_branch = 0.55\n",
+    "\n",
+    "# Start by generating the root \n",
+    "tree = { 0 : {'stem'     : '_root_',\n",
+    "              'branches' : '_none_'} }\n",
+    "\n",
+    "# Keep track of IDs\n",
+    "IDs = [0]\n",
+    "\n",
+    "# Iterate\n",
+    "for iterstep in range(max_iter):\n",
+    "    \n",
+    "    # For each existing stem...\n",
+    "    for ID in tree.keys():\n",
+    "        \n",
+    "        # If it can create branches...\n",
+    "        if tree[ID]['branches'] == '_none_':\n",
+    "            \n",
+    "            # Randomly decide if it branches\n",
+    "            if np.random.binomial(1, p_branch) or tree[ID]['stem'] == '_root_':\n",
+    "                \n",
+    "                # Create the new branches\n",
+    "                make_branches(ID, IDs)\n",
+    "                \n",
+    "            # Otherwise, make it a leaf\n",
+    "            else: \n",
+    "                tree[ID]['branches'] = ['_leaf_', '_leaf_']\n",
+    "                \n",
+    "# Clean up final leaves (in case max_iter was reached)\n",
+    "for ID in tree.keys():\n",
+    "    if tree[ID]['branches'] == '_none_':\n",
+    "        tree[ID]['branches'] = ['_leaf_', '_leaf_']"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Track Generation: Indices"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "### Generate length & indices of all tracks\n",
+    "\n",
+    "# Parameters\n",
+    "min_len =  10\n",
+    "max_len = 100\n",
+    "\n",
+    "# Function to recursively assign lenghts / indices\n",
+    "def generate_indices(ID):\n",
+    "    \n",
+    "    # Randomly generate length\n",
+    "    track_len = np.random.randint(min_len, max_len)\n",
+    "    \n",
+    "    # Generate indices for the root (count from zero)\n",
+    "    if tree[ID]['stem'] == '_root_':\n",
+    "        track_indices = np.arange(0, track_len)\n",
+    "    \n",
+    "    # Generate indices for branches/leaves (count from stem position)\n",
+    "    else:\n",
+    "        track_indices = np.arange(1, track_len+1) + tree[tree[ID]['stem']]['indices'][-1]\n",
+    "    \n",
+    "    # Add indices to tree\n",
+    "    tree[ID]['indices'] = track_indices\n",
+    "    \n",
+    "    # Generate indices for the branches (recursion)\n",
+    "    if tree[ID]['branches'][0] != '_leaf_':\n",
+    "        generate_indices(tree[ID]['branches'][0])\n",
+    "        generate_indices(tree[ID]['branches'][1])\n",
+    "        \n",
+    "# Run the function\n",
+    "generate_indices(0)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Track Generation: Measurements"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "### Function to generate pink-noise\n",
+    "#     Adapted from Allen B. Downey,\n",
+    "#     github.com/AllenDowney/ThinkDSP/blob/master/code/voss.ipynb\n",
+    "#     I removed the pandas dependency (at the cost of speed and scaling...)\n",
+    "\n",
+    "def voss(nrows, ncols=16):\n",
+    "    \"\"\"Generates pink noise using the Voss-McCartney algorithm.\n",
+    "    \n",
+    "    nrows: number of values to generate\n",
+    "    rcols: number of random sources to add\n",
+    "    \n",
+    "    returns: NumPy array\n",
+    "    \"\"\"\n",
+    "    \n",
+    "    # Set up the array\n",
+    "    array = np.empty((nrows, ncols))\n",
+    "    array.fill(np.nan)\n",
+    "    \n",
+    "    # Populate first row (first time point)\n",
+    "    array[0, :] = np.random.random(ncols)\n",
+    "    \n",
+    "    # Populate first columns (highest-freq generator)\n",
+    "    array[:, 0] = np.random.random(nrows)\n",
+    "    \n",
+    "    # Compute where changes happen and add new values\n",
+    "    n = nrows  # the total number of changes is nrows\n",
+    "    cols = np.random.geometric(0.5, n)\n",
+    "    cols[cols >= ncols] = 0\n",
+    "    rows = np.random.randint(nrows, size=n)\n",
+    "    array[rows, cols] = np.random.random(n)\n",
+    "    \n",
+    "    # Forward-fill the skipped nan values\n",
+    "    lel = np.copy(array)\n",
+    "    while np.any(np.isnan(array)):\n",
+    "        nan_r, nan_c = np.where(np.isnan(array))\n",
+    "        fillable = np.where(~np.isnan(array[nan_r-1, nan_c]))\n",
+    "        array[nan_r[fillable], nan_c[fillable]] = array[nan_r[fillable]-1, nan_c[fillable]]\n",
+    "\n",
+    "    # Return the sums\n",
+    "    return array.sum(axis=1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "### Generate two measurements (at different order of magnitude)\n",
+    "\n",
+    "# For each branch...\n",
+    "for ID in tree.keys():\n",
+    "    \n",
+    "    # For each measure & magnitude...\n",
+    "    for m_name, m_magnitude in zip(['measure_1','measure_2'],[1,10]):\n",
+    "        \n",
+    "        # Create measure track\n",
+    "        tree[ID][m_name] = voss(tree[ID]['indices'].shape[0], ncols=16) * m_magnitude"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Saving Generated Data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "### Save the tree structure\n",
+    "# Files will be \"ID\\tStem\\tBranch1\\tBranch2\\n\"\n",
+    "\n",
+    "with open(\"tree_struct.txt\",\"w\") as outfile:\n",
+    "    \n",
+    "    # Write header\n",
+    "    outfile.write(\"trackID\\tstemID\\tbranchID1\\tbranchID2\\n\")\n",
+    "    \n",
+    "    # Iterate over branches in random order\n",
+    "    # (...to better approximate real experimental result lists)\n",
+    "    shuffled_keys = tree.keys()\n",
+    "    np.random.shuffle(shuffled_keys)\n",
+    "    for ID in shuffled_keys:\n",
+    "        \n",
+    "        # Write the output\n",
+    "        outfile.write(\"%s\\t%s\\t%s\\t%s\\n\" % (ID,\n",
+    "                                            tree[ID]['stem'],\n",
+    "                                            tree[ID]['branches'][0],\n",
+    "                                            tree[ID]['branches'][1]))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "### Save data tracks\n",
+    "\n",
+    "for m_name in ['measure_1','measure_2']:\n",
+    "    \n",
+    "    # Create fname\n",
+    "    fname = \"tracks_\"+m_name+\".txt\"\n",
+    "        \n",
+    "    # Create header\n",
+    "    all_IDs = sorted(tree.keys())\n",
+    "    header = '\\t'.join([\"index\"]+[str(ID) for ID in all_IDs])\n",
+    "\n",
+    "    # Create a numpy array containing all track data\n",
+    "    # Note: first column is the time course index\n",
+    "    final_index = np.max(np.concatenate([tree[ID]['indices'] for ID in all_IDs]))\n",
+    "    track_array = np.zeros((final_index+1, len(all_IDs)+1))\n",
+    "    track_array.fill(np.nan)\n",
+    "    track_array[:, 0] = np.arange(final_index+1)\n",
+    "    for track_idx,ID in enumerate(all_IDs):\n",
+    "        track_array[tree[ID]['indices'], track_idx+1] = tree[ID][m_name]\n",
+    "\n",
+    "    # Write the file\n",
+    "    fmt = ['%d'] + [' %.3f' for track_idx in range(len(all_IDs))]  # To write index as d, everything else as f\n",
+    "    np.savetxt(fname, track_array, fmt=fmt, delimiter='\\t', header=header, comments='') "
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 2",
+   "language": "python",
+   "name": "python2"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}