rasdani
diff --git a/‎demo/demo.ipynb
+578-27 b/‎demo/demo.ipynb
+578-27
diff --git a/‎demo/load_from_wandb.ipynb
+21-256 b/‎demo/load_from_wandb.ipynb
+21-256
diff --git a/‎demo/losses_for_different_sequence_lengths.png
2.34 KB b/‎demo/losses_for_different_sequence_lengths.png
2.34 KB
diff --git a/‎demo/losses_over_models_and_sequnce_lenghts.json
+1 b/‎demo/losses_over_models_and_sequnce_lenghts.json
+1
diff --git a/‎demo/mm_losses_for_different_sequence_lengths.png
73 KB b/‎demo/mm_losses_for_different_sequence_lengths.png
73 KB
diff --git a/‎demo/mpjpe_comparison.json
+1 b/‎demo/mpjpe_comparison.json
+1
diff --git a/‎demo/mpjpe_comparison.png
55.4 KB b/‎demo/mpjpe_comparison.png
55.4 KB
diff --git a/‎mp_transformer/datasets/toy_dataset.py
-6 b/‎mp_transformer/datasets/toy_dataset.py
-6
@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -17,17 +17,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "/data/daniel/git/mp-transformer\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "current_dir = Path.cwd().parts[-1]\n",
     "if current_dir == \"demo\":\n",
@@ -37,98 +29,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.\n",
-      "\u001b[34m\u001b[1mwandb\u001b[0m: Currently logged in as: \u001b[33mdaniel-a\u001b[0m (\u001b[33mtcs-mr\u001b[0m). Use \u001b[1m`wandb login --relogin`\u001b[0m to force relogin\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "wandb version 0.15.10 is available!  To upgrade, please run:\n",
-       " $ pip install wandb --upgrade"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       "Tracking run with wandb version 0.15.4"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       "Run data is saved locally in <code>/data/daniel/git/mp-transformer/wandb/run-20230914_181329-xlh6vk92</code>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       "Syncing run <strong><a href='https://wandb.ai/tcs-mr/mp-transformer/runs/xlh6vk92' target=\"_blank\">peach-cloud-545</a></strong> to <a href='https://wandb.ai/tcs-mr/mp-transformer' target=\"_blank\">Weights & Biases</a> (<a href='https://wandb.me/run' target=\"_blank\">docs</a>)<br/>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       " View project at <a href='https://wandb.ai/tcs-mr/mp-transformer' target=\"_blank\">https://wandb.ai/tcs-mr/mp-transformer</a>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       " View run at <a href='https://wandb.ai/tcs-mr/mp-transformer/runs/xlh6vk92' target=\"_blank\">https://wandb.ai/tcs-mr/mp-transformer/runs/xlh6vk92</a>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "\u001b[34m\u001b[1mwandb\u001b[0m:   1 of 1 files downloaded.  \n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "run = wandb.init(project=\"mp-transformer\")\n",
     "artifact = run.use_artifact(\"tcs-mr/mp-transformer/model:v300\", type='model')\n",
@@ -137,63 +40,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "./artifacts/model:v300\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "print(artifact_dir)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "Waiting for W&B process to finish... <strong style=\"color:green\">(success).</strong>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       " View run <strong style=\"color:#cdcd00\">peach-cloud-545</strong> at: <a href='https://wandb.ai/tcs-mr/mp-transformer/runs/xlh6vk92' target=\"_blank\">https://wandb.ai/tcs-mr/mp-transformer/runs/xlh6vk92</a><br/>Synced 6 W&B file(s), 0 media file(s), 0 artifact file(s) and 0 other file(s)"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/html": [
-       "Find logs at: <code>./wandb/run-20230914_181329-xlh6vk92/logs</code>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    }
-   ],
+   "outputs": [],
    "source": [
     "CONFIG[\"hidden_dim\"] = 40\n",
     "CONFIG[\"latent_dim\"] = 48\n",
@@ -208,17 +66,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Video saved to tmp/comp_vid.mp4\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "item = val_dataset[-1]\n",
     "# item = val_dataset[64]\n",
@@ -229,26 +79,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "\n",
-       "<video width=\"320\" height=\"240\" controls>\n",
-       "  <source src=\"../tmp/comp_vid.mp4\" type=\"video/mp4\">\n",
-       "</video>\n"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
+   "outputs": [],
    "source": [
     "\n",
     "HTML(\"\"\"\n",
@@ -260,53 +93,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "poses range: [3.5189839309168747e-06, 0.9999984502792358]\n",
-      "mus range: [-1.7213106155395508, 1.4266711473464966]\n",
-      "average mu: -0.047322604805231094\n",
-      "logvars range: [-8.529964447021484, -5.8591179847717285]\n",
-      "median logvar: -7.437717914581299\n",
-      "gt_latents range: [-1.848239541053772, 2.237262487411499]\n",
-      "average gt_latents: 0.24795043468475342\n",
-      "random_latents range: [-1.7329806089401245, 1.4522238969802856]\n",
-      "average random_latents: -0.05122515186667442\n",
-      "Video saved to tmp/fill_vid.mp4\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "item = val_dataset[50]\n",
     "save_side_by_side_video(item, model, from_idx=1, to_idx=4, path=\"tmp/fill_vid.mp4\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "\n",
-       "<video width=\"320\" height=\"240\" controls>\n",
-       "  <source src=\"../tmp/fill_vid.mp4\" type=\"video/mp4\">\n",
-       "</video>\n"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "execution_count": 9,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
+   "outputs": [],
    "source": [
     "\n",
     "\n",
@@ -319,52 +118,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "poses range: [3.5189839309168747e-06, 0.9999984502792358]\n",
-      "mus range: [-1.487624168395996, 1.8445534706115723]\n",
-      "average mu: 0.04888433218002319\n",
-      "logvars range: [-8.518484115600586, -5.8925089836120605]\n",
-      "median logvar: -7.370262622833252\n",
-      "gt_latents range: [-1.948813796043396, 2.2732694149017334]\n",
-      "average gt_latents: 0.24087952077388763\n",
-      "random_latents range: [-1.4572112560272217, 1.8878892660140991]\n",
-      "average random_latents: 0.04571348428726196\n",
-      "Video saved to tmp/gen_vid.mp4\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "save_side_by_side_video(item, model, from_idx=0, path=\"tmp/gen_vid.mp4\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "\n",
-       "<video width=\"320\" height=\"240\" controls>\n",
-       "  <source src=\"../tmp/gen_vid.mp4\" type=\"video/mp4\">\n",
-       "</video>\n"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "execution_count": 11,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
+   "outputs": [],
    "source": [
     "\n",
     "\n",
 
@@ -0,0 +1 @@
+{"model": [0.12564842402935028, 0.08892914652824402, 0.0831979289650917, 0.08228670805692673, 0.08564914762973785, 0.0953526571393013, 0.1093117892742157, 0.13006433844566345, 0.15024712681770325, 0.17235219478607178, 0.19508112967014313, 0.21641355752944946, 0.23918820917606354, 0.2606200873851776, 0.27891215682029724, 0.29907020926475525, 0.3144414722919464, 0.33412039279937744, 0.3491173982620239, 0.36269068717956543], "model_single_layer_transformer": [0.13918371498584747, 0.09241282939910889, 0.08359085023403168, 0.08277571201324463, 0.08699499070644379, 0.09778112918138504, 0.11320507526397705, 0.13444054126739502, 0.155262291431427, 0.1772998869419098, 0.20199641585350037, 0.22535252571105957, 0.24829532206058502, 0.26870790123939514, 0.28866785764694214, 0.3094658851623535, 0.3262939751148224, 0.3449738025665283, 0.3587801158428192, 0.3760082721710205], "model_vae": [0.30333247780799866, 0.3200998306274414, 0.33794063329696655, 0.3640925884246826, 0.3904769718647003, 0.4185958206653595, 0.44002050161361694, 0.46187642216682434, 0.4782748222351074, 0.49203750491142273, 0.5079672932624817, 0.519733726978302, 0.5377718806266785, 0.541067361831665, 0.5547375679016113, 0.5591103434562683, 0.5664754509925842, 0.5756450891494751, 0.5771839618682861, 0.5854555368423462], "model_vae_single_layer_transformer": [0.3151271939277649, 0.31420376896858215, 0.3264966309070587, 0.35072073340415955, 0.3787328600883484, 0.40926486253738403, 0.4301280379295349, 0.4536152184009552, 0.4696636199951172, 0.4861705005168915, 0.5050753355026245, 0.5159381031990051, 0.5327478051185608, 0.5394688844680786, 0.5467861890792847, 0.5526284575462341, 0.5601837635040283, 0.5701719522476196, 0.5759778022766113, 0.5826566815376282]}
@@ -0,0 +1 @@
+{"model": [21.98292350769043, 14.340300559997559, 13.43407917022705, 13.281380653381348, 13.68807315826416, 14.619558334350586, 16.02347755432129, 18.08142852783203, 20.648395538330078, 23.337923049926758, 26.42051887512207, 29.621652603149414, 33.34819412231445, 37.707115173339844, 41.067047119140625, 45.00002670288086, 48.33279800415039, 52.669677734375, 55.95282745361328, 58.46841812133789], "model_single_layer_transformer": [21.327821731567383, 16.639490127563477, 14.898528099060059, 14.581068992614746, 14.713642120361328, 15.887846946716309, 17.2874813079834, 19.435869216918945, 22.553186416625977, 25.458030700683594, 29.034015655517578, 32.70307540893555, 36.36600112915039, 40.38428497314453, 45.23580551147461, 48.895408630371094, 52.23849868774414, 55.964927673339844, 59.8380012512207, 62.868343353271484], "model_vae": [39.20149230957031, 52.6158332824707, 55.64812088012695, 59.33192443847656, 63.002384185791016, 68.69374084472656, 72.3512954711914, 76.72998046875, 80.79139709472656, 85.02607727050781, 86.35516357421875, 91.21097564697266, 94.64981842041016, 95.75718688964844, 99.6708755493164, 100.07467651367188, 102.95051574707031, 105.49016571044922, 103.9454345703125, 105.8687973022461], "model_vae_single_layer_transformer": [53.5693359375, 50.3300666809082, 51.67551803588867, 56.25404739379883, 61.61893844604492, 67.36402893066406, 72.91018676757812, 77.97484588623047, 82.93614196777344, 87.12987518310547, 90.387939453125, 94.40081024169922, 97.01863861083984, 99.4786605834961, 102.1368637084961, 102.08549499511719, 104.48709106445312, 106.8950424194336, 107.47530364990234, 109.40076446533203]}
@@ -152,10 +152,4 @@ def _get_segment(self, idx):
             images = torch.stack(images)
             ret["images"] = images
 
-        # Check for sudden jumps in the values of the poses tensor
-        diff = poses[1:] - poses[:-1]
-        max_jump = 0.25
-        if torch.any(torch.abs(diff) > max_jump):
-            print(f"{diff.abs().max()=} at {idx=}")
-
         return ret
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	+{"model": [0.12564842402935028, 0.08892914652824402, 0.0831979289650917, 0.08228670805692673, 0.08564914762973785, 0.0953526571393013, 0.1093117892742157, 0.13006433844566345, 0.15024712681770325, 0.17235219478607178, 0.19508112967014313, 0.21641355752944946, 0.23918820917606354, 0.2606200873851776, 0.27891215682029724, 0.29907020926475525, 0.3144414722919464, 0.33412039279937744, 0.3491173982620239, 0.36269068717956543], "model_single_layer_transformer": [0.13918371498584747, 0.09241282939910889, 0.08359085023403168, 0.08277571201324463, 0.08699499070644379, 0.09778112918138504, 0.11320507526397705, 0.13444054126739502, 0.155262291431427, 0.1772998869419098, 0.20199641585350037, 0.22535252571105957, 0.24829532206058502, 0.26870790123939514, 0.28866785764694214, 0.3094658851623535, 0.3262939751148224, 0.3449738025665283, 0.3587801158428192, 0.3760082721710205], "model_vae": [0.30333247780799866, 0.3200998306274414, 0.33794063329696655, 0.3640925884246826, 0.3904769718647003, 0.4185958206653595, 0.44002050161361694, 0.46187642216682434, 0.4782748222351074, 0.49203750491142273, 0.5079672932624817, 0.519733726978302, 0.5377718806266785, 0.541067361831665, 0.5547375679016113, 0.5591103434562683, 0.5664754509925842, 0.5756450891494751, 0.5771839618682861, 0.5854555368423462], "model_vae_single_layer_transformer": [0.3151271939277649, 0.31420376896858215, 0.3264966309070587, 0.35072073340415955, 0.3787328600883484, 0.40926486253738403, 0.4301280379295349, 0.4536152184009552, 0.4696636199951172, 0.4861705005168915, 0.5050753355026245, 0.5159381031990051, 0.5327478051185608, 0.5394688844680786, 0.5467861890792847, 0.5526284575462341, 0.5601837635040283, 0.5701719522476196, 0.5759778022766113, 0.5826566815376282]}
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	+{"model": [21.98292350769043, 14.340300559997559, 13.43407917022705, 13.281380653381348, 13.68807315826416, 14.619558334350586, 16.02347755432129, 18.08142852783203, 20.648395538330078, 23.337923049926758, 26.42051887512207, 29.621652603149414, 33.34819412231445, 37.707115173339844, 41.067047119140625, 45.00002670288086, 48.33279800415039, 52.669677734375, 55.95282745361328, 58.46841812133789], "model_single_layer_transformer": [21.327821731567383, 16.639490127563477, 14.898528099060059, 14.581068992614746, 14.713642120361328, 15.887846946716309, 17.2874813079834, 19.435869216918945, 22.553186416625977, 25.458030700683594, 29.034015655517578, 32.70307540893555, 36.36600112915039, 40.38428497314453, 45.23580551147461, 48.895408630371094, 52.23849868774414, 55.964927673339844, 59.8380012512207, 62.868343353271484], "model_vae": [39.20149230957031, 52.6158332824707, 55.64812088012695, 59.33192443847656, 63.002384185791016, 68.69374084472656, 72.3512954711914, 76.72998046875, 80.79139709472656, 85.02607727050781, 86.35516357421875, 91.21097564697266, 94.64981842041016, 95.75718688964844, 99.6708755493164, 100.07467651367188, 102.95051574707031, 105.49016571044922, 103.9454345703125, 105.8687973022461], "model_vae_single_layer_transformer": [53.5693359375, 50.3300666809082, 51.67551803588867, 56.25404739379883, 61.61893844604492, 67.36402893066406, 72.91018676757812, 77.97484588623047, 82.93614196777344, 87.12987518310547, 90.387939453125, 94.40081024169922, 97.01863861083984, 99.4786605834961, 102.1368637084961, 102.08549499511719, 104.48709106445312, 106.8950424194336, 107.47530364990234, 109.40076446533203]}