example/gluon/lipnet/utils/run_preprocess.ipynb - mxnet - Git at Google

 {
  "cells": [
   {
    "cell_type": "code",
    "execution_count": 1,
    "metadata": {
     "scrolled": true
    },
    "outputs": [],
    "source": [
     "from download_data import multi_p_run, put_worker, _worker, download_mp4, download_align"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
     "## TEST"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 2,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
       "[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34]\n",
       "5\n",
       "35 >> [[0, 7], [7, 14], [14, 21], [21, 28], [28, 35]]\n",
       "[{'succ': {0, 1, 2, 3, 4, 5, 6}, 'fail': set()}, {'succ': {7, 8, 9, 10, 11, 12, 13}, 'fail': set()}, {'succ': {14, 15, 16, 17, 18, 19, 20}, 'fail': set()}, {'succ': {21, 22, 23, 24, 25, 26, 27}, 'fail': set()}, {'succ': {32, 33, 34, 28, 29, 30, 31}, 'fail': set()}]\n"
      ]
     }
    ],
    "source": [
     "res = multi_p_run(35, put_worker, _worker, 5)\n",
     "print (res)"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
     "## Download Data"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
     "## down\n",
     "import os\n",
     "os.makedirs('./datasets', exist_ok=True)\n",
     "#os.system('rm -rf ./datasets/*')\n",
     "\n",
     "res = multi_p_run(35, put_worker, download_align, 9)\n",
     "print (res)\n",
     "\n",
     "os.system('rm -f datasets/*.tar && rm -f datasets/align/Thumbs.db')"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
     "res = multi_p_run(35, put_worker, download_mp4, 9)\n",
     "print (res)\n",
     "\n",
     "os.system('rm -f datasets/*.zip && rm -f datasets/*/Thumbs.db')"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
     "## download single 22 th dir\n",
     "#download_data.py(22, 22)"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
     "## Preprocess Data"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
     "from preprocess_data import preprocess, find_files, Video"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 4,
    "metadata": {
     "scrolled": true
    },
    "outputs": [
     {
      "data": {
       "text/plain": [
        "0"
       ]
      },
      "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
     "import os\n",
     "os.makedirs('./TARGET', exist_ok=True)\n",
     "os.system('rm -rf ./TARGET/*')"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
       "[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34]\n",
       "9\n",
       "35 >> [[0, 4], [4, 8], [8, 12], [12, 16], [16, 20], [20, 24], [24, 28], [28, 32], [32, 35]]\n",
       "Processing: datasets/s1/prwq3s.mpg\n",
       "Processing: datasets/s4/lrix7n.mpg\n",
       "Processing: datasets/s8/pgbyza.mpg\n",
       "Processing: datasets/s12/brik7n.mpg\n",
       "Processing: datasets/s16/sgit7p.mpg\n",
       "Processing: datasets/s20/lrbp8a.mpg\n",
       "Processing: datasets/s24/sbik8a.mpg\n",
       "Processing: datasets/s28/srwf8a.mpg\n",
       "Processing: datasets/s32/pbbm1n.mpg\n",
       "Processing: datasets/s12/sbbaza.mpg\n",
       "Processing: datasets/s28/lbit7n.mpg\n",
       "Processing: datasets/s32/pbwm7p.mpg\n",
       "Processing: datasets/s8/bril2s.mpg\n",
       "Processing: datasets/s20/bway7n.mpg\n",
       "Processing: datasets/s1/pbib8p.mpg\n",
       "Processing: datasets/s16/lwaj7n.mpg\n",
       "Processing: datasets/s24/bwwl6a.mpg\n",
       "Processing: datasets/s4/bbwf7n.mpg\n"
      ]
     }
    ],
    "source": [
     "res = multi_p_run(35, put_worker, preprocess, 9)"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": []
   }
  ],
  "metadata": {
   "kernelspec": {
    "display_name": "Python 3",
    "language": "python",
    "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
     "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
    "version": "3.6.6"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 2
 }
	{
	"cells": [
	{
	"cell_type": "code",
	"execution_count": 1,
	"metadata": {
	"scrolled": true
	},
	"outputs": [],
	"source": [
	"from download_data import multi_p_run, put_worker, _worker, download_mp4, download_align"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"## TEST"
	]
	},
	{
	"cell_type": "code",
	"execution_count": 2,
	"metadata": {},
	"outputs": [
	{
	"name": "stdout",
	"output_type": "stream",
	"text": [
	"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34]\n",
	"5\n",
	"35 >> [[0, 7], [7, 14], [14, 21], [21, 28], [28, 35]]\n",
	"[{'succ': {0, 1, 2, 3, 4, 5, 6}, 'fail': set()}, {'succ': {7, 8, 9, 10, 11, 12, 13}, 'fail': set()}, {'succ': {14, 15, 16, 17, 18, 19, 20}, 'fail': set()}, {'succ': {21, 22, 23, 24, 25, 26, 27}, 'fail': set()}, {'succ': {32, 33, 34, 28, 29, 30, 31}, 'fail': set()}]\n"
	]
	}
	],
	"source": [
	"res = multi_p_run(35, put_worker, _worker, 5)\n",
	"print (res)"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"## Download Data"
	]
	},
	{
	"cell_type": "code",
	"execution_count": null,
	"metadata": {},
	"outputs": [],
	"source": [
	"## down\n",
	"import os\n",
	"os.makedirs('./datasets', exist_ok=True)\n",
	"#os.system('rm -rf ./datasets/*')\n",
	"\n",
	"res = multi_p_run(35, put_worker, download_align, 9)\n",
	"print (res)\n",
	"\n",
	"os.system('rm -f datasets/*.tar && rm -f datasets/align/Thumbs.db')"
	]
	},
	{
	"cell_type": "code",
	"execution_count": null,
	"metadata": {},
	"outputs": [],
	"source": [
	"res = multi_p_run(35, put_worker, download_mp4, 9)\n",
	"print (res)\n",
	"\n",
	"os.system('rm -f datasets/.zip && rm -f datasets//Thumbs.db')"
	]
	},
	{
	"cell_type": "code",
	"execution_count": null,
	"metadata": {},
	"outputs": [],
	"source": [
	"## download single 22 th dir\n",
	"#download_data.py(22, 22)"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"## Preprocess Data"
	]
	},
	{
	"cell_type": "code",
	"execution_count": 3,
	"metadata": {},
	"outputs": [],
	"source": [
	"from preprocess_data import preprocess, find_files, Video"
	]
	},
	{
	"cell_type": "code",
	"execution_count": 4,
	"metadata": {
	"scrolled": true
	},
	"outputs": [
	{
	"data": {
	"text/plain": [
	"0"
	]
	},
	"execution_count": 4,
	"metadata": {},
	"output_type": "execute_result"
	}
	],
	"source": [
	"import os\n",
	"os.makedirs('./TARGET', exist_ok=True)\n",
	"os.system('rm -rf ./TARGET/*')"
	]
	},
	{
	"cell_type": "code",
	"execution_count": null,
	"metadata": {},
	"outputs": [
	{
	"name": "stdout",
	"output_type": "stream",
	"text": [
	"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34]\n",
	"9\n",
	"35 >> [[0, 4], [4, 8], [8, 12], [12, 16], [16, 20], [20, 24], [24, 28], [28, 32], [32, 35]]\n",
	"Processing: datasets/s1/prwq3s.mpg\n",
	"Processing: datasets/s4/lrix7n.mpg\n",
	"Processing: datasets/s8/pgbyza.mpg\n",
	"Processing: datasets/s12/brik7n.mpg\n",
	"Processing: datasets/s16/sgit7p.mpg\n",
	"Processing: datasets/s20/lrbp8a.mpg\n",
	"Processing: datasets/s24/sbik8a.mpg\n",
	"Processing: datasets/s28/srwf8a.mpg\n",
	"Processing: datasets/s32/pbbm1n.mpg\n",
	"Processing: datasets/s12/sbbaza.mpg\n",
	"Processing: datasets/s28/lbit7n.mpg\n",
	"Processing: datasets/s32/pbwm7p.mpg\n",
	"Processing: datasets/s8/bril2s.mpg\n",
	"Processing: datasets/s20/bway7n.mpg\n",
	"Processing: datasets/s1/pbib8p.mpg\n",
	"Processing: datasets/s16/lwaj7n.mpg\n",
	"Processing: datasets/s24/bwwl6a.mpg\n",
	"Processing: datasets/s4/bbwf7n.mpg\n"
	]
	}
	],
	"source": [
	"res = multi_p_run(35, put_worker, preprocess, 9)"
	]
	},
	{
	"cell_type": "code",
	"execution_count": null,
	"metadata": {},
	"outputs": [],
	"source": []
	}
	],
	"metadata": {
	"kernelspec": {
	"display_name": "Python 3",
	"language": "python",
	"name": "python3"
	},
	"language_info": {
	"codemirror_mode": {
	"name": "ipython",
	"version": 3
	},
	"file_extension": ".py",
	"mimetype": "text/x-python",
	"name": "python",
	"nbconvert_exporter": "python",
	"pygments_lexer": "ipython3",
	"version": "3.6.6"
	}
	},
	"nbformat": 4,
	"nbformat_minor": 2
	}