"]}, "execution_count": 6, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd ls -l"]}, {"cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "
\n", " \n", " \n", " | \n", " | \n", " attributes | \n", " code | \n", " alias | \n", " folder | \n", " size | \n", " unit | \n", " name | \n", " isdir | \n", "
\n", " \n", " \n", " \n", " -rw-rw-r-- | \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 1043 | \n", " Jul | \n", " 14 | \n", " 23:40 | \n", " centrer_reduire.pig | \n", " False | \n", "
\n", " \n", " -rw-r--r-- | \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 2 | \n", " Jul | \n", " 15 | \n", " 00:22 | \n", " diff_cluster | \n", " False | \n", "
\n", " \n", " -rw-rw-r-- | \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " Sep | \n", " 27 | \n", " 00:21 | \n", " dummy | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 290 | \n", " Jul | \n", " 14 | \n", " 23:48 | \n", " init_random.pig | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 1654 | \n", " Jul | \n", " 15 | \n", " 00:20 | \n", " iteration_complete.pig | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 235 | \n", " Jul | \n", " 14 | \n", " 23:37 | \n", " nb_obervations.pig | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 1778 | \n", " Jul | \n", " 14 | \n", " 23:57 | \n", " pig_1436911046432.log | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 4570 | \n", " Jul | \n", " 15 | \n", " 00:45 | \n", " pig_1436913856496.log | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 4570 | \n", " Jul | \n", " 15 | \n", " 23:52 | \n", " pig_1436997076356.log | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 574 | \n", " Jul | \n", " 15 | \n", " 23:51 | \n", " post_traitement.pig | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 659 | \n", " Sep | \n", " 27 | \n", " 00:21 | \n", " pystream.pig | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 382 | \n", " Sep | \n", " 27 | \n", " 00:21 | \n", " pystream.py | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 26186 | \n", " Jul | \n", " 15 | \n", " 23:52 | \n", " redirection.err | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " Jul | \n", " 15 | \n", " 23:51 | \n", " redirection.out | \n", " False | \n", "
\n", " \n", " 1 | \n", " xavierdupre | \n", " xavierdupre | \n", " 3400818 | \n", " Jul | \n", " 15 | \n", " 23:48 | \n", " Skin_NonSkin.txt | \n", " False | \n", "
\n", " \n", "
\n", "
"], "text/plain": [" attributes code alias folder size unit \\\n", "-rw-rw-r-- 1 xavierdupre xavierdupre 1043 Jul 14 23:40 \n", "-rw-r--r-- 1 xavierdupre xavierdupre 2 Jul 15 00:22 \n", "-rw-rw-r-- 1 xavierdupre xavierdupre 0 Sep 27 00:21 \n", " 1 xavierdupre xavierdupre 290 Jul 14 23:48 \n", " 1 xavierdupre xavierdupre 1654 Jul 15 00:20 \n", " 1 xavierdupre xavierdupre 235 Jul 14 23:37 \n", " 1 xavierdupre xavierdupre 1778 Jul 14 23:57 \n", " 1 xavierdupre xavierdupre 4570 Jul 15 00:45 \n", " 1 xavierdupre xavierdupre 4570 Jul 15 23:52 \n", " 1 xavierdupre xavierdupre 574 Jul 15 23:51 \n", " 1 xavierdupre xavierdupre 659 Sep 27 00:21 \n", " 1 xavierdupre xavierdupre 382 Sep 27 00:21 \n", " 1 xavierdupre xavierdupre 26186 Jul 15 23:52 \n", " 1 xavierdupre xavierdupre 0 Jul 15 23:51 \n", " 1 xavierdupre xavierdupre 3400818 Jul 15 23:48 \n", "\n", " name isdir \n", "-rw-rw-r-- 1 centrer_reduire.pig False \n", "-rw-r--r-- 1 diff_cluster False \n", "-rw-rw-r-- 1 dummy False \n", " 1 init_random.pig False \n", " 1 iteration_complete.pig False \n", " 1 nb_obervations.pig False \n", " 1 pig_1436911046432.log False \n", " 1 pig_1436913856496.log False \n", " 1 pig_1436997076356.log False \n", " 1 post_traitement.pig False \n", " 1 pystream.pig False \n", " 1 pystream.py False \n", " 1 redirection.err False \n", " 1 redirection.out False \n", " 1 Skin_NonSkin.txt False "]}, "execution_count": 7, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_ls ."]}, {"cell_type": "markdown", "metadata": {}, "source": ["We check the content on the cluster:"]}, {"cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "Found 33 items\n", "drwx------ - xavierdupre xavierdupre 0 2015-09-27 02:00 .Trash\n", "drwx------ - xavierdupre xavierdupre 0 2015-09-27 00:22 .staging\n", "-rw-r--r-- 3 xavierdupre xavierdupre 132727 2014-11-16 02:37 ConfLongDemo_JSI.small.example.txt\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-16 02:38 ConfLongDemo_JSI.small.example2.walking.txt\n", "-rw-r--r-- 3 xavierdupre xavierdupre 3400818 2015-07-14 23:35 Skin_NonSkin.txt\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:22 diff_cluster\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:44 donnees_normalisees\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:43 ecartstypes\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:49 init_random\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:41 moyennes\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:38 nb_obervations\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:05 output_iter1\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:22 output_iter10\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:07 output_iter2\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:09 output_iter3\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:11 output_iter4\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:13 output_iter5\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:15 output_iter6\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:17 output_iter7\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:18 output_iter8\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:20 output_iter9\n", "-rw-r--r-- 3 xavierdupre xavierdupre 461444 2014-11-20 01:33 paris.2014-11-11_22-00-18.331391.txt\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 22:03 python_info.txt\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 22:07 python_info2.txt\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-12-03 22:55 random\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-20 23:43 unitest2\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-09-27 00:23 unittest\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2015-09-27 00:22 unittest2\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-20 01:53 velib_1hjs\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-21 01:17 velib_py\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 21:34 velib_py_results\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 21:51 velib_py_results_3days\n", "drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-21 11:08 velib_several_days\n", "\n", "
"], "text/plain": [""]}, "execution_count": 8, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd hdfs dfs -ls"]}, {"cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "
\n", " \n", " \n", " | \n", " attributes | \n", " code | \n", " alias | \n", " folder | \n", " size | \n", " date | \n", " time | \n", " name | \n", " isdir | \n", "
\n", " \n", " \n", " \n", " 0 | \n", " drwx------ | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-09-27 | \n", " 02:00 | \n", " .Trash | \n", " True | \n", "
\n", " \n", " 1 | \n", " drwx------ | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-09-27 | \n", " 00:22 | \n", " .staging | \n", " True | \n", "
\n", " \n", " 2 | \n", " -rw-r--r-- | \n", " 3 | \n", " xavierdupre | \n", " xavierdupre | \n", " 132727 | \n", " 2014-11-16 | \n", " 02:37 | \n", " ConfLongDemo_JSI.small.example.txt | \n", " False | \n", "
\n", " \n", " 3 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-16 | \n", " 02:38 | \n", " ConfLongDemo_JSI.small.example2.walking.txt | \n", " True | \n", "
\n", " \n", " 4 | \n", " -rw-r--r-- | \n", " 3 | \n", " xavierdupre | \n", " xavierdupre | \n", " 3400818 | \n", " 2015-07-14 | \n", " 23:35 | \n", " Skin_NonSkin.txt | \n", " False | \n", "
\n", " \n", " 5 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:22 | \n", " diff_cluster | \n", " True | \n", "
\n", " \n", " 6 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-14 | \n", " 23:44 | \n", " donnees_normalisees | \n", " True | \n", "
\n", " \n", " 7 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-14 | \n", " 23:43 | \n", " ecartstypes | \n", " True | \n", "
\n", " \n", " 8 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-14 | \n", " 23:49 | \n", " init_random | \n", " True | \n", "
\n", " \n", " 9 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-14 | \n", " 23:41 | \n", " moyennes | \n", " True | \n", "
\n", " \n", " 10 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-14 | \n", " 23:38 | \n", " nb_obervations | \n", " True | \n", "
\n", " \n", " 11 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:05 | \n", " output_iter1 | \n", " True | \n", "
\n", " \n", " 12 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:22 | \n", " output_iter10 | \n", " True | \n", "
\n", " \n", " 13 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:07 | \n", " output_iter2 | \n", " True | \n", "
\n", " \n", " 14 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:09 | \n", " output_iter3 | \n", " True | \n", "
\n", " \n", " 15 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:11 | \n", " output_iter4 | \n", " True | \n", "
\n", " \n", " 16 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:13 | \n", " output_iter5 | \n", " True | \n", "
\n", " \n", " 17 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:15 | \n", " output_iter6 | \n", " True | \n", "
\n", " \n", " 18 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:17 | \n", " output_iter7 | \n", " True | \n", "
\n", " \n", " 19 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:18 | \n", " output_iter8 | \n", " True | \n", "
\n", " \n", " 20 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-07-15 | \n", " 00:20 | \n", " output_iter9 | \n", " True | \n", "
\n", " \n", " 21 | \n", " -rw-r--r-- | \n", " 3 | \n", " xavierdupre | \n", " xavierdupre | \n", " 461444 | \n", " 2014-11-20 | \n", " 01:33 | \n", " paris.2014-11-11_22-00-18.331391.txt | \n", " False | \n", "
\n", " \n", " 22 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-23 | \n", " 22:03 | \n", " python_info.txt | \n", " True | \n", "
\n", " \n", " 23 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-23 | \n", " 22:07 | \n", " python_info2.txt | \n", " True | \n", "
\n", " \n", " 24 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-12-03 | \n", " 22:55 | \n", " random | \n", " True | \n", "
\n", " \n", " 25 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-20 | \n", " 23:43 | \n", " unitest2 | \n", " True | \n", "
\n", " \n", " 26 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-09-27 | \n", " 00:23 | \n", " unittest | \n", " True | \n", "
\n", " \n", " 27 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-09-27 | \n", " 00:22 | \n", " unittest2 | \n", " True | \n", "
\n", " \n", " 28 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-20 | \n", " 01:53 | \n", " velib_1hjs | \n", " True | \n", "
\n", " \n", " 29 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-21 | \n", " 01:17 | \n", " velib_py | \n", " True | \n", "
\n", " \n", " 30 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-23 | \n", " 21:34 | \n", " velib_py_results | \n", " True | \n", "
\n", " \n", " 31 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-23 | \n", " 21:51 | \n", " velib_py_results_3days | \n", " True | \n", "
\n", " \n", " 32 | \n", " drwxr-xr-x | \n", " - | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2014-11-21 | \n", " 11:08 | \n", " velib_several_days | \n", " True | \n", "
\n", " \n", "
\n", "
"], "text/plain": [" attributes code alias folder size date time \\\n", "0 drwx------ - xavierdupre xavierdupre 0 2015-09-27 02:00 \n", "1 drwx------ - xavierdupre xavierdupre 0 2015-09-27 00:22 \n", "2 -rw-r--r-- 3 xavierdupre xavierdupre 132727 2014-11-16 02:37 \n", "3 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-16 02:38 \n", "4 -rw-r--r-- 3 xavierdupre xavierdupre 3400818 2015-07-14 23:35 \n", "5 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:22 \n", "6 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:44 \n", "7 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:43 \n", "8 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:49 \n", "9 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:41 \n", "10 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-14 23:38 \n", "11 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:05 \n", "12 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:22 \n", "13 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:07 \n", "14 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:09 \n", "15 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:11 \n", "16 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:13 \n", "17 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:15 \n", "18 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:17 \n", "19 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:18 \n", "20 drwxr-xr-x - xavierdupre xavierdupre 0 2015-07-15 00:20 \n", "21 -rw-r--r-- 3 xavierdupre xavierdupre 461444 2014-11-20 01:33 \n", "22 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 22:03 \n", "23 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 22:07 \n", "24 drwxr-xr-x - xavierdupre xavierdupre 0 2014-12-03 22:55 \n", "25 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-20 23:43 \n", "26 drwxr-xr-x - xavierdupre xavierdupre 0 2015-09-27 00:23 \n", "27 drwxr-xr-x - xavierdupre xavierdupre 0 2015-09-27 00:22 \n", "28 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-20 01:53 \n", "29 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-21 01:17 \n", "30 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 21:34 \n", "31 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-23 21:51 \n", "32 drwxr-xr-x - xavierdupre xavierdupre 0 2014-11-21 11:08 \n", "\n", " name isdir \n", "0 .Trash True \n", "1 .staging True \n", "2 ConfLongDemo_JSI.small.example.txt False \n", "3 ConfLongDemo_JSI.small.example2.walking.txt True \n", "4 Skin_NonSkin.txt False \n", "5 diff_cluster True \n", "6 donnees_normalisees True \n", "7 ecartstypes True \n", "8 init_random True \n", "9 moyennes True \n", "10 nb_obervations True \n", "11 output_iter1 True \n", "12 output_iter10 True \n", "13 output_iter2 True \n", "14 output_iter3 True \n", "15 output_iter4 True \n", "16 output_iter5 True \n", "17 output_iter6 True \n", "18 output_iter7 True \n", "19 output_iter8 True \n", "20 output_iter9 True \n", "21 paris.2014-11-11_22-00-18.331391.txt False \n", "22 python_info.txt True \n", "23 python_info2.txt True \n", "24 random True \n", "25 unitest2 True \n", "26 unittest True \n", "27 unittest2 True \n", "28 velib_1hjs True \n", "29 velib_py True \n", "30 velib_py_results True \n", "31 velib_py_results_3days True \n", "32 velib_several_days True "]}, "execution_count": 9, "metadata": {}, "output_type": "execute_result"}], "source": ["%dfs_ls ."]}, {"cell_type": "markdown", "metadata": {}, "source": ["We upload the file on the bridge (we should zip it first, it would reduce the uploading time)."]}, {"cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [{"data": {"text/plain": ["'ConfLongDemo_JSI.txt'"]}, "execution_count": 10, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_up ConfLongDemo_JSI.txt ConfLongDemo_JSI.txt"]}, {"cell_type": "markdown", "metadata": {}, "source": ["We check it got there:"]}, {"cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "ConfLongDemo_JSI.txt\n", "\n", "
"], "text/plain": [""]}, "execution_count": 11, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd ls Conf*JSI.txt"]}, {"cell_type": "markdown", "metadata": {}, "source": ["We put it on the cluster:"]}, {"cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "\n", "
"], "text/plain": [""]}, "execution_count": 12, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd hdfs dfs -put ConfLongDemo_JSI.txt ConfLongDemo_JSI.txt"]}, {"cell_type": "markdown", "metadata": {}, "source": ["We check it was put on the cluster:"]}, {"cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "Found 1 items\n", "-rw-r--r-- 3 xavierdupre xavierdupre 21546346 2015-09-27 11:33 ConfLongDemo_JSI.txt\n", "\n", "
"], "text/plain": [""]}, "execution_count": 13, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd hdfs dfs -ls Conf*JSI.txt"]}, {"cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "
\n", " \n", " \n", " | \n", " attributes | \n", " code | \n", " alias | \n", " folder | \n", " size | \n", " date | \n", " time | \n", " name | \n", " isdir | \n", "
\n", " \n", " \n", " \n", " 0 | \n", " -rw-r--r-- | \n", " 3 | \n", " xavierdupre | \n", " xavierdupre | \n", " 21546346 | \n", " 2015-09-27 | \n", " 11:33 | \n", " ConfLongDemo_JSI.txt | \n", " False | \n", "
\n", " \n", "
\n", "
"], "text/plain": [" attributes code alias folder size date time \\\n", "0 -rw-r--r-- 3 xavierdupre xavierdupre 21546346 2015-09-27 11:33 \n", "\n", " name isdir \n", "0 ConfLongDemo_JSI.txt False "]}, "execution_count": 14, "metadata": {}, "output_type": "execute_result"}], "source": ["dfs_ls Conf*JSI.txt"]}, {"cell_type": "markdown", "metadata": {}, "source": ["We create a simple PIG program:"]}, {"cell_type": "code", "execution_count": 14, "metadata": {"collapsed": true}, "outputs": [], "source": ["%%PIG filter_example.pig\n", "\n", "myinput = LOAD 'ConfLongDemo_JSI.txt' USING PigStorage(',') AS\n", " (index:long, sequence, tag, timestamp:long, dateformat, x:double,y:double, z:double, activity) ;\n", "filt = FILTER myinput BY activity == 'walking' ;\n", "STORE filt INTO 'ConfLongDemo_JSI.walking.txt' USING PigStorage() ;"]}, {"cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "\n", "
"], "text/plain": [""]}, "execution_count": 16, "metadata": {}, "output_type": "execute_result"}], "source": ["%pig_submit filter_example.pig -r=filter_example.redirect"]}, {"cell_type": "markdown", "metadata": {}, "source": ["We check the redirected files were created:"]}, {"cell_type": "code", "execution_count": 16, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "filter_example.redirect.err\n", "filter_example.redirect.out\n", "\n", "
"], "text/plain": [""]}, "execution_count": 17, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd ls f*redirect*"]}, {"cell_type": "markdown", "metadata": {}, "source": ["We check the tail on a regular basis to see the job running (some other commands can be used to monitor jobs, ``%remote_cmd mapred --help``)."]}, {"cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "Spillable Memory Manager spill count : 0\n", "Total bags proactively spilled: 0\n", "Total records proactively spilled: 0\n", "\n", "Job DAG:\n", "job_1435583503337_0055\n", "\n", "\n", "2015-09-27 11:38:56,436 [main] WARN org.apache.pig.backend.hadoop.executionengine.mapReduceLayer.MapReduceLauncher - Encountered Warning ACCESSING_NON_EXISTENT_FIELD 164860 time(s).\n", "2015-09-27 11:38:56,436 [main] INFO org.apache.pig.backend.hadoop.executionengine.mapReduceLayer.MapReduceLauncher - Success!\n", "\n", "
"], "text/plain": [""]}, "execution_count": 18, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd tail filter_example.redirect.err"]}, {"cell_type": "code", "execution_count": 18, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "Found 2 items\n", "-rw-r--r-- 3 xavierdupre xavierdupre 0 2015-09-27 11:38 ConfLongDemo_JSI.walking.txt/_SUCCESS\n", "-rw-r--r-- 3 xavierdupre xavierdupre 0 2015-09-27 11:38 ConfLongDemo_JSI.walking.txt/part-m-00000\n", "\n", "
"], "text/plain": [""]}, "execution_count": 19, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_cmd hdfs dfs -ls Conf*JSI.walking.txt"]}, {"cell_type": "code", "execution_count": 19, "metadata": {}, "outputs": [{"data": {"text/html": ["\n", "
\n", " \n", " \n", " | \n", " attributes | \n", " code | \n", " alias | \n", " folder | \n", " size | \n", " date | \n", " time | \n", " name | \n", " isdir | \n", "
\n", " \n", " \n", " \n", " 0 | \n", " -rw-r--r-- | \n", " 3 | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-09-27 | \n", " 11:38 | \n", " ConfLongDemo_JSI.walking.txt/_SUCCESS | \n", " False | \n", "
\n", " \n", " 1 | \n", " -rw-r--r-- | \n", " 3 | \n", " xavierdupre | \n", " xavierdupre | \n", " 0 | \n", " 2015-09-27 | \n", " 11:38 | \n", " ConfLongDemo_JSI.walking.txt/part-m-00000 | \n", " False | \n", "
\n", " \n", "
\n", "
"], "text/plain": [" attributes code alias folder size date time \\\n", "0 -rw-r--r-- 3 xavierdupre xavierdupre 0 2015-09-27 11:38 \n", "1 -rw-r--r-- 3 xavierdupre xavierdupre 0 2015-09-27 11:38 \n", "\n", " name isdir \n", "0 ConfLongDemo_JSI.walking.txt/_SUCCESS False \n", "1 ConfLongDemo_JSI.walking.txt/part-m-00000 False "]}, "execution_count": 20, "metadata": {}, "output_type": "execute_result"}], "source": ["%dfs_ls Conf*JSI.walking.txt"]}, {"cell_type": "markdown", "metadata": {}, "source": ["After that, the stream has to downloaded to the bridge and then to the local machine with ``%remote_down``. We finally close the connection."]}, {"cell_type": "code", "execution_count": 20, "metadata": {}, "outputs": [{"data": {"text/plain": ["True"]}, "execution_count": 21, "metadata": {}, "output_type": "execute_result"}], "source": ["%remote_close"]}, {"cell_type": "markdown", "metadata": {}, "source": ["**END**"]}, {"cell_type": "code", "execution_count": 21, "metadata": {"collapsed": true}, "outputs": [], "source": []}], "metadata": {"kernelspec": {"display_name": "Python 3", "language": "python", "name": "python3"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.1"}}, "nbformat": 4, "nbformat_minor": 2}