Workflow10collectionpath00hdfspath00homepath00summarypath00hadoopjobjar00summarySTDERRSTDOUTHadoopStreamingFindDuplicatescollectionpath0hdfspath0homepath0summarypath0hadoopjobjar0outputfile_summary00STDERR00STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.4net.sf.taverna.t2.activities.externaltool.ExternalToolActivity D0A4CDEB-DD10-4A8E-A49C-8871003083D8 localhost_2 <?xml version="1.0" encoding="UTF-8"?> <sshInvocation><sshNode><host>127.0.0.1</host><port>22</port><directory>/tmp/</directory><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand><copyCommand>/bin/cp %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</copyCommand></sshNode></sshInvocation> 0cd8cdd1-2602-44e6-8817-bfd0bb37050a jobname=find_duplicates #exec 3<inputhomepath #exec 4<inputhdfspath #exec 5<inputcollectionpath #exec 6<outputdir #while read -r homepath<&3; read -r hdfspath<&4; read -r collectionpath<&5; read -r outputfolder<&6 #do # outrefsummary="$outputfolder/benchmark_result_list.csv" # echo "matchbox findduplicates --input-home-path=\"$homepath\" --input-hdfs-path=\"$hdfspath\" --input-collection-path=\"$collectionpath\" --summary=\"$outrefsummary\"" >> $jobname # echo $outrefsummary >> outputfile_summary #done #outrefsummary="%%summarypath%%/benchmark_result_list.csv" #echo "%%homepath%%" #echo $outrefsummary #echo "matchbox findduplicates --input-home-path=\"%%homepath%%\" --input-hdfs-path=\"%%hdfspath%%\" --input-collection-path=\"%%collectionpath%%\" --summary=\"$outrefsummary\"" >> $jobname #echo $outrefsummary >> outputfile_summary #read -r homepath<&3; read -r hdfspath<&4; read -r collectionpath<&5; read -r outputfolder<&6 ##outrefsummary="$outputfolder/benchmark_result_list.csv" ##echo "homepath=$homepath" ##echo "hdfspath=$hdfspath" ##echo "collectionpath=$collectionpath" ##echo "outrefsummary=$outrefsummary" #echo "matchboxspec findduplicates --input-home-path=\"$homepath\" --input-hdfs-path=\"$hdfspath\" --input-collection-path=\"$collectionpath\" --summary=\"$outrefsummary\"" >> $jobname ##echo $outrefsummary >> outputfile_summary outrefsummary="%%summarypath%%/benchmark_result_list.csv" echo "homepath=%%homepath%%" echo "hdfspath=%%hdfspath%%" echo "collectionpath=%%collectionpath%%" echo "outrefsummary=$outrefsummary" #echo "matchboxspec findduplicates --input-home-path=\"$homepath\" --input-hdfs-path=\"$hdfspath\" --input-collection-path=\"$collectionpath\" --summary=\"$outrefsummary\"" >> $jobname echo $outrefsummary >> outputfile_summary cd /home/training/rg-scenario/ #./PythonMatchboxWF.sh $homepath $hdfspath $collectionpath ./PythonMatchboxWF.sh %%homepath%% %%hdfspath%% %%collectionpath%% #hadoop jar hadoopjob.jar -j $jobname -i $jobname -r toolspecs if [ $? -ne 0 ]; then echo -n > outputfile_summary fi 1200 1800 collectionpath hdfspath homepath summarypath summarypath summarypath false false false UTF-8 false false false hdfspath hdfspath false false false UTF-8 false false false hadoopjobjar hadoopjob.jar true false true UTF-8 false false false homepath homepath false false false UTF-8 false false false collectionpath collectionpath false false false UTF-8 false false false outputfile_summary outputfile_summary false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.4net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.4net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.4net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.4net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.4net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHadoopStreamingFindDuplicatescollectionpathcollectionpathHadoopStreamingFindDuplicateshdfspathhdfspathHadoopStreamingFindDuplicateshomepathhomepathHadoopStreamingFindDuplicatessummarypathsummarypathHadoopStreamingFindDuplicateshadoopjobjarhadoopjobjarsummaryHadoopStreamingFindDuplicatesoutputfile_summarySTDERRHadoopStreamingFindDuplicatesSTDERRSTDOUTHadoopStreamingFindDuplicatesSTDOUT 823a6c9b-d6dd-4d47-8b32-35a653cbda3c 2013-07-26 02:06:13.980 UTC 54c65d76-4a84-45a4-b622-c7cd948d01dd 2013-07-25 18:48:08.174 UTC be363ae9-f05f-45d8-a5d5-f1d5a25e3e57 2013-09-28 23:04:11.59 UTC fbeeb473-1488-4f69-a537-8f5f760d306b 2013-07-02 08:57:49.543 UTC babeeda0-ca71-4f03-aa3e-37087b09a8a1 2013-09-28 22:08:51.331 UTC 438b2314-e479-4b8b-8cde-c0adcc18e1b8 2013-07-25 20:42:45.403 UTC 4eece3e9-4003-42e2-9623-fd98032f8941 2013-07-25 19:42:55.617 UTC b9c069ba-9800-4b1a-8eab-db75f754df8e 2013-07-25 15:46:42.368 UTC 9a3cbb29-10e2-4608-8bc8-057506baac54 2013-07-26 01:22:27.9 UTC 7f3fcfac-6f00-4d90-99a5-de631b20a50a 2013-07-25 18:54:15.227 UTC 2aa82e1f-d8e2-4efc-8740-812b3517c238 2013-07-26 01:58:02.5 UTC 146b80b3-b39e-42a2-81b6-0dd12f75c53a 2013-07-25 14:28:50.829 UTC c96f5181-bea8-45d0-a82a-56c84a3759a1 2013-09-29 00:26:22.337 UTC fae3c555-d677-435b-8981-665e9a87344d 2013-07-29 14:32:34.246 UTC a2321add-0429-492b-848d-5563c7a3dbca 2013-07-29 14:59:04.355 UTC 81cceed2-0a7b-47ac-99a2-b09205b0cf8c 2013-07-25 20:04:15.52 UTC 7b1876fa-940c-4ee8-b28d-4d08f91bfe0a 2013-07-29 14:21:03.743 UTC 76717a15-daa7-4971-b3b0-3f11b9a1378a 2013-07-02 17:21:03.550 UTC bb1ccdad-56a4-4403-b86f-426efd858888 2013-09-28 22:54:34.708 UTC 3d10764c-0db6-4bee-b9b2-d78830ee75e1 2013-07-26 01:39:38.342 UTC 84b3f5c8-7468-4453-a53a-40a27f3eb257 2013-07-02 16:50:32.647 UTC fde78648-e9fa-4581-a680-1917a704b592 2013-07-25 23:38:33.717 UTC 631430fd-a52b-4873-a046-9c1028c34752 2013-07-30 11:47:54.535 UTC ad38ee00-1d99-40ce-a076-90f5fbb23d9c 2013-07-29 14:34:08.84 UTC 4978f124-986b-48f7-a149-a44a3e29af31 2013-07-03 07:43:36.194 UTC 80adfd3a-60da-44a5-b8a5-9eff229a8ef5 2013-07-29 15:18:44.267 UTC e20dc475-4896-4145-81bb-558a699e2d51 2013-07-04 09:35:43.261 UTC ab165169-3d79-436f-b987-a3c0db4907e3 2013-09-29 01:24:21.945 UTC 166ca883-d482-4e7f-aea7-d09cf9f64ee9 2013-09-28 22:51:59.339 UTC 712733d8-88eb-4bd3-9ef8-0ab3e4285c2c 2013-07-02 09:59:54.623 UTC ad19eac9-df30-4c45-a9df-0b9f05e722b5 2013-05-07 14:43:56.511 UTC dcc5f297-5656-4656-804a-aa5c6c5cd78f 2013-06-18 12:01:50.974 UTC a6943d89-90b9-4430-a058-1f4ab49fa9f7 2013-09-28 23:47:50.446 UTC 1fa7e3e2-354d-4ffb-87f8-b15086894b4c 2013-09-28 22:24:41.653 UTC c365f659-1dda-4790-bced-ec22a14a8c37 2013-06-18 14:33:46.771 UTC c2882223-aca4-4999-b91e-a7953d2b0170 2013-07-02 07:36:49.322 UTC fd18d43f-9215-4516-b647-b5e517fbd6b0 2013-09-28 23:01:45.662 UTC 210f8096-6edb-4804-89dc-89de3526caf1 2013-07-25 19:33:30.33 UTC cd49841f-b6c4-4866-9462-8a896bdde5b9 2013-09-28 23:45:26.588 UTC 238308d1-54d8-41a9-b73c-f9cedf5c92e4 2013-07-26 09:34:58.50 UTC dba65df0-2c73-499c-8e02-d2b6f6f3a181 2013-07-25 19:11:55.869 UTC 349b34e8-10f9-42e7-ac84-6a5b2bf386f0 2013-07-30 11:48:14.211 UTC a5839299-1e38-4a22-94f8-7fc54003d602 2013-07-03 06:43:22.348 UTC d0f69eef-d10f-483d-b797-ec206de5f2e5 2013-07-25 20:15:33.57 UTC 84ef82ec-9321-49c9-8df8-34b990cd37f8 2013-07-03 08:22:36.221 UTC e61bb578-a05f-47c3-8f65-c1e5ffd9b9cd 2013-07-03 05:52:49.929 UTC 627a9609-749b-469f-884e-3198a1eb8574 2013-07-03 07:56:15.159 UTC 350e60e3-82cf-437e-b424-ffdcc92e6d51 2013-07-25 20:28:44.285 UTC dedb04f2-1334-423a-9c40-acbf4a7631b8 2013-07-05 14:38:39.604 UTC 1dbf4ca8-61d5-48dd-b675-22bcf049f22b 2013-07-25 15:03:19.147 UTC b3179b3f-f275-49a7-a5fa-c5b88ccbd818 2013-07-03 07:13:14.366 UTC b274e7ee-6ecf-4a66-be0f-0d4ea66228b0 2013-07-03 06:01:56.905 UTC 7331cf52-b780-4606-94af-91237676090a 2013-09-28 23:59:21.93 UTC 4584f232-d82c-4b61-96f6-c0b94d092226 2013-09-29 00:46:02.667 UTC 9a33ed0f-8fb2-4c22-9f64-dc897cc6c441 2013-07-05 14:11:32.856 UTC ff456058-8f51-4d4b-971c-145fac1c02ac 2013-07-05 14:24:39.504 UTC 84a583f8-3000-4b79-9a7a-c81423b5134d 2013-07-02 13:00:11.976 UTC 0e80c109-bcb5-4cb2-8e17-2a225c70dc4f 2013-07-29 14:45:08.764 UTC 1c668765-6405-4aca-a17b-4e6eaeb1f9b1 2013-07-02 16:22:09.32 UTC 208a7d9f-ed19-4dff-94d6-80f0152d3d69 2013-07-25 16:32:50.531 UTC a00cf8dc-e945-4cd9-9332-5c5dac66dd25 2013-07-30 12:04:24.847 UTC 70a5444f-5480-4ee8-a3ca-3f58f969be56 2013-07-17 14:34:39.427 UTC 0a6dc7d2-481d-4469-ad6a-675809437614 2013-08-08 09:24:23.61 UTC c84f6e42-2a5b-4578-838e-c397a5a43173 2013-07-25 20:56:19.378 UTC bdadad1a-8c25-4fbb-a5cc-326c2fc9fcec 2013-06-21 15:30:32.773 UTC 97283512-9f5c-4657-98e4-1ad65dfd1958 2013-05-07 16:01:05.778 UTC 5d49217d-33e2-4a25-a503-e93bc9ba8e60 2013-07-04 08:35:53.351 UTC e1112ebb-2973-4d46-af19-7e67ddf8209a 2013-07-25 14:38:14.209 UTC 1ac2b974-7388-4852-a36d-538f94c5266f 2013-07-02 10:03:46.617 UTC af979f13-ce24-4ee3-ae82-f0c72d5c4cd1 2013-07-03 06:56:23.591 UTC fea00aab-b702-4326-9f46-1c236051563b 2013-07-25 15:35:21.764 UTC e72796f7-a41a-4eab-9ab4-cb166ad26d7a 2013-09-29 01:41:28.950 UTC afbaf39c-b573-4dee-8e70-a019afc7852c 2013-07-02 12:36:11.728 UTC 0b3465bb-738f-4d01-848e-f1ed6defee1e 2013-07-25 20:07:31.36 UTC 5d300d73-b237-450e-8958-1352b8baf96d 2013-09-28 22:49:05.620 UTC 4ddf9253-4c0d-48f7-9442-1f876f0d7477 2013-07-30 12:48:20.170 UTC 85c1f94a-9f65-41e4-8df9-a7f64bd5640e 2013-09-29 01:03:24.363 UTC 3c7aa164-0b40-48c1-aa43-966679652054 2013-09-28 23:46:36.862 UTC fb79d22e-4889-4279-8b9d-5a91354db65f 2013-07-25 19:22:43.767 UTC f32b4855-c180-40bc-9244-a4982d6d750b 2013-07-05 14:41:55.489 UTC 12312700-0d25-4046-b213-259919dcb099 2013-07-02 12:44:45.763 UTC e5deaaec-06fe-4523-81d7-e4f57bc2bd6a 2013-09-28 23:31:12.425 UTC 5eebebf4-347d-48d7-acde-c53078764c6c 2013-07-26 02:51:09.229 UTC f4ba29f9-a125-4af1-8c63-f121bb7bccb4 2013-07-25 21:54:36.793 UTC 91683717-814b-4ede-92c3-b9c98dcebb47 2013-09-29 00:41:49.635 UTC 2bc2b3c4-475f-404f-8d81-37e1523d1e5c 2013-07-02 07:08:04.989 UTC 76dcd12c-6060-41d1-8088-f1c7ce54bcb8 2013-07-25 15:08:20.891 UTC 4ac49f48-e794-4a99-84ef-82361fbf5e6d 2013-07-30 12:12:44.450 UTC 89619c67-b7d4-4cfd-82b9-297636427994 2013-06-18 12:10:22.484 UTC 01523dcc-ab27-455a-aa08-443e12eaedd3 2013-07-03 08:11:18.698 UTC 3be35927-b3f6-457e-8d73-28a08b063268 2013-07-30 12:59:50.807 UTC 5333dac3-b0a5-4c11-ac34-50f861fe102c 2013-07-30 12:23:14.585 UTC e2f5a9f6-4d2a-4c28-bf3d-19c4603ece53 2013-09-28 23:08:27.859 UTC