Data_explorationfileName00 '/path/to/dataset' 2017-01-18 10:02:22.14 UTC Path to the dataset that will be processed. It is important to give such path surrounded by single quotes. 2017-01-18 10:02:14.662 UTC hasHeader00 If the given dataset includes a header row, this condition must be indicated writing --header like in the example. Otherwise, just leave it empty. 2017-01-18 10:03:04.977 UTC --header 2017-01-18 10:03:10.111 UTC lastAction0loadDatasetfileName0hasHeader0net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> b8d947e9-8d10-459a-8b63-3e10b06648f5 python loadDataset.py %%fileName%% %%hasHeader%% 1200 1800 fileName hasHeader loadDataset.py true false false UTF-8 false import pandas, argparse # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' TMP_HEADER_FILE = '/home/brayan/Taverna/tmpHeader' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Main program parser = argparse.ArgumentParser(description = 'This module preloads the dataset in auxiliare files for the execution.') parser.add_argument('filename', help = 'Name of the file to be loaded') parser.add_argument('--header', help = 'If indicated, the file has a header row', action = 'store_true') fileName = parser.parse_args().filename header = parser.parse_args().header # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Data read if header: dataset = pandas.read_csv(fileName) else: dataset = pandas.read_csv(fileName, header = None) dataset.columns = map(str, range(dataset.shape[1])) # New header of ints as str dataset = dataset.apply(pandas.to_numeric, errors = 'coerce') dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) with open(TMP_HEADER_FILE, 'w') as headerFile: headerFile.write(','.join(dataset.columns)) fileName fileName false false false UTF-8 false false false hasHeader hasHeader false false false UTF-8 false false false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemainLooplastAction00net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Loop <activity xmlns="http://taverna.sf.net/2008/xml/t2flow"><raven><group>net.sf.taverna.t2.activities</group><artifact>beanshell-activity</artifact><version>1.5</version></raven><class>net.sf.taverna.t2.activities.beanshell.BeanshellActivity</class><inputMap /><outputMap /><configBean encoding="xstream"><net.sf.taverna.t2.activities.beanshell.BeanshellActivityConfigurationBean xmlns=""> <inputs> <net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityInputPortDefinitionBean> <name>lastAction</name> <depth>0</depth> <translatedElementType>java.lang.String</translatedElementType> <allowsLiteralValues>true</allowsLiteralValues> </net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityInputPortDefinitionBean> </inputs> <outputs> <net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityOutputPortDefinitionBean> <name>loop</name> <depth>0</depth> <granularDepth>0</granularDepth> </net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityOutputPortDefinitionBean> </outputs> <classLoaderSharing>workflow</classLoaderSharing> <localDependencies /> <artifactDependencies /> <script>loop = "" + ! lastAction.equals("Quit"); if ("true".matches(loop)) { Thread.sleep(500); }</script> <dependencies /> </net.sf.taverna.t2.activities.beanshell.BeanshellActivityConfigurationBean></configBean><annotations /></activity> true net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedeleteTmpnet.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> f9659a22-2a34-4fbe-a01a-b503291d0d53 python deleteTmp.py 1200 1800 deleteTmp.py true false false UTF-8 false import os # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' TMP_HEADER_FILE = '/home/brayan/Taverna/tmpHeader' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Main program try: os.remove(TMP_DATASET_FILE) os.remove(TMP_HEADER_FILE) except OSError: pass false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeloadDatasetfileNamefileNameloadDatasethasHeaderhasHeaderlastActionmainLooplastAction Data exploration 2017-01-18 09:58:41.114 UTC a08194b1-8776-4586-8dea-43e250e05a67 2017-01-18 14:32:59.738 UTC 750c66ac-6c0d-4550-9c5a-804c0b599657 2017-01-17 14:27:46.422 UTC 8fc5c71c-42fb-4689-bf3b-3822894134f2 2017-01-18 10:50:10.5 UTC c20805f5-3774-46ef-ad6a-021df3173359 2017-01-18 10:50:41.554 UTC 4e4a6eaa-d59b-46ae-8d29-7b13f8ba93c0 2017-01-17 11:00:10.327 UTC 5b8f3dbb-13af-4d5a-ac68-a50731814c1b 2017-01-17 14:39:15.97 UTC 23b648fb-e3f4-4a32-9630-fe0a708280ca 2017-01-18 14:40:47.958 UTC 1a1d166d-4acb-4342-96a6-82e477b8dff3 2017-01-18 10:00:52.240 UTC 33a670e3-1d84-4400-aa69-9cd92dc57a87 2017-01-18 14:44:32.531 UTC 08f8b9d7-a5b9-49db-8c6c-0d426ab0e6e3 2017-01-18 11:25:19.334 UTC d962dccd-7e97-450b-b188-5be2fa60d2ba 2017-01-18 11:10:57.837 UTC 2fcd1019-ea0e-400d-9bb6-2a256f6d45da 2017-01-17 14:33:30.263 UTC ee8f829d-e2e7-4ba3-a549-5abd06714128 2017-01-18 10:32:59.129 UTC dd178ad6-80a0-4a75-bf07-cd93689953c6 2017-01-18 11:04:41.697 UTC fa5e3094-b81b-4737-93dc-6993b3129387 2017-01-18 14:55:00.275 UTC 9ed03c73-0c1c-45ce-8c27-59d1c6c3c92a 2017-01-18 15:06:38.545 UTC f07e2fd6-5627-4396-9513-8abe038b9ac6 2017-01-17 11:42:28.948 UTC 182219e2-0aec-44a4-8ed0-6ce720904e30 2017-01-17 14:49:30.981 UTC d21fd703-84a8-4448-a7f0-7deee5bca364 2017-01-18 10:37:54.364 UTC 603042f0-dd99-43e7-b26f-40e37aeda228 2017-01-18 15:12:51.359 UTC 31b5ba93-76bb-4b3f-a69f-05dc353b58b1 2017-01-17 11:19:05.961 UTC 54679c07-7a47-4627-ab1a-a4719cc1b798 2017-01-17 11:15:36.33 UTC 46a10f58-d0f1-4231-a2ce-dab7b38f90bf 2017-01-18 10:47:18.645 UTC a877d377-0492-4abe-b04c-ed69277c8b71 2017-01-18 11:26:36.726 UTC 212188ff-ee6f-4000-8f78-136480fa1be3 2017-01-18 14:41:39.271 UTC b4c10c24-7212-43a9-ad85-ed94f1771f26 2017-01-18 10:59:36.906 UTC 7650d310-4872-49fe-a1e9-fc44d4514e68 2017-01-17 11:40:05.159 UTC fd4794e6-d400-4b95-a08c-225f482fa3b7 2017-01-17 12:51:05.993 UTC 769d154d-823d-41f1-a924-697c9485b348 2017-01-18 14:40:34.776 UTC 9ebdb8b0-367c-4c42-9469-74ba2750267b 2017-01-17 14:36:03.735 UTC be9d7dcd-e9da-4e4b-9d1e-05b828d0221c 2017-01-17 14:23:40.766 UTC 7a933706-41a5-429f-9a4a-54a26cf8d547 2017-01-18 11:14:57.364 UTC 270ecfae-3364-4166-9736-6f159c6306d8 2017-01-18 14:51:27.161 UTC 3a96a913-379d-4bc5-be8f-6003a5b4ad18 2017-01-17 15:16:31.869 UTC 6333fe59-9a12-4491-b06e-bcddaae7e762 2017-01-18 14:50:08.878 UTC f19ea17a-6c83-405a-9e65-c46738f428cd 2017-01-17 14:41:20.769 UTC 8d785c1c-1207-4137-9be0-36be21063d58 2017-01-18 15:08:45.966 UTC 1ad93dd3-1f29-42c2-be90-2db9af258630 2017-01-18 10:03:12.439 UTC d625b610-4e94-4528-a784-8255e9209939 2017-01-17 15:00:32.298 UTC b0a168ed-116b-4937-8789-a12ffb23fcb1 2017-01-18 11:25:29.539 UTC This workflows allows one to explore and process a given dataset file. These are the list of possible actions: - Visualization (Histogram, Scatter plot) - Normalization (Feature scaling, Standardization) - Column drop - Deal with missing values (Use mean as a replace, Drop samples) - Cast to numeric labels - Save the processed file 2017-01-18 10:00:50.413 UTC c9e10585-125d-4f5e-8039-81b5d21a6303 2017-01-17 11:43:13.302 UTC 5d371e08-4635-4476-a34f-e3dfc7d342a2 2017-01-17 14:55:44.865 UTC 7073f46f-db3c-4a1e-8bb0-27771c48a5e2 2017-01-19 11:32:22.525 UTC 52496cad-e0dd-438a-b851-109b9fa18e9a 2017-01-18 11:03:45.227 UTC fc199911-453d-40a1-8716-820de3369259 2017-01-18 11:25:44.227 UTC c7157685-da0a-42d0-a56e-d65d0d8cfeb1 2017-01-17 14:22:37.937 UTC 37c89f41-15c3-43b3-b3c0-4233edbaeee0 2017-01-18 14:47:01.466 UTC 3066d118-9a67-4834-ba12-cd7115980d4a 2017-01-17 14:51:17.575 UTC abc67d94-5cbf-4a88-b138-38fee66509f2 2017-01-17 11:17:20.340 UTC ed310273-8908-48b2-8d1a-37dcc9a53f0d 2017-01-18 10:50:04.603 UTC Brayan Stiven Zapata Impatá 2017-01-18 09:58:37.467 UTC 60326ead-05e2-4d87-a48c-4fec527a8524 2017-01-18 11:01:24.418 UTC 00e8a9d4-3a90-4af8-9bf5-f4d2e7dd0028 2017-01-17 15:02:42.186 UTC 763e56a8-6a8f-4434-a087-9ec1ce7f9706 2017-01-18 11:25:31.115 UTC 847bac2f-c371-4520-9582-a474125d3a04 2017-01-17 14:26:48.406 UTC fd544e0b-c391-4240-a7c0-9754461d309c 2017-01-18 11:29:09.486 UTC a5a57b61-d206-4d48-9cb8-11695b26175b 2017-01-17 11:01:35.239 UTC f8623af3-42ec-4669-9c22-b520e53c4c33 2017-01-18 10:45:45.658 UTC 7965768d-92db-4a3a-8d61-85c560f67b46 2017-01-18 11:27:40.561 UTC 5f6d717f-b374-4489-b7e8-ac917c40565d 2017-01-18 15:18:40.21 UTC 78fa0bdc-5c5a-457c-9d59-41779648b354 2017-01-18 15:09:38.732 UTC d8ef593e-e91f-4c7f-865c-f3b9870a2843 2017-01-18 10:45:15.970 UTC d13bee50-d0b2-4294-bbbc-79bfe3de39a7 2017-01-18 11:13:25.868 UTC d12de995-37a8-4c03-a3b4-eaede95b607d 2017-01-18 11:27:14.688 UTC 3e1af8b1-eca0-4bf3-b937-afdd2379c0dd 2017-01-17 14:45:52.753 UTC 662bd6e5-72f9-4e46-9fc4-190260389dbd 2017-01-17 13:23:29.67 UTC 778583c2-5f8b-4a0a-a776-70ffa37c4f6a 2017-01-17 14:31:48.376 UTC 4f04f52d-640e-43fe-895f-896195f166de 2017-01-17 12:52:44.280 UTC 16f8903a-9585-404a-b48d-926ad89db725 2017-01-18 11:18:27.716 UTC 24e8a898-59c9-47fc-92bc-ec428bd76fc7 2017-01-17 12:03:05.972 UTC 7ce88652-73fa-422a-bd82-2cef9166ed36 2017-01-18 11:21:54.852 UTC 48fe90af-f4ef-4adb-8524-4423b48efc82 2017-01-18 11:04:06.972 UTC 129c2ac5-d69c-4f8b-9dc4-5c4092b0c2bf 2017-01-17 11:25:48.52 UTC 8bceeea7-2c69-4c79-90a0-0f8d79a23b62 2017-01-18 15:05:09.114 UTC 4160f2b6-361d-49df-a342-9dac63bcfffc 2017-01-17 11:51:16.520 UTC 5927a373-ec5e-469e-9075-823c0db51e13 2017-01-18 14:56:49.823 UTC 79d242b4-cf87-4595-b83f-84a7e12e6b73 2017-01-17 14:43:20.27 UTC b9720331-27f7-40fd-9459-7793f0674a87 2017-01-17 12:59:34.288 UTC d2d43be7-cb8a-40c7-bf80-37306068cda2 2017-01-17 10:58:00.842 UTC 5a3fa5c7-6279-4276-8baf-d79bbd2e95e6 2017-01-18 15:10:05.813 UTC d2525c96-01b8-4e71-9cb6-eee422ec0939 2017-01-18 11:06:26.957 UTC 9fbbc6dc-3866-4293-8710-161df68c64e9 2017-01-17 12:45:07.39 UTC 0aa6afe2-3e8e-44ff-b532-dd3c41f65b60 2017-01-18 14:39:42.40 UTC 2c39ca07-1b57-4209-a830-4f47dae6095c 2017-01-18 11:15:47.792 UTC acb11776-3830-4a02-9e11-df134122fef7 2017-01-18 14:53:29.684 UTC f1214adc-f25e-4df4-a834-cf02dfb49c85 2017-01-18 11:28:17.907 UTC 9f6578b3-8913-4295-8758-5d08cc4cb41e 2017-01-18 11:03:21.451 UTC 797b8e8e-8d9b-4482-8545-b73c1d1466f8 2017-01-18 10:43:19.449 UTC 4e83404a-ef5a-454b-8d10-363158f2e4c1 2017-01-18 15:19:02.877 UTC f1cad094-807b-453a-bdb0-e96093b4a698 2017-01-18 10:38:56.825 UTC 7d79cc09-2d21-4a6e-af3d-cc30751d2322 2017-01-18 11:08:45.404 UTC 08479ded-4dd9-4f04-83bc-ab8ffa2667e9 2017-01-17 11:14:44.208 UTC 467f5c53-36b4-4bff-8111-18d9ce8db694 2017-01-18 14:45:32.17 UTC 14621cec-d958-4196-b185-fe2a2c73982a 2017-01-18 15:01:32.656 UTC baccf983-da11-447a-9712-e15c07f6b9f6 2017-01-17 15:01:53.609 UTC a64c5fc0-ca90-43d2-9ccb-10a1ad2bdf05 2017-01-18 11:02:47.107 UTC ab3c4b0e-1550-4b4f-9085-de2007f848ef 2017-01-17 15:19:22.964 UTC 6d278d6a-5c56-4392-ad24-e69c28f7cc24 2017-01-18 10:56:17.650 UTC c58912bf-fcc4-43fc-9bd4-988efe28bf59 2017-01-17 12:55:48.432 UTC 8a032e6f-f44d-4e91-8ae4-0c3b9d73a848 2017-01-17 13:29:05.819 UTC beaf1545-9f7c-41d7-b0fd-aaed080d6609 2017-01-18 10:43:55.82 UTC edd58035-4796-4ee7-8d8b-3818e42360c2 2017-01-18 14:50:37.377 UTC 56dfbcf0-0743-46bb-a3a7-f1173a859666 2017-01-17 12:47:11.15 UTC 8d6d5dd2-3a69-41a7-ac9e-db5d6fd4e372 2017-01-17 12:46:09.335 UTC 2ebb2c1f-7880-4e7f-8120-bc86c9805c61 2017-01-17 12:40:02.247 UTC c621ad59-3ef1-4106-ac92-1177f3d6161d 2017-01-17 11:17:52.426 UTC 14a1b2f1-2560-49ef-afbe-36c8da8a75a4 2017-01-17 11:48:21.52 UTC 95130d18-98a9-451d-b115-9d68d0840d36 2017-01-17 13:01:56.568 UTC 5d0648e7-caa5-4c17-a5a8-055780f8264b 2017-01-18 14:38:55.452 UTC 6241d0ae-f0ae-43d0-9c28-c69fd02719d5 2017-01-18 15:07:57.388 UTC 3d2a83dc-4972-4330-85dc-72dbdbcb243d 2017-01-18 11:26:34.624 UTC 533aeb3c-1a31-451c-8d66-ebc1c0f8c4c8 2017-01-17 11:07:03.664 UTC 41f1c906-26b4-4e0b-9efc-39157dc5999e 2017-01-17 14:54:44.153 UTC fa5e5e9c-5909-4dc7-9f92-d8157cd94093 2017-01-18 10:47:48.522 UTC 8e7fc9d0-21fb-472a-820b-8f52aa3caaa2 2017-01-17 14:33:54.425 UTC replacereplaceMissinMeanFlags00replaceMissingMeanSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> b4b78e6e-7765-4bfc-ad88-d6d6963a3696 python replaceMissingWithMean.py 1200 1800 replaceMissingWithMean.py true false false UTF-8 false import pandas # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Missing values processing dataset = pandas.read_csv(TMP_DATASET_FILE) dataset.fillna(dataset.mean(), inplace = True) dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) print 'Dataset processed correctly!' false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Replacement by mean values output information net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageConcatenate_two_stringsoutputTelltitletitlevalueConcatenate_two_stringsstring1replaceMissingMeanSTDERRConcatenate_two_stringsstring2replaceMissingMeanSTDOUT 9d5df8a4-b5c5-443a-a2a4-d069c6a3e8f4 2017-01-18 11:25:10.44 UTC 01433a41-e4a2-489d-aaa3-6184984deda2 2017-01-17 13:22:49.505 UTC 593ffd29-f947-40f9-afca-011d97ca85d1 2017-01-18 10:47:32.361 UTC fd9118ac-5531-4faa-abd5-2567a526c364 2017-01-17 13:22:40.208 UTC da01e85c-67a8-4d24-b717-f48dc6f9d3f6 2017-01-18 14:41:36.138 UTC f43744da-e1f5-498c-a35e-aafae63e95b6 2017-01-18 10:47:39.329 UTC replace 2017-01-17 13:22:37.159 UTC 32aa66f0-4b84-496a-bb8b-2ccc8f0a29ee 2017-01-18 11:25:13.749 UTC ba481226-9f8a-4c04-b93c-f720204d3c65 2017-01-18 11:03:12.53 UTC mainLooplastAction0actionOptionsvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Plot histogram,Plot scatter,Normalize data by feature scaling,Normalize data by standardization,Drop feature,Replace missing values with feature mean,Drop samples with missing values,Convert to numeric labels,Save to new file,Quit net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokecheckActionAction0plotHistogramFlags11plotScatterFlags11normFeatureFlags11normStandardFlags11dropFeatureFlags11replaceMissingMeanFlags11replaceMissingDropFlags11labelsToNumFlags11saveFlags11 This service checks if the condition is "true" and if so outputs a value in the pass_flags list and leaves the fail_flags empty. If the condition is not true then the service outputs a value in the fail_flags list and leaves the pass_flags empty. 2011-11-15 09:59:22.100 UTC net.sf.taverna.t2.activitiesbeanshell-activity1.5net.sf.taverna.t2.activities.beanshell.BeanshellActivity Action 0 text/plain java.lang.String true plotHistogramFlags 1 1 plotScatterFlags 1 1 normFeatureFlags 1 1 normStandardFlags 1 1 dropFeatureFlags 1 1 replaceMissingMeanFlags 1 1 replaceMissingDropFlags 1 1 labelsToNumFlags 1 1 saveFlags 1 1 workflow net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Loop net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedropFeaturedropFeatureFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedropMissingValuesreplaceMissingDropFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelabelsNumlabelsToNumFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select an action to perform over the dataset: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokenormFeatureScalingnormFeatureFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokenormStandardnormStandardFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotHistogramplotHistogramFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotScatterplotScatterFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesplitActionsToListregex0string0split11net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string 0 'text/plain' java.lang.String true regex 0 'text/plain' java.lang.String true split 1 l('text/plain') 1 workflow org.embl.ebi.escience.scuflworkers.java.SplitByRegex net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeregexvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity , net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokereplaceMissingMeanreplaceMissinMeanFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesaveFilesaveFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesplitHeaderToListstring0regex0split11net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string 0 'text/plain' java.lang.String true regex 0 'text/plain' java.lang.String true split 1 l('text/plain') 1 workflow org.embl.ebi.escience.scuflworkers.java.SplitByRegex net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokereadHeaderFilefileurl0filecontents00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity fileurl 0 'text/plain' java.lang.String true encoding 0 'text/plain' java.lang.String true filecontents 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.io.TextFileReader net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeheaderSeparatorvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity , net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeheaderFilevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity /home/brayan/Taverna/tmpHeader net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectActionvalueList1message0title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedescribeDatasetSTDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 554a5d5d-ca88-496b-add2-6e905c8b79ba python describeDataset.py 1200 1800 describeDataset.py true false false UTF-8 false import pandas TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' dataset = pandas.read_csv(TMP_DATASET_FILE) print dataset.describe() false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokecomposeMessagestring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat UserNameHere 2017-01-18 11:18:16.222 UTC net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Data exloration and processing net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokecheckActionActionselectActionanswerdropFeaturedropFeatureFlagscheckActiondropFeatureFlagsdropFeatureheaderListsplitHeaderToListsplitdropMissingValuesreplaceMissingDropFlagscheckActionreplaceMissingDropFlagslabelsNumlabelsToNumFlagscheckActionlabelsToNumFlagslabelsNumheaderListsplitHeaderToListsplitnormFeatureScalingnormFeatureFlagscheckActionnormFeatureFlagsnormStandardnormStandardFlagscheckActionnormStandardFlagsplotHistogramplotHistogramFlagscheckActionplotHistogramFlagsplotHistogramheaderListsplitHeaderToListsplitplotScatterplotScatterFlagscheckActionplotScatterFlagsplotScatterheaderListsplitHeaderToListsplitsplitActionsToListregexregexvaluesplitActionsToListstringactionOptionsvaluereplaceMissingMeanreplaceMissinMeanFlagscheckActionreplaceMissingMeanFlagssaveFilesaveFlagscheckActionsaveFlagssplitHeaderToListstringreadHeaderFilefilecontentssplitHeaderToListregexheaderSeparatorvaluereadHeaderFilefileurlheaderFilevalueselectActionvalueListsplitActionsToListsplitselectActionmessagecomposeMessageoutputselectActiontitletitlevaluecomposeMessagestring1describeDatasetSTDOUTcomposeMessagestring2messagevaluelastActionselectActionanswer 43e71d15-64ee-455f-a942-ec7d376eb5f3 2017-01-17 15:12:11.201 UTC 7adb8f4b-59bc-487c-bd1c-de0b783a74be 2017-01-18 11:17:55.92 UTC dcd71717-0429-4337-a923-2da00b80aa82 2017-01-18 11:27:13.853 UTC 0be853bd-34c2-4a00-b0bd-1dd7232eccc1 2017-01-18 14:40:32.333 UTC 7fe3f88f-e8fb-4c9d-9923-46b86b7f5902 2017-01-18 11:21:48.141 UTC ccf2a5af-d0bc-4c21-b98c-7fae41cb93ef 2017-01-18 11:28:17.88 UTC c1ca3818-eb32-4a81-883b-9a66e5896c45 2017-01-18 11:13:23.148 UTC 8936335e-49b4-415a-8bf3-057116984b2e 2017-01-18 11:08:37.894 UTC af026ae8-7dbf-47a0-ab97-86e86e54c5cb 2017-01-18 15:07:56.230 UTC This workflow asks for an action and the calls the nested workflow that performs the desired operation over the dataset. 2017-01-18 10:50:35.629 UTC mainLoop 2017-01-17 14:57:17.562 UTC 13f4303c-d79a-4844-97a6-d082848300d4 2017-01-18 11:27:37.692 UTC 3208a966-12cb-4ba0-b182-8f93a176b157 2017-01-18 14:56:43.676 UTC Brayan Stiven Zapata Impatá 2017-01-18 10:50:03.112 UTC 87319bbc-be04-41bf-a0ca-83d10ebe0410 2017-01-18 10:35:32.666 UTC 98dd5e32-c8bc-4093-a9db-41c8d7ac27ad 2017-01-17 15:13:24.833 UTC d1b1200f-be93-4c0e-ab3c-0e1d5e4fd653 2017-01-18 15:10:04.526 UTC 548fd807-1f6a-422d-add3-b94f2b0e39b5 2017-01-18 14:53:26.449 UTC f79182e9-f75e-43f0-a2c6-c5a97726ab4e 2017-01-18 15:09:37.618 UTC 94b1b2e4-45a7-4e3a-9559-bad4b3f5a215 2017-01-18 14:41:36.875 UTC b20f18f7-590f-4448-933c-c65633987cc7 2017-01-18 11:02:45.52 UTC 963a5560-4653-4853-8fda-6cdd447a3885 2017-01-18 14:38:49.962 UTC d3f74f75-8031-4d5b-8e05-2c4175797b2b 2017-01-18 11:04:32.786 UTC f09efb08-88d4-4838-a225-62d180e2a77a 2017-01-18 11:03:40.18 UTC 2f23c46b-44bc-4df4-8846-bbedacc01115 2017-01-18 11:10:55.227 UTC ecbc62e7-d69f-4f78-9af3-7c340ddbb1d2 2017-01-18 10:45:12.353 UTC 218d78c2-a9e9-42df-83c5-be291e21de17 2017-01-18 10:42:03.241 UTC b4256eee-ea8f-4a36-8cfa-1f871d457fa3 2017-01-18 10:37:50.978 UTC 52ca9dee-1bf1-42c5-b070-532835fc3b1d 2017-01-18 10:38:54.521 UTC 7261f66f-1e90-4c4c-9407-88ca2c210142 2017-01-18 11:01:22.170 UTC 5cd04d78-2109-4240-a4f9-7dda49694c0a 2017-01-18 14:51:24.92 UTC f1371e2f-b440-47f8-bba8-97d38df76be4 2017-01-18 11:25:28.580 UTC f9c65e42-6687-467a-b588-ef045ef0e878 2017-01-18 11:24:06.429 UTC 64eba6e5-96ee-4a2c-9a02-ae730efe056b 2017-01-18 11:25:42.7 UTC 76283317-94ad-4b76-b9bc-9b82bb511fee 2017-01-17 15:15:57.234 UTC 9336f07e-3118-48b1-99cd-ba0440b200d0 2017-01-18 14:50:34.921 UTC d454118b-cfcf-47cf-9f7f-04557331c670 2017-01-18 11:24:42.468 UTC 7eb375be-7450-4055-be8c-ef5bcc0bdf95 2017-01-18 11:29:08.664 UTC 136ecad1-c9d8-4f57-8144-2f95e05acbb5 2017-01-18 14:39:39.968 UTC 3447dd75-0f1e-4d69-ab46-416821a75cdc 2017-01-18 14:45:29.579 UTC db275682-9457-48ef-995d-a2ec6c2ed275 2017-01-17 15:10:42.379 UTC bc615334-b710-41e8-98ba-361ec5d9286c 2017-01-18 14:44:29.562 UTC 9b47e994-7e93-4cce-91aa-4ba33af1159c 2017-01-18 14:50:06.432 UTC 5e27aac4-4bff-4b1f-afa0-5b0e1143ce04 2017-01-17 14:57:47.765 UTC 14f27c8d-656e-467f-bc1f-ed93aed7827c 2017-01-18 10:59:26.235 UTC ddb2ba2a-5341-4130-bb8d-5f76f6e67fb7 2017-01-17 15:01:42.320 UTC 75609912-e68b-4a72-b9a8-2ed8515d6d60 2017-01-18 15:00:35.581 UTC 30924e00-a896-460d-8dc2-a795b8107dbb 2017-01-18 10:32:53.150 UTC 02cd9059-62da-4f34-be25-794fb4a59dff 2017-01-18 15:08:45.34 UTC 56014400-b738-4414-ae4f-da6bacb5e0e5 2017-01-17 15:00:00.409 UTC 4217e0e5-4a46-4b42-a4d1-8cd826d5dc6e 2017-01-18 14:46:59.56 UTC 7f341262-2cd7-4dd6-a6d7-658f360632d4 2017-01-18 10:50:36.628 UTC 227278ab-b092-42bc-a752-22cbb1d7a043 2017-01-18 11:04:04.747 UTC 49ef9fe4-d73f-4dcc-ae66-ace94fccd866 2017-01-18 10:47:09.994 UTC 51d0067a-4c80-48dc-a3cf-7e01fda9db22 2017-01-18 11:18:17.668 UTC 676c7ec5-558e-4f0d-8774-410c6bc3ad5c 2017-01-18 15:12:50.86 UTC 201a7bb0-b88e-4ee3-8648-bd9f24e59a96 2017-01-18 10:43:49.603 UTC 4b0df6bd-b684-4541-8b0b-208ca7a024e3 2017-01-18 10:41:38.945 UTC 9ae75c76-bc3b-43a2-baed-f57c2c0fec1c 2017-01-18 11:03:19.196 UTC f403048c-1a1e-486a-8a46-de08a2bcdbf0 2017-01-18 14:54:57.846 UTC 3c30038f-69db-43ff-a474-ee695da17b7d 2017-01-18 10:41:26.145 UTC 186b20d5-d02d-4c9d-8e73-179a30199b2c 2017-01-18 11:06:12.267 UTC 8f1e8ce6-8c80-4a1c-9714-ddc429e011b8 2017-01-18 11:26:32.206 UTC 42b45e89-eed6-417d-8a2c-635232986034 2017-01-18 11:25:17.444 UTC 593a6b18-81c0-4616-a5f2-3adf26160840 2017-01-18 15:05:05.965 UTC 0f6170c3-7831-44c1-a90c-1afa81502636 2017-01-18 10:45:41.385 UTC 111791e3-22ad-490b-95ae-e10be5d0fb35 2017-01-18 15:06:37.591 UTC f63a5fb2-f6cf-4123-a23f-7d0d7f970211 2017-01-18 10:43:15.468 UTC 10bf596d-7b3a-4dcf-ac63-3436c553cd74 2017-01-18 10:49:37.545 UTC dbad82d1-eaf0-4289-bafe-528e670c9393 2017-01-18 10:49:45.914 UTC fcf46500-f944-48c0-88e3-5325998e24d6 2017-01-18 10:47:44.593 UTC 537a4e04-ea88-4a64-bee1-3753dbdcb2ee 2017-01-18 10:50:07.434 UTC dropFeaturedropFeatureFlags00headerList11dropFeaturecolumn0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 9916a27a-c60a-424a-9568-7cc121db4807 python dropFeature.py %%column%% 1200 1800 column dropFeature.py true false false UTF-8 false import pandas, argparse # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' TMP_HEADER_FILE = '/home/brayan/Taverna/tmpHeader' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Column drop parser = argparse.ArgumentParser(description = 'This programdrops a column of the processed dataset.') parser.add_argument('column', help = 'Name of the column to be dropped') droppedColumn = parser.parse_args().column dataset = pandas.read_csv(TMP_DATASET_FILE) dataset = dataset.drop([droppedColumn], axis = 1) dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) with open(TMP_HEADER_FILE, 'w') as headerFile: headerFile.write(','.join(dataset.columns)) print 'Dataset processed correctly!' column column false false false UTF-8 false false false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select the column that will be dropped: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectDropColumnmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Drop column net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedropFeaturecolumnselectDropColumnanswerTellmessageConcatenate_two_stringsoutputTelltitletitleGeneralvalueselectDropColumnmessagemessagevalueselectDropColumnvalueListheaderListselectDropColumntitletitleGeneralvalueConcatenate_two_stringsstring1dropFeatureSTDERRConcatenate_two_stringsstring2dropFeatureSTDOUT 1f1f5256-e419-4572-80e4-47092fbb9e1b 2017-01-18 10:36:23.577 UTC 650dee82-df91-4323-b39f-8e98e92696b4 2017-01-18 10:37:02.163 UTC ddc7c835-4677-42f7-be0d-18c8703d7d92 2017-01-17 13:00:35.848 UTC c8c07c2f-935d-4c38-b10d-76a3b0a435f3 2017-01-18 11:28:13.197 UTC 5af6d39e-6791-4a13-ad35-b6ff5c61090a 2017-01-18 14:53:26.371 UTC dropFeature 2017-01-17 12:59:00.212 UTC cd49b1d4-f20d-488b-83fc-12a5fa740fd7 2017-01-18 11:02:29.650 UTC f6b365b0-8afd-4fe6-bc77-7509c9f16622 2017-01-18 10:34:49.898 UTC f0088e7a-e01b-4076-bfd0-063f4f60dc4d 2017-01-17 15:08:56.996 UTC b8527a97-9de3-406e-99b3-8b20c5d0e4a5 2017-01-18 10:41:14.649 UTC d1c885b1-9368-453a-93d9-8773fdaf1321 2017-01-18 15:10:02.797 UTC e08e0621-7f1d-4e08-9dd7-f96e0f3fc69f 2017-01-17 15:08:26.132 UTC a3d33cd4-bf20-47f8-985c-4421ba91c844 2017-01-17 13:01:42.0 UTC fb33b2cb-8324-4fc7-9f29-7f13837f2c43 2017-01-18 10:35:09.897 UTC 58527f47-cf10-4ad9-8061-97ca917bbe90 2017-01-17 12:59:21.512 UTC 9b5b1d3f-365b-4516-84a0-f3fbe40434b4 2017-01-17 12:59:10.757 UTC plotScatterplotScatterFlags00headerList11plotScattercolumnX0columnY0columnObj0STDERR00STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 178d1624-9188-45eb-80b5-71852fcce2ee python plotScatter.py %%columnX%% %%columnY%% %%columnObj%% 1200 1800 columnObj columnX columnY plotScatter.py true false false UTF-8 false import pandas, argparse import matplotlib.pyplot as pyplot # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Plotting parser = argparse.ArgumentParser(description = 'This program plots a scatter given the colums for the X and Y axis. Dots are coloured by the value of the third column.') parser.add_argument('columnX', help = 'Name of the column to be plotted as the X axis') parser.add_argument('columnY', help = 'Name of the column to be plotted as the Y axis') parser.add_argument('columnObj', help = 'Name of the column to be plotted') selectedXColumn = parser.parse_args().columnX selectedYColumn = parser.parse_args().columnY objColumn = parser.parse_args().columnObj dataset = pandas.read_csv(TMP_DATASET_FILE) try: dataset.plot(kind = 'scatter', x = selectedXColumn, y = selectedYColumn, c = objColumn, s = 50) pyplot.xlabel(selectedXColumn) pyplot.ylabel(selectedYColumn) pyplot.title(selectedXColumn + ' - ' + selectedYColumn) pyplot.grid(True) pyplot.show() except Exception as e: print 'Unexpected error:', str(e) print 'Dataset processed correctly!' columnObj columnObj false false false UTF-8 false false false columnX columnX false false false UTF-8 false false false columnY columnY false false false UTF-8 false false false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemessageForXvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select the column for the X axis: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemessageForYvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select the column for the Y axis: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemessageForObjvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select the objective column: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectXmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectYmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectObjmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Scatter plot output information net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Scatter plot net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotScattercolumnXselectXanswerplotScattercolumnYselectYanswerplotScattercolumnObjselectObjanswerselectXmessagemessageForXvalueselectXvalueListheaderListselectXtitletitleGeneralvalueselectYmessagemessageForYvalueselectYvalueListheaderListselectYtitletitleGeneralvalueselectObjmessagemessageForObjvalueselectObjvalueListheaderListselectObjtitletitleGeneralvalueTellmessageConcatenate_two_stringsoutputTelltitletitlevalueConcatenate_two_stringsstring1plotScatterSTDERRConcatenate_two_stringsstring2plotScatterSTDOUT ba8a6ed4-8916-44f6-8dda-87c7a423ac38 2017-01-17 11:39:52.554 UTC 96d7b727-20d3-4035-a2e1-88a40c3d101a 2017-01-17 11:07:00.664 UTC 885325a8-026d-4d46-ae5e-52fb6a86f93a 2017-01-18 14:50:04.363 UTC 0ca77df8-57b6-413c-8313-e7583b19149c 2017-01-18 15:12:46.847 UTC 265dc3a1-997f-4593-9fbd-bbf2fc0b0d4d 2017-01-18 15:09:36.189 UTC plotScatter 2017-01-17 12:01:21.265 UTC 9a1156de-defa-4313-a290-0cd61f0ee3b6 2017-01-17 11:51:12.22 UTC 93ff1fe6-1dcc-4bcd-9253-0d326fbcc850 2017-01-17 11:39:43.154 UTC 739bb821-b0a0-4e41-943a-855ae90e741c 2017-01-18 11:27:32.84 UTC 631844da-a909-4fdc-a184-7a54d68e690b 2017-01-17 10:57:13.506 UTC a37d084f-4839-407f-8c62-ffbf8c264559 2017-01-18 11:21:18.684 UTC 22503c9f-1a01-45d8-be86-87f2693da327 2017-01-17 12:00:46.28 UTC 7b5136fa-05ac-4488-9f5a-a4163d09605f 2017-01-17 11:07:29.192 UTC 429d9268-b459-41b5-96af-25d13ea1d877 2017-01-17 11:30:52.545 UTC 1cde77e4-b082-4179-becf-be09ea8782ad 2017-01-17 11:36:13.474 UTC 2966558f-03e3-4728-beba-1a8070d22ffe 2017-01-17 12:01:25.133 UTC dfadf90a-c6d7-43f4-a635-fbd4875eea43 2017-01-17 11:59:25.87 UTC e2e07e17-a405-41ba-86f7-d08380350797 2017-01-17 11:14:04.908 UTC 33f8d35f-6ff9-4655-a901-3183183cc6b5 2017-01-17 11:25:25.281 UTC 68d2c0e4-8f02-4a3d-827f-e76cfc811e62 2017-01-18 11:10:51.419 UTC 246cd909-630f-475f-8d26-0108cc38cad7 2017-01-17 11:19:02.258 UTC 231a410b-a2db-4387-ab9e-dc3aa6072753 2017-01-18 10:41:37.515 UTC 1fdcb14b-a2ce-45e7-a740-2c94a284a7da 2017-01-18 11:21:45.684 UTC 4f919c6c-0388-47b2-ba21-dc549e0ac041 2017-01-18 10:37:44.137 UTC 903878da-fc1a-4a67-a970-da9a630e7cd1 2017-01-18 11:10:24.99 UTC e6cfe743-f358-43e6-8a59-b67820816976 2017-01-17 10:57:24.719 UTC labelsNumlabelsToNumFlags00headerList11labelsToNumcolumn0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 157dce46-5f13-4299-b2ce-29fdf6c89d0d python labelsToNum.py %%column%% 1200 1800 column labelsToNum.py true false false UTF-8 false import pandas, argparse # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Missing values processing parser = argparse.ArgumentParser(description = 'This program sets the given column to a numerical order.') parser.add_argument('column', help = 'Name of the column to be processed') classColumn = parser.parse_args().column dataset = pandas.read_csv(TMP_DATASET_FILE) classes = dataset[classColumn].unique() for i in range(len(classes)): dataset.loc[dataset[classColumn] == classes[i], classColumn] = i dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) print 'Dataset processed correctly!' column column false false false UTF-8 false false false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select the labels column: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectLabelsColumnmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Labels to numeric value net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelabelsToNumcolumnselectLabelsColumnanswerselectLabelsColumnmessagemessagevalueselectLabelsColumnvalueListheaderListselectLabelsColumntitletitleGeneralvalueTellmessageConcatenate_two_stringsoutputTelltitletitleGeneralvalueConcatenate_two_stringsstring1labelsToNumSTDERRConcatenate_two_stringsstring2labelsToNumSTDOUT 2fa0a274-f248-4d5a-868c-7fad8de8c5a8 2017-01-18 11:01:18.307 UTC 88c2dd97-1662-40e3-a801-5f95bb736aef 2017-01-18 11:29:03.820 UTC edc1b9fe-1fae-48f3-928e-fbd971ab03ce 2017-01-18 15:08:43.44 UTC bc1795cd-b0a7-4e83-aaa7-3b3afb2e4e2b 2017-01-18 10:32:01.288 UTC 05ce6586-ac88-451c-9952-30cd685c08b9 2017-01-17 14:32:14.379 UTC 56dea0e1-188b-478b-928d-557cb30d4fb6 2017-01-18 10:36:47.211 UTC 2b7f2f9b-eddd-49c8-b779-4312b3bb09a3 2017-01-18 10:41:53.685 UTC d57ef759-0f08-4da0-9aef-e3563aa62e6d 2017-01-18 11:01:12.83 UTC 3337b65b-4592-44df-94d6-84758174b7a7 2017-01-18 10:36:10.234 UTC 839eb079-7141-4167-83ba-cac1f28e4c1a 2017-01-18 11:00:57.10 UTC labelsNum 2017-01-17 14:32:09.207 UTC 7597cf85-5d3a-4e3c-9aea-b82e2f628bcb 2017-01-18 14:54:56.531 UTC 8aae29ee-a039-4483-b155-5b94e608d3ca 2017-01-17 14:33:14.320 UTC f40f983c-bd31-47d1-846a-8d331227e880 2017-01-18 10:32:31.184 UTC dropMissingValuesreplaceMissingDropFlags00dropMissingSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> c0caab14-007a-46e8-b732-7051cb2daf25 python replaceMissingWithDrop.py 1200 1800 replaceMissingWithDrop.py true false false UTF-8 false import pandas # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Missing values processing dataset = pandas.read_csv(TMP_DATASET_FILE) dataset.dropna(inplace = True) dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) print 'Dataset processed correctly!' false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Replacement output information net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageConcatenate_two_stringsoutputTelltitletitlevalueConcatenate_two_stringsstring1dropMissingSTDERRConcatenate_two_stringsstring2dropMissingSTDOUT 03f38345-3979-4768-a1eb-dcaaa103111e 2017-01-17 14:26:30.574 UTC 4015f12b-eebf-4df3-8046-44fbdd62ab56 2017-01-18 10:45:32.699 UTC 65c07b74-eaec-47b4-8338-923758f29863 2017-01-18 11:23:20.446 UTC a13584a1-7010-48fa-afd3-8da26c3f1c93 2017-01-18 10:45:39.250 UTC d8977f5f-17f8-460b-94ef-dd6675742e0e 2017-01-18 11:23:24.344 UTC 7eafd153-e83c-4c18-9c3b-2e8329577389 2017-01-18 14:45:26.242 UTC dropMissingValues 2017-01-17 14:26:27.427 UTC 5bd326ab-f282-4cc3-ad27-0871aca1d8f7 2017-01-18 11:03:38.179 UTC fda57315-4759-4d5b-8b86-e08878b4fdd2 2017-01-17 14:26:42.721 UTC normFeatureScalingnormFeatureFlags00normFeatureSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 89f039e5-78fb-4a05-a2d0-bd33e14a34f4 python featureScaling.py 1200 1800 featureScaling.py true false false UTF-8 false import pandas # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Normalization dataset = pandas.read_csv(TMP_DATASET_FILE) processedDataset = (dataset - dataset.min()) / (dataset.max() - dataset.min()) processedDataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) print 'Dataset processed correctly!' false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Feature scaling output information net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageConcatenate_two_stringsoutputTelltitletitlevalueConcatenate_two_stringsstring1normFeatureSTDERRConcatenate_two_stringsstring2normFeatureSTDOUT 7b05ab89-4989-412f-966c-7148962526ba 2017-01-18 14:39:39.66 UTC 5532d37b-47a2-4dd1-a6ef-482e4adacdc1 2017-01-17 12:49:30.711 UTC 5d81a6a5-96e5-4348-a3e2-a93d9bf14b52 2017-01-18 11:04:01.266 UTC b4762844-5551-44bb-a3af-42f62adfae8f 2017-01-18 11:25:39.364 UTC normFeatureScaling 2017-01-17 12:39:06.855 UTC 0014a9dc-fba3-45b9-a857-4374392623e4 2017-01-17 12:39:17.588 UTC 4e8b3e6f-bac6-4b34-81d3-1e183d840e78 2017-01-17 12:51:03.775 UTC 07a77734-9b25-44f2-97b1-039f26a1ab03 2017-01-18 14:38:39.602 UTC 1e71953c-5074-473f-a3ba-8de399709cdd 2017-01-17 12:39:27.838 UTC e3e08062-3114-4f9e-9d32-aacacce73527 2017-01-18 10:45:03.49 UTC 733db518-e38f-4666-80c0-a761368c7bb8 2017-01-18 10:45:09.740 UTC 75fb1e3e-187a-4e0d-8046-335493529c7b 2017-01-18 11:24:05.236 UTC normStandardnormStandardFlags00normStandardizationSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> ee9902b7-c136-459b-bf66-ff482acb3c4d python standardization.py 1200 1800 standardization.py true false false UTF-8 false import pandas # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Normalization dataset = pandas.read_csv(TMP_DATASET_FILE) processedDataset = (dataset - dataset.mean()) / dataset.std() processedDataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False) print 'Dataset processed correctly!' false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Standardization output information net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageConcatenate_two_stringsoutputTelltitletitlevalueConcatenate_two_stringsstring1normStandardizationSTDERRConcatenate_two_stringsstring2normStandardizationSTDOUT 2d617b74-9c66-4c91-9263-4b9a451138b6 2017-01-18 11:25:25.612 UTC f5dc05d1-42d7-46b2-b7eb-b14a148b5b2f 2017-01-18 11:24:36.900 UTC 3b78dfcd-1927-4774-b718-30bfe437e1e6 2017-01-17 12:42:03.166 UTC 60e73cbe-cac7-450f-8dbf-cc8ecd43deee 2017-01-17 12:41:53.633 UTC 241dd1aa-043b-4887-9209-aab78027c9be 2017-01-17 12:50:24.159 UTC 0a8a428f-8e89-4873-8349-57227b005558 2017-01-17 12:52:41.815 UTC 3e1037af-cb7f-43d3-9ac7-b76132c8b89b 2017-01-18 14:40:30.298 UTC normStandard 2017-01-17 12:41:49.651 UTC ea165dfd-aa0f-4815-a57d-58141e9e80a0 2017-01-18 10:43:44.778 UTC 89e49c6e-5121-4ee3-b84a-4bc31f0cde71 2017-01-18 11:04:28.71 UTC saveFilesaveFlags00saveNewFilefileName0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 369f8a7e-1a82-47c4-9895-eba935357d87 python saveNewFile.py %%fileName%% 1200 1800 fileName saveNewFile.py true false false UTF-8 false import pandas, argparse # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' NEW_FILE_PATH = '/home/brayan/Taverna/' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Main program parser = argparse.ArgumentParser(description = 'This program saves the loaded dataset in a new file.') parser.add_argument('fileName', help = 'Name of the new file') fileName = parser.parse_args().fileName dataset = pandas.read_csv(TMP_DATASET_FILE) dataset.to_csv(NEW_FILE_PATH + fileName, encoding = 'utf-8', index = False) print 'Dataset saved correctly at', NEW_FILE_PATH fileName fileName false false false UTF-8 false false false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Write the new file's name: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokefirstQuotestring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokefirstQuoteSignvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity ' net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelastQuotestring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelastQuoteSignvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity ' net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeaskFileNamemessage0title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.AskWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Save new file net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesaveNewFilefileNamelastQuoteoutputfirstQuotestring1firstQuoteSignvaluefirstQuotestring2askFileNameanswerlastQuotestring1firstQuoteoutputlastQuotestring2lastQuoteSignvalueaskFileNamemessagemessagevalueaskFileNametitletitleGeneralvalueTellmessageConcatenate_two_stringsoutputTelltitletitleGeneralvalueConcatenate_two_stringsstring1saveNewFileSTDERRConcatenate_two_stringsstring2saveNewFileSTDOUT saveFile 2017-01-17 14:39:32.908 UTC 20005879-cca7-40bb-8296-224fe1ce4c9c 2017-01-17 14:45:45.516 UTC 9630aca9-43e9-4888-afe1-e6984e241289 2017-01-18 11:26:28.573 UTC 270f7858-4166-45cd-94e9-bc418c77d842 2017-01-18 10:47:03.666 UTC 52bb89cb-58cb-4794-8bc4-13de81530d94 2017-01-18 11:05:43.731 UTC ef01b1c4-38ef-4871-b69e-22c2a7bd9ea5 2017-01-18 15:07:40.957 UTC ccd9137a-b699-4728-8847-6e9155570862 2017-01-18 11:06:03.614 UTC 4e2c183e-0534-4bdc-b680-8fb2cca43cf5 2017-01-17 14:43:13.296 UTC d897f094-4533-4b5b-ad9d-1ed88cd5d763 2017-01-17 14:49:10.797 UTC 17dacc60-8137-4673-a297-8458c623f2ca 2017-01-18 10:46:21.393 UTC 5e6a198b-89aa-4de9-8b48-0dda9960b24d 2017-01-18 10:46:56.113 UTC ea48b3d5-f20c-4bbd-b309-a241c4fccd78 2017-01-18 10:46:12.314 UTC 66c543ae-f336-4c5e-89d3-9a8faebe2e5c 2017-01-18 14:44:26.811 UTC 0f571c4a-0efb-474e-90d2-752d2c63472d 2017-01-17 14:41:11.107 UTC a92cd78e-8782-4ac3-b2db-aa7a21257ffc 2017-01-17 14:39:37.456 UTC a7ae23b7-966f-4a92-b12b-16e161f021f0 2017-01-17 14:51:01.780 UTC f24d51f1-a4ca-4e8c-9812-2b9bc3cab1f7 2017-01-18 14:51:23.987 UTC 59609eb9-5546-4cbb-915f-fbf63c5a82e5 2017-01-18 11:26:23.958 UTC e4fe1ffd-e747-49f3-920f-906bb5a7325b 2017-01-18 14:44:13.395 UTC plotHistogramplotHistogramFlags00headerList11plotHistogramcolumn0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local_3 <?xml version="1.0" encoding="UTF-8"?> <localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 178d1624-9188-45eb-80b5-71852fcce2ee python plotHistogram.py %%column%% 1200 1800 column plotHistogram.py true false false UTF-8 false import pandas, argparse import matplotlib.pyplot as pyplot # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Constant definition TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset' # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - # Plotting parser = argparse.ArgumentParser(description = 'This program plots the histogram of the given column') parser.add_argument('column', help = 'Name of the column to be plotted') selectedColumn = parser.parse_args().column dataset = pandas.read_csv(TMP_DATASET_FILE) try: dataset[selectedColumn].dropna().plot(kind = 'hist', xticks = dataset[selectedColumn].dropna().unique(), bins = dataset[selectedColumn].dropna().unique().size) pyplot.xlabel(selectedColumn) pyplot.title(selectedColumn + ' distribution') pyplot.grid(True) pyplot.show() except Exception as e: print 'Unexpected error:', str(e) print 'Dataset processed correctly!' column column false false false UTF-8 false false false false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Select the column that will be plotted: net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTelltitle0message0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity title 0 'text/plain' java.lang.String true message 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.TellWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectColumnmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity valueList 1 l('text/plain') java.lang.String true message 0 'text/plain' java.lang.String true title 0 'text/plain' java.lang.String true answer 0 'text/plain' 0 workflow net.sourceforge.taverna.scuflworkers.ui.SelectWorker net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Histogram output information net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity string1 0 'text/plain' java.lang.String true string2 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringConcat net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleColumnvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity Histogram column selector net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotHistogramcolumnselectColumnanswerTelltitletitlevalueTellmessageConcatenate_two_stringsoutputselectColumnmessagemessagevalueselectColumnvalueListheaderListselectColumntitletitleColumnvalueConcatenate_two_stringsstring1plotHistogramSTDERRConcatenate_two_stringsstring2plotHistogramSTDOUT dacfdbbf-8ac1-4941-b0fc-a83d7d2d4888 2017-01-18 14:50:34.251 UTC 8bcd45de-5031-428f-9fc6-e03797fdec03 2017-01-18 10:43:12.737 UTC e6cfe743-f358-43e6-8a59-b67820816976 2017-01-17 10:57:24.719 UTC 33f8d35f-6ff9-4655-a901-3183183cc6b5 2017-01-17 11:25:25.281 UTC 1c368b09-ee2e-4b31-a918-2a91f174e66c 2017-01-18 10:38:15.730 UTC b55c48b2-ed13-4c7a-ab15-7b6ea7b2391f 2017-01-18 15:06:35.544 UTC 7b5136fa-05ac-4488-9f5a-a4163d09605f 2017-01-17 11:07:29.192 UTC 2944cb50-5e54-44cb-b60c-05e5324e2735 2017-01-18 10:38:42.265 UTC 9f7989b8-6a3e-45d3-8920-c9cfa420947d 2017-01-18 11:08:34.557 UTC plotHistogram 2017-01-17 10:56:45.598 UTC 96d7b727-20d3-4035-a2e1-88a40c3d101a 2017-01-17 11:07:00.664 UTC 9a1156de-defa-4313-a290-0cd61f0ee3b6 2017-01-17 11:51:12.22 UTC e2e07e17-a405-41ba-86f7-d08380350797 2017-01-17 11:14:04.908 UTC ba8a6ed4-8916-44f6-8dda-87c7a423ac38 2017-01-17 11:39:52.554 UTC 8496a21f-666d-4a1e-96ea-3d1bf0453c7b 2017-01-18 11:13:18.507 UTC 7b6e59c8-6428-4595-b328-cb8d0fa1bcb7 2017-01-18 10:42:59.529 UTC 1cde77e4-b082-4179-becf-be09ea8782ad 2017-01-17 11:36:13.474 UTC 0adcfe92-b0b4-48ca-82c0-58bda0b63ea7 2017-01-18 11:08:26.467 UTC 8adbe06e-bfe1-45d4-829f-2c2f4bd9401b 2017-01-18 10:38:03.587 UTC 631844da-a909-4fdc-a184-7a54d68e690b 2017-01-17 10:57:13.506 UTC 429d9268-b459-41b5-96af-25d13ea1d877 2017-01-17 11:30:52.545 UTC 93ff1fe6-1dcc-4bcd-9253-0d326fbcc850 2017-01-17 11:39:43.154 UTC 246cd909-630f-475f-8d26-0108cc38cad7 2017-01-17 11:19:02.258 UTC e79d65e4-fc91-4ae5-9ed3-5d2024377313 2017-01-18 11:13:13.534 UTC 5cb20341-91c7-4e5c-a565-007915db8b38 2017-01-18 14:46:58.971 UTC 21579554-7044-4d9c-8633-79ba218f9c25 2017-01-18 11:27:07.30 UTC