Data_explorationfileName00
'/path/to/dataset'
2017-01-18 10:02:22.14 UTC
Path to the dataset that will be processed. It is important to give such path surrounded by single quotes.
2017-01-18 10:02:14.662 UTC
hasHeader00
If the given dataset includes a header row, this condition must be indicated writing --header like in the example. Otherwise, just leave it empty.
2017-01-18 10:03:04.977 UTC
--header
2017-01-18 10:03:10.111 UTC
lastAction0loadDatasetfileName0hasHeader0net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
b8d947e9-8d10-459a-8b63-3e10b06648f5
python loadDataset.py %%fileName%% %%hasHeader%%
1200
1800
fileName
hasHeader
loadDataset.py
true
false
false
UTF-8
false
import pandas, argparse
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
TMP_HEADER_FILE = '/home/brayan/Taverna/tmpHeader'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Main program
parser = argparse.ArgumentParser(description = 'This module preloads the dataset in auxiliare files for the execution.')
parser.add_argument('filename', help = 'Name of the file to be loaded')
parser.add_argument('--header', help = 'If indicated, the file has a header row', action = 'store_true')
fileName = parser.parse_args().filename
header = parser.parse_args().header
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Data read
if header:
dataset = pandas.read_csv(fileName)
else:
dataset = pandas.read_csv(fileName, header = None)
dataset.columns = map(str, range(dataset.shape[1])) # New header of ints as str
dataset = dataset.apply(pandas.to_numeric, errors = 'coerce')
dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
with open(TMP_HEADER_FILE, 'w') as headerFile:
headerFile.write(','.join(dataset.columns))
fileName
fileName
false
false
false
UTF-8
false
false
false
hasHeader
hasHeader
false
false
false
UTF-8
false
false
false
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemainLooplastAction00net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Loop
<activity xmlns="http://taverna.sf.net/2008/xml/t2flow"><raven><group>net.sf.taverna.t2.activities</group><artifact>beanshell-activity</artifact><version>1.5</version></raven><class>net.sf.taverna.t2.activities.beanshell.BeanshellActivity</class><inputMap /><outputMap /><configBean encoding="xstream"><net.sf.taverna.t2.activities.beanshell.BeanshellActivityConfigurationBean xmlns="">
<inputs>
<net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityInputPortDefinitionBean>
<name>lastAction</name>
<depth>0</depth>
<translatedElementType>java.lang.String</translatedElementType>
<allowsLiteralValues>true</allowsLiteralValues>
</net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityInputPortDefinitionBean>
</inputs>
<outputs>
<net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityOutputPortDefinitionBean>
<name>loop</name>
<depth>0</depth>
<granularDepth>0</granularDepth>
</net.sf.taverna.t2.workflowmodel.processor.activity.config.ActivityOutputPortDefinitionBean>
</outputs>
<classLoaderSharing>workflow</classLoaderSharing>
<localDependencies />
<artifactDependencies />
<script>loop = "" + ! lastAction.equals("Quit");
if ("true".matches(loop)) {
Thread.sleep(500);
}</script>
<dependencies />
</net.sf.taverna.t2.activities.beanshell.BeanshellActivityConfigurationBean></configBean><annotations /></activity>
true
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedeleteTmpnet.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
f9659a22-2a34-4fbe-a01a-b503291d0d53
python deleteTmp.py
1200
1800
deleteTmp.py
true
false
false
UTF-8
false
import os
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
TMP_HEADER_FILE = '/home/brayan/Taverna/tmpHeader'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Main program
try:
os.remove(TMP_DATASET_FILE)
os.remove(TMP_HEADER_FILE)
except OSError:
pass
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeloadDatasetfileNameloadDatasethasHeaderlastAction
Data exploration
2017-01-18 09:58:41.114 UTC
a08194b1-8776-4586-8dea-43e250e05a67
2017-01-18 14:32:59.738 UTC
750c66ac-6c0d-4550-9c5a-804c0b599657
2017-01-17 14:27:46.422 UTC
8fc5c71c-42fb-4689-bf3b-3822894134f2
2017-01-18 10:50:10.5 UTC
c20805f5-3774-46ef-ad6a-021df3173359
2017-01-18 10:50:41.554 UTC
4e4a6eaa-d59b-46ae-8d29-7b13f8ba93c0
2017-01-17 11:00:10.327 UTC
5b8f3dbb-13af-4d5a-ac68-a50731814c1b
2017-01-17 14:39:15.97 UTC
23b648fb-e3f4-4a32-9630-fe0a708280ca
2017-01-18 14:40:47.958 UTC
1a1d166d-4acb-4342-96a6-82e477b8dff3
2017-01-18 10:00:52.240 UTC
33a670e3-1d84-4400-aa69-9cd92dc57a87
2017-01-18 14:44:32.531 UTC
08f8b9d7-a5b9-49db-8c6c-0d426ab0e6e3
2017-01-18 11:25:19.334 UTC
d962dccd-7e97-450b-b188-5be2fa60d2ba
2017-01-18 11:10:57.837 UTC
2fcd1019-ea0e-400d-9bb6-2a256f6d45da
2017-01-17 14:33:30.263 UTC
ee8f829d-e2e7-4ba3-a549-5abd06714128
2017-01-18 10:32:59.129 UTC
dd178ad6-80a0-4a75-bf07-cd93689953c6
2017-01-18 11:04:41.697 UTC
fa5e3094-b81b-4737-93dc-6993b3129387
2017-01-18 14:55:00.275 UTC
9ed03c73-0c1c-45ce-8c27-59d1c6c3c92a
2017-01-18 15:06:38.545 UTC
f07e2fd6-5627-4396-9513-8abe038b9ac6
2017-01-17 11:42:28.948 UTC
182219e2-0aec-44a4-8ed0-6ce720904e30
2017-01-17 14:49:30.981 UTC
d21fd703-84a8-4448-a7f0-7deee5bca364
2017-01-18 10:37:54.364 UTC
603042f0-dd99-43e7-b26f-40e37aeda228
2017-01-18 15:12:51.359 UTC
31b5ba93-76bb-4b3f-a69f-05dc353b58b1
2017-01-17 11:19:05.961 UTC
54679c07-7a47-4627-ab1a-a4719cc1b798
2017-01-17 11:15:36.33 UTC
46a10f58-d0f1-4231-a2ce-dab7b38f90bf
2017-01-18 10:47:18.645 UTC
a877d377-0492-4abe-b04c-ed69277c8b71
2017-01-18 11:26:36.726 UTC
212188ff-ee6f-4000-8f78-136480fa1be3
2017-01-18 14:41:39.271 UTC
b4c10c24-7212-43a9-ad85-ed94f1771f26
2017-01-18 10:59:36.906 UTC
7650d310-4872-49fe-a1e9-fc44d4514e68
2017-01-17 11:40:05.159 UTC
fd4794e6-d400-4b95-a08c-225f482fa3b7
2017-01-17 12:51:05.993 UTC
769d154d-823d-41f1-a924-697c9485b348
2017-01-18 14:40:34.776 UTC
9ebdb8b0-367c-4c42-9469-74ba2750267b
2017-01-17 14:36:03.735 UTC
be9d7dcd-e9da-4e4b-9d1e-05b828d0221c
2017-01-17 14:23:40.766 UTC
7a933706-41a5-429f-9a4a-54a26cf8d547
2017-01-18 11:14:57.364 UTC
270ecfae-3364-4166-9736-6f159c6306d8
2017-01-18 14:51:27.161 UTC
3a96a913-379d-4bc5-be8f-6003a5b4ad18
2017-01-17 15:16:31.869 UTC
6333fe59-9a12-4491-b06e-bcddaae7e762
2017-01-18 14:50:08.878 UTC
f19ea17a-6c83-405a-9e65-c46738f428cd
2017-01-17 14:41:20.769 UTC
8d785c1c-1207-4137-9be0-36be21063d58
2017-01-18 15:08:45.966 UTC
1ad93dd3-1f29-42c2-be90-2db9af258630
2017-01-18 10:03:12.439 UTC
d625b610-4e94-4528-a784-8255e9209939
2017-01-17 15:00:32.298 UTC
b0a168ed-116b-4937-8789-a12ffb23fcb1
2017-01-18 11:25:29.539 UTC
This workflows allows one to explore and process a given dataset file. These are the list of possible actions:
- Visualization (Histogram, Scatter plot)
- Normalization (Feature scaling, Standardization)
- Column drop
- Deal with missing values (Use mean as a replace, Drop samples)
- Cast to numeric labels
- Save the processed file
2017-01-18 10:00:50.413 UTC
c9e10585-125d-4f5e-8039-81b5d21a6303
2017-01-17 11:43:13.302 UTC
5d371e08-4635-4476-a34f-e3dfc7d342a2
2017-01-17 14:55:44.865 UTC
7073f46f-db3c-4a1e-8bb0-27771c48a5e2
2017-01-19 11:32:22.525 UTC
52496cad-e0dd-438a-b851-109b9fa18e9a
2017-01-18 11:03:45.227 UTC
fc199911-453d-40a1-8716-820de3369259
2017-01-18 11:25:44.227 UTC
c7157685-da0a-42d0-a56e-d65d0d8cfeb1
2017-01-17 14:22:37.937 UTC
37c89f41-15c3-43b3-b3c0-4233edbaeee0
2017-01-18 14:47:01.466 UTC
3066d118-9a67-4834-ba12-cd7115980d4a
2017-01-17 14:51:17.575 UTC
abc67d94-5cbf-4a88-b138-38fee66509f2
2017-01-17 11:17:20.340 UTC
ed310273-8908-48b2-8d1a-37dcc9a53f0d
2017-01-18 10:50:04.603 UTC
Brayan Stiven Zapata Impatá
2017-01-18 09:58:37.467 UTC
60326ead-05e2-4d87-a48c-4fec527a8524
2017-01-18 11:01:24.418 UTC
00e8a9d4-3a90-4af8-9bf5-f4d2e7dd0028
2017-01-17 15:02:42.186 UTC
763e56a8-6a8f-4434-a087-9ec1ce7f9706
2017-01-18 11:25:31.115 UTC
847bac2f-c371-4520-9582-a474125d3a04
2017-01-17 14:26:48.406 UTC
fd544e0b-c391-4240-a7c0-9754461d309c
2017-01-18 11:29:09.486 UTC
a5a57b61-d206-4d48-9cb8-11695b26175b
2017-01-17 11:01:35.239 UTC
f8623af3-42ec-4669-9c22-b520e53c4c33
2017-01-18 10:45:45.658 UTC
7965768d-92db-4a3a-8d61-85c560f67b46
2017-01-18 11:27:40.561 UTC
5f6d717f-b374-4489-b7e8-ac917c40565d
2017-01-18 15:18:40.21 UTC
78fa0bdc-5c5a-457c-9d59-41779648b354
2017-01-18 15:09:38.732 UTC
d8ef593e-e91f-4c7f-865c-f3b9870a2843
2017-01-18 10:45:15.970 UTC
d13bee50-d0b2-4294-bbbc-79bfe3de39a7
2017-01-18 11:13:25.868 UTC
d12de995-37a8-4c03-a3b4-eaede95b607d
2017-01-18 11:27:14.688 UTC
3e1af8b1-eca0-4bf3-b937-afdd2379c0dd
2017-01-17 14:45:52.753 UTC
662bd6e5-72f9-4e46-9fc4-190260389dbd
2017-01-17 13:23:29.67 UTC
778583c2-5f8b-4a0a-a776-70ffa37c4f6a
2017-01-17 14:31:48.376 UTC
4f04f52d-640e-43fe-895f-896195f166de
2017-01-17 12:52:44.280 UTC
16f8903a-9585-404a-b48d-926ad89db725
2017-01-18 11:18:27.716 UTC
24e8a898-59c9-47fc-92bc-ec428bd76fc7
2017-01-17 12:03:05.972 UTC
7ce88652-73fa-422a-bd82-2cef9166ed36
2017-01-18 11:21:54.852 UTC
48fe90af-f4ef-4adb-8524-4423b48efc82
2017-01-18 11:04:06.972 UTC
129c2ac5-d69c-4f8b-9dc4-5c4092b0c2bf
2017-01-17 11:25:48.52 UTC
8bceeea7-2c69-4c79-90a0-0f8d79a23b62
2017-01-18 15:05:09.114 UTC
4160f2b6-361d-49df-a342-9dac63bcfffc
2017-01-17 11:51:16.520 UTC
5927a373-ec5e-469e-9075-823c0db51e13
2017-01-18 14:56:49.823 UTC
79d242b4-cf87-4595-b83f-84a7e12e6b73
2017-01-17 14:43:20.27 UTC
b9720331-27f7-40fd-9459-7793f0674a87
2017-01-17 12:59:34.288 UTC
d2d43be7-cb8a-40c7-bf80-37306068cda2
2017-01-17 10:58:00.842 UTC
5a3fa5c7-6279-4276-8baf-d79bbd2e95e6
2017-01-18 15:10:05.813 UTC
d2525c96-01b8-4e71-9cb6-eee422ec0939
2017-01-18 11:06:26.957 UTC
9fbbc6dc-3866-4293-8710-161df68c64e9
2017-01-17 12:45:07.39 UTC
0aa6afe2-3e8e-44ff-b532-dd3c41f65b60
2017-01-18 14:39:42.40 UTC
2c39ca07-1b57-4209-a830-4f47dae6095c
2017-01-18 11:15:47.792 UTC
acb11776-3830-4a02-9e11-df134122fef7
2017-01-18 14:53:29.684 UTC
f1214adc-f25e-4df4-a834-cf02dfb49c85
2017-01-18 11:28:17.907 UTC
9f6578b3-8913-4295-8758-5d08cc4cb41e
2017-01-18 11:03:21.451 UTC
797b8e8e-8d9b-4482-8545-b73c1d1466f8
2017-01-18 10:43:19.449 UTC
4e83404a-ef5a-454b-8d10-363158f2e4c1
2017-01-18 15:19:02.877 UTC
f1cad094-807b-453a-bdb0-e96093b4a698
2017-01-18 10:38:56.825 UTC
7d79cc09-2d21-4a6e-af3d-cc30751d2322
2017-01-18 11:08:45.404 UTC
08479ded-4dd9-4f04-83bc-ab8ffa2667e9
2017-01-17 11:14:44.208 UTC
467f5c53-36b4-4bff-8111-18d9ce8db694
2017-01-18 14:45:32.17 UTC
14621cec-d958-4196-b185-fe2a2c73982a
2017-01-18 15:01:32.656 UTC
baccf983-da11-447a-9712-e15c07f6b9f6
2017-01-17 15:01:53.609 UTC
a64c5fc0-ca90-43d2-9ccb-10a1ad2bdf05
2017-01-18 11:02:47.107 UTC
ab3c4b0e-1550-4b4f-9085-de2007f848ef
2017-01-17 15:19:22.964 UTC
6d278d6a-5c56-4392-ad24-e69c28f7cc24
2017-01-18 10:56:17.650 UTC
c58912bf-fcc4-43fc-9bd4-988efe28bf59
2017-01-17 12:55:48.432 UTC
8a032e6f-f44d-4e91-8ae4-0c3b9d73a848
2017-01-17 13:29:05.819 UTC
beaf1545-9f7c-41d7-b0fd-aaed080d6609
2017-01-18 10:43:55.82 UTC
edd58035-4796-4ee7-8d8b-3818e42360c2
2017-01-18 14:50:37.377 UTC
56dfbcf0-0743-46bb-a3a7-f1173a859666
2017-01-17 12:47:11.15 UTC
8d6d5dd2-3a69-41a7-ac9e-db5d6fd4e372
2017-01-17 12:46:09.335 UTC
2ebb2c1f-7880-4e7f-8120-bc86c9805c61
2017-01-17 12:40:02.247 UTC
c621ad59-3ef1-4106-ac92-1177f3d6161d
2017-01-17 11:17:52.426 UTC
14a1b2f1-2560-49ef-afbe-36c8da8a75a4
2017-01-17 11:48:21.52 UTC
95130d18-98a9-451d-b115-9d68d0840d36
2017-01-17 13:01:56.568 UTC
5d0648e7-caa5-4c17-a5a8-055780f8264b
2017-01-18 14:38:55.452 UTC
6241d0ae-f0ae-43d0-9c28-c69fd02719d5
2017-01-18 15:07:57.388 UTC
3d2a83dc-4972-4330-85dc-72dbdbcb243d
2017-01-18 11:26:34.624 UTC
533aeb3c-1a31-451c-8d66-ebc1c0f8c4c8
2017-01-17 11:07:03.664 UTC
41f1c906-26b4-4e0b-9efc-39157dc5999e
2017-01-17 14:54:44.153 UTC
fa5e5e9c-5909-4dc7-9f92-d8157cd94093
2017-01-18 10:47:48.522 UTC
8e7fc9d0-21fb-472a-820b-8f52aa3caaa2
2017-01-17 14:33:54.425 UTC
replacereplaceMissinMeanFlags00replaceMissingMeanSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
b4b78e6e-7765-4bfc-ad88-d6d6963a3696
python replaceMissingWithMean.py
1200
1800
replaceMissingWithMean.py
true
false
false
UTF-8
false
import pandas
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Missing values processing
dataset = pandas.read_csv(TMP_DATASET_FILE)
dataset.fillna(dataset.mean(), inplace = True)
dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
print 'Dataset processed correctly!'
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Replacement by mean values output information
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
9d5df8a4-b5c5-443a-a2a4-d069c6a3e8f4
2017-01-18 11:25:10.44 UTC
01433a41-e4a2-489d-aaa3-6184984deda2
2017-01-17 13:22:49.505 UTC
593ffd29-f947-40f9-afca-011d97ca85d1
2017-01-18 10:47:32.361 UTC
fd9118ac-5531-4faa-abd5-2567a526c364
2017-01-17 13:22:40.208 UTC
da01e85c-67a8-4d24-b717-f48dc6f9d3f6
2017-01-18 14:41:36.138 UTC
f43744da-e1f5-498c-a35e-aafae63e95b6
2017-01-18 10:47:39.329 UTC
replace
2017-01-17 13:22:37.159 UTC
32aa66f0-4b84-496a-bb8b-2ccc8f0a29ee
2017-01-18 11:25:13.749 UTC
ba481226-9f8a-4c04-b93c-f720204d3c65
2017-01-18 11:03:12.53 UTC
mainLooplastAction0actionOptionsvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Plot histogram,Plot scatter,Normalize data by feature scaling,Normalize data by standardization,Drop feature,Replace missing values with feature mean,Drop samples with missing values,Convert to numeric labels,Save to new file,Quit
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokecheckActionAction0plotHistogramFlags11plotScatterFlags11normFeatureFlags11normStandardFlags11dropFeatureFlags11replaceMissingMeanFlags11replaceMissingDropFlags11labelsToNumFlags11saveFlags11
This service checks if the condition is "true" and if so outputs a value in the pass_flags list and
leaves the fail_flags empty. If the condition is not true then the service outputs a value in the
fail_flags list and leaves the pass_flags empty.
2011-11-15 09:59:22.100 UTC
net.sf.taverna.t2.activitiesbeanshell-activity1.5net.sf.taverna.t2.activities.beanshell.BeanshellActivity
Action
0
text/plain
java.lang.String
true
plotHistogramFlags
1
1
plotScatterFlags
1
1
normFeatureFlags
1
1
normStandardFlags
1
1
dropFeatureFlags
1
1
replaceMissingMeanFlags
1
1
replaceMissingDropFlags
1
1
labelsToNumFlags
1
1
saveFlags
1
1
workflow
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Loop
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedropFeaturedropFeatureFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedropMissingValuesreplaceMissingDropFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelabelsNumlabelsToNumFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select an action to perform over the dataset:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokenormFeatureScalingnormFeatureFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokenormStandardnormStandardFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotHistogramplotHistogramFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotScatterplotScatterFlags0headerList1net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesplitActionsToListregex0string0split11net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string
0
'text/plain'
java.lang.String
true
regex
0
'text/plain'
java.lang.String
true
split
1
l('text/plain')
1
workflow
org.embl.ebi.escience.scuflworkers.java.SplitByRegex
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeregexvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
,
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokereplaceMissingMeanreplaceMissinMeanFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesaveFilesaveFlags0net.sf.taverna.t2.activitiesdataflow-activity1.5net.sf.taverna.t2.activities.dataflow.DataflowActivitynet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesplitHeaderToListstring0regex0split11net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string
0
'text/plain'
java.lang.String
true
regex
0
'text/plain'
java.lang.String
true
split
1
l('text/plain')
1
workflow
org.embl.ebi.escience.scuflworkers.java.SplitByRegex
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokereadHeaderFilefileurl0filecontents00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
fileurl
0
'text/plain'
java.lang.String
true
encoding
0
'text/plain'
java.lang.String
true
filecontents
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.io.TextFileReader
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeheaderSeparatorvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
,
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeheaderFilevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
/home/brayan/Taverna/tmpHeader
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectActionvalueList1message0title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedescribeDatasetSTDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
554a5d5d-ca88-496b-add2-6e905c8b79ba
python describeDataset.py
1200
1800
describeDataset.py
true
false
false
UTF-8
false
import pandas
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
dataset = pandas.read_csv(TMP_DATASET_FILE)
print dataset.describe()
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokecomposeMessagestring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
UserNameHere
2017-01-18 11:18:16.222 UTC
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Data exloration and processing
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokecheckActionActiondropFeaturedropFeatureFlagsdropFeatureheaderListdropMissingValuesreplaceMissingDropFlagslabelsNumlabelsToNumFlagslabelsNumheaderListnormFeatureScalingnormFeatureFlagsnormStandardnormStandardFlagsplotHistogramplotHistogramFlagsplotHistogramheaderListplotScatterplotScatterFlagsplotScatterheaderListsplitActionsToListregexsplitActionsToListstringreplaceMissingMeanreplaceMissinMeanFlagssaveFilesaveFlagssplitHeaderToListstringsplitHeaderToListregexreadHeaderFilefileurlselectActionvalueListselectActionmessageselectActiontitlecomposeMessagestring1composeMessagestring2lastAction
43e71d15-64ee-455f-a942-ec7d376eb5f3
2017-01-17 15:12:11.201 UTC
7adb8f4b-59bc-487c-bd1c-de0b783a74be
2017-01-18 11:17:55.92 UTC
dcd71717-0429-4337-a923-2da00b80aa82
2017-01-18 11:27:13.853 UTC
0be853bd-34c2-4a00-b0bd-1dd7232eccc1
2017-01-18 14:40:32.333 UTC
7fe3f88f-e8fb-4c9d-9923-46b86b7f5902
2017-01-18 11:21:48.141 UTC
ccf2a5af-d0bc-4c21-b98c-7fae41cb93ef
2017-01-18 11:28:17.88 UTC
c1ca3818-eb32-4a81-883b-9a66e5896c45
2017-01-18 11:13:23.148 UTC
8936335e-49b4-415a-8bf3-057116984b2e
2017-01-18 11:08:37.894 UTC
af026ae8-7dbf-47a0-ab97-86e86e54c5cb
2017-01-18 15:07:56.230 UTC
This workflow asks for an action and the calls the nested workflow that performs the desired operation over the dataset.
2017-01-18 10:50:35.629 UTC
mainLoop
2017-01-17 14:57:17.562 UTC
13f4303c-d79a-4844-97a6-d082848300d4
2017-01-18 11:27:37.692 UTC
3208a966-12cb-4ba0-b182-8f93a176b157
2017-01-18 14:56:43.676 UTC
Brayan Stiven Zapata Impatá
2017-01-18 10:50:03.112 UTC
87319bbc-be04-41bf-a0ca-83d10ebe0410
2017-01-18 10:35:32.666 UTC
98dd5e32-c8bc-4093-a9db-41c8d7ac27ad
2017-01-17 15:13:24.833 UTC
d1b1200f-be93-4c0e-ab3c-0e1d5e4fd653
2017-01-18 15:10:04.526 UTC
548fd807-1f6a-422d-add3-b94f2b0e39b5
2017-01-18 14:53:26.449 UTC
f79182e9-f75e-43f0-a2c6-c5a97726ab4e
2017-01-18 15:09:37.618 UTC
94b1b2e4-45a7-4e3a-9559-bad4b3f5a215
2017-01-18 14:41:36.875 UTC
b20f18f7-590f-4448-933c-c65633987cc7
2017-01-18 11:02:45.52 UTC
963a5560-4653-4853-8fda-6cdd447a3885
2017-01-18 14:38:49.962 UTC
d3f74f75-8031-4d5b-8e05-2c4175797b2b
2017-01-18 11:04:32.786 UTC
f09efb08-88d4-4838-a225-62d180e2a77a
2017-01-18 11:03:40.18 UTC
2f23c46b-44bc-4df4-8846-bbedacc01115
2017-01-18 11:10:55.227 UTC
ecbc62e7-d69f-4f78-9af3-7c340ddbb1d2
2017-01-18 10:45:12.353 UTC
218d78c2-a9e9-42df-83c5-be291e21de17
2017-01-18 10:42:03.241 UTC
b4256eee-ea8f-4a36-8cfa-1f871d457fa3
2017-01-18 10:37:50.978 UTC
52ca9dee-1bf1-42c5-b070-532835fc3b1d
2017-01-18 10:38:54.521 UTC
7261f66f-1e90-4c4c-9407-88ca2c210142
2017-01-18 11:01:22.170 UTC
5cd04d78-2109-4240-a4f9-7dda49694c0a
2017-01-18 14:51:24.92 UTC
f1371e2f-b440-47f8-bba8-97d38df76be4
2017-01-18 11:25:28.580 UTC
f9c65e42-6687-467a-b588-ef045ef0e878
2017-01-18 11:24:06.429 UTC
64eba6e5-96ee-4a2c-9a02-ae730efe056b
2017-01-18 11:25:42.7 UTC
76283317-94ad-4b76-b9bc-9b82bb511fee
2017-01-17 15:15:57.234 UTC
9336f07e-3118-48b1-99cd-ba0440b200d0
2017-01-18 14:50:34.921 UTC
d454118b-cfcf-47cf-9f7f-04557331c670
2017-01-18 11:24:42.468 UTC
7eb375be-7450-4055-be8c-ef5bcc0bdf95
2017-01-18 11:29:08.664 UTC
136ecad1-c9d8-4f57-8144-2f95e05acbb5
2017-01-18 14:39:39.968 UTC
3447dd75-0f1e-4d69-ab46-416821a75cdc
2017-01-18 14:45:29.579 UTC
db275682-9457-48ef-995d-a2ec6c2ed275
2017-01-17 15:10:42.379 UTC
bc615334-b710-41e8-98ba-361ec5d9286c
2017-01-18 14:44:29.562 UTC
9b47e994-7e93-4cce-91aa-4ba33af1159c
2017-01-18 14:50:06.432 UTC
5e27aac4-4bff-4b1f-afa0-5b0e1143ce04
2017-01-17 14:57:47.765 UTC
14f27c8d-656e-467f-bc1f-ed93aed7827c
2017-01-18 10:59:26.235 UTC
ddb2ba2a-5341-4130-bb8d-5f76f6e67fb7
2017-01-17 15:01:42.320 UTC
75609912-e68b-4a72-b9a8-2ed8515d6d60
2017-01-18 15:00:35.581 UTC
30924e00-a896-460d-8dc2-a795b8107dbb
2017-01-18 10:32:53.150 UTC
02cd9059-62da-4f34-be25-794fb4a59dff
2017-01-18 15:08:45.34 UTC
56014400-b738-4414-ae4f-da6bacb5e0e5
2017-01-17 15:00:00.409 UTC
4217e0e5-4a46-4b42-a4d1-8cd826d5dc6e
2017-01-18 14:46:59.56 UTC
7f341262-2cd7-4dd6-a6d7-658f360632d4
2017-01-18 10:50:36.628 UTC
227278ab-b092-42bc-a752-22cbb1d7a043
2017-01-18 11:04:04.747 UTC
49ef9fe4-d73f-4dcc-ae66-ace94fccd866
2017-01-18 10:47:09.994 UTC
51d0067a-4c80-48dc-a3cf-7e01fda9db22
2017-01-18 11:18:17.668 UTC
676c7ec5-558e-4f0d-8774-410c6bc3ad5c
2017-01-18 15:12:50.86 UTC
201a7bb0-b88e-4ee3-8648-bd9f24e59a96
2017-01-18 10:43:49.603 UTC
4b0df6bd-b684-4541-8b0b-208ca7a024e3
2017-01-18 10:41:38.945 UTC
9ae75c76-bc3b-43a2-baed-f57c2c0fec1c
2017-01-18 11:03:19.196 UTC
f403048c-1a1e-486a-8a46-de08a2bcdbf0
2017-01-18 14:54:57.846 UTC
3c30038f-69db-43ff-a474-ee695da17b7d
2017-01-18 10:41:26.145 UTC
186b20d5-d02d-4c9d-8e73-179a30199b2c
2017-01-18 11:06:12.267 UTC
8f1e8ce6-8c80-4a1c-9714-ddc429e011b8
2017-01-18 11:26:32.206 UTC
42b45e89-eed6-417d-8a2c-635232986034
2017-01-18 11:25:17.444 UTC
593a6b18-81c0-4616-a5f2-3adf26160840
2017-01-18 15:05:05.965 UTC
0f6170c3-7831-44c1-a90c-1afa81502636
2017-01-18 10:45:41.385 UTC
111791e3-22ad-490b-95ae-e10be5d0fb35
2017-01-18 15:06:37.591 UTC
f63a5fb2-f6cf-4123-a23f-7d0d7f970211
2017-01-18 10:43:15.468 UTC
10bf596d-7b3a-4dcf-ac63-3436c553cd74
2017-01-18 10:49:37.545 UTC
dbad82d1-eaf0-4289-bafe-528e670c9393
2017-01-18 10:49:45.914 UTC
fcf46500-f944-48c0-88e3-5325998e24d6
2017-01-18 10:47:44.593 UTC
537a4e04-ea88-4a64-bee1-3753dbdcb2ee
2017-01-18 10:50:07.434 UTC
dropFeaturedropFeatureFlags00headerList11dropFeaturecolumn0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
9916a27a-c60a-424a-9568-7cc121db4807
python dropFeature.py %%column%%
1200
1800
column
dropFeature.py
true
false
false
UTF-8
false
import pandas, argparse
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
TMP_HEADER_FILE = '/home/brayan/Taverna/tmpHeader'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Column drop
parser = argparse.ArgumentParser(description = 'This programdrops a column of the processed dataset.')
parser.add_argument('column', help = 'Name of the column to be dropped')
droppedColumn = parser.parse_args().column
dataset = pandas.read_csv(TMP_DATASET_FILE)
dataset = dataset.drop([droppedColumn], axis = 1)
dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
with open(TMP_HEADER_FILE, 'w') as headerFile:
headerFile.write(','.join(dataset.columns))
print 'Dataset processed correctly!'
column
column
false
false
false
UTF-8
false
false
false
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select the column that will be dropped:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectDropColumnmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Drop column
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokedropFeaturecolumnTellmessageTelltitleselectDropColumnmessageselectDropColumnvalueListselectDropColumntitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
1f1f5256-e419-4572-80e4-47092fbb9e1b
2017-01-18 10:36:23.577 UTC
650dee82-df91-4323-b39f-8e98e92696b4
2017-01-18 10:37:02.163 UTC
ddc7c835-4677-42f7-be0d-18c8703d7d92
2017-01-17 13:00:35.848 UTC
c8c07c2f-935d-4c38-b10d-76a3b0a435f3
2017-01-18 11:28:13.197 UTC
5af6d39e-6791-4a13-ad35-b6ff5c61090a
2017-01-18 14:53:26.371 UTC
dropFeature
2017-01-17 12:59:00.212 UTC
cd49b1d4-f20d-488b-83fc-12a5fa740fd7
2017-01-18 11:02:29.650 UTC
f6b365b0-8afd-4fe6-bc77-7509c9f16622
2017-01-18 10:34:49.898 UTC
f0088e7a-e01b-4076-bfd0-063f4f60dc4d
2017-01-17 15:08:56.996 UTC
b8527a97-9de3-406e-99b3-8b20c5d0e4a5
2017-01-18 10:41:14.649 UTC
d1c885b1-9368-453a-93d9-8773fdaf1321
2017-01-18 15:10:02.797 UTC
e08e0621-7f1d-4e08-9dd7-f96e0f3fc69f
2017-01-17 15:08:26.132 UTC
a3d33cd4-bf20-47f8-985c-4421ba91c844
2017-01-17 13:01:42.0 UTC
fb33b2cb-8324-4fc7-9f29-7f13837f2c43
2017-01-18 10:35:09.897 UTC
58527f47-cf10-4ad9-8061-97ca917bbe90
2017-01-17 12:59:21.512 UTC
9b5b1d3f-365b-4516-84a0-f3fbe40434b4
2017-01-17 12:59:10.757 UTC
plotScatterplotScatterFlags00headerList11plotScattercolumnX0columnY0columnObj0STDERR00STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
178d1624-9188-45eb-80b5-71852fcce2ee
python plotScatter.py %%columnX%% %%columnY%% %%columnObj%%
1200
1800
columnObj
columnX
columnY
plotScatter.py
true
false
false
UTF-8
false
import pandas, argparse
import matplotlib.pyplot as pyplot
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Plotting
parser = argparse.ArgumentParser(description = 'This program plots a scatter given the colums for the X and Y axis. Dots are coloured by the value of the third column.')
parser.add_argument('columnX', help = 'Name of the column to be plotted as the X axis')
parser.add_argument('columnY', help = 'Name of the column to be plotted as the Y axis')
parser.add_argument('columnObj', help = 'Name of the column to be plotted')
selectedXColumn = parser.parse_args().columnX
selectedYColumn = parser.parse_args().columnY
objColumn = parser.parse_args().columnObj
dataset = pandas.read_csv(TMP_DATASET_FILE)
try:
dataset.plot(kind = 'scatter',
x = selectedXColumn,
y = selectedYColumn,
c = objColumn,
s = 50)
pyplot.xlabel(selectedXColumn)
pyplot.ylabel(selectedYColumn)
pyplot.title(selectedXColumn + ' - ' + selectedYColumn)
pyplot.grid(True)
pyplot.show()
except Exception as e:
print 'Unexpected error:', str(e)
print 'Dataset processed correctly!'
columnObj
columnObj
false
false
false
UTF-8
false
false
false
columnX
columnX
false
false
false
UTF-8
false
false
false
columnY
columnY
false
false
false
UTF-8
false
false
false
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemessageForXvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select the column for the X axis:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemessageForYvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select the column for the Y axis:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokemessageForObjvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select the objective column:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectXmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectYmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectObjmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Scatter plot output information
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Scatter plot
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotScattercolumnXplotScattercolumnYplotScattercolumnObjselectXmessageselectXvalueListselectXtitleselectYmessageselectYvalueListselectYtitleselectObjmessageselectObjvalueListselectObjtitleTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
ba8a6ed4-8916-44f6-8dda-87c7a423ac38
2017-01-17 11:39:52.554 UTC
96d7b727-20d3-4035-a2e1-88a40c3d101a
2017-01-17 11:07:00.664 UTC
885325a8-026d-4d46-ae5e-52fb6a86f93a
2017-01-18 14:50:04.363 UTC
0ca77df8-57b6-413c-8313-e7583b19149c
2017-01-18 15:12:46.847 UTC
265dc3a1-997f-4593-9fbd-bbf2fc0b0d4d
2017-01-18 15:09:36.189 UTC
plotScatter
2017-01-17 12:01:21.265 UTC
9a1156de-defa-4313-a290-0cd61f0ee3b6
2017-01-17 11:51:12.22 UTC
93ff1fe6-1dcc-4bcd-9253-0d326fbcc850
2017-01-17 11:39:43.154 UTC
739bb821-b0a0-4e41-943a-855ae90e741c
2017-01-18 11:27:32.84 UTC
631844da-a909-4fdc-a184-7a54d68e690b
2017-01-17 10:57:13.506 UTC
a37d084f-4839-407f-8c62-ffbf8c264559
2017-01-18 11:21:18.684 UTC
22503c9f-1a01-45d8-be86-87f2693da327
2017-01-17 12:00:46.28 UTC
7b5136fa-05ac-4488-9f5a-a4163d09605f
2017-01-17 11:07:29.192 UTC
429d9268-b459-41b5-96af-25d13ea1d877
2017-01-17 11:30:52.545 UTC
1cde77e4-b082-4179-becf-be09ea8782ad
2017-01-17 11:36:13.474 UTC
2966558f-03e3-4728-beba-1a8070d22ffe
2017-01-17 12:01:25.133 UTC
dfadf90a-c6d7-43f4-a635-fbd4875eea43
2017-01-17 11:59:25.87 UTC
e2e07e17-a405-41ba-86f7-d08380350797
2017-01-17 11:14:04.908 UTC
33f8d35f-6ff9-4655-a901-3183183cc6b5
2017-01-17 11:25:25.281 UTC
68d2c0e4-8f02-4a3d-827f-e76cfc811e62
2017-01-18 11:10:51.419 UTC
246cd909-630f-475f-8d26-0108cc38cad7
2017-01-17 11:19:02.258 UTC
231a410b-a2db-4387-ab9e-dc3aa6072753
2017-01-18 10:41:37.515 UTC
1fdcb14b-a2ce-45e7-a740-2c94a284a7da
2017-01-18 11:21:45.684 UTC
4f919c6c-0388-47b2-ba21-dc549e0ac041
2017-01-18 10:37:44.137 UTC
903878da-fc1a-4a67-a970-da9a630e7cd1
2017-01-18 11:10:24.99 UTC
e6cfe743-f358-43e6-8a59-b67820816976
2017-01-17 10:57:24.719 UTC
labelsNumlabelsToNumFlags00headerList11labelsToNumcolumn0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
157dce46-5f13-4299-b2ce-29fdf6c89d0d
python labelsToNum.py %%column%%
1200
1800
column
labelsToNum.py
true
false
false
UTF-8
false
import pandas, argparse
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Missing values processing
parser = argparse.ArgumentParser(description = 'This program sets the given column to a numerical order.')
parser.add_argument('column', help = 'Name of the column to be processed')
classColumn = parser.parse_args().column
dataset = pandas.read_csv(TMP_DATASET_FILE)
classes = dataset[classColumn].unique()
for i in range(len(classes)):
dataset.loc[dataset[classColumn] == classes[i], classColumn] = i
dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
print 'Dataset processed correctly!'
column
column
false
false
false
UTF-8
false
false
false
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select the labels column:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectLabelsColumnmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Labels to numeric value
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelabelsToNumcolumnselectLabelsColumnmessageselectLabelsColumnvalueListselectLabelsColumntitleTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
2fa0a274-f248-4d5a-868c-7fad8de8c5a8
2017-01-18 11:01:18.307 UTC
88c2dd97-1662-40e3-a801-5f95bb736aef
2017-01-18 11:29:03.820 UTC
edc1b9fe-1fae-48f3-928e-fbd971ab03ce
2017-01-18 15:08:43.44 UTC
bc1795cd-b0a7-4e83-aaa7-3b3afb2e4e2b
2017-01-18 10:32:01.288 UTC
05ce6586-ac88-451c-9952-30cd685c08b9
2017-01-17 14:32:14.379 UTC
56dea0e1-188b-478b-928d-557cb30d4fb6
2017-01-18 10:36:47.211 UTC
2b7f2f9b-eddd-49c8-b779-4312b3bb09a3
2017-01-18 10:41:53.685 UTC
d57ef759-0f08-4da0-9aef-e3563aa62e6d
2017-01-18 11:01:12.83 UTC
3337b65b-4592-44df-94d6-84758174b7a7
2017-01-18 10:36:10.234 UTC
839eb079-7141-4167-83ba-cac1f28e4c1a
2017-01-18 11:00:57.10 UTC
labelsNum
2017-01-17 14:32:09.207 UTC
7597cf85-5d3a-4e3c-9aea-b82e2f628bcb
2017-01-18 14:54:56.531 UTC
8aae29ee-a039-4483-b155-5b94e608d3ca
2017-01-17 14:33:14.320 UTC
f40f983c-bd31-47d1-846a-8d331227e880
2017-01-18 10:32:31.184 UTC
dropMissingValuesreplaceMissingDropFlags00dropMissingSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
c0caab14-007a-46e8-b732-7051cb2daf25
python replaceMissingWithDrop.py
1200
1800
replaceMissingWithDrop.py
true
false
false
UTF-8
false
import pandas
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Missing values processing
dataset = pandas.read_csv(TMP_DATASET_FILE)
dataset.dropna(inplace = True)
dataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
print 'Dataset processed correctly!'
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Replacement output information
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
03f38345-3979-4768-a1eb-dcaaa103111e
2017-01-17 14:26:30.574 UTC
4015f12b-eebf-4df3-8046-44fbdd62ab56
2017-01-18 10:45:32.699 UTC
65c07b74-eaec-47b4-8338-923758f29863
2017-01-18 11:23:20.446 UTC
a13584a1-7010-48fa-afd3-8da26c3f1c93
2017-01-18 10:45:39.250 UTC
d8977f5f-17f8-460b-94ef-dd6675742e0e
2017-01-18 11:23:24.344 UTC
7eafd153-e83c-4c18-9c3b-2e8329577389
2017-01-18 14:45:26.242 UTC
dropMissingValues
2017-01-17 14:26:27.427 UTC
5bd326ab-f282-4cc3-ad27-0871aca1d8f7
2017-01-18 11:03:38.179 UTC
fda57315-4759-4d5b-8b86-e08878b4fdd2
2017-01-17 14:26:42.721 UTC
normFeatureScalingnormFeatureFlags00normFeatureSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
89f039e5-78fb-4a05-a2d0-bd33e14a34f4
python featureScaling.py
1200
1800
featureScaling.py
true
false
false
UTF-8
false
import pandas
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Normalization
dataset = pandas.read_csv(TMP_DATASET_FILE)
processedDataset = (dataset - dataset.min()) / (dataset.max() - dataset.min())
processedDataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
print 'Dataset processed correctly!'
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Feature scaling output information
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
7b05ab89-4989-412f-966c-7148962526ba
2017-01-18 14:39:39.66 UTC
5532d37b-47a2-4dd1-a6ef-482e4adacdc1
2017-01-17 12:49:30.711 UTC
5d81a6a5-96e5-4348-a3e2-a93d9bf14b52
2017-01-18 11:04:01.266 UTC
b4762844-5551-44bb-a3af-42f62adfae8f
2017-01-18 11:25:39.364 UTC
normFeatureScaling
2017-01-17 12:39:06.855 UTC
0014a9dc-fba3-45b9-a857-4374392623e4
2017-01-17 12:39:17.588 UTC
4e8b3e6f-bac6-4b34-81d3-1e183d840e78
2017-01-17 12:51:03.775 UTC
07a77734-9b25-44f2-97b1-039f26a1ab03
2017-01-18 14:38:39.602 UTC
1e71953c-5074-473f-a3ba-8de399709cdd
2017-01-17 12:39:27.838 UTC
e3e08062-3114-4f9e-9d32-aacacce73527
2017-01-18 10:45:03.49 UTC
733db518-e38f-4666-80c0-a761368c7bb8
2017-01-18 10:45:09.740 UTC
75fb1e3e-187a-4e0d-8046-335493529c7b
2017-01-18 11:24:05.236 UTC
normStandardnormStandardFlags00normStandardizationSTDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
ee9902b7-c136-459b-bf66-ff482acb3c4d
python standardization.py
1200
1800
standardization.py
true
false
false
UTF-8
false
import pandas
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Normalization
dataset = pandas.read_csv(TMP_DATASET_FILE)
processedDataset = (dataset - dataset.mean()) / dataset.std()
processedDataset.to_csv(TMP_DATASET_FILE, encoding = 'utf-8', index = False)
print 'Dataset processed correctly!'
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Standardization output information
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
2d617b74-9c66-4c91-9263-4b9a451138b6
2017-01-18 11:25:25.612 UTC
f5dc05d1-42d7-46b2-b7eb-b14a148b5b2f
2017-01-18 11:24:36.900 UTC
3b78dfcd-1927-4774-b718-30bfe437e1e6
2017-01-17 12:42:03.166 UTC
60e73cbe-cac7-450f-8dbf-cc8ecd43deee
2017-01-17 12:41:53.633 UTC
241dd1aa-043b-4887-9209-aab78027c9be
2017-01-17 12:50:24.159 UTC
0a8a428f-8e89-4873-8349-57227b005558
2017-01-17 12:52:41.815 UTC
3e1037af-cb7f-43d3-9ac7-b76132c8b89b
2017-01-18 14:40:30.298 UTC
normStandard
2017-01-17 12:41:49.651 UTC
ea165dfd-aa0f-4815-a57d-58141e9e80a0
2017-01-18 10:43:44.778 UTC
89e49c6e-5121-4ee3-b84a-4bc31f0cde71
2017-01-18 11:04:28.71 UTC
saveFilesaveFlags00saveNewFilefileName0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
369f8a7e-1a82-47c4-9895-eba935357d87
python saveNewFile.py %%fileName%%
1200
1800
fileName
saveNewFile.py
true
false
false
UTF-8
false
import pandas, argparse
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
NEW_FILE_PATH = '/home/brayan/Taverna/'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Main program
parser = argparse.ArgumentParser(description = 'This program saves the loaded dataset in a new file.')
parser.add_argument('fileName', help = 'Name of the new file')
fileName = parser.parse_args().fileName
dataset = pandas.read_csv(TMP_DATASET_FILE)
dataset.to_csv(NEW_FILE_PATH + fileName, encoding = 'utf-8', index = False)
print 'Dataset saved correctly at', NEW_FILE_PATH
fileName
fileName
false
false
false
UTF-8
false
false
false
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Write the new file's name:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokefirstQuotestring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokefirstQuoteSignvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
'
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelastQuotestring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokelastQuoteSignvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
'
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeaskFileNamemessage0title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.AskWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTellmessage0title0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleGeneralvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Save new file
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokesaveNewFilefileNamefirstQuotestring1firstQuotestring2lastQuotestring1lastQuotestring2askFileNamemessageaskFileNametitleTellmessageTelltitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
saveFile
2017-01-17 14:39:32.908 UTC
20005879-cca7-40bb-8296-224fe1ce4c9c
2017-01-17 14:45:45.516 UTC
9630aca9-43e9-4888-afe1-e6984e241289
2017-01-18 11:26:28.573 UTC
270f7858-4166-45cd-94e9-bc418c77d842
2017-01-18 10:47:03.666 UTC
52bb89cb-58cb-4794-8bc4-13de81530d94
2017-01-18 11:05:43.731 UTC
ef01b1c4-38ef-4871-b69e-22c2a7bd9ea5
2017-01-18 15:07:40.957 UTC
ccd9137a-b699-4728-8847-6e9155570862
2017-01-18 11:06:03.614 UTC
4e2c183e-0534-4bdc-b680-8fb2cca43cf5
2017-01-17 14:43:13.296 UTC
d897f094-4533-4b5b-ad9d-1ed88cd5d763
2017-01-17 14:49:10.797 UTC
17dacc60-8137-4673-a297-8458c623f2ca
2017-01-18 10:46:21.393 UTC
5e6a198b-89aa-4de9-8b48-0dda9960b24d
2017-01-18 10:46:56.113 UTC
ea48b3d5-f20c-4bbd-b309-a241c4fccd78
2017-01-18 10:46:12.314 UTC
66c543ae-f336-4c5e-89d3-9a8faebe2e5c
2017-01-18 14:44:26.811 UTC
0f571c4a-0efb-474e-90d2-752d2c63472d
2017-01-17 14:41:11.107 UTC
a92cd78e-8782-4ac3-b2db-aa7a21257ffc
2017-01-17 14:39:37.456 UTC
a7ae23b7-966f-4a92-b12b-16e161f021f0
2017-01-17 14:51:01.780 UTC
f24d51f1-a4ca-4e8c-9812-2b9bc3cab1f7
2017-01-18 14:51:23.987 UTC
59609eb9-5546-4cbb-915f-fbf63c5a82e5
2017-01-18 11:26:23.958 UTC
e4fe1ffd-e747-49f3-920f-906bb5a7325b
2017-01-18 14:44:13.395 UTC
plotHistogramplotHistogramFlags00headerList11plotHistogramcolumn0STDOUT00STDERR00net.sf.taverna.t2.activitiesexternal-tool-activity1.5net.sf.taverna.t2.activities.externaltool.ExternalToolActivity
789663B8-DA91-428A-9F7D-B3F3DA185FD4
default local_3
<?xml version="1.0" encoding="UTF-8"?>
<localInvocation><directory>/home/brayan/Taverna/sessions</directory><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation>
178d1624-9188-45eb-80b5-71852fcce2ee
python plotHistogram.py %%column%%
1200
1800
column
plotHistogram.py
true
false
false
UTF-8
false
import pandas, argparse
import matplotlib.pyplot as pyplot
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Constant definition
TMP_DATASET_FILE = '/home/brayan/Taverna/tmpDataset'
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Plotting
parser = argparse.ArgumentParser(description = 'This program plots the histogram of the given column')
parser.add_argument('column', help = 'Name of the column to be plotted')
selectedColumn = parser.parse_args().column
dataset = pandas.read_csv(TMP_DATASET_FILE)
try:
dataset[selectedColumn].dropna().plot(kind = 'hist',
xticks = dataset[selectedColumn].dropna().unique(),
bins = dataset[selectedColumn].dropna().unique().size)
pyplot.xlabel(selectedColumn)
pyplot.title(selectedColumn + ' distribution')
pyplot.grid(True)
pyplot.show()
except Exception as e:
print 'Unexpected error:', str(e)
print 'Dataset processed correctly!'
column
column
false
false
false
UTF-8
false
false
false
false
true
true
0
false
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemessagevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Select the column that will be plotted:
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeTelltitle0message0net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
title
0
'text/plain'
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.TellWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeselectColumnmessage0valueList1title0answer00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
valueList
1
l('text/plain')
java.lang.String
true
message
0
'text/plain'
java.lang.String
true
title
0
'text/plain'
java.lang.String
true
answer
0
'text/plain'
0
workflow
net.sourceforge.taverna.scuflworkers.ui.SelectWorker
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invoketitlevalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Histogram output information
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeConcatenate_two_stringsstring10string20output00net.sf.taverna.t2.activitieslocalworker-activity1.5net.sf.taverna.t2.activities.localworker.LocalworkerActivity
string1
0
'text/plain'
java.lang.String
true
string2
0
'text/plain'
java.lang.String
true
output
0
'text/plain'
0
workflow
org.embl.ebi.escience.scuflworkers.java.StringConcat
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvoketitleColumnvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.5net.sf.taverna.t2.activities.stringconstant.StringConstantActivity
Histogram column selector
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize
1
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry
1.0
1000
5000
0
net.sf.taverna.t2.coreworkflowmodel-impl1.5net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeplotHistogramcolumnTelltitleTellmessageselectColumnmessageselectColumnvalueListselectColumntitleConcatenate_two_stringsstring1Concatenate_two_stringsstring2
dacfdbbf-8ac1-4941-b0fc-a83d7d2d4888
2017-01-18 14:50:34.251 UTC
8bcd45de-5031-428f-9fc6-e03797fdec03
2017-01-18 10:43:12.737 UTC
e6cfe743-f358-43e6-8a59-b67820816976
2017-01-17 10:57:24.719 UTC
33f8d35f-6ff9-4655-a901-3183183cc6b5
2017-01-17 11:25:25.281 UTC
1c368b09-ee2e-4b31-a918-2a91f174e66c
2017-01-18 10:38:15.730 UTC
b55c48b2-ed13-4c7a-ab15-7b6ea7b2391f
2017-01-18 15:06:35.544 UTC
7b5136fa-05ac-4488-9f5a-a4163d09605f
2017-01-17 11:07:29.192 UTC
2944cb50-5e54-44cb-b60c-05e5324e2735
2017-01-18 10:38:42.265 UTC
9f7989b8-6a3e-45d3-8920-c9cfa420947d
2017-01-18 11:08:34.557 UTC
plotHistogram
2017-01-17 10:56:45.598 UTC
96d7b727-20d3-4035-a2e1-88a40c3d101a
2017-01-17 11:07:00.664 UTC
9a1156de-defa-4313-a290-0cd61f0ee3b6
2017-01-17 11:51:12.22 UTC
e2e07e17-a405-41ba-86f7-d08380350797
2017-01-17 11:14:04.908 UTC
ba8a6ed4-8916-44f6-8dda-87c7a423ac38
2017-01-17 11:39:52.554 UTC
8496a21f-666d-4a1e-96ea-3d1bf0453c7b
2017-01-18 11:13:18.507 UTC
7b6e59c8-6428-4595-b328-cb8d0fa1bcb7
2017-01-18 10:42:59.529 UTC
1cde77e4-b082-4179-becf-be09ea8782ad
2017-01-17 11:36:13.474 UTC
0adcfe92-b0b4-48ca-82c0-58bda0b63ea7
2017-01-18 11:08:26.467 UTC
8adbe06e-bfe1-45d4-829f-2c2f4bd9401b
2017-01-18 10:38:03.587 UTC
631844da-a909-4fdc-a184-7a54d68e690b
2017-01-17 10:57:13.506 UTC
429d9268-b459-41b5-96af-25d13ea1d877
2017-01-17 11:30:52.545 UTC
93ff1fe6-1dcc-4bcd-9253-0d326fbcc850
2017-01-17 11:39:43.154 UTC
246cd909-630f-475f-8d26-0108cc38cad7
2017-01-17 11:19:02.258 UTC
e79d65e4-fc91-4ae5-9ed3-5d2024377313
2017-01-18 11:13:13.534 UTC
5cb20341-91c7-4e5c-a565-007915db8b38
2017-01-18 14:46:58.971 UTC
21579554-7044-4d9c-8633-79ba218f9c25
2017-01-18 11:27:07.30 UTC