Hadoop_hOCR_parserhadoop_job_name_prefix00 Hadoop job name prefix for 2012-08-12 21:48:14.164 CEST taverna_hocr_parser_with_exiftool 2012-08-09 17:53:12.346 CEST rootpath00 /home/onbscs/testdata/abo/samples/verysmall/ 2012-08-09 17:53:25.1 CEST OutHadoopHocrAvBlockWidthMapReducehdfs_input_dir0hadoop_job_name_prefix0STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> c78b0d9f-4d5f-4828-b2e7-ce9b502b4d12 /usr/bin/hadoop jar /home/onbscs/scape-dev/scape/tb-lsdr-hocrparser/target/tb-lsdr-hocrparser-0.1-SNAPSHOT-jar-with-dependencies.jar eu.scape_project.tb.lsdr.hocrparser.HocrParser -d %%hdfs_input_dir%% -n %%hadoop_job_name_prefix%%_hocrparser 1200 1800 hadoop_job_name_prefix hdfs_input_dir hadoop_job_name_prefix hadoop_job_name_prefix false false false UTF-8 false false false hdfs_input_dir hdfs_input_dir false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHadoopSequenceFileCreatorhadoop_job_name_prefix0hdfs_input_path0STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 17838d9c-ef94-4aa7-8673-6f0b717aa4c0 /usr/bin/hadoop jar /home/onbscs/scape-dev/scape/tb-lsdr-seqfilecreator/target/tb-lsdr-seqfileutility-0.1-SNAPSHOT-jar-with-dependencies.jar -m -p %%hdfs_input_path%% -c NONE -n %%hadoop_job_name_prefix%%_seqfilecreation 1200 1800 hadoop_job_name_prefix hdfs_input_path hdfs_input_path hdfs_input_path false false false UTF-8 false false false hadoop_job_name_prefix hadoop_job_name_prefix false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHtmlPathCreatorrootpath0extfilter0STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 27b6c918-d0e3-46f7-8f35-cf5c72a9791e MILLIS=`date +%s%N | cut -b1-13` PATHID=%%extfilter%% TMPDIR=${MILLIS}${PATHID} mkdir /tmp/${TMPDIR}/ find -L %%rootpath%% -regex .*.%%extfilter%% -type f -print > /tmp/${TMPDIR}/absolutepaths.txt && \ hadoop fs -put /tmp/${TMPDIR}/absolutepaths.txt /user/onbscs/output/${TMPDIR}/absolutepaths.txt && \ echo -n /user/onbscs/output/${TMPDIR}/ 1200 1800 extfilter rootpath rootpath rootpath false false false UTF-8 false false false extfilter extfilter false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeJp2PathCreatorrootpath0extfilter0STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> 27b6c918-d0e3-46f7-8f35-cf5c72a9791e MILLIS=`date +%s%N | cut -b1-13` PATHID=%%extfilter%% TMPDIR=${MILLIS}${PATHID} mkdir /tmp/${TMPDIR}/ find -L %%rootpath%% -regex .*.%%extfilter%% -type f -print > /tmp/${TMPDIR}/absolutepaths.txt && \ hadoop fs -put /tmp/${TMPDIR}/absolutepaths.txt /user/onbscs/output/${TMPDIR}/absolutepaths.txt && \ echo -n /user/onbscs/output/${TMPDIR}/ 1200 1800 extfilter rootpath rootpath rootpath false false false UTF-8 false false false extfilter extfilter false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokehtml_extensionvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.3net.sf.taverna.t2.activities.stringconstant.StringConstantActivity html net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokejp2_extensionvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.3net.sf.taverna.t2.activities.stringconstant.StringConstantActivity jp2 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHadoopStreamingExiftoolReadhdfs_input_dir0hadoop_job_name_prefix0STDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> f67de292-9ef0-404e-9184-a4902fc7ac3b #!/bin/bash # Bash script using Hadoop's streaming API to read metadata from images that are listed # with absolute file paths in a text file available in the hdfs input directory. #! Hadoop home directory HADOOP_HOME=/usr/lib/hadoop-0.20 #! the streaming jar location HADOOP_STREAMING_JAR=$HADOOP_HOME/contrib/streaming/hadoop-streaming-0.20.2-cdh3u3.jar #! Identifier MILLIS=`date +%s%N | cut -b1-13` SUFFIX=xft IDENTIFIER=${MILLIS}${SUFFIX} #! input (hdfs location) IN=%%hdfs_input_dir%% #! output (hdfs location) OUT=/user/onbscs/output/${IDENTIFIER} #! Mapper script #! The mapper script will be stored in a temporary executable file, it executes exiftool #! and filters the image width value using 'sed'. The key is Barcode-number/Page-number. #! For example, in this string: #! Z119585409/00000778:2258 #! the image width for book Z119585409 page 778 is 2258. MAPPER="while read filepath ; do export HKEY; HKEY=\`echo -n \$filepath | sed 's/.*+//;s/abo\///g;s/\.jp2//g'\`; export HVAL; HVAL=\`exiftool -d %Y-%m-%d_%H-%M-%S \$filepath | grep 'Image Width' | sed s/[^0-9]*//g\`; echo \"\${HKEY}\\t\${HVAL}\"; done" #! temporary mapper script MAPFILE="/tmp/map${IDENTIFIER}.sh" #! write mapper script to temporary file and make it executable `echo ${MAPPER} > $MAPFILE && chmod +x $MAPFILE` #! job name defined as job options OPTS='-D mapred.job.name=%%hadoop_job_name_prefix%%_exiftool' #! Hadoop command #! standard out of the hadoop job is redirected to a temporary log file `hadoop jar $HADOOP_STREAMING_JAR $OPTS -mapper "$MAPFILE" -input $IN -output $OUT` >/tmp/%%hadoop_job_name_prefix%%_${IDENTIFIER}.log 2>&1 #! hdfs output path to stdout echo -n $OUT 1200 1800 hadoop_job_name_prefix hdfs_input_dir hadoop_job_name_prefix hadoop_job_name_prefix false false false UTF-8 false false false hdfs_input_dir hdfs_input_dir false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHiveLoadExifDatahdfs_result_file0net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> fbee1ccb-8a7f-4fcb-8a9f-ce362a58a810 #/usr/bin/hadoop fs -cat %%hdfs_result_file%%/part-r-00000 TABLENAME=exif_data `/usr/local/java/hive-0.8.1/bin/hive -e "CREATE TABLE ${TABLENAME} (identifier STRING, width INT) ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t';"` >>/tmp/hivelog_${TABLENAME}.log 2>&1 `/usr/local/java/hive-0.8.1/bin/hive -e "LOAD DATA INPATH '%%hdfs_result_file%%/' OVERWRITE INTO TABLE ${TABLENAME};"` >>/tmp/hivelog_${TABLENAME}.log 2>&1 echo -n ${TABLENAME} 1200 1800 hdfs_result_file hdfs_result_file hdfs_result_file false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHiveLoadHocrDatahdfs_result_file0net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> fbee1ccb-8a7f-4fcb-8a9f-ce362a58a810 #/usr/bin/hadoop fs -cat %%hdfs_result_file%%/part-r-00000 TABLENAME=hocr_data `/usr/local/java/hive-0.8.1/bin/hive -e "CREATE TABLE ${TABLENAME} (identifier STRING, width INT) ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t';"` >>/tmp/hivelog_${TABLENAME}.log 2>&1 `/usr/local/java/hive-0.8.1/bin/hive -e "LOAD DATA INPATH '%%hdfs_result_file%%/' OVERWRITE INTO TABLE ${TABLENAME};"` >>/tmp/hivelog_${TABLENAME}.log 2>&1 echo -n ${TABLENAME} 1200 1800 hdfs_result_file hdfs_result_file hdfs_result_file false false false UTF-8 false false false false true false 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHiveSelectSTDOUT00net.sf.taverna.t2.activitiesexternal-tool-activity1.3net.sf.taverna.t2.activities.externaltool.ExternalToolActivity 789663B8-DA91-428A-9F7D-B3F3DA185FD4 default local <?xml version="1.0" encoding="UTF-8"?> <localInvocation><shellPrefix>/bin/sh -c</shellPrefix><linkCommand>/bin/ln -s %%PATH_TO_ORIGINAL%% %%TARGET_NAME%%</linkCommand></localInvocation> ad3726a2-f32c-4d4d-a528-529398a625bb /usr/local/java/hive-0.8.1/bin/hive -e "select hocr_data.identifier,hocr_data.width,exif_data.width from hocr_data inner join exif_data on hocr_data.identifier=exif_data.identifier;" 1200 1800 false true true 0 false net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 1000 5000 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3net.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeHadoopHocrAvBlockWidthMapReducehdfs_input_dirHadoopSequenceFileCreatorSTDOUTHadoopHocrAvBlockWidthMapReducehadoop_job_name_prefixhadoop_job_name_prefixHadoopSequenceFileCreatorhadoop_job_name_prefixhadoop_job_name_prefixHadoopSequenceFileCreatorhdfs_input_pathHtmlPathCreatorSTDOUTHtmlPathCreatorrootpathrootpathHtmlPathCreatorextfilterhtml_extensionvalueJp2PathCreatorrootpathrootpathJp2PathCreatorextfilterjp2_extensionvalueHadoopStreamingExiftoolReadhdfs_input_dirJp2PathCreatorSTDOUTHadoopStreamingExiftoolReadhadoop_job_name_prefixhadoop_job_name_prefixHiveLoadExifDatahdfs_result_fileHadoopStreamingExiftoolReadSTDOUTHiveLoadHocrDatahdfs_result_fileHadoopHocrAvBlockWidthMapReduceSTDOUTOutHiveSelectSTDOUT 19b64e80-7f4b-4790-9628-c6ea255be89c 2012-08-06 17:24:59.183 CEST 00783411-21c3-4af2-8c7b-4138520b1da3 2012-08-11 17:48:17.650 CEST e20e50c6-1d96-4ad0-b4e1-bce397d0c613 2012-08-09 17:53:25.172 CEST 5ec6ae87-f4fd-440b-8227-ae2e2d35db6e 2012-08-06 14:43:00.860 CEST 4ff0f0a6-227d-4499-944b-521609c4d015 2012-08-10 15:26:48.595 CEST 928d3974-52b2-4ccf-b6c7-e45da13297cc 2012-08-09 14:08:20.11 CEST afe7d48f-7a66-4cdf-bfed-26bd875f0ad5 2012-08-09 14:47:40.140 CEST c3200eed-d32c-408d-a6bc-be79d8c515f6 2012-08-06 17:05:06.329 CEST 2c24767a-76ea-4069-83fc-8b9ef7edb3c6 2012-08-09 17:23:40.62 CEST 81507e8e-2e6a-4cc0-8887-73267d37bf0f 2012-08-11 10:08:35.413 CEST 1eb6e96e-ccda-4f8f-b60e-c0210ffb9bf5 2012-08-11 17:48:49.978 CEST 227bd895-0a70-4ea5-b644-5df589282e96 2012-08-11 18:00:34.232 CEST ceffc2b6-c8db-40ae-8912-6a7d7f135591 2012-08-09 14:36:00.516 CEST ed182d5b-9c95-4a19-b6cb-c3da4e3d484c 2012-08-11 08:40:16.63 CEST b9ea9564-6525-4542-8bf9-df1906b4ac34 2012-08-09 17:52:03.434 CEST c0ddc45d-6040-4df4-9431-648174cf8951 2012-08-11 10:11:33.18 CEST 0e485ba2-8058-4193-abd1-15d304629bfb 2012-08-11 19:32:09.305 CEST 6c03c57c-2ffc-4583-b5f3-e3564ef40c46 2012-08-10 15:30:05.764 CEST 0cfc6ccf-84c6-4962-afdc-0832c804af37 2012-08-06 15:21:28.581 CEST ba145c17-4263-493b-a844-0701538902d4 2012-08-06 14:38:46.807 CEST c2c24124-b5f3-4680-9f98-e0eb2d1e92ca 2012-08-06 14:23:22.451 CEST 9b94270e-a4d8-441a-b4aa-0214a8f413b7 2012-08-06 14:40:52.367 CEST b1a99001-0a44-41f8-8843-f0344887df93 2012-08-06 16:55:19.393 CEST aab6b952-ac05-49ce-8a11-e88b5229edb2 2012-08-06 15:53:28.680 CEST e74bf437-1675-469c-b07c-575463491785 2012-08-11 10:04:46.928 CEST cb572561-fac5-4c3f-9798-3603a1bd3c30 2012-08-10 14:32:40.870 CEST ba31f000-400a-4f12-8d3c-4f9eb6b4116b 2012-08-01 18:00:41.530 CEST c9f9efef-d495-48d9-b7ce-2f7ac43761ff 2012-08-10 14:35:01.787 CEST 36c1ee60-26c4-4ed4-b60a-d33459ddb64d 2012-08-12 21:50:34.536 CEST 594b6663-5259-4875-8730-1778bc68bd41 2012-08-01 18:01:29.34 CEST d02984d8-5493-4a2c-92fe-49b4da5f5f6d 2012-08-06 17:20:43.714 CEST e9fb096c-1069-47d8-8dbd-618042344f26 2012-08-10 21:18:02.624 CEST 6b846eac-4e8f-4c94-a292-ef0c0c3b4806 2012-08-10 15:29:23.898 CEST bfd29632-3c33-4d96-a7dc-ac0051cbcb7a 2012-08-12 21:49:36.521 CEST 0c8854b0-0e27-4be5-baee-cbc36422e703 2012-08-09 18:00:56.220 CEST 5f36f31f-9022-4982-bebf-9d6c3025af91 2012-08-14 10:06:56.945 CEST ef7567b3-96ad-4174-a3a4-e4178765fbcf 2012-08-06 17:39:53.989 CEST e8802b88-1d08-43bd-b3a4-123fd6ffdf98 2012-08-11 08:28:35.557 CEST 8e5507cc-0b4e-4dcc-bece-c1e79c7654a5 2012-08-10 21:09:08.998 CEST 409c7fab-7b4b-401b-9d6c-d1d94128ef6f 2012-08-09 14:47:09.909 CEST 2bfab0ea-ef2e-4f2e-bed6-c10fbe537678 2012-08-06 16:15:58.243 CEST edefb9d5-db04-483e-b929-d991e5641913 2012-08-11 19:03:34.485 CEST 1128a255-2b2f-4b1a-b277-050e337c6a03 2012-08-06 17:47:12.743 CEST b9905c1b-c86f-4115-b2cd-9bdea5a4388b 2012-08-10 21:19:17.391 CEST 0fdf4eec-a4dd-4b32-9c05-aa7b8715a938 2012-08-11 12:14:00.175 CEST 07998f05-609d-400d-88a0-8bbc2c660dd2 2012-08-01 15:13:42.332 CEST 4a040203-1a83-4459-aa76-ce1d3c668c40 2012-08-06 17:30:59.373 CEST 7839ac77-1a73-4194-b4c5-bb97aefbd64a 2012-08-11 12:13:05.460 CEST d5aad4cc-227f-49b7-a5c3-7c1801471bd1 2012-08-11 20:49:51.132 CEST Hadoop hOCR parser 2012-08-01 17:41:06.747 CEST 4c20df2b-a6a7-4aa4-9afe-7955f53200de 2012-08-06 14:31:26.889 CEST e0b7076b-4c54-484a-ae50-ae3cc36158bd 2012-08-01 17:41:38.868 CEST b57f7264-3e4b-41bb-9016-32ec5d65b183 2012-08-06 14:41:58.669 CEST 1bfb9edd-0227-43a4-9730-237a571ba289 2012-08-06 17:46:32.160 CEST Sven Schlarb 2012-08-01 17:41:11.547 CEST ae8503bb-2163-43aa-ac70-33ace9b6aa5f 2012-08-09 14:46:53.214 CEST c72f9122-21b6-4fb3-9350-03942dc38fec 2012-08-01 18:16:43.314 CEST 5e3d2777-7ee3-4e2c-b400-e9a3386af290 2012-08-10 21:20:05.71 CEST