ExtractScientificTermsphenotype_abstracts00 2010-01-28 11:40:34.439 GMT application/octet-stream 2010-01-28 11:40:34.439 GMT phenotype_terms text/plain 2010-01-28 11:40:34.439 GMT Encode_byte_to_base64bytes0base6400net.sf.taverna.t2.activitieslocalworker-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.localworker.LocalworkerActivity bytes 0 'application/octet-stream' [B true base64 0 'text/plain' 0 workflow commons-codec commons-codec 1.3 1635363350 commons-codec:commons-codec:1.3 org.embl.ebi.escience.scuflworkers.java.EncodeBase64 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemerge_strings_2stringlist1concatenated00net.sf.taverna.t2.activitieslocalworker-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.localworker.LocalworkerActivity stringlist 1 l('text/plain') java.lang.String true seperator 0 'text/plain' java.lang.String true concatenated 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringListMerge net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeregexvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.stringconstant.StringConstantActivity \n net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokexpathvalue00net.sf.taverna.t2.activitiesstringconstant-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.stringconstant.StringConstantActivity /*[local-name(.)='generateTerminologyResponse']/*[local-name(.)='return'] net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeextract_abstractsinput0output_search00output00net.sf.taverna.t2.activitiesbeanshell-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.beanshell.BeanshellActivity input 0 'text/plain' java.lang.String true output 0 'text/plain' 0 output_search 0 'text/plain' 0 workflow net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemerge_search_and_termsterms0search_term0output00net.sf.taverna.t2.activitiesbeanshell-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.beanshell.BeanshellActivity terms 0 'text/plain' java.lang.String true search_term 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeextract_Termsxml-text0xpath0nodelistAsXML11nodelist11net.sf.taverna.t2.activitieslocalworker-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.localworker.LocalworkerActivity xpath 0 'text/plain' java.lang.String true xml-text 0 'text/xml' java.lang.String true nodelist 1 l('text/plain') 1 nodelistAsXML 1 l('text/plain') 1 workflow dom4j dom4j 1.6 716010169 dom4j:dom4j:1.6 net.sourceforge.taverna.scuflworkers.xml.XPathTextWorker net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokemerge_stringsstringlist1concatenated00net.sf.taverna.t2.activitieslocalworker-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.localworker.LocalworkerActivity stringlist 1 l('text/plain') java.lang.String true seperator 0 'text/plain' java.lang.String true concatenated 0 'text/plain' 0 workflow org.embl.ebi.escience.scuflworkers.java.StringListMerge net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeremove_Nullsinput0output00net.sf.taverna.t2.activitiesbeanshell-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.beanshell.BeanshellActivity input 0 'text/plain' java.lang.String true output 0 'text/plain' 0 workflow net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeRemove_duplicate_stringsstringlist1strippedlist11net.sf.taverna.t2.activitieslocalworker-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.localworker.LocalworkerActivity stringlist 1 l('text/plain') java.lang.String true strippedlist 1 l('text/plain') 1 workflow org.embl.ebi.escience.scuflworkers.java.StringStripDuplicates net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeparametersXMLtexts1output00net.sf.taverna.t2.activitieswsdl-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.wsdl.xmlsplitter.XMLInputSplitterActivity applicationCode 0 'text/plain' java.lang.String true texts 1 l('text/plain') java.lang.String true maxNumberOfTerms 0 'text/plain' java.lang.String true output 0 'text/xml' 0 <s:extensions xmlns:s="http://org.embl.ebi.escience/xscufl/0.1alpha"><s:complextype optional="false" unbounded="false" typename="generateTerminology" name="parameters" qname="{http://server.gopubmedTermGenerationService.biotec.tud.de}generateTerminology"><s:elements><s:basetype optional="true" unbounded="false" typename="string" name="applicationCode" qname="{http://server.gopubmedTermGenerationService.biotec.tud.de}&gt;generateTerminology&gt;applicationCode" /><s:arraytype optional="true" unbounded="true" wrapped="false" typename="string" name="texts" qname="{http://server.gopubmedTermGenerationService.biotec.tud.de}&gt;generateTerminology&gt;texts"><s:elementtype><s:basetype optional="false" unbounded="false" typename="string" name="" qname="{http://www.w3.org/2001/XMLSchema}string" /></s:elementtype></s:arraytype><s:basetype optional="true" unbounded="false" typename="int" name="maxNumberOfTerms" qname="{http://server.gopubmedTermGenerationService.biotec.tud.de}&gt;generateTerminology&gt;maxNumberOfTerms" /></s:elements></s:complextype></s:extensions> net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokesplit_by_regexregex0string0split11net.sf.taverna.t2.activitieslocalworker-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.localworker.LocalworkerActivity string 0 'text/plain' java.lang.String true regex 0 'text/plain' java.lang.String true split 1 l('text/plain') 1 workflow org.embl.ebi.escience.scuflworkers.java.SplitByRegex net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokegenerateTerminologyparameters0parameters00attachmentList11net.sf.taverna.t2.activitieswsdl-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.wsdl.WSDLActivity http://gopubmed4.biotec.tu-dresden.de/GoPubMedTermGenerationService/services/GoPubMedTermGeneration?wsdl generateTerminology net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Invokeclean_textfile_direct_data0output00report00net.sf.taverna.t2.activitiessoaplab-activity1.3-SNAPSHOTnet.sf.taverna.t2.activities.soaplab.SoaplabActivity http://phoebus.cs.man.ac.uk:1977/axis/services/text_mining.clean_text 0 1.0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Parallelize 1 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.ErrorBouncenet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Failovernet.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.Retry 1.0 0 0 0 net.sf.taverna.t2.coreworkflowmodel-impl1.3-SNAPSHOTnet.sf.taverna.t2.workflowmodel.processor.dispatch.layers.InvokeEncode_byte_to_base64bytesphenotype_abstractsmerge_strings_2stringlistmerge_stringsconcatenatedextract_abstractsinputclean_textoutputmerge_search_and_termstermsmerge_strings_2concatenatedmerge_search_and_termssearch_termextract_abstractsoutput_searchextract_Termsxml-textgenerateTerminologyparametersextract_Termsxpathxpathvaluemerge_stringsstringlistRemove_duplicate_stringsstrippedlistremove_Nullsinputmerge_search_and_termsoutputRemove_duplicate_stringsstringlistextract_TermsnodelistparametersXMLtextssplit_by_regexsplitsplit_by_regexregexregexvaluesplit_by_regexstringextract_abstractsoutputgenerateTerminologyparametersparametersXMLoutputclean_textfile_direct_dataEncode_byte_to_base64base64phenotype_termsremove_Nullsoutput Extract Scientific Terms 2010-01-28 11:40:34.898 GMT 28f539d5-327d-4fbd-964c-f3de64e5203a 2010-12-08 11:16:40.955 GMT This workflow takes in a document containg text and removes and non-ascii characters. The cleaned text is then sent to a service in dresden to extract all scientific terms. These terms represent a profile for the input document. Any null values are also removed. 2010-01-28 11:40:34.898 GMT Paul Fisher 2010-01-28 11:40:34.898 GMT