<?xml version = "1.0" encoding = "UTF-8"?>
<serviceDescriptions  xmlns="pd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="pd /C:/Documents and Settings/ytanoh/My Documents/TAVERNA/taverna-1.4-old/plugins/pedro/services/model/common.xsd">
	<serviceDescription >
		<serviceName>siggen</serviceName>
		<organisation >
			<organisationName>European Bioinformatics Institute</organisationName>
			<organisationDescriptionText>http://www.ebi.ac.uk/</organisationDescriptionText>
			<organisationKey>EBI</organisationKey>
		</organisation>

		<locationURL>http://www.ebi.ac.uk/soaplab/emboss4/services/protein_3d_structure.siggen</locationURL>
		<interfaceWSDL>http://www.ebi.ac.uk/soaplab/emboss4/services/protein_3d_structure.siggen?wsdl</interfaceWSDL>
		<serviceDescriptionText>Generates a sparse protein signature from an alignment. Detailed info about this operation can be found at the following link: http://liv.bmc.uu.se/cgi-bin/emboss/help/siggen</serviceDescriptionText>
		<operations >
			<serviceOperation >
				<operationName>siggen</operationName>
				<operationSpec>&lt;s:soaplabwsdl xmlns:s=&quot;http://org.embl.ebi.escience/xscufl/0.1alpha&quot;&gt;http://www.ebi.ac.uk/soaplab/emboss4/services/protein_3d_structure.siggen&lt;/s:soaplabwsdl&gt;</operationSpec>
				<operationDescriptionText>Generates a sparse protein signature from an alignment. Detailed info about this operation can be found at the following link: http://liv.bmc.uu.se/cgi-bin/emboss/help/siggen</operationDescriptionText>
				<operationInputs >
					<parameter >
						<parameterName>algpath</parameterName>
						<parameterDescription>DAF files (domain alignment files). A &apos;domain alignment file&apos; contains a sequence alignment of domains belonging to the same SCOP or CATH family (or other node in the structural hierarchies). The file is in DAF format (CLUSTAL-like) and is annotated with domain family classification information. This is a mandatory parameter. </parameterDescription>
						<defaultValue>./</defaultValue>
						<transportDataType>IDL:omg.org/DsLSRAnalysis/StringList:1.0</transportDataType>
					</parameter>

					<parameter >
						<parameterName>mode</parameterName>
						<parameterDescription>Specifies the mode of signature generation. There are 3 modes for signatures generatation: (1) Use positions specified in alignment file. The alignment file must contain a line beginning with the text &apos;Positions&apos; for each line of the alignment.
(2) Use a scoring method. The alignment is scored and the signature of a specified sparsity is sampled from high scoring positions.
(3): Generate a randomised signature. A signature of a specified sparsity is sampled at random from the alignment. This is an optional parameter. The default is 1</parameterDescription>
						<defaultValue>1</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>wsiz</parameterName>
						<parameterDescription>Type: long. Specifies the window size. When a signature is aligned to a protein sequence, the permissible gaps between two signature positions is determined by the empirical gaps and the window size. This is an optional parameter. The default is 0</parameterDescription>
						<defaultValue>0</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>conoption</parameterName>
						<parameterDescription>Specifies the structure-based scoring scheme. SIGGEN provides 2 structure-based scoring schemes(plus a combination method) that are used to score the input alignment. This is an optional parameter. The allowed values for this parameter are: 
1(Number)|
2(Conservation)|
3(Number and conservation)|
4(None (structural data available))|
5(None (no structural data available))|
The default is 5</parameterDescription>
						<defaultValue>5</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>conpath</parameterName>
						<parameterDescription>CON files (contact files). A &apos;contact file&apos; contains contact data for a protein or a domain from SCOP or CATH, in the CON format(EMBL-like). The contacts may be intra-chain residue-residue,inter-chain residue-residue or residue-ligand. This is a mandatory parameter. </parameterDescription>
						<defaultValue>./</defaultValue>
						<transportDataType>byte[][]</transportDataType>
					</parameter>

					<parameter >
						<parameterName>cpdbpath</parameterName>
						<parameterDescription>CCF files(clean coordinate files). A &apos;clean cordinate file&apos;contains protein coordinate and derived data for a single PDB file(&apos;protein clean coordinate file&apos;) or a single domain from SCOP or CATH (&apos;domain clean coordinate file&apos;), in CCF format (EMBL-like). The files, generated by using PDBPARSE (PDB files) or DOMAINER(domains), contain &apos;cleaned-up&apos; data that is self-consistent and error-corrected. Records for residue solvent accessibility and secondary structure are added to the file by using PDBPLUS. This is a mandatory parameter. </parameterDescription>
						<defaultValue>./</defaultValue>
						<transportDataType>byte[][]</transportDataType>
					</parameter>

					<parameter >
						<parameterName>seqoption</parameterName>
						<parameterDescription>This option specifies the sequence-based scoring scheme. SIGGEN provides 2 sequence-based scoring schemes that are used to score the input alignment. This is an optional parameter. The allowed values for this parameter are: 1(Substitution matrix)| 
2(Residue class)|
3(None)|. 
The default is 3</parameterDescription>
						<defaultValue>3</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>datafile_direct_data</parameterName>
						<parameterDescription>Substitution matrix to use. The substitution matrix is used by the sequence-based scoring schemes. This is an optional parameter the default is &apos;EBLOSUM62&apos;. The parameters &apos;datafile_direct_data&apos; and &apos;datafile_url&apos; are mutually exclusive.  </parameterDescription>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>datafile_url</parameterName>
						<parameterDescription>URL of substitution matrix to use. The substitution matrix is used by the sequence-based scoring schemes. This is an optional parameter the default is &apos;EBLOSUM62&apos;. The parameters &apos;datafile_direct_data&apos; and &apos;datafile_url&apos; are mutually exclusive.  </parameterDescription>
						<defaultValue>EBLOSUM62</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>sparsity</parameterName>
						<parameterDescription>This option specifies the % sparsity of signature. The signature sparsity is a user-defined parameter that determines how many residues the final signature will contain, for example, if the average sequence length of the proteins in the alignment is 250 residues, then a signature of sparsity 10% (default value) will contain 25 key residues or signature positions, that correspond to the top 25% highest scoring alignment positions. This is an optional parameter.</parameterDescription>
						<defaultValue>10</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>filtercon</parameterName>
						<parameterDescription>Type: boolean(Yes/No).This option specifies whether to disregard positions forming few contacts only during the selection of signature positions. This is an optional parameter. The default is &apos;No&apos;.</parameterDescription>
						<defaultValue>N</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>conthresh</parameterName>
						<parameterDescription>This option specifies the threshold contact number. This controls the selection of key positions for the structure-based scoring scheme (number of contacts).
This is an optional parameter. The default is 10.</parameterDescription>
						<defaultValue>10</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>filterpsim</parameterName>
						<parameterDescription>Type: boolean (true/false). Disregard alignment sites that were not aligned satisfactorily. This is an optional parameter. The default is &apos;true&apos;. </parameterDescription>
						<defaultValue>true</defaultValue>
						<transportDataType>String</transportDataType>
					</parameter>

				</operationInputs>

				<operationOutputs >
					<parameter >
						<parameterName>report</parameterName>
						<parameterDescription>A general report for the underlying analysis job.</parameterDescription>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>detailed_status</parameterName>
						<parameterDescription>The exit code of the underlying analysis job, 0 means the job returned normally.</parameterDescription>
						<transportDataType>String</transportDataType>
					</parameter>

					<parameter >
						<parameterName>sigoutdir</parameterName>
						<parameterDescription>Returns a signature report. A &apos;signature report&apos; contains a sparse sequence signature suitable for use with the SIGSCAN and SIGGEN services. </parameterDescription>
						<semanticType>http://www.mygrid.org.uk/ontology#structural_alignment_report</semanticType>
						<transportDataType>byte[][]</transportDataType>
					</parameter>

				</operationOutputs>

				<operationTask>http://www.mygrid.org.uk/ontology#predicting</operationTask>
			</serviceOperation>

		</operations>

		<serviceType>Soaplab service</serviceType>
	</serviceDescription>

</serviceDescriptions>
