<?xml version="1.0" encoding="UTF-8" ?>
<?xml-stylesheet type="text/xsl" href="https://webservices.cls.ru.nl/ucto/static/interface.xsl"?>
<clam xmlns:xlink="http://www.w3.org/1999/xlink" version="3.2.10" id="ucto" name="Ucto Webservice" user="anonymous" baseurl="https://webservices.cls.ru.nl/ucto" interfaceoptions="centercover,coverheight100" authentication="oauth,basic">
    <description>Ucto is a unicode-compliant tokeniser. It takes input in the form of one or more untokenised texts, and subsequently tokenises them. Several languages are supported, but the software is extensible to other languages.</description>
    <version>2.5.2</version>
    <author>Maarten van Gompel, Ko van der Sloot</author>
<affiliation>Centre for Language and Speech Technology, Radboud University and KNAW Humanities Cluster</affiliation><email>lamasoftware@science.ru.nl</email><url>https://languagemachines.github.io/ucto</url><coverurl>https://languagemachines.github.io/ucto/style/icon.png</coverurl><license>GNU General Public License v3</license>    <customhtml>
    <![CDATA[
    <p class="alert alert info"><strong>Data processing notice:</strong> All data you upload to this service and data obtained using this service will remain yours and is accessible only by you and our technical staff. Your data will not be shared with third parties and not be used for any purpose other than this service's operation. You can remove your projects at any time and are encouraged to do so, which will remove your data from our servers permanently. We can not guarantee any long-term storage of your data so you are recommended to download the results and store it yourself immediately; projects on the server will be automatically deleted after 30 days. Despite our security precautions, we do discourage use of this service for highly confidential material as there is no encryption on the storage. Last, we also collect some statistics on the frequency of use of this service, when shared this will always be anonymised.</p>
    ]]>
    </customhtml>
    <formats>
            <format id="PlainTextFormat" name="Plain Text Format" mimetype="text/plain" />
            <format id="FoLiAXMLFormat" name="FoLiA XML" mimetype="text/xml" />
    </formats>
    <profiles>
            
        <profile>
         <input>
            <InputTemplate id="untokinput" format="PlainTextFormat" label="Text document" mimetype="text/plain" extension="txt" optional="no" unique="no" acceptarchive="no">
                <StaticParameter id="encoding" name="Encoding" description="The character encoding of the file" value="utf-8" />
                <ChoiceParameter id="language" name="Language" description="The language this text is in" required="1"> <choice id="eng">English</choice> <choice id="nld">Dutch</choice> <choice id="nld-twitter">Dutch on Twitter</choice> <choice id="fra">French</choice> <choice id="deu">German</choice> <choice id="ita">Italian</choice> <choice id="fry">Frisian</choice> <choice id="swe">Swedish</choice> <choice id="rus">Russian</choice> <choice id="spa">Spanish</choice> <choice id="por">Portuguese</choice> <choice id="tur">Turkish</choice></ChoiceParameter>
                <StringParameter id="documentid" name="Document ID" description="Enter a unique identifier for this document (no spaces). Needed only for XML output, will be auto-generated if not specified." />
                <StringParameter id="author" name="Author" description="The author of the document (optional)" />
                <converter id="pdfconv">Convert from PDF Document</converter>
                <converter id="mswordconv">Convert from MS Word Document</converter>
                <converter id="latin1">Convert from Latin-1 (iso-8859-1)</converter>
                <converter id="latin9">Convert from Latin-9 (iso-8859-15)</converter>
            </InputTemplate>
         </input>
         <output>
            <parametercondition>
             <if>
              <equals parameter="xml">True</equals>
             </if>
             <then>
                <OutputTemplate id="foliatokoutput" format="FoLiAXMLFormat" label="Tokenised Text Document (FoLiA XML)" mimetype="text/xml" extension="xml" parent="untokinput" unique="no">
                    <meta id="tokenisation">ucto</meta>
                    <viewer id="flatviewer" name="Open in FLAT" type="FLATViewer" mimetype="text/html" more="false" allowdefault="false" />

                </OutputTemplate>
             </then>
             <else>
                 <parametercondition>
                  <if>
                   <equals parameter="verbose">True</equals>
                  </if>
                  <then>
                     <OutputTemplate id="vtokoutput" format="PlainTextFormat" label="Verbosely Tokenised Text Document" mimetype="text/plain" extension="vtok" parent="untokinput" unique="no">
                         <parametercondition>
                          <if>
                           <equals parameter="sentenceperline">True</equals>
                          </if>
                          <then>
                             <meta id="sentenceperline">yes</meta>
                          </then>
                         </parametercondition>
                         <parametercondition>
                          <if>
                           <equals parameter="lowercase">True</equals>
                          </if>
                          <then>
                             <meta id="lowercase">yes</meta>
                          </then>
                         </parametercondition>
                         <parametercondition>
                          <if>
                           <equals parameter="uppercase">True</equals>
                          </if>
                          <then>
                             <meta id="uppercase">yes</meta>
                          </then>
                         </parametercondition>
                     </OutputTemplate>
                  </then>
                  <else>
                      <OutputTemplate id="tokoutput" format="PlainTextFormat" label="Tokenised Text Document" mimetype="text/plain" extension="tok" parent="untokinput" unique="no">
                          <parametercondition>
                           <if>
                            <equals parameter="sentenceperline">True</equals>
                           </if>
                           <then>
                              <meta id="sentenceperline">yes</meta>
                           </then>
                          </parametercondition>
                          <parametercondition>
                           <if>
                            <equals parameter="lowercase">True</equals>
                           </if>
                           <then>
                              <meta id="lowercase">yes</meta>
                           </then>
                          </parametercondition>
                          <parametercondition>
                           <if>
                            <equals parameter="uppercase">True</equals>
                           </if>
                           <then>
                              <meta id="uppercase">yes</meta>
                           </then>
                          </parametercondition>
                      </OutputTemplate>
                  </else>         </parametercondition>
             </else>    </parametercondition>
            <OutputTemplate id="errorlog" format="PlainTextFormat" label="Log file with (standard) error output" mimetype="text/plain" filename="error.log" unique="yes">
                <meta id="encoding">utf-8</meta>
            </OutputTemplate>
         </output>
        </profile>

    </profiles>
    <parameters>
        <parametergroup name="Tokenisation options">
                    <BooleanParameter id="xml" name="FoLiA XML Output" description="Output FoLiA XML" value="True" />
                    <BooleanParameter id="verbose" name="Verbose tokeniser output" description="Outputs token types per token, one token per line" flag="-V" forbid="sentenceperline,xml" />
                    <BooleanParameter id="sentenceperline" name="Sentence per line" description="Output each sentence on a single line. Does not work in verbose or XML mode." flag="-n" forbid="verbose,xml" />
                    <BooleanParameter id="lowercase" name="Lowercase" description="Convert text to lowercase" flag="-l" forbid="uppercase,xml" />
                    <BooleanParameter id="uppercase" name="Uppercase" description="Convert text to uppercase" flag="-u" forbid="lowercase,xml" />
        </parametergroup>
    </parameters>
    <inputsources>
    </inputsources>
</clam>