Blacklab AutoSearch Corpus Search

<?xml version="1.0" encoding="UTF-8"?>
<cmd:CMD xmlns:cmd="http://www.clarin.eu/cmd/1"
         xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1342181139640"
         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
         CMDVersion="1.2"
         xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1342181139640 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.1/profiles/clarin.eu:cr1:p_1342181139640/1.2/xsd">
   <cmd:Header>
      <cmd:MdCreator>BobBoelhouwer</cmd:MdCreator>
      <cmd:MdCreationDate>2016-07-17</cmd:MdCreationDate>
      <cmd:MdProfile>clarin.eu:cr1:p_1342181139640</cmd:MdProfile>
      <cmd:MdCollectionDisplayName>CLARIN Netherlands</cmd:MdCollectionDisplayName>
   </cmd:Header>
   <cmd:Resources>
      <cmd:ResourceProxyList>
         <cmd:ResourceProxy id="resource">
            <cmd:ResourceType mimetype="text/html">Resource</cmd:ResourceType>
            <cmd:ResourceRef>http://hdl.handle.net/10032/5389ce7fdf3ce8afcb58e95fd4ee4461</cmd:ResourceRef>
         </cmd:ResourceProxy>
         <cmd:ResourceProxy id="landingpage">
            <cmd:ResourceType>LandingPage</cmd:ResourceType>
            <cmd:ResourceRef>http://hdl.handle.net/10032/5389ce7fdf3ce8afcb58e95fd4ee4461</cmd:ResourceRef>
         </cmd:ResourceProxy>         
     </cmd:ResourceProxyList>
      <cmd:JournalFileProxyList/>
      <cmd:ResourceRelationList/>
   </cmd:Resources>
   <cmd:Components>
      <cmdp:ClarinSoftwareDescription>
         <cmdp:GeneralInfo>
            <cmdp:name xml:lang="eng">AutoSearch</cmdp:name>
            <cmdp:title xml:lang="eng">Blacklab AutoSearch Corpus Search</cmdp:title>
			         <cmdp:version>1.0.14</cmdp:version>
            <cmdp:publicationYear>2013</cmdp:publicationYear>
            <cmdp:url>http://hdl.handle.net/10032/5389ce7fdf3ce8afcb58e95fd4ee4461</cmdp:url>
            <cmdp:CLARINCentre>Dutch Language Institute</cmdp:CLARINCentre>
            <cmdp:OriginalSource>http://portal.clarin.nl/node/4222</cmdp:OriginalSource>
            <cmdp:ReleaseStatus>
               <cmdp:LifeCycleStatus>published</cmdp:LifeCycleStatus>
               <cmdp:lastUpdate>2015-01-01</cmdp:lastUpdate>
	              <cmdp:version>1.0.14</cmdp:version>
            </cmdp:ReleaseStatus>
            <cmdp:NationalProjects>
               <cmdp:Project>
                  <cmdp:name>CLARIN-NL</cmdp:name>
                  <cmdp:title>CLARIN in the Netherlands</cmdp:title>
                  <cmdp:id>184.021.003</cmdp:id>
                  <cmdp:funder>NWO</cmdp:funder>
                  <cmdp:url>http://www.clarin.nl</cmdp:url>
                  <cmdp:Contact>
                     <cmdp:Person>Jan Odijk</cmdp:Person>
                     <cmdp:Role>National Coordinator</cmdp:Role>
                     <cmdp:Address>Utrecht, the Netherlands</cmdp:Address>
                     <cmdp:Email>j.odijk@uu.nl</cmdp:Email>
                     <cmdp:Department>UiL-OTS</cmdp:Department>
                     <cmdp:Organisation>Utrecht University</cmdp:Organisation>
                  </cmdp:Contact>
                  <cmdp:Duration>
                     <cmdp:StartYear>2009</cmdp:StartYear>
                     <cmdp:CompletionYear>2015</cmdp:CompletionYear>
                  </cmdp:Duration>
               </cmdp:Project>
               <cmdp:Project>
                  <cmdp:name>CLARIAH-CORE</cmdp:name>
                  <cmdp:title>Common Lab Research Infrastructure for the Arts and the Humanities</cmdp:title>
                  <cmdp:id>184.033.101</cmdp:id>
                  <cmdp:funder>NWO</cmdp:funder>
                  <cmdp:url>http://www.clariah.nl</cmdp:url>
                  <cmdp:Contact>
                     <cmdp:Person>Jan Odijk</cmdp:Person>
                     <cmdp:Role>National Coordinator</cmdp:Role>
                     <cmdp:Address>Utrecht, the Netherlands</cmdp:Address>
                     <cmdp:Email>j.odijk@uu.nl</cmdp:Email>
                     <cmdp:Department>UiL-OTS</cmdp:Department>
                     <cmdp:Organisation>Utrecht University</cmdp:Organisation>
                  </cmdp:Contact>
                  <cmdp:Duration>
                     <cmdp:StartYear>2015</cmdp:StartYear>
                     <cmdp:CompletionYear>2018</cmdp:CompletionYear>
                  </cmdp:Duration>
               </cmdp:Project>
            </cmdp:NationalProjects>
            <cmdp:Country>
               <cmdp:CountryName>Netherlands</cmdp:CountryName>
               <cmdp:CountryCoding>NL</cmdp:CountryCoding>
            </cmdp:Country>
            <cmdp:Description>
	              <cmdp:Description>This demonstrator allows users to define one or more corpora and upload data for the corpora, after which the corpora will be made automatically searchable in a private workspace. Users can upload text data annotated with lemma + part of speech tags in TEI or FoLiA format, either as a single XML file or as an archive (zip or tar.gz) containing several XML files. Corpus size is limited to begin with (25 MB limit per uploaded file; 500,000 token limit for an entire corpus), but these limits may be increased at a later point in time. The search application is powered by the INL BlackLab corpus search engine. The search interface is the same as the one used in for example the Corpus of Contemporary Dutch / Corpus Hedendaags Nederlands.</cmdp:Description>
            </cmdp:Description>
         </cmdp:GeneralInfo>
         <cmdp:SoftwareFunction>
            <cmdp:toolCategory>written language tool</cmdp:toolCategory>
            <cmdp:ToolTasks>
               <cmdp:toolTask>corpus browsing</cmdp:toolTask>
               <cmdp:toolTask>corpus searching</cmdp:toolTask>
               <cmdp:toolTask>corpus processing</cmdp:toolTask>
			         </cmdp:ToolTasks>
            <cmdp:ResearchPhases>
               <cmdp:ResearchPhase>Browsing and Searching</cmdp:ResearchPhase>
            </cmdp:ResearchPhases>
            <cmdp:ResearchDomains>
				           <cmdp:researchDomain>Linguistics</cmdp:researchDomain>
			         </cmdp:ResearchDomains>
            <cmdp:LinguisticsSubject>
               <cmdp:linguisticsSubject>computational linguistics</cmdp:linguisticsSubject>
	              <cmdp:Description>
		                <cmdp:Description/>
	              </cmdp:Description>
            </cmdp:LinguisticsSubject>
            <cmdp:LinguisticsSubject>
               <cmdp:linguisticsSubject>general linguistics</cmdp:linguisticsSubject>
	              <cmdp:Description>
		                <cmdp:Description/>
	              </cmdp:Description>
            </cmdp:LinguisticsSubject>
            <cmdp:LinguisticsSubject>
               <cmdp:linguisticsSubject>lexicology</cmdp:linguisticsSubject>
	              <cmdp:Description>
		                <cmdp:Description/>
	              </cmdp:Description>
            </cmdp:LinguisticsSubject>
            <cmdp:LinguisticsSubject>
              <cmdp:linguisticsSubject>text and corpus linguistics</cmdp:linguisticsSubject>
	              <cmdp:Description>
		                <cmdp:Description/>
	              </cmdp:Description>
            </cmdp:LinguisticsSubject>
            <cmdp:LanguageVariety>
               <cmdp:languageDependent>no</cmdp:languageDependent>
				           <cmdp:Centuries>
                  <cmdp:centuryDependent>no</cmdp:centuryDependent>
               </cmdp:Centuries>
            </cmdp:LanguageVariety>
         </cmdp:SoftwareFunction>
         <cmdp:SoftwareImplementation>
            <cmdp:distributionMedium>Online available</cmdp:distributionMedium>
            <cmdp:UserInterface>
               <cmdp:interfaceType>graphical user interface</cmdp:interfaceType>
               <cmdp:applicationType>web application</cmdp:applicationType>
            </cmdp:UserInterface>
            <cmdp:UserInterface>
               <cmdp:interfaceType>other</cmdp:interfaceType>
               <cmdp:applicationType>web service</cmdp:applicationType>
            </cmdp:UserInterface>
            <cmdp:Input>
               <cmdp:inputType>text</cmdp:inputType>
            </cmdp:Input>
            <cmdp:Output>
				           <cmdp:outputType>text</cmdp:outputType>
				           <cmdp:outputResource>corpus statistics</cmdp:outputResource>
				           <cmdp:outputResource>corpus fragments</cmdp:outputResource>
            </cmdp:Output>
         </cmdp:SoftwareImplementation>
         <cmdp:Access>
	           <cmdp:catalogueLink>https://portal.clarin.inl.nl</cmdp:catalogueLink>
            <cmdp:ResourceLicense>
               <cmdp:license>other</cmdp:license>
               <cmdp:distributionType>academic</cmdp:distributionType>
	              <cmdp:availability>Free, accessible through CLARIN Institutional login</cmdp:availability>
               <cmdp:url>https://portal.clarin.inl.nl/autocorp/</cmdp:url>
               <cmdp:Price>
                  <cmdp:amount>0</cmdp:amount>
                  <cmdp:ISO4217>
                     <cmdp:iso-4217-currency>EUR</cmdp:iso-4217-currency>
                  </cmdp:ISO4217>
               </cmdp:Price>
            </cmdp:ResourceLicense>
            <cmdp:Contact>
              <cmdp:Email>servicedesk@ivdnt.org</cmdp:Email>
              <cmdp:Organisation xml:lang="nld">Instituut voor de Nederlandse Taal</cmdp:Organisation>
              <cmdp:Organisation xml:lang="eng">Institute for the Dutch Language</cmdp:Organisation>
              <cmdp:Url>http://www.ivdnt.org/</cmdp:Url>
            </cmdp:Contact>
         </cmdp:Access>
         <cmdp:ResourceDocumentation>
            <cmdp:Documentation>
               <cmdp:title>AutoSearch demo: a brief overview</cmdp:title>
               <cmdp:documentationTarget>user</cmdp:documentationTarget>
               <cmdp:url>https://portal.clarin.inl.nl/autocorp/doc/AutoSearch-manual.pdf</cmdp:url>
               <cmdp:ISO639>
                  <cmdp:iso-639-3-code>eng</cmdp:iso-639-3-code>
               </cmdp:ISO639>
            </cmdp:Documentation>
			         <cmdp:Pictures>
			            <cmdp:picture height="400" type="other" width="800">
				  http://dev.clarin.nl/sites/default/files/corpora.png
			   </cmdp:picture>
			         </cmdp:Pictures>
			      </cmdp:ResourceDocumentation>
         <cmdp:SoftwareDevelopment>
            <cmdp:Project>
               <cmdp:name>AutoSearch</cmdp:name>
               <cmdp:title>Blacklab AutoSearch Corpus Search</cmdp:title>
               <cmdp:funder>Clarin.nl</cmdp:funder>
               <cmdp:url/>
               <cmdp:Contact>
                  <cmdp:Email>-</cmdp:Email>
               </cmdp:Contact>
               <cmdp:Duration/>
            </cmdp:Project>
            <cmdp:Creator>
              <cmdp:Role>creator</cmdp:Role>
              <cmdp:Contact>
                  <cmdp:Email>servicedesk@ivdnt.org</cmdp:Email>
                  <cmdp:Organisation>Institute of Dutch Lexicology</cmdp:Organisation>
                  <cmdp:Organisation>Instituut voor Nederlandse Lexicology</cmdp:Organisation>
                  <cmdp:Url>http://www.ivdnt.org</cmdp:Url>
              </cmdp:Contact>
            </cmdp:Creator>
         </cmdp:SoftwareDevelopment>
         <cmdp:TechnicalInfo>
            <cmdp:ImplementationLanguage>
               <cmdp:implementationLanguage/>
               <cmdp:version>unknown</cmdp:version>
            </cmdp:ImplementationLanguage>
         </cmdp:TechnicalInfo>
      </cmdp:ClarinSoftwareDescription>
   </cmd:Components>
</cmd:CMD>
Organisation:
  • Institute for the Dutch Language
  • Utrecht University
  • Instituut voor de Nederlandse Taal
  • Institute of Dutch Lexicology
  • Instituut voor Nederlandse Lexicology

Resources:

Resource

text/html