<?xml version="1.0" ?><?xml-stylesheet type='text/xsl' href='/cmdixsl/templates.xsl'?><cmd:CMD xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:cmd="http://www.clarin.eu/cmd/1" xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1527668176122" CMDVersion="1.2" xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1527668176122 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.x/profiles/clarin.eu:cr1:p_1527668176122/xsd">
<cmd:Header>
<cmd:MdCreator>Marco Passarotti</cmd:MdCreator>
<cmd:MdCreationDate>2012-11-07</cmd:MdCreationDate>
<cmd:MdSelfLink>https://doi.org/10.57754/FDAT.0955m-hk887</cmd:MdSelfLink>
<cmd:MdProfile>clarin.eu:cr1:p_1527668176122</cmd:MdProfile>
<cmd:MdCollectionDisplayName>Tübingen Archive of Language Resources (TALAR)</cmd:MdCollectionDisplayName>
</cmd:Header>
<cmd:Resources>
<cmd:ResourceProxyList>
<cmd:ResourceProxy id="LandingPage-11858-00-1778-0000-0008-C024-C">
<cmd:ResourceType mimetype="application/xml">LandingPage</cmd:ResourceType>
<cmd:ResourceRef>https://doi.org/10.57754/FDAT.0955m-hk887</cmd:ResourceRef>
</cmd:ResourceProxy>
<cmd:ResourceProxy id="IT-TBconlltxt">
<cmd:ResourceType mimetype="text/plain">Resource</cmd:ResourceType>
<cmd:ResourceRef>https://doi.org/10.57754/FDAT.0955m-hk887</cmd:ResourceRef>
</cmd:ResourceProxy>
<cmd:ResourceProxy id="update-2020targz">
<cmd:ResourceType mimetype="text/plain">Resource</cmd:ResourceType>
<cmd:ResourceRef>https://doi.org/10.57754/FDAT.0955m-hk887</cmd:ResourceRef>
</cmd:ResourceProxy>
</cmd:ResourceProxyList>
<cmd:JournalFileProxyList>
<cmd:JournalFileProxy>
<cmd:JournalFileRef/>
</cmd:JournalFileProxy>
</cmd:JournalFileProxyList>
<cmd:ResourceRelationList> </cmd:ResourceRelationList>
</cmd:Resources>
<cmd:IsPartOfList>
<cmd:IsPartOf/>
</cmd:IsPartOfList>
<cmd:Components>
<cmdp:TextCorpusProfile>
<cmdp:GeneralInfo>
<cmdp:ResourceName xml:lang="en">Index Thomisticus Treebank</cmdp:ResourceName>
<cmdp:ResourceTitle xml:lang="en">Index Thomisticus Treebank</cmdp:ResourceTitle>
<cmdp:ResourceClass>Corpus</cmdp:ResourceClass>
<cmdp:LifeCycleStatus>development</cmdp:LifeCycleStatus>
<cmdp:StartYear>2006</cmdp:StartYear>
<cmdp:TimeCoverage xml:lang="en">Lifespan of Thomas Aquinas (1225-1274)</cmdp:TimeCoverage>
<cmdp:LegalOwner xml:lang="it">Centro Interdisciplinare di Ricerche per la Computerizzazione dei Segni dell’Espressione (CIRCSE)</cmdp:LegalOwner>
<cmdp:Genre>historical corpus</cmdp:Genre>
<cmdp:Genre>Treebank</cmdp:Genre>
<cmdp:Genre>Syntactically annotated Corpus</cmdp:Genre>
<cmdp:FieldOfResearch/>
<cmdp:Location>
<cmdp:Address>Università Cattolica del Sacro Cuore
c/o Istituto di Glottologia
Franciscanum Building, II floor, rooms 209-210
Largo Gemelli, 1
20123 Milan
ITALY</cmdp:Address>
<cmdp:Country>
<cmdp:CountryName xml:lang="en">Italy</cmdp:CountryName>
<cmdp:CountryCoding>IT</cmdp:CountryCoding>
</cmdp:Country>
</cmdp:Location>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">The Index Thomisticus Treebank is the syntactically annotated subset of the Index Thomisticus corpus.
The Index Thomisticus corpus features the opera omnia by Thomas Aquinas in Latin, for a total of around 11 million words.
The Index Thomisticus Treebank is a dependency-based treebank, whose annotation style resembles that of the Prague Dependency Treebank of Czech</cmdp:Description>
</cmdp:Descriptions>
<cmdp:tags>
<cmdp:tag xml:lang="en">treebank</cmdp:tag>
<cmdp:tag xml:lang="en">Latin</cmdp:tag>
<cmdp:tag xml:lang="en">written language</cmdp:tag>
</cmdp:tags>
<cmdp:ModalityInfo>
<cmdp:Modalities>written</cmdp:Modalities>
</cmdp:ModalityInfo>
</cmdp:GeneralInfo>
<cmdp:Project>
<cmdp:ProjectName xml:lang="en">Index Thomisticus Treebank</cmdp:ProjectName>
<cmdp:ProjectTitle xml:lang="en">Index Thomisticus Treebank</cmdp:ProjectTitle>
<cmdp:ProjectID>IT-TB</cmdp:ProjectID>
<cmdp:Url targetLang="en">http://itreebank.marginalia.it/</cmdp:Url>
<cmdp:Funder>
<cmdp:fundingAgency/>
</cmdp:Funder>
<cmdp:Institution>
<cmdp:Department xml:lang="it">Centro Interdisciplinare di Ricerche per la Computerizzazione dei Segni dell’Espressione (CIRCSE)</cmdp:Department>
<cmdp:Url>http://centridiricerca.unicatt.it/circse</cmdp:Url>
<cmdp:Organisation>
<cmdp:name xml:lang="en">Università Cattolica del Sacro Cuore, Milan (Italy)</cmdp:name>
<cmdp:AuthoritativeIDs>
<cmdp:AuthoritativeID>
<cmdp:id>https://viaf.org/viaf/123731682</cmdp:id>
<cmdp:issuingAuthority>ORCID</cmdp:issuingAuthority>
</cmdp:AuthoritativeID>
</cmdp:AuthoritativeIDs>
</cmdp:Organisation>
<cmdp:Descriptions>
<cmdp:Description/>
</cmdp:Descriptions>
</cmdp:Institution>
<cmdp:Duration>
<cmdp:StartYear>2006</cmdp:StartYear>
</cmdp:Duration>
</cmdp:Project>
<cmdp:Publications>
<cmdp:Publication>
<cmdp:PublicationTitle xml:lang="en">The Index Thomisticus Treebank Project: Annotation, Parsing and Valency Lexicon</cmdp:PublicationTitle>
<cmdp:resolvablePID>https://www.atala.org/sites/default/files/TAL-2009-50-2-04-McGillivray.pdf</cmdp:resolvablePID>
<cmdp:Author>
<cmdp:firstName>Barbara</cmdp:firstName>
<cmdp:lastName>McGillivray</cmdp:lastName>
<cmdp:AuthoritativeIDs>
<cmdp:AuthoritativeID>
<cmdp:id>https://orcid.org/0000-0003-3426-8200</cmdp:id>
<cmdp:issuingAuthority>ORCID</cmdp:issuingAuthority>
</cmdp:AuthoritativeID>
</cmdp:AuthoritativeIDs>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Marco</cmdp:firstName>
<cmdp:lastName>Passarotti</cmdp:lastName>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Paolo</cmdp:firstName>
<cmdp:lastName>Ruffolo</cmdp:lastName>
<cmdp:AuthoritativeIDs>
<cmdp:AuthoritativeID>
<cmdp:id>https://orcid.org/0000-0002-9120-0846</cmdp:id>
<cmdp:issuingAuthority>ORCID</cmdp:issuingAuthority>
</cmdp:AuthoritativeID>
</cmdp:AuthoritativeIDs>
</cmdp:Author>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">Project overview</cmdp:Description>
</cmdp:Descriptions>
</cmdp:Publication>
<cmdp:Publication>
<cmdp:PublicationTitle xml:lang="en">Guidelines for the Syntactic Annotation of Latin Treebanks</cmdp:PublicationTitle>
<cmdp:resolvablePID>http://static.perseus.tufts.edu/docs/guidelines.pdf</cmdp:resolvablePID>
<cmdp:Author>
<cmdp:firstName>David</cmdp:firstName>
<cmdp:lastName>Bamman</cmdp:lastName>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Marco</cmdp:firstName>
<cmdp:lastName>Passarotti</cmdp:lastName>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Gregory</cmdp:firstName>
<cmdp:lastName>Crane</cmdp:lastName>
<cmdp:AuthoritativeIDs>
<cmdp:AuthoritativeID>
<cmdp:id>https://orcid.org/0000-0001-6847-2811</cmdp:id>
<cmdp:issuingAuthority>ORCID</cmdp:issuingAuthority>
</cmdp:AuthoritativeID>
</cmdp:AuthoritativeIDs>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Savina</cmdp:firstName>
<cmdp:lastName>Raynaud</cmdp:lastName>
<cmdp:AuthoritativeIDs>
<cmdp:AuthoritativeID>
<cmdp:id>https://orcid.org/0000-0002-8054-1733</cmdp:id>
<cmdp:issuingAuthority>ORCID</cmdp:issuingAuthority>
</cmdp:AuthoritativeID>
</cmdp:AuthoritativeIDs>
</cmdp:Author>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">Project overview</cmdp:Description>
</cmdp:Descriptions>
</cmdp:Publication>
<cmdp:Publication>
<cmdp:PublicationTitle xml:lang="en">The annotation guidelines of the Latin Dependency Treebank and Index Thomisticus Treebank. The treatment of some specific syntactic constructions in Latin</cmdp:PublicationTitle>
<cmdp:resolvablePID>http://www.lrec-conf.org/proceedings/lrec2008/pdf/25_paper.pdf</cmdp:resolvablePID>
<cmdp:Author>
<cmdp:firstName>David</cmdp:firstName>
<cmdp:lastName>Bamman</cmdp:lastName>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Marco</cmdp:firstName>
<cmdp:lastName>Passarotti</cmdp:lastName>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Roberto</cmdp:firstName>
<cmdp:lastName>Busa</cmdp:lastName>
</cmdp:Author>
<cmdp:Author>
<cmdp:firstName>Gregory</cmdp:firstName>
<cmdp:lastName>Crane</cmdp:lastName>
<cmdp:AuthoritativeIDs>
<cmdp:AuthoritativeID>
<cmdp:id>https://orcid.org/0000-0001-6847-2811</cmdp:id>
<cmdp:issuingAuthority>ORCID</cmdp:issuingAuthority>
</cmdp:AuthoritativeID>
</cmdp:AuthoritativeIDs>
</cmdp:Author>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">Project overview</cmdp:Description>
</cmdp:Descriptions>
</cmdp:Publication>
<cmdp:Publication>
<cmdp:PublicationTitle xml:lang="en">Leaving Behind the Less-Resourced Status. The Case of Latin through the Experience of the Index Thomisticus Treebank</cmdp:PublicationTitle>
<cmdp:resolvablePID>http://hdl.handle.net/10807/1407</cmdp:resolvablePID>
<cmdp:Author>
<cmdp:firstName>Marco</cmdp:firstName>
<cmdp:lastName>Passarotti</cmdp:lastName>
</cmdp:Author>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">Project overview</cmdp:Description>
</cmdp:Descriptions>
</cmdp:Publication>
</cmdp:Publications>
<cmdp:Creation>
<cmdp:Topic xml:lang="en">Syntactic analysis of a subset of the Index Thomisticus corpus, using a dependency-based annotation style similar to that of the Prague Dependency Treebank of Czech</cmdp:Topic>
<cmdp:Creators>
<cmdp:Person>
<cmdp:firstName>Marco</cmdp:firstName>
<cmdp:lastName>Passarotti</cmdp:lastName>
<cmdp:role>Project leader</cmdp:role>
</cmdp:Person>
<cmdp:Descriptions>
<cmdp:Description/>
</cmdp:Descriptions>
</cmdp:Creators>
<cmdp:Annotation>
<cmdp:AnnotationMode xml:lang="en">Machine assisted</cmdp:AnnotationMode>
<cmdp:AnnotationStandoff xml:lang="en">Yes</cmdp:AnnotationStandoff>
<cmdp:AnnotationFormat xml:lang="en">Prague Dependency Treebank format (analytical layer)</cmdp:AnnotationFormat>
<cmdp:SegmentationUnits>
<cmdp:SegmentationUnit>grammatical sentence</cmdp:SegmentationUnit>
<cmdp:SegmentationUnit>lexeme</cmdp:SegmentationUnit>
<cmdp:SegmentationUnit>other</cmdp:SegmentationUnit>
</cmdp:SegmentationUnits>
<cmdp:AnnotationTypes>
<cmdp:AnnotationType>
<cmdp:AnnotationLevelType xml:lang="en">lemmatization</cmdp:AnnotationLevelType>
<cmdp:AnnotationLevelType xml:lang="en">morphological analysis</cmdp:AnnotationLevelType>
<cmdp:AnnotationLevelType xml:lang="en">surface syntax annotation</cmdp:AnnotationLevelType>
<cmdp:AnnotationMode xml:lang="en">semi automatic</cmdp:AnnotationMode>
<cmdp:TagsetInfo>
<cmdp:Tagset xml:lang="en">Index Thomisticus Treebank morphological and syntactic tagset</cmdp:Tagset>
</cmdp:TagsetInfo>
</cmdp:AnnotationType>
</cmdp:AnnotationTypes>
<cmdp:AnnotationToolInfo>
<cmdp:AnnotationTool xml:lang="en">TrEd</cmdp:AnnotationTool>
<cmdp:ToolType xml:lang="en">tree editor</cmdp:ToolType>
<cmdp:Version xml:lang="en">2.0</cmdp:Version>
<cmdp:Url>http://ufal.mff.cuni.cz/tred/</cmdp:Url>
</cmdp:AnnotationToolInfo>
<cmdp:AnnotationToolInfo>
<cmdp:AnnotationTool xml:lang="en">DeSR</cmdp:AnnotationTool>
<cmdp:ToolType xml:lang="en">data-driven dependency parser</cmdp:ToolType>
<cmdp:Version/>
<cmdp:Url>https://sites.google.com/site/desrparser/</cmdp:Url>
</cmdp:AnnotationToolInfo>
<cmdp:AnnotationToolInfo>
<cmdp:AnnotationTool xml:lang="en">MaltParser</cmdp:AnnotationTool>
<cmdp:ToolType xml:lang="en">data-driven dependency parser</cmdp:ToolType>
<cmdp:Version/>
<cmdp:Url>http://www.maltparser.org/</cmdp:Url>
</cmdp:AnnotationToolInfo>
<cmdp:AnnotationToolInfo>
<cmdp:AnnotationTool xml:lang="en">Hunpos</cmdp:AnnotationTool>
<cmdp:ToolType xml:lang="en">HMM tagger</cmdp:ToolType>
<cmdp:Version/>
<cmdp:Url>http://code.google.com/p/hunpos/</cmdp:Url>
</cmdp:AnnotationToolInfo>
</cmdp:Annotation>
<cmdp:Source>
<cmdp:OriginalSource xml:lang="la">Index Thomisticus corpus</cmdp:OriginalSource>
<cmdp:SourceType xml:lang="en">Corpus</cmdp:SourceType>
<cmdp:MediaFiles>
<cmdp:MediaFile>
<cmdp:CatalogueLink/>
<cmdp:Type>Unknown</cmdp:Type>
<cmdp:Quality>Unknown</cmdp:Quality>
<cmdp:RecordingConditions/>
<cmdp:Position>
<cmdp:PositionType/>
<cmdp:StartPosition/>
<cmdp:EndPosition/>
</cmdp:Position>
<cmdp:Access>
<cmdp:Contact>
<cmdp:email/>
<cmdp:role/>
<cmdp:Address>
<cmdp:street/>
<cmdp:ZIPCode/>
<cmdp:city/>
</cmdp:Address>
</cmdp:Contact>
</cmdp:Access>
</cmdp:MediaFile>
</cmdp:MediaFiles>
</cmdp:Source>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">Syntactic annotation of excerpts from three works of Thomas Aquinas:
(1) Scriptum super Sententiis Magistri Petri Lombardi,
(2) Summa contra Gentiles,
(3) Summa Theologiae </cmdp:Description>
</cmdp:Descriptions>
</cmdp:Creation>
<cmdp:TextCorpusContext>
<cmdp:CorpusType>treebank</cmdp:CorpusType>
<cmdp:TemporalClassification>historical</cmdp:TemporalClassification>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">Dependency-based annotation of excerpts from three works of Thomas Aquinas:
(1) Scriptum super Sententiis Magistri Petri Lombardi,
(2) Summa contra Gentiles,
(3) Summa Theologiae </cmdp:Description>
</cmdp:Descriptions>
<cmdp:ValidationGrp>
<cmdp:Validation>false</cmdp:Validation>
</cmdp:ValidationGrp>
<cmdp:SubjectLanguages>
<cmdp:NumberOfLanguages>1</cmdp:NumberOfLanguages>
<cmdp:SubjectLanguage>
<cmdp:DominantLanguage>true</cmdp:DominantLanguage>
<cmdp:SourceLanguage>true</cmdp:SourceLanguage>
<cmdp:TargetLanguage>true</cmdp:TargetLanguage>
<cmdp:Language>
<cmdp:LanguageName xml:lang="en">Latin</cmdp:LanguageName>
<cmdp:ISO639>
<cmdp:iso-639-3-code>lat</cmdp:iso-639-3-code>
</cmdp:ISO639>
</cmdp:Language>
<cmdp:Descriptions>
<cmdp:Description xml:lang="en">13th century Church Latin</cmdp:Description>
</cmdp:Descriptions>
</cmdp:SubjectLanguage>
</cmdp:SubjectLanguages>
<cmdp:TypeSpecificSizeInfo>
<cmdp:TypeSpecificSize>
<cmdp:Size>462142803</cmdp:Size>
<cmdp:SizeUnit>byte</cmdp:SizeUnit>
</cmdp:TypeSpecificSize>
<cmdp:TypeSpecificSize>
<cmdp:Size>26831</cmdp:Size>
<cmdp:SizeUnit>sentences</cmdp:SizeUnit>
</cmdp:TypeSpecificSize>
<cmdp:TypeSpecificSize>
<cmdp:Size>447306</cmdp:Size>
<cmdp:SizeUnit>tokens</cmdp:SizeUnit>
</cmdp:TypeSpecificSize>
</cmdp:TypeSpecificSizeInfo>
</cmdp:TextCorpusContext>
<cmdp:Access>
<cmdp:Availability xml:lang="en">Free for academic use</cmdp:Availability>
<cmdp:DistributionMedium xml:lang="en">Digital file</cmdp:DistributionMedium>
<cmdp:Price xml:lang="en">0</cmdp:Price>
<cmdp:Licence>CC BY-NC-SA 3.0</cmdp:Licence>
<cmdp:Contact>
<cmdp:firstname>Dr. Marco</cmdp:firstname>
<cmdp:lastname>Passarotti</cmdp:lastname>
<cmdp:email>marco.passarotti@unicatt.it</cmdp:email>
<cmdp:telephoneNumber>+39-02-72342380</cmdp:telephoneNumber>
<cmdp:role>Head of project</cmdp:role>
<cmdp:Address>
<cmdp:street>Largo Gemelli, 1</cmdp:street>
<cmdp:ZIPCode>20123</cmdp:ZIPCode>
<cmdp:city>Milan, Italy</cmdp:city>
</cmdp:Address>
</cmdp:Contact>
<cmdp:DeploymentToolInfo>
<cmdp:DeploymentTool xml:lang="en">TrEd</cmdp:DeploymentTool>
<cmdp:ToolType xml:lang="en">tree editor</cmdp:ToolType>
<cmdp:Version xml:lang="en">2.0</cmdp:Version>
<cmdp:Url>http://ufal.mff.cuni.cz/tred/</cmdp:Url>
</cmdp:DeploymentToolInfo>
</cmdp:Access>
<cmdp:ResourceProxyListInfo>
<cmdp:ResourceProxyInfo xmlns:ns1="http://www.clarin.eu/cmd/1" ns1:ref="IT-TBconlltxt">
<cmdp:ResProxItemName/>
<cmdp:ResProxFileName>IT-TB.conll</cmdp:ResProxFileName>
<cmdp:SizeInfo>
<cmdp:TotalSize>
<cmdp:Size> 7023634 </cmdp:Size>
<cmdp:SizeUnit>B</cmdp:SizeUnit>
</cmdp:TotalSize>
</cmdp:SizeInfo>
<cmdp:Checksums>
<cmdp:md5>48d1ba3cbb900771c1290c288e383429</cmdp:md5>
<cmdp:sha1>42c2e92a88de6bbe149a445a82a256176216e21a</cmdp:sha1>
<cmdp:sha256>febeaa5a628406eea7e70079c07f39293d9ab6cf6205eeb6dc6d74ec3a38660f</cmdp:sha256>
</cmdp:Checksums>
</cmdp:ResourceProxyInfo>
<cmdp:ResourceProxyInfo xmlns:ns1="http://www.clarin.eu/cmd/1" ns1:ref="update-2020targz">
<cmdp:ResProxItemName/>
<cmdp:ResProxFileName>update-2020.tar.gz</cmdp:ResProxFileName>
<cmdp:SizeInfo>
<cmdp:TotalSize>
<cmdp:Size> 3937465 </cmdp:Size>
<cmdp:SizeUnit>B</cmdp:SizeUnit>
</cmdp:TotalSize>
</cmdp:SizeInfo>
<cmdp:Checksums>
<cmdp:md5>3843441b2a798765063b651665b968e2</cmdp:md5>
<cmdp:sha1>e3601369ff96ec7a88a0227ee10e43dd49d9e6b0</cmdp:sha1>
<cmdp:sha256>4e813f5566a27cdc1d63631c8ba0d00e86b9b86b8cb23e3fe9663aae7ac13b5d</cmdp:sha256>
</cmdp:Checksums>
</cmdp:ResourceProxyInfo>
</cmdp:ResourceProxyListInfo>
</cmdp:TextCorpusProfile>
</cmd:Components>
</cmd:CMD>