<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
<cmd:CMD xmlns:cmd="http://www.clarin.eu/cmd/1"
        xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1527668176047"
        xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
        CMDVersion="1.2"
        xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1527668176047 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.x/profiles/clarin.eu:cr1:p_1527668176047/xsd">

    <cmd:Header>
        <cmd:MdCreator>SAW Leipzig CMDI Creator 3.0</cmd:MdCreator>
        <cmd:MdCreationDate>2022-05-04</cmd:MdCreationDate>
        <cmd:MdSelfLink>hdl:11022/0000-0007-D396-1</cmd:MdSelfLink>
        <cmd:MdProfile>clarin.eu:cr1:p_1527668176047</cmd:MdProfile>
        <cmd:MdCollectionDisplayName>Leipzig Corpora Collection</cmd:MdCollectionDisplayName>
    </cmd:Header>

    <cmd:Resources>
        <cmd:ResourceProxyList>
                <cmd:ResourceProxy id="saw-1102200000007D3961-landingpage">
                    <cmd:ResourceType mimetype="text/html">LandingPage</cmd:ResourceType>
                    <cmd:ResourceRef>https://repo.data.saw-leipzig.de/resources?identifier=lcc/corpora/1102200000007D3961</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-searchpage">
                    <cmd:ResourceType mimetype="text/html">SearchPage</cmd:ResourceType>
                    <cmd:ResourceRef>https://dict.wortschatz-leipzig.de/de?corpusId=xho_community_2019</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-rest">
                    <cmd:ResourceType mimetype="text/html">SearchPage</cmd:ResourceType>
                    <cmd:ResourceRef>https://api.wortschatz-leipzig.de/ws</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-nse">
                    <cmd:ResourceType mimetype="text/html">SearchPage</cmd:ResourceType>
                    <cmd:ResourceRef>https://text.wortschatz-leipzig.de/#dashboard?corpname=xho_community_2019</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-searchservice">
                    <cmd:ResourceType mimetype="application/sru+xml">SearchService</cmd:ResourceType>
                    <cmd:ResourceRef>https://fcs.data.saw-leipzig.de/lcc</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-files">
                    <cmd:ResourceType mimetype="application/zstd">Resource</cmd:ResourceType>
                    <cmd:ResourceRef>https://repo.data.saw-leipzig.de/resources?identifier=lcc/corpora/1102200000007D3961/files</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-words">
                    <cmd:ResourceType mimetype="text/tab-separated-values">Resource</cmd:ResourceType>
                    <cmd:ResourceRef>https://repo.data.saw-leipzig.de/resources?identifier=lcc/corpora/1102200000007D3961/words</cmd:ResourceRef>
                </cmd:ResourceProxy>
                <cmd:ResourceProxy id="saw-1102200000007D3961-conllu">
                    <cmd:ResourceType mimetype="application/zstd">Resource</cmd:ResourceType>
                    <cmd:ResourceRef>https://repo.data.saw-leipzig.de/resources?identifier=lcc/corpora/1102200000007D3961/conllu</cmd:ResourceRef>
                </cmd:ResourceProxy>
        </cmd:ResourceProxyList>
        <cmd:JournalFileProxyList/>
        <cmd:ResourceRelationList/>
    </cmd:Resources>

    <cmd:Components>
        <cmdp:LCC_CorpusProfile ProfileId="clarin.eu:cr1:p_1527668176047">
            <cmdp:LCC_Corpus cmd:ComponentId="clarin.eu:cr1:c_1527668176044">
                <cmdp:Id>11022/0000-0007-D396-1</cmdp:Id>
                <cmdp:Name>Xhosa community corpus from 2019 (xho_community_2019)</cmdp:Name>
                <cmdp:Description xml:lang="en">Xhosa community corpus based on material from 2019 created in the project &quot;Deutscher Wortschatz&quot; or &quot;Leipzig Corpora Collection.
&lt;br&gt;The project regularly collects and processes available documents from the Internet (typically in an annual cycle) and other sources. The results are corpora and corpora-based dictionaries for more than 250 languages, which provide statistical information about almost each word, example sentences and links to related words. Because of the huge amount of used text material containing several million sentences, information about almost every word can be provided. The service ranks among the most comprehensive information systems about the German language and provides the largest freely available amounts of data for many other languages.</cmdp:Description>
                <cmdp:Description xml:lang="de">Xhosa Community-Korpus basierend auf Texten von 2019 erstellt im Rahmen des Projektes &quot;Deutscher Wortschatz&quot; bzw. &quot;Wortschatz Leipzig&quot;.
&lt;br&gt;Das Projekt sammelt regelmäßig (meist jährlich) frei verfügbare Dokumente im Internet und aus anderen Quellen und bereitet diese auf. Das Ergebnis sind Korpora und korpusbasierte Wörterbücher für über 250 Sprachen, in denen zu jedem Wort statistische Angaben, Beispielsätze und Links zu verwandten Wörtern verfügbar sind. Das Angebot zählt zu den umfangreichsten Informationssystemen zur deutschen Sprache und stellt für viele weitere Sprachen die jeweils größten frei verfügbaren Datenmengen bereit.</cmdp:Description>
                <cmdp:Version>1.0</cmdp:Version>
                <cmdp:ResponsibleOrganisation>Saxon Academy of Sciences and Humanities in Leipzig</cmdp:ResponsibleOrganisation>
                <cmdp:Contacts>
                    <cmdp:Contact>
                        <cmdp:Person>CLARIN Center Leipzig Staff</cmdp:Person>
                        <cmdp:Role>Technical contact</cmdp:Role>
                        <cmdp:Email>clarin@saw-leipzig.de</cmdp:Email>
                        <cmdp:Organisation>Saxon Academy of Sciences and Humanities in Leipzig</cmdp:Organisation>
                        <cmdp:Url>https://repo.data.saw-leipzig.de</cmdp:Url>
                    </cmdp:Contact>
                </cmdp:Contacts>
                <cmdp:Types>
                        <cmdp:Type>Written corpus</cmdp:Type>
                        <cmdp:Type>text/tab-separated-values</cmdp:Type>
                        <cmdp:Type>application/zstd</cmdp:Type>
                </cmdp:Types>
                <cmdp:Genres>
                        <cmdp:Genre>community text</cmdp:Genre>
                </cmdp:Genres>
                <cmdp:Annotations>
                        <cmdp:Annotation>tokenized text</cmdp:Annotation>
                        <cmdp:Annotation>word cooccurrences</cmdp:Annotation>
                </cmdp:Annotations>
                <cmdp:TextKeywords>
                        <cmdp:TextKeyword>Xhosa</cmdp:TextKeyword>
                        <cmdp:TextKeyword>community</cmdp:TextKeyword>
                        <cmdp:TextKeyword>Corpus</cmdp:TextKeyword>
                </cmdp:TextKeywords>
                    <cmdp:Language>
                        <cmdp:LanguageName>Xhosa</cmdp:LanguageName>
                        <cmdp:ISO639>
                            <cmdp:iso-639-3-code>xho</cmdp:iso-639-3-code>
                        </cmdp:ISO639>
                    </cmdp:Language>
                <cmdp:License>
                    <cmdp:DistributionType>public</cmdp:DistributionType>
                    <cmdp:LicenseName>CC BY-NC</cmdp:LicenseName>
                    <cmdp:LicenseURL>https://creativecommons.org/licenses/by-nc/4.0/</cmdp:LicenseURL>
                </cmdp:License>
                    <cmdp:TimeCoverage>
                        <cmdp:TimeCoverageBegin>2009-04-02</cmdp:TimeCoverageBegin>
                        <cmdp:TimeCoverageEnd>2019-03-28</cmdp:TimeCoverageEnd>
                    </cmdp:TimeCoverage>
                <cmdp:Size>
                        <cmdp:TotalSize>
                            <cmdp:Number>63387</cmdp:Number>
                            <cmdp:SizeUnit>number of sentences</cmdp:SizeUnit>
                        </cmdp:TotalSize>
                        <cmdp:TotalSize>
                            <cmdp:Number>805022</cmdp:Number>
                            <cmdp:SizeUnit>number of tokens</cmdp:SizeUnit>
                        </cmdp:TotalSize>
                        <cmdp:TotalSize>
                            <cmdp:Number>172484</cmdp:Number>
                            <cmdp:SizeUnit>number of types</cmdp:SizeUnit>
                        </cmdp:TotalSize>
                </cmdp:Size>
            </cmdp:LCC_Corpus>
        </cmdp:LCC_CorpusProfile>
    </cmd:Components>
</cmd:CMD>