<OAI-PMH xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://www.openarchives.org/OAI/2.0/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/          http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
  <responseDate>2026-04-23T18:25:41.419Z</responseDate>
  <request verb="GetRecord">https://www.nb.no/sprakbanken/oai</request>
  <GetRecord>
    <record>
      <header>
        <identifier>oai:nb.no:sbr-70</identifier>
        <datestamp/>
      </header>
      <metadata>
        <cmd:CMD xmlns:cmd="http://www.clarin.eu/cmd/1" xmlns="http://www.clarin.eu/cmd/" xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1407745711925" CMDVersion="1.2" xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1407745711925 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.1/profiles/clarin.eu:cr1:p_1407745711925/1.2/xsd">
          <cmd:Header>
            <cmd:MdCreator>Arne Martinus Lindstad</cmd:MdCreator>
            <cmd:MdCreationDate>2021-10-30</cmd:MdCreationDate>
            <cmd:MdSelfLink>https://www.nb.no/sprakbanken/oai?verb=GetRecord&amp;identifier=oai:nb.no:sbr-70&amp;metadataPrefix=cmdi</cmd:MdSelfLink>
            <cmd:MdProfile>clarin.eu:cr1:p_1407745711925</cmd:MdProfile>
            <cmd:MdCollectionDisplayName>Språkbanken NB</cmd:MdCollectionDisplayName>
          </cmd:Header>
          <cmd:Resources>
            <cmd:ResourceProxyList>
              <cmd:ResourceProxy id="ngram_avis1_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-digavis-unigram.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_avis2_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-digavis-bigram.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_avis3_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-digavis-trigram.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_bok1_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-digibok-unigram.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_bok2_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-digibok-bigram.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_bok3_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-digibok-trigram.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_avis_meta_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-metadata-digavis.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_bok_meta_2021">
                <cmd:ResourceType mimetype="application/gzip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-metadata-digibok.csv.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_totals_2021">
                <cmd:ResourceType mimetype="application/json">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-totals.json</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_readme_eng_2021">
                <cmd:ResourceType mimetype="text/markdown">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-README-eng.md</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_readme_nob_2021">
                <cmd:ResourceType mimetype="text/markdown">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/ngram-2021-README-nob.md</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="ngram_doc_2021">
                <cmd:ResourceType mimetype="application/pdf">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/ngram/ngram_2021/2021_NBngram.pdf</cmd:ResourceRef>
              </cmd:ResourceProxy>
            </cmd:ResourceProxyList>
            <cmd:JournalFileProxyList/>
            <cmd:ResourceRelationList/>
          </cmd:Resources>
          <cmd:IsPartOfList/>
          <cmd:Components>
            <cmdp:corpusProfile>
              <cmdp:resourceCommonInfo>
                <cmdp:resourceType>corpus</cmdp:resourceType>
                <cmdp:identificationInfo>
                  <cmdp:resourceName xml:lang="nb">N-grammer fra NBdigital 2021</cmdp:resourceName>
                  <cmdp:resourceName xml:lang="en">N-grams from NBdigital 2021</cmdp:resourceName>
                  <cmdp:description xml:lang="nb">Dette korpuset inneholder n-grammer – unigrammer, bigrammer og trigrammer – fra alle bøker og aviser som var blitt digitalisert ved Nasjonalbiblioteket per juli 2021. N-grammene er laget på basis av et materiale bestående av om lag 580.000 bøker og 3.400.000 aviser, til sammen ca. 122 milliarder "tokens" (ord og tegnsetting). N-grammene finnes på CSV-format (UTF-8-kodert).

Kolonnene i CSV-filene med n-grammer er som følger:
- first - det første ordet i n-grammet (i uni-, bi- og trigrammer)
- second - det andre ordet i n-grammet (i bi- og trigrammer)
- third - det tredje ordet i n-grammet (i trigrammer)
- lang - språkkode for n-grammet (gjelder kun bøker, avisene har ingen språkklassifikasjon per nå)
- freq - den totale frekvensen for n-grammet i samlingen av bøker eller aviser
- json - et dictionary med råfrekvens per år

totals.json inneholder totalfrekvenser innenfor årganger i bok- og aviskorpuset. Med disse kan man lett regne ut relativfrekvenser for sammenlikning på tvers av år som i NB N-gram.

metadata-digibok.csv og metadata-digavis.csv inneholder enkle metadata for alle bøkene og avisene som inngår i bok- og aviskorpuset. Hvis du er interessert i mer utførlige metadata, henviser vi til Oria eller NBs APIer under https://api.nb.no/.

Se dokumentasjonsfilene for mer informasjon.</cmdp:description>
                  <cmdp:description xml:lang="en">This resource contains n-grams - i.e. unigrams, bigrams and trigrams - from all books and newspapers that had been digitized at the National Library of Norway up to July 2021. The n-grams have been extracted from a material consisting of approximately 580,000 books and 3,400,000 newspapers, amounting to a total of 122 billion tokens (words and punctuation). The n-grams are offered as CSV files (UTF-8-encoded).

Columns in the n-gram CSV files:
- first - the first word (in uni-, bi- and trigrams)
- second - the second word (in bi- and trigrams)
- third - the third word (in trigrams)
- lang - the language of the n-gram (only regarding books, newspapers have no language classification as for now)
- freq - the total frequency of the n-gram in the collection of books or newspapers
- json - a dictionary with raw frequency for each year

totals.json contains aggregated frequencies per year in the book and newspaper corpora. Using these numbers, relative frequencies can be calculated in order to compare frequencies over time as in NB N-gram.

metadata-digibok.csv and metadata-digavis.csv contain simple metadata for the books and newspapers. If you need more extensive metadata, you could use Oria or the APIs at https://api.nb.no/.

See the documentation files for further information.</cmdp:description>
                  <cmdp:resourceShortName xml:lang="nb">NBngram2021</cmdp:resourceShortName>
                  <cmdp:resourceShortName xml:lang="en">NBngram2021</cmdp:resourceShortName>
                  <cmdp:url cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-70/</cmdp:url>
                  <cmdp:PID cmd:description="handle">hdl:21.11146/70</cmdp:PID>
                  <cmdp:identifier>sbr-70</cmdp:identifier>
                </cmdp:identificationInfo>
                <cmdp:distributionInfo>
                  <cmdp:licenceInfo>
                    <cmdp:userCategory>Public</cmdp:userCategory>
                    <cmdp:distributionAccessMedium>downloadable</cmdp:distributionAccessMedium>
                    <cmdp:downloadLocation cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-70/</cmdp:downloadLocation>
                    <cmdp:licence>
                      <cmdp:licenceFamily>Creative Commons (CC)</cmdp:licenceFamily>
                      <cmdp:licenceName>Creative_Commons-ZERO (CC-ZERO)</cmdp:licenceName>
                      <cmdp:licenceURL>https://creativecommons.org/publicdomain/zero/1.0/</cmdp:licenceURL>
                    </cmdp:licence>
                    <cmdp:licensor>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role xml:lang="en">Licensor</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:licensor>
                  </cmdp:licenceInfo>
                </cmdp:distributionInfo>
                <cmdp:contact>
                  <cmdp:actorInfo>
                    <cmdp:actorType>organization</cmdp:actorType>
                    <cmdp:role xml:lang="en">Contact</cmdp:role>
                    <cmdp:organizationInfo>
                      <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                      <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                      <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                      <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                      <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                      <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                    </cmdp:organizationInfo>
                    <cmdp:communicationInfo>
                      <cmdp:email>sprakbanken@nb.no</cmdp:email>
                      <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                      <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                      <cmdp:zipCode>0203</cmdp:zipCode>
                      <cmdp:city>Oslo</cmdp:city>
                      <cmdp:region>Oslo</cmdp:region>
                      <cmdp:country>Norway</cmdp:country>
                    </cmdp:communicationInfo>
                  </cmdp:actorInfo>
                </cmdp:contact>
                <cmdp:metadataInfo>
                  <cmdp:metadataCreationDate>2021-10-29</cmdp:metadataCreationDate>
                  <cmdp:metadataLanguageName>English</cmdp:metadataLanguageName>
                  <cmdp:metadataLanguageId>en</cmdp:metadataLanguageId>
                  <cmdp:metadataLastDateUpdated>2023-08-08</cmdp:metadataLastDateUpdated>
                  <cmdp:metadataCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Metadata Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Lindstad</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Arne Martinus</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                      <cmdp:communicationInfo>
                        <cmdp:email>sprakbanken@nb.no</cmdp:email>
                        <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                        <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                        <cmdp:zipCode>0203</cmdp:zipCode>
                        <cmdp:city>Oslo</cmdp:city>
                        <cmdp:region>Oslo</cmdp:region>
                        <cmdp:country>Norway</cmdp:country>
                      </cmdp:communicationInfo>
                    </cmdp:actorInfo>
                  </cmdp:metadataCreator>
                </cmdp:metadataInfo>
                <cmdp:versionInfo>
                  <cmdp:version>2021</cmdp:version>
                  <cmdp:lastDateUpdated>2021-10-28</cmdp:lastDateUpdated>
                </cmdp:versionInfo>
                <cmdp:resourceDocumentationInfo>
                  <cmdp:documentationUnstructured>
                    <cmdp:role>documentation</cmdp:role>
                    <cmdp:documentUnstructured>Documentation files in English and Norwegian. Metadata files accompanying the data.</cmdp:documentUnstructured>
                  </cmdp:documentationUnstructured>
                </cmdp:resourceDocumentationInfo>
                <cmdp:resourceCreationInfo>
                  <cmdp:creationStartDate>2021-06-01</cmdp:creationStartDate>
                  <cmdp:creationEndDate>2021-10-28</cmdp:creationEndDate>
                  <cmdp:resourceCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Resource Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Birkenes</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Magnus Breder</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                      <cmdp:communicationInfo>
                        <cmdp:email>sprakbanken@nb.no</cmdp:email>
                        <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                        <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                        <cmdp:zipCode>0203</cmdp:zipCode>
                        <cmdp:city>Oslo</cmdp:city>
                        <cmdp:region>Oslo</cmdp:region>
                        <cmdp:country>Norway</cmdp:country>
                      </cmdp:communicationInfo>
                    </cmdp:actorInfo>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Rsource Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Johnsen</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Lars</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                      <cmdp:communicationInfo>
                        <cmdp:email>sprakbanken@nb.no</cmdp:email>
                        <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                        <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                        <cmdp:zipCode>0203</cmdp:zipCode>
                        <cmdp:city>Oslo</cmdp:city>
                        <cmdp:region>Oslo</cmdp:region>
                        <cmdp:country>Norway</cmdp:country>
                      </cmdp:communicationInfo>
                    </cmdp:actorInfo>
                  </cmdp:resourceCreator>
                </cmdp:resourceCreationInfo>
              </cmdp:resourceCommonInfo>
              <cmdp:corpusInfo>
                <cmdp:corpusType>Ngram Corpus</cmdp:corpusType>
                <cmdp:corpusPartInfo>
                  <cmdp:mediaType>textNgram</cmdp:mediaType>
                  <cmdp:corpusTextNgramInfo>
                    <cmdp:ngramInfo>
                      <cmdp:baseItem>word</cmdp:baseItem>
                      <cmdp:order>3</cmdp:order>
                    </cmdp:ngramInfo>
                    <cmdp:textFormatInfo>
                      <cmdp:mimeType>text/csv</cmdp:mimeType>
                      <cmdp:sizePerTextFormat>
                        <cmdp:sizeInfo>
                          <cmdp:size>8</cmdp:size>
                          <cmdp:sizeUnit>files</cmdp:sizeUnit>
                        </cmdp:sizeInfo>
                        <cmdp:sizeInfo>
                          <cmdp:size>42,1</cmdp:size>
                          <cmdp:sizeUnit>gb</cmdp:sizeUnit>
                        </cmdp:sizeInfo>
                        <cmdp:sizeInfo>
                          <cmdp:size>121834422207</cmdp:size>
                          <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                        </cmdp:sizeInfo>
                      </cmdp:sizePerTextFormat>
                    </cmdp:textFormatInfo>
                    <cmdp:textFormatInfo>
                      <cmdp:mimeType>application/json</cmdp:mimeType>
                      <cmdp:sizePerTextFormat>
                        <cmdp:sizeInfo>
                          <cmdp:size>1</cmdp:size>
                          <cmdp:sizeUnit>files</cmdp:sizeUnit>
                        </cmdp:sizeInfo>
                        <cmdp:sizeInfo>
                          <cmdp:size>18</cmdp:size>
                          <cmdp:sizeUnit>kb</cmdp:sizeUnit>
                        </cmdp:sizeInfo>
                      </cmdp:sizePerTextFormat>
                    </cmdp:textFormatInfo>
                    <cmdp:characterEncodingInfo>
                      <cmdp:characterEncoding>UTF-8</cmdp:characterEncoding>
                    </cmdp:characterEncodingInfo>
                  </cmdp:corpusTextNgramInfo>
                </cmdp:corpusPartInfo>
                <cmdp:corpusPartGeneralInfo>
                  <cmdp:lingualityInfo>
                    <cmdp:lingualityType>multilingual</cmdp:lingualityType>
                    <cmdp:multilingualityType>other</cmdp:multilingualityType>
                    <cmdp:multilingualityTypeDetails>Independent text in several languages</cmdp:multilingualityTypeDetails>
                  </cmdp:lingualityInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nb</cmdp:languageId>
                    <cmdp:languageName>Norwegian Bokmål</cmdp:languageName>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nn</cmdp:languageId>
                    <cmdp:languageName>Norwegian Nynorsk</cmdp:languageName>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>se</cmdp:languageId>
                    <cmdp:languageName>Northern Sami</cmdp:languageName>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>sma</cmdp:languageId>
                    <cmdp:languageName>Southern Sami</cmdp:languageName>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>smj</cmdp:languageId>
                    <cmdp:languageName>Lule Sami</cmdp:languageName>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>fkv</cmdp:languageId>
                    <cmdp:languageName>Kven</cmdp:languageName>
                  </cmdp:languageInfo>
                  <cmdp:modalityInfo>
                    <cmdp:modalityType>writtenLanguage</cmdp:modalityType>
                    <cmdp:modalityTypeDetails>Text from digitized books and newspapers.</cmdp:modalityTypeDetails>
                    <cmdp:sizePerModality>
                      <cmdp:sizeInfo>
                        <cmdp:size>121834422207</cmdp:size>
                        <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>3980000</cmdp:size>
                        <cmdp:sizeUnit>texts</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerModality>
                  </cmdp:modalityInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>121834422207</cmdp:size>
                    <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>3980000</cmdp:size>
                    <cmdp:sizeUnit>texts</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:timeCoverageInfo>
                    <cmdp:timeCoverage>1800-2021</cmdp:timeCoverage>
                  </cmdp:timeCoverageInfo>
                </cmdp:corpusPartGeneralInfo>
              </cmdp:corpusInfo>
            </cmdp:corpusProfile>
          </cmd:Components>
        </cmd:CMD>
      </metadata>
    </record>
  </GetRecord>
</OAI-PMH>