<OAI-PMH xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://www.openarchives.org/OAI/2.0/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/          http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
  <responseDate>2026-04-04T21:49:28.334Z</responseDate>
  <request verb="GetRecord">https://www.nb.no/sprakbanken/oai</request>
  <GetRecord>
    <record>
      <header>
        <identifier>oai:nb.no:sbr-4</identifier>
        <datestamp/>
      </header>
      <metadata>
        <cmd:CMD xmlns:cmd="http://www.clarin.eu/cmd/1" xmlns="http://www.clarin.eu/cmd/" xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1407745711925" CMDVersion="1.2" xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1407745711925 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.1/profiles/clarin.eu:cr1:p_1407745711925/1.2/xsd">
          <cmd:Header>
            <cmd:MdCreator>Arne Martinus Lindstad</cmd:MdCreator>
            <cmd:MdCreationDate>2021-06-18</cmd:MdCreationDate>
            <cmd:MdSelfLink>https://www.nb.no/sprakbanken/oai?verb=GetRecord&amp;identifier=oai:nb.no:sbr-4&amp;metadataPrefix=cmdi</cmd:MdSelfLink>
            <cmd:MdProfile>clarin.eu:cr1:p_1407745711925</cmd:MdProfile>
            <cmd:MdCollectionDisplayName>Språkbanken NB</cmd:MdCollectionDisplayName>
          </cmd:Header>
          <cmd:Resources>
            <cmd:ResourceProxyList>
              <cmd:ResourceProxy id="nnc_1998_2011">
                <cmd:ResourceType mimetype="application/zip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/norsk_aviskorpus.zip</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2012">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2012.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2013">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2013.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2014">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2014.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2015">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2015.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2016">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2016.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2017">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2017.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2018">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2018.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_2019">
                <cmd:ResourceType mimetype="application/tar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/nak_2019.tar</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nno_tok">
                <cmd:ResourceType mimetype="application/zip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/norsk_aviskorpus_nno_tok.zip</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nob_tok">
                <cmd:ResourceType mimetype="application/zip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/norsk_aviskorpus_nob_tok.zip</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_doc_1998_2011">
                <cmd:ResourceType mimetype="application/pdf">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/dok/nak_1998_2011.pdf</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="nnc_doc_2012_2019">
                <cmd:ResourceType mimetype="application/pdf">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/dok/nak_2012_2019.pdf</cmd:ResourceRef>
              </cmd:ResourceProxy>
            </cmd:ResourceProxyList>
            <cmd:JournalFileProxyList/>
            <cmd:ResourceRelationList>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
            </cmd:ResourceRelationList>
          </cmd:Resources>
          <cmd:IsPartOfList/>
          <cmd:Components>
            <cmdp:corpusProfile>
              <cmdp:resourceCommonInfo>
                <cmdp:resourceType>corpus</cmdp:resourceType>
                <cmdp:identificationInfo>
                  <cmdp:resourceName xml:lang="nb">Norsk aviskorpus</cmdp:resourceName>
                  <cmdp:resourceName xml:lang="en">Norwegian Newspaper Corpus</cmdp:resourceName>
                  <cmdp:description xml:lang="nb">Norsk aviskorpus var et prosjekt ved Universitetet i Bergen der man trålet nyhetsnettsteder etter nyhetsartikler.

Denne versjonen av Norsk aviskorpus består av tekst fra perioden 1998 til og med 2019. Korpuset inneholder om lag 1,68 milliarder ord for bokmål og 68 millioner ord for nynorsk.

Det finnes også en forenklet versjon av korpuset for tekstene fra perioden 1998-2011. Her er alle setningsdubletter fjernet, og setningene er sortert alfabetisk. Setningene er separert med s-tagger.

Tekstene fra 1998-2011 er samlet i en felles nedlastbar fil, ellers foreligger dataene som en fil per år. Se dokumentasjonsfilene for en beskrivelse av innholdet og filformater.</cmdp:description>
                  <cmdp:description xml:lang="en">The Norwegian Newspaper Corpus was a project at the University of Bergen where news websites were crawled for news articles.

This version of The Norwegian Newspaper Corpus consists of text from 1998 to 2019. The corpus contains approximately 1,68 billion words for Norwegian Bokmål, and about 68 million words for Norwegian Nynorsk.

There is also a simplified version of the corpus available (1998-2011), where duplicate sentences have been removed and the sentences are ordered alphabetically.

The texts from 1998-2011 are collected in a single downloadable file, otherwise the data are structured as one file per year. See the documentation files for a description of the content and file formats.</cmdp:description>
                  <cmdp:url cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-4/</cmdp:url>
                  <cmdp:PID cmd:description="hdl">hdl:21.11146/4</cmdp:PID>
                  <cmdp:identifier>sbr-4</cmdp:identifier>
                </cmdp:identificationInfo>
                <cmdp:distributionInfo>
                  <cmdp:licenceInfo>
                    <cmdp:userCategory>Public</cmdp:userCategory>
                    <cmdp:distributionAccessMedium>downloadable</cmdp:distributionAccessMedium>
                    <cmdp:downloadLocation cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-4/</cmdp:downloadLocation>
                    <cmdp:attributionText xml:lang="en">We hereby credit the individual publishers for making their texts available for language technology purposes. The copyright of the texts in this corpus remains with the individual publisher.</cmdp:attributionText>
                    <cmdp:licence>
                      <cmdp:licenceFamily>Creative Commons (CC)</cmdp:licenceFamily>
                      <cmdp:licenceName>Creative_Commons-BY-NC (CC-BY-NC)</cmdp:licenceName>
                      <cmdp:licenceURL>https://creativecommons.org/licenses/by-nc/4.0/</cmdp:licenceURL>
                      <cmdp:conditionsOfUse>BY</cmdp:conditionsOfUse>
                      <cmdp:conditionsOfUse>NC</cmdp:conditionsOfUse>
                      <cmdp:conditionsOfUse>*</cmdp:conditionsOfUse>
                      <cmdp:nonStandardConditionsOfUse>* NORED * No redistribution. The licence is motivated by the need to block the possibility of third parties redistributing the orignal texts for commercial purposes. Note that machine learned models, extracted lexicons, embeddings, and similar resources that are created on the basis of The Norwegian Newspaper Corpus are not considered to contain the original data and so can be freely used also for commercial purposes despite the non-commercial condition.</cmdp:nonStandardConditionsOfUse>
                    </cmdp:licence>
                    <cmdp:licensor>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role xml:lang="en">Licensor</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:licensor>
                    <cmdp:distributionRightsHolder>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role>Distribution Rights Holder</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:distributionRightsHolder>
                  </cmdp:licenceInfo>
                </cmdp:distributionInfo>
                <cmdp:contact>
                  <cmdp:actorInfo>
                    <cmdp:actorType>organization</cmdp:actorType>
                    <cmdp:role xml:lang="en">Contact</cmdp:role>
                    <cmdp:organizationInfo>
                      <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                      <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                      <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                      <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                      <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                      <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                    </cmdp:organizationInfo>
                    <cmdp:communicationInfo>
                      <cmdp:email>sprakbanken@nb.no</cmdp:email>
                      <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                      <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                      <cmdp:zipCode>0203</cmdp:zipCode>
                      <cmdp:city>Oslo</cmdp:city>
                      <cmdp:region>Oslo</cmdp:region>
                      <cmdp:country>Norway</cmdp:country>
                    </cmdp:communicationInfo>
                  </cmdp:actorInfo>
                </cmdp:contact>
                <cmdp:metadataInfo>
                  <cmdp:metadataCreationDate>2016-02-04</cmdp:metadataCreationDate>
                  <cmdp:metadataLanguageName>English</cmdp:metadataLanguageName>
                  <cmdp:metadataLanguageId>en</cmdp:metadataLanguageId>
                  <cmdp:metadataLastDateUpdated>2023-06-22</cmdp:metadataLastDateUpdated>
                  <cmdp:metadataCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Metadata Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Birkenes</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Magnus Breder</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                    </cmdp:actorInfo>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Metadata Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Lindstad</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Arne Martinus</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                    </cmdp:actorInfo>
                  </cmdp:metadataCreator>
                </cmdp:metadataInfo>
                <cmdp:versionInfo>
                  <cmdp:version>2020</cmdp:version>
                  <cmdp:revision>Texts from 2015-2019 added to the corpus</cmdp:revision>
                  <cmdp:lastDateUpdated>2020-04-20</cmdp:lastDateUpdated>
                </cmdp:versionInfo>
                <cmdp:validationInfo>
                  <cmdp:validated>false</cmdp:validated>
                </cmdp:validationInfo>
                <cmdp:resourceDocumentationInfo>
                  <cmdp:documentationUnstructured>
                    <cmdp:role>documentation</cmdp:role>
                    <cmdp:documentUnstructured>Documentation files describing the content, structure and file formats of the resource.</cmdp:documentUnstructured>
                  </cmdp:documentationUnstructured>
                </cmdp:resourceDocumentationInfo>
                <cmdp:resourceCreationInfo>
                  <cmdp:creationStartDate>1998-01-01</cmdp:creationStartDate>
                  <cmdp:creationEndDate>2020-04-20</cmdp:creationEndDate>
                  <cmdp:resourceCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Resource Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Hofland</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Knut</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="nb">Universitetet i Bergen</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="en">University of Bergen</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="nb">UiB</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="en">UiB</cmdp:organizationShortName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                    </cmdp:actorInfo>
                  </cmdp:resourceCreator>
                </cmdp:resourceCreationInfo>
              </cmdp:resourceCommonInfo>
              <cmdp:corpusInfo>
                <cmdp:corpusType>Written Corpus</cmdp:corpusType>
                <cmdp:corpusPartInfo>
                  <cmdp:mediaType>text</cmdp:mediaType>
                </cmdp:corpusPartInfo>
                <cmdp:corpusPartGeneralInfo>
                  <cmdp:lingualityInfo>
                    <cmdp:lingualityType>bilingual</cmdp:lingualityType>
                    <cmdp:multilingualityType>multilingualSingleText</cmdp:multilingualityType>
                    <cmdp:multilingualityTypeDetails>News text in Norwegian Bokmål and Norwegian Nynorsk</cmdp:multilingualityTypeDetails>
                  </cmdp:lingualityInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nb</cmdp:languageId>
                    <cmdp:languageName>Norwegian Bokmål</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>1680000000</cmdp:size>
                        <cmdp:sizeUnit>words</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nn</cmdp:languageId>
                    <cmdp:languageName>Norwegian Nynorsk</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>68000000</cmdp:size>
                        <cmdp:sizeUnit>words</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                  </cmdp:languageInfo>
                  <cmdp:modalityInfo>
                    <cmdp:modalityType>writtenLanguage</cmdp:modalityType>
                  </cmdp:modalityInfo>
                  <cmdp:timeCoverageInfo>
                    <cmdp:timeCoverage>1998-2019</cmdp:timeCoverage>
                  </cmdp:timeCoverageInfo>
                  <cmdp:creationInfo>
                    <cmdp:creationMode>mixed</cmdp:creationMode>
                    <cmdp:creationModeDetails>Crawling news web sites, with post processing.</cmdp:creationModeDetails>
                  </cmdp:creationInfo>
                </cmdp:corpusPartGeneralInfo>
              </cmdp:corpusInfo>
            </cmdp:corpusProfile>
          </cmd:Components>
        </cmd:CMD>
      </metadata>
    </record>
  </GetRecord>
</OAI-PMH>