<OAI-PMH xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://www.openarchives.org/OAI/2.0/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/          http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
  <responseDate>2026-04-24T06:14:10.032Z</responseDate>
  <request verb="GetRecord">https://www.nb.no/sprakbanken/oai</request>
  <GetRecord>
    <record>
      <header>
        <identifier>oai:nb.no:sbr-68</identifier>
        <datestamp/>
      </header>
      <metadata>
        <cmd:CMD xmlns:cmd="http://www.clarin.eu/cmd/1" xmlns="http://www.clarin.eu/cmd/" xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1407745711925" CMDVersion="1.2" xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1407745711925 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.1/profiles/clarin.eu:cr1:p_1407745711925/1.2/xsd">
          <cmd:Header>
            <cmd:MdCreator>Arne Martinus Lindstad</cmd:MdCreator>
            <cmd:MdCreationDate>2021-10-01</cmd:MdCreationDate>
            <cmd:MdSelfLink>https://www.nb.no/sprakbanken/oai?verb=GetRecord&amp;identifier=oai:nb.no:sbr-68&amp;metadataPrefix=cmdi</cmd:MdSelfLink>
            <cmd:MdProfile>clarin.eu:cr1:p_1407745711925</cmd:MdProfile>
            <cmd:MdCollectionDisplayName>Språkbanken NB</cmd:MdCollectionDisplayName>
          </cmd:Header>
          <cmd:Resources>
            <cmd:ResourceProxyList>
              <cmd:ResourceProxy id="offweb">
                <cmd:ResourceType mimetype="application/zip">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/tekst/20180402_offweb.zip</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="offweb_doc">
                <cmd:ResourceType mimetype="application/pdf">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/dok/20180402_offweb.pdf</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="offweb_report">
                <cmd:ResourceType mimetype="application/pdf">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/dok/20180402_report.pdf</cmd:ResourceRef>
              </cmd:ResourceProxy>
            </cmd:ResourceProxyList>
            <cmd:JournalFileProxyList/>
            <cmd:ResourceRelationList>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
            </cmd:ResourceRelationList>
          </cmd:Resources>
          <cmd:IsPartOfList/>
          <cmd:Components>
            <cmdp:corpusProfile>
              <cmdp:resourceCommonInfo>
                <cmdp:resourceType>corpus</cmdp:resourceType>
                <cmdp:identificationInfo>
                  <cmdp:resourceName xml:lang="en">Norwegian-English Parallel Corpus from Public Web Sites</cmdp:resourceName>
                  <cmdp:resourceName xml:lang="nn">Norsk-engelsk parallellkorpus frå offentlege nettstadar</cmdp:resourceName>
                  <cmdp:description xml:lang="en">This is a sentence-aligned parallel corpus built from the public web sites www.nav.no, www.nyinorge.no and skatteetaten.no. These web sites provide information in both Norwegian Bokmål and Nynorsk, and parts of this is translated into English. The material is split in two corpora, one for Norwegian Bokmål-English, and one for Norwegian Nynorsk-English. Only sentences with a corresponding translation are included in the corpora. 

The corpora were made by Paul Meurer and Andrew Salway at the University of Bergen for the Language Bank. See the attached report for a description of how this was done.

The corpora are also available at the Clarino Bergen Centre's corpus management and analysis system Corpuscle (https://clarino.uib.no/korpuskel/).</cmdp:description>
                  <cmdp:description xml:lang="nn">Dette er eit parallellkorpus laga med utgangspunkt i tekster frå dei offentlege nettstadane www.nav.no, www.nyinorge.no og skatteetaten.no. Desse nettstadane publiserer informasjon på både bokmål og nynorsk, og delar av dette vert omsett til engelsk. Materialet er delt i to korpus, eitt for bokmål-engelsk, og eitt for nynorsk-engelsk. Berre material med ei tilsvarande engelsk omsetjing er inkludert i korpusa.

Korpusa vart laga for Språkbanken av Paul Meurer og Andrew Salway ved Universitetet i Bergen. Rapporten for korleis dei gjekk fram ligg ved korpset.

Korpusa er òg tilgjengelege i korpushandsamingssystemet Korpuskel ved Clarino Bergen Centre (https://clarino.uib.no/korpuskel/).</cmdp:description>
                  <cmdp:url cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-68/</cmdp:url>
                  <cmdp:PID cmd:description="handle">hdl:21.11146/68</cmdp:PID>
                  <cmdp:identifier>sbr-68</cmdp:identifier>
                </cmdp:identificationInfo>
                <cmdp:distributionInfo>
                  <cmdp:licenceInfo>
                    <cmdp:userCategory>Public</cmdp:userCategory>
                    <cmdp:distributionAccessMedium>downloadable</cmdp:distributionAccessMedium>
                    <cmdp:downloadLocation cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-68/</cmdp:downloadLocation>
                    <cmdp:licence>
                      <cmdp:licenceFamily>Creative Commons (CC)</cmdp:licenceFamily>
                      <cmdp:licenceName>Creative_Commons-BY (CC-BY)</cmdp:licenceName>
                      <cmdp:licenceURL>https://creativecommons.org/licenses/by/4.0/</cmdp:licenceURL>
                      <cmdp:conditionsOfUse>BY</cmdp:conditionsOfUse>
                    </cmdp:licence>
                    <cmdp:licensor>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role xml:lang="en">Licensor</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="nn">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="nn">NB</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="nn">Språkbanken</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:licensor>
                    <cmdp:distributionRightsHolder>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role xml:lang="en">Distribution Rights Holder</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="nn">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="nn">NB</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="nn">Språkbanken</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:distributionRightsHolder>
                  </cmdp:licenceInfo>
                </cmdp:distributionInfo>
                <cmdp:contact>
                  <cmdp:actorInfo>
                    <cmdp:actorType>organization</cmdp:actorType>
                    <cmdp:role xml:lang="en">Contact</cmdp:role>
                    <cmdp:organizationInfo>
                      <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                      <cmdp:organizationName xml:lang="nn">Nasjonalbiblioteket</cmdp:organizationName>
                      <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                      <cmdp:organizationShortName xml:lang="nn">NB</cmdp:organizationShortName>
                      <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                      <cmdp:departmentName xml:lang="nn">Språkbanken</cmdp:departmentName>
                    </cmdp:organizationInfo>
                    <cmdp:communicationInfo>
                      <cmdp:email>sprakbanken@nb.no</cmdp:email>
                      <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                      <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                      <cmdp:zipCode>0203</cmdp:zipCode>
                      <cmdp:city>Oslo</cmdp:city>
                      <cmdp:region>Oslo</cmdp:region>
                      <cmdp:country>Norway</cmdp:country>
                    </cmdp:communicationInfo>
                  </cmdp:actorInfo>
                </cmdp:contact>
                <cmdp:metadataInfo>
                  <cmdp:metadataCreationDate>2021-10-01</cmdp:metadataCreationDate>
                  <cmdp:metadataLanguageName>English</cmdp:metadataLanguageName>
                  <cmdp:metadataLanguageId>en</cmdp:metadataLanguageId>
                  <cmdp:metadataLastDateUpdated>2023-08-08</cmdp:metadataLastDateUpdated>
                  <cmdp:metadataCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Metadata Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nn">Lindstad</cmdp:surname>
                        <cmdp:givenName xml:lang="nn">Arne Martinus</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="nn">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="nn">NB</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="nn">Språkbanken</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                      <cmdp:communicationInfo>
                        <cmdp:email>sprakbanken@nb.no</cmdp:email>
                        <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                        <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                        <cmdp:zipCode>0203</cmdp:zipCode>
                        <cmdp:city>Oslo</cmdp:city>
                        <cmdp:region>Oslo</cmdp:region>
                        <cmdp:country>Norway</cmdp:country>
                      </cmdp:communicationInfo>
                    </cmdp:actorInfo>
                  </cmdp:metadataCreator>
                </cmdp:metadataInfo>
                <cmdp:versionInfo>
                  <cmdp:version>1</cmdp:version>
                  <cmdp:lastDateUpdated>2018-04-02</cmdp:lastDateUpdated>
                </cmdp:versionInfo>
                <cmdp:validationInfo>
                  <cmdp:validated>true</cmdp:validated>
                  <cmdp:validationType>formal</cmdp:validationType>
                  <cmdp:validationMode>automatic</cmdp:validationMode>
                  <cmdp:validationExtent>full</cmdp:validationExtent>
                </cmdp:validationInfo>
                <cmdp:resourceDocumentationInfo>
                  <cmdp:documentationUnstructured>
                    <cmdp:role>documentation</cmdp:role>
                    <cmdp:documentUnstructured>https://www.nb.no/sbfil/dok/20180402_report.pdf</cmdp:documentUnstructured>
                  </cmdp:documentationUnstructured>
                  <cmdp:documentationUnstructured>
                    <cmdp:role>documentation</cmdp:role>
                    <cmdp:documentUnstructured>https://www.nb.no/sbfil/dok/20180402_offweb.pdf</cmdp:documentUnstructured>
                  </cmdp:documentationUnstructured>
                </cmdp:resourceDocumentationInfo>
                <cmdp:resourceCreationInfo>
                  <cmdp:creationEndDate>2018-04-02</cmdp:creationEndDate>
                  <cmdp:resourceCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>organization</cmdp:actorType>
                      <cmdp:organizationInfo>
                        <cmdp:organizationName xml:lang="en">University of Bergen</cmdp:organizationName>
                        <cmdp:organizationName xml:lang="nn">Universitetet i Bergen</cmdp:organizationName>
                        <cmdp:organizationShortName xml:lang="en">UiB</cmdp:organizationShortName>
                        <cmdp:organizationShortName xml:lang="nn">UiB</cmdp:organizationShortName>
                        <cmdp:departmentName xml:lang="en">Department of Linguistic, Literary and Aesthetic Studies</cmdp:departmentName>
                        <cmdp:departmentName xml:lang="nn">Institutt for lingvistiske, litterære og estetiske studium</cmdp:departmentName>
                      </cmdp:organizationInfo>
                    </cmdp:actorInfo>
                  </cmdp:resourceCreator>
                </cmdp:resourceCreationInfo>
              </cmdp:resourceCommonInfo>
              <cmdp:corpusInfo>
                <cmdp:corpusType>Written Corpus</cmdp:corpusType>
                <cmdp:corpusPartInfo>
                  <cmdp:mediaType>text</cmdp:mediaType>
                  <cmdp:corpusTextInfo>
                    <cmdp:textFormatInfo>
                      <cmdp:mimeType>application/xml</cmdp:mimeType>
                    </cmdp:textFormatInfo>
                  </cmdp:corpusTextInfo>
                </cmdp:corpusPartInfo>
                <cmdp:corpusPartGeneralInfo>
                  <cmdp:lingualityInfo>
                    <cmdp:lingualityType>bilingual</cmdp:lingualityType>
                    <cmdp:multilingualityType>parallel</cmdp:multilingualityType>
                    <cmdp:multilingualityTypeDetails>Parallelized text from public service web sites</cmdp:multilingualityTypeDetails>
                  </cmdp:lingualityInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nn</cmdp:languageId>
                    <cmdp:languageName>Norwegian Nynorsk</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>289722</cmdp:size>
                        <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>21056</cmdp:size>
                        <cmdp:sizeUnit>sentences</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                    <cmdp:languageVarietyInfo>
                      <cmdp:languageVarietyType>other</cmdp:languageVarietyType>
                      <cmdp:languageVarietyName>Formal written language</cmdp:languageVarietyName>
                    </cmdp:languageVarietyInfo>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>en</cmdp:languageId>
                    <cmdp:languageName>English</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>353837</cmdp:size>
                        <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>20998</cmdp:size>
                        <cmdp:sizeUnit>sentences</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                    <cmdp:languageVarietyInfo>
                      <cmdp:languageVarietyType>other</cmdp:languageVarietyType>
                      <cmdp:languageVarietyName>Formal written language, translated from Norwegian Nynorsk</cmdp:languageVarietyName>
                    </cmdp:languageVarietyInfo>
                  </cmdp:languageInfo>
                  <cmdp:modalityInfo>
                    <cmdp:modalityType>writtenLanguage</cmdp:modalityType>
                  </cmdp:modalityInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>2</cmdp:size>
                    <cmdp:sizeUnit>files</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>5,29</cmdp:size>
                    <cmdp:sizeUnit>mb</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:annotationInfo>
                    <cmdp:annotationType>other</cmdp:annotationType>
                    <cmdp:segmentationLevel>sentence</cmdp:segmentationLevel>
                    <cmdp:annotationMode>automatic</cmdp:annotationMode>
                    <cmdp:annotationModeDetails>https://www.nb.no/sbfil/dok/20180402_report.pdf</cmdp:annotationModeDetails>
                  </cmdp:annotationInfo>
                  <cmdp:creationInfo>
                    <cmdp:creationMode>automatic</cmdp:creationMode>
                    <cmdp:creationModeDetails>https://www.nb.no/sbfil/dok/20180402_report.pdf</cmdp:creationModeDetails>
                  </cmdp:creationInfo>
                </cmdp:corpusPartGeneralInfo>
                <cmdp:corpusPartGeneralInfo>
                  <cmdp:lingualityInfo>
                    <cmdp:lingualityType>bilingual</cmdp:lingualityType>
                    <cmdp:multilingualityType>parallel</cmdp:multilingualityType>
                    <cmdp:multilingualityTypeDetails>Parallelized text from public service web sites</cmdp:multilingualityTypeDetails>
                  </cmdp:lingualityInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nb</cmdp:languageId>
                    <cmdp:languageName>Norwegian Bokmål</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>359401</cmdp:size>
                        <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>26771</cmdp:size>
                        <cmdp:sizeUnit>sentences</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                    <cmdp:languageVarietyInfo>
                      <cmdp:languageVarietyType>other</cmdp:languageVarietyType>
                      <cmdp:languageVarietyName>Formal written language</cmdp:languageVarietyName>
                    </cmdp:languageVarietyInfo>
                  </cmdp:languageInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>en</cmdp:languageId>
                    <cmdp:languageName>English</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>448717</cmdp:size>
                        <cmdp:sizeUnit>tokens</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>26693</cmdp:size>
                        <cmdp:sizeUnit>sentences</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                    <cmdp:languageVarietyInfo>
                      <cmdp:languageVarietyType>other</cmdp:languageVarietyType>
                      <cmdp:languageVarietyName>Formal written language, translated from Norwegian Bokmål</cmdp:languageVarietyName>
                    </cmdp:languageVarietyInfo>
                  </cmdp:languageInfo>
                  <cmdp:modalityInfo>
                    <cmdp:modalityType>writtenLanguage</cmdp:modalityType>
                  </cmdp:modalityInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>3</cmdp:size>
                    <cmdp:sizeUnit>files</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>6,71</cmdp:size>
                    <cmdp:sizeUnit>mb</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:annotationInfo>
                    <cmdp:annotationType>other</cmdp:annotationType>
                    <cmdp:segmentationLevel>sentence</cmdp:segmentationLevel>
                    <cmdp:annotationMode>automatic</cmdp:annotationMode>
                    <cmdp:annotationModeDetails>https://www.nb.no/sbfil/dok/20180402_report.pdf</cmdp:annotationModeDetails>
                  </cmdp:annotationInfo>
                  <cmdp:creationInfo>
                    <cmdp:creationMode>automatic</cmdp:creationMode>
                    <cmdp:creationModeDetails>https://www.nb.no/sbfil/dok/20180402_report.pdf</cmdp:creationModeDetails>
                  </cmdp:creationInfo>
                </cmdp:corpusPartGeneralInfo>
              </cmdp:corpusInfo>
            </cmdp:corpusProfile>
          </cmd:Components>
        </cmd:CMD>
      </metadata>
    </record>
  </GetRecord>
</OAI-PMH>