<OAI-PMH xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://www.openarchives.org/OAI/2.0/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/          http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
  <responseDate>2026-04-24T19:07:47.406Z</responseDate>
  <request verb="GetRecord">https://www.nb.no/sprakbanken/oai</request>
  <GetRecord>
    <record>
      <header>
        <identifier>oai:nb.no:sbr-23</identifier>
        <datestamp/>
      </header>
      <metadata>
        <cmd:CMD xmlns:cmd="http://www.clarin.eu/cmd/1" xmlns="http://www.clarin.eu/cmd/" xmlns:cmdp="http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1548239945780" CMDVersion="1.2" xsi:schemaLocation="http://www.clarin.eu/cmd/1 https://infra.clarin.eu/CMDI/1.x/xsd/cmd-envelop.xsd http://www.clarin.eu/cmd/1/profiles/clarin.eu:cr1:p_1548239945780 https://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/1.1/profiles/clarin.eu:cr1:p_1548239945780/1.2/xsd">
          <cmd:Header>
            <cmd:MdCreator>Arne Martinus Lindstad</cmd:MdCreator>
            <cmd:MdCreationDate>2021-07-05</cmd:MdCreationDate>
            <cmd:MdSelfLink>https://www.nb.no/sprakbanken/oai?verb=GetRecord&amp;identifier=oai:nb.no:sbr-23&amp;metadataPrefix=cmdi</cmd:MdSelfLink>
            <cmd:MdProfile>clarin.eu:cr1:p_1548239945780</cmd:MdProfile>
            <cmd:MdCollectionDisplayName>Språkbanken NB</cmd:MdCollectionDisplayName>
          </cmd:Header>
          <cmd:Resources>
            <cmd:ResourceProxyList>
              <cmd:ResourceProxy id="sbr23_lex">
                <cmd:ResourceType mimetype="application/x-gtar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/leksikalske_databaser/leksikon/no.leksikon.tar.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="sbr23_tool">
                <cmd:ResourceType mimetype="application/x-gtar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/leksikalske_databaser/verktoy/nor.leksikalsk.verktoy.tar.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="sbr23_trans">
                <cmd:ResourceType mimetype="application/x-gtar">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/leksikalske_databaser/trans_konv/nor.trans-konv.tar.gz</cmd:ResourceRef>
              </cmd:ResourceProxy>
              <cmd:ResourceProxy id="sbr23_doc">
                <cmd:ResourceType mimetype="application/pdf">Resource</cmd:ResourceType>
                <cmd:ResourceRef>https://www.nb.no/sbfil/dok/nst_leksdat_no.pdf</cmd:ResourceRef>
              </cmd:ResourceProxy>
            </cmd:ResourceProxyList>
            <cmd:JournalFileProxyList/>
            <cmd:ResourceRelationList>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
              <cmd:ResourceRelation>
                <cmd:RelationType>describes</cmd:RelationType>
                <cmd:Resource>
                  <cmd:Role>
                    <cmd:Resource>
                      <cmd:Role/>
                    </cmd:Resource>
                  </cmd:Role>
                </cmd:Resource>
              </cmd:ResourceRelation>
            </cmd:ResourceRelationList>
          </cmd:Resources>
          <cmd:IsPartOfList/>
          <cmd:Components>
            <cmdp:lexicalProfileRev1>
              <cmdp:resourceCommonInfo>
                <cmdp:resourceType>lexicalConceptualResource</cmdp:resourceType>
                <cmdp:identificationInfo>
                  <cmdp:resourceName xml:lang="en">NST Pronunciation Lexicon for Norwegian Bokmål</cmdp:resourceName>
                  <cmdp:resourceName xml:lang="nb">NST uttaleleksikon for bokmål</cmdp:resourceName>
                  <cmdp:description xml:lang="en">This pronunciation lexicon for Norwegian Bokmål was originally produced by Nordic Language Technology (NST), and contains approximately 785,000 entries. The word list is based on the 100,000 most frequent word forms in NST's Norwegian text corpus.

The lexicon is available as one large csv file. Each entry (line) contains 51 fields, separated by a semicolon. Not all fields are equally relevant for all purposes, but given the format, it should be easy to extract relevant information.

The lexicon contains, among other things, information about the decomposition of compounds and one or more phonetic transcriptions. The phonetic transcription has partly been done manually, but to a large extent it was done automatically using an inflector. Parts of the output of this process was manually checked afterwards. The inflector and other lexical tools that can be used in processing the lexicon, can be downloaded as a separate file.

The transcription format is SAMPA (Speech Assessment Methods Phonetic Alphabet). See http://www.phon.ucl.ac.uk/home/sampa/index.html.

A script for converting the SAMPA transcriptons to IPA can be found on GitHub (https://github.com/peresolb/sampa_to_ipa).</cmdp:description>
                  <cmdp:description xml:lang="nb">Dette uttaleleksikonet ble opprinnelig produsert av Nordisk språkteknologi (NST), og inneholder omtrent 785.000 oppslagsord. Ordlisten tar utgangspunkt i de 100.000 mest frekvente ordformene i det norske tekstkorpuset til NST.

Hele leksikonet foreligger som en stor fil i csv-format. Hvert oppslag er på en linje, det er 51 poster tilgjengeleg på hver linje, og postene er skilt med semikolon. Ikke alle postene er like relevante for alle formål, men gitt formatet er det lett å hente ut den informasjonen man trenger.

Leksikonet inneholder blant annet informasjon om dekomponeringsledd i sammensetninger, og fonetisk transkripsjon. Denne transkripsjonen er delvis gjort manuelt, men det meste er gjort automatisk ved hjelp av en inflektor. Deler av dette er stikkprøvekontrollert i etterkant. Selve inflektoren, og annet leksikalsk verktøy som kan brukes i behandling av leksikonet, kan lastes ned som en egen fil.

Transkripsjonsformatet er SAMPA (Speech Assessment Methods Phonetic Alphabet). Se http://www.phon.ucl.ac.uk/home/sampa/index.html for nærmere informasjon om dette transkripsjonsformatet.

Et skript som konverter SAMPA-transkripsjonene i leksikonet til IPA finnes på GitHub (https://github.com/peresolb/sampa_to_ipa).</cmdp:description>
                  <cmdp:url cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-23/</cmdp:url>
                  <cmdp:PID cmd:description="hdl">hdl:21.11146/23</cmdp:PID>
                  <cmdp:identifier>sbr-23</cmdp:identifier>
                </cmdp:identificationInfo>
                <cmdp:distributionInfo>
                  <cmdp:licenceInfo>
                    <cmdp:userCategory>Public</cmdp:userCategory>
                    <cmdp:distributionAccessMedium>downloadable</cmdp:distributionAccessMedium>
                    <cmdp:downloadLocation cmd:description="resource homepage">https://www.nb.no/sprakbanken/ressurskatalog/oai-nb-no-sbr-23/</cmdp:downloadLocation>
                    <cmdp:licence>
                      <cmdp:licenceFamily>Creative Commons (CC)</cmdp:licenceFamily>
                      <cmdp:licenceName>Creative_Commons-ZERO (CC-ZERO)</cmdp:licenceName>
                      <cmdp:licenceURL>https://creativecommons.org/publicdomain/zero/1.0/</cmdp:licenceURL>
                    </cmdp:licence>
                    <cmdp:licensor>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role xml:lang="en">Licensor</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:licensor>
                    <cmdp:distributionRightsHolder>
                      <cmdp:actorInfo>
                        <cmdp:actorType>organization</cmdp:actorType>
                        <cmdp:role xml:lang="en">Distribution Rights Holder</cmdp:role>
                        <cmdp:organizationInfo>
                          <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                          <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                          <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                          <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                          <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                          <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                        </cmdp:organizationInfo>
                        <cmdp:communicationInfo>
                          <cmdp:email>sprakbanken@nb.no</cmdp:email>
                          <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                          <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                          <cmdp:zipCode>0203</cmdp:zipCode>
                          <cmdp:city>Oslo</cmdp:city>
                          <cmdp:region>Oslo</cmdp:region>
                          <cmdp:country>Norway</cmdp:country>
                        </cmdp:communicationInfo>
                      </cmdp:actorInfo>
                    </cmdp:distributionRightsHolder>
                  </cmdp:licenceInfo>
                </cmdp:distributionInfo>
                <cmdp:contact>
                  <cmdp:actorInfo>
                    <cmdp:actorType>organization</cmdp:actorType>
                    <cmdp:role xml:lang="en">Contact</cmdp:role>
                    <cmdp:organizationInfo>
                      <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                      <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                      <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                      <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                      <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                      <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                    </cmdp:organizationInfo>
                    <cmdp:communicationInfo>
                      <cmdp:email>sprakbanken@nb.no</cmdp:email>
                      <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                      <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                      <cmdp:zipCode>0203</cmdp:zipCode>
                      <cmdp:city>Oslo</cmdp:city>
                      <cmdp:region>Oslo</cmdp:region>
                      <cmdp:country>Norway</cmdp:country>
                    </cmdp:communicationInfo>
                  </cmdp:actorInfo>
                </cmdp:contact>
                <cmdp:metadataInfo>
                  <cmdp:metadataCreationDate>2011-11-30</cmdp:metadataCreationDate>
                  <cmdp:metadataLanguageName>English</cmdp:metadataLanguageName>
                  <cmdp:metadataLanguageId>en</cmdp:metadataLanguageId>
                  <cmdp:metadataLastDateUpdated>2023-07-05</cmdp:metadataLastDateUpdated>
                  <cmdp:metadataCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Metadata Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Birkenes</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Magnus Breder</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                      <cmdp:communicationInfo>
                        <cmdp:email>sprakbanken@nb.no</cmdp:email>
                        <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                        <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                        <cmdp:zipCode>0203</cmdp:zipCode>
                        <cmdp:city>Oslo</cmdp:city>
                        <cmdp:region>Oslo</cmdp:region>
                        <cmdp:country>Norway</cmdp:country>
                      </cmdp:communicationInfo>
                    </cmdp:actorInfo>
                    <cmdp:actorInfo>
                      <cmdp:actorType>person</cmdp:actorType>
                      <cmdp:role xml:lang="en">Resource Creator</cmdp:role>
                      <cmdp:personInfo>
                        <cmdp:surname xml:lang="nb">Lindstad</cmdp:surname>
                        <cmdp:givenName xml:lang="nb">Arne Martinus</cmdp:givenName>
                        <cmdp:affiliation>
                          <cmdp:organizationInfo>
                            <cmdp:organizationName xml:lang="en">National Library of Norway</cmdp:organizationName>
                            <cmdp:organizationName xml:lang="nb">Nasjonalbiblioteket</cmdp:organizationName>
                            <cmdp:organizationShortName xml:lang="en">NLN</cmdp:organizationShortName>
                            <cmdp:organizationShortName xml:lang="nb">NB</cmdp:organizationShortName>
                            <cmdp:departmentName xml:lang="en">The Language Bank</cmdp:departmentName>
                            <cmdp:departmentName xml:lang="nb">Språkbanken</cmdp:departmentName>
                          </cmdp:organizationInfo>
                        </cmdp:affiliation>
                      </cmdp:personInfo>
                      <cmdp:communicationInfo>
                        <cmdp:email>sprakbanken@nb.no</cmdp:email>
                        <cmdp:url>https://www.nb.no/sprakbanken/</cmdp:url>
                        <cmdp:address>P.O. Box 2674 Solli</cmdp:address>
                        <cmdp:zipCode>0203</cmdp:zipCode>
                        <cmdp:city>Oslo</cmdp:city>
                        <cmdp:region>Oslo</cmdp:region>
                        <cmdp:country>Norway</cmdp:country>
                      </cmdp:communicationInfo>
                    </cmdp:actorInfo>
                  </cmdp:metadataCreator>
                </cmdp:metadataInfo>
                <cmdp:versionInfo>
                  <cmdp:version>1.0</cmdp:version>
                  <cmdp:lastDateUpdated>2003-02-24</cmdp:lastDateUpdated>
                </cmdp:versionInfo>
                <cmdp:validationInfo>
                  <cmdp:validated>true</cmdp:validated>
                  <cmdp:validationType>content</cmdp:validationType>
                  <cmdp:validationMode>manual</cmdp:validationMode>
                  <cmdp:validationExtent>partial</cmdp:validationExtent>
                  <cmdp:validator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>organization</cmdp:actorType>
                      <cmdp:role xml:lang="en">Resource Validator</cmdp:role>
                      <cmdp:organizationInfo>
                        <cmdp:organizationName xml:lang="en">Nordic Language Technology AS</cmdp:organizationName>
                        <cmdp:organizationName xml:lang="nb">Nordisk språkteknologi AS</cmdp:organizationName>
                        <cmdp:organizationShortName xml:lang="en">NST</cmdp:organizationShortName>
                        <cmdp:organizationShortName xml:lang="nb">NST</cmdp:organizationShortName>
                      </cmdp:organizationInfo>
                    </cmdp:actorInfo>
                  </cmdp:validator>
                </cmdp:validationInfo>
                <cmdp:resourceDocumentationInfo>
                  <cmdp:documentationUnstructured>
                    <cmdp:role>documentation</cmdp:role>
                    <cmdp:documentUnstructured>https://www.nb.no/sbfil/dok/nst_leksdat_no.pdf</cmdp:documentUnstructured>
                  </cmdp:documentationUnstructured>
                </cmdp:resourceDocumentationInfo>
                <cmdp:resourceCreationInfo>
                  <cmdp:creationStartDate>2000-01-03</cmdp:creationStartDate>
                  <cmdp:creationEndDate>2003-02-24</cmdp:creationEndDate>
                  <cmdp:resourceCreator>
                    <cmdp:actorInfo>
                      <cmdp:actorType>organization</cmdp:actorType>
                      <cmdp:role xml:lang="en">Resource Creator</cmdp:role>
                      <cmdp:organizationInfo>
                        <cmdp:organizationName xml:lang="en">Nordic Language Technology AS</cmdp:organizationName>
                        <cmdp:organizationName xml:lang="nb">Nordisk språkteknologi AS</cmdp:organizationName>
                        <cmdp:organizationShortName xml:lang="en">NST</cmdp:organizationShortName>
                        <cmdp:organizationShortName xml:lang="nb">NST</cmdp:organizationShortName>
                      </cmdp:organizationInfo>
                    </cmdp:actorInfo>
                  </cmdp:resourceCreator>
                </cmdp:resourceCreationInfo>
              </cmdp:resourceCommonInfo>
              <cmdp:lexicalConceptualResourceInfoRev1>
                <cmdp:lexicalConceptualResourceType>computationalLexicon</cmdp:lexicalConceptualResourceType>
                <cmdp:lexicalConceptualResourcePartGeneralInfo>
                  <cmdp:lingualityInfo>
                    <cmdp:lingualityType>monolingual</cmdp:lingualityType>
                  </cmdp:lingualityInfo>
                  <cmdp:languageInfo>
                    <cmdp:languageId>nb</cmdp:languageId>
                    <cmdp:languageName>Norwegian Bokål</cmdp:languageName>
                    <cmdp:sizePerLanguage>
                      <cmdp:sizeInfo>
                        <cmdp:size>784240</cmdp:size>
                        <cmdp:sizeUnit>words</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>784240</cmdp:size>
                        <cmdp:sizeUnit>entries</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>162,8</cmdp:size>
                        <cmdp:sizeUnit>mb</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerLanguage>
                  </cmdp:languageInfo>
                  <cmdp:modalityInfo>
                    <cmdp:modalityType>writtenLanguage</cmdp:modalityType>
                    <cmdp:modalityTypeDetails>Contains a general, non-specific vocabulary. Fullform frequency-based worlist with additions from various sources, including named entities. Contains corresponding phonetic transcriptions.</cmdp:modalityTypeDetails>
                    <cmdp:sizePerModality>
                      <cmdp:sizeInfo>
                        <cmdp:size>784240</cmdp:size>
                        <cmdp:sizeUnit>words</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>784240</cmdp:size>
                        <cmdp:sizeUnit>entries</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                      <cmdp:sizeInfo>
                        <cmdp:size>162,8</cmdp:size>
                        <cmdp:sizeUnit>mb</cmdp:sizeUnit>
                      </cmdp:sizeInfo>
                    </cmdp:sizePerModality>
                  </cmdp:modalityInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>784240</cmdp:size>
                    <cmdp:sizeUnit>words</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>784240</cmdp:size>
                    <cmdp:sizeUnit>entries</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                  <cmdp:sizeInfo>
                    <cmdp:size>162,8</cmdp:size>
                    <cmdp:sizeUnit>mb</cmdp:sizeUnit>
                  </cmdp:sizeInfo>
                </cmdp:lexicalConceptualResourcePartGeneralInfo>
                <cmdp:lexicalConceptualResourceEncodingInfo>
                  <cmdp:encodingLevel>phonetics</cmdp:encodingLevel>
                  <cmdp:linguisticInformation>phonetics-Transcription</cmdp:linguisticInformation>
                  <cmdp:conformanceToStandardsBestPractices>other</cmdp:conformanceToStandardsBestPractices>
                  <cmdp:theoreticModel>SAMPA</cmdp:theoreticModel>
                </cmdp:lexicalConceptualResourceEncodingInfo>
                <cmdp:lexicalConceptualResourcePartInfoRev1>
                  <cmdp:mediaType>text</cmdp:mediaType>
                  <cmdp:lexicalConceptualResourceTextInfo>
                    <cmdp:textFormatInfo>
                      <cmdp:mimeType>text/csv</cmdp:mimeType>
                    </cmdp:textFormatInfo>
                    <cmdp:characterEncodingInfo>
                      <cmdp:characterEncoding>UTF-8</cmdp:characterEncoding>
                    </cmdp:characterEncodingInfo>
                  </cmdp:lexicalConceptualResourceTextInfo>
                </cmdp:lexicalConceptualResourcePartInfoRev1>
              </cmdp:lexicalConceptualResourceInfoRev1>
            </cmdp:lexicalProfileRev1>
          </cmd:Components>
        </cmd:CMD>
      </metadata>
    </record>
  </GetRecord>
</OAI-PMH>