{"id":31351,"date":"2025-02-10T10:38:55","date_gmt":"2025-02-10T09:38:55","guid":{"rendered":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/"},"modified":"2025-02-10T10:56:01","modified_gmt":"2025-02-10T09:56:01","slug":"oai-repo-clarino-uib-no-11509-140","status":"publish","type":"language-resource","link":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/","title":{"rendered":"Randomized extraction of the New Norwegian corpus"},"content":{"rendered":"<p><?xml version='1.0' encoding='utf-8'?><br \/>\n<record><\/p>\n<header><identifier>oai:repo.clarino.uib.no:11509\/140<\/identifier><datestamp>2021-01-29T12:21:00Z<\/datestamp><setSpec>hdl_11509_1<\/setSpec><setSpec>hdl_11509_2<\/setSpec><\/header>\n<p><metadata><CMD xmlns=\"http:\/\/www.clarin.eu\/cmd\/\"><br \/>\n    <Header><br \/>\n        <MdCreationDate>2021-01-29<\/MdCreationDate><br \/>\n        <MdSelfLink>http:\/\/hdl.handle.net\/11509\/140@format=cmdi<\/MdSelfLink><br \/>\n        <MdProfile>clarin.eu:cr1:p_1403526079380<\/MdProfile><br \/>\n        <MdCollectionDisplayName>CLARINO Bergen Centre<\/MdCollectionDisplayName><br \/>\n    <\/Header><br \/>\n    <Resources><br \/>\n        <ResourceProxyList><br \/>\n            <ResourceProxy id=\"lp_198\"><br \/>\n                <ResourceType>LandingPage<\/ResourceType><br \/>\n                <ResourceRef>http:\/\/hdl.handle.net\/11509\/140<\/ResourceRef><br \/>\n            <\/ResourceProxy><br \/>\n            <ResourceProxy id=\"uri_1\"><br \/>\n                <ResourceType mimetype=\"text\/html\">Resource<\/ResourceType><br \/>\n                <ResourceRef>http:\/\/spraksamlingene.no\/<\/ResourceRef><br \/>\n            <\/ResourceProxy><br \/>\n            <ResourceProxy id=\"_382\"><br \/>\n                <ResourceType mimetype=\"application\/zip\">Resource<\/ResourceType><br \/>\n                <ResourceRef>https:\/\/repo.clarino.uib.no\/xmlui\/bitstream\/handle\/11509\/140\/nnk-2000-scrambled.zip?sequence=1<\/ResourceRef><br \/>\n            <\/ResourceProxy><br \/>\n        <\/ResourceProxyList><br \/>\n        <JournalFileProxyList \/><br \/>\n        <ResourceRelationList \/><br \/>\n    <\/Resources><br \/>\n    <Components><br \/>\n        <LINDAT_CLARIN><br \/>\n            <bibliographicInfo>\n                <projectUrl>http:\/\/spraksamlingene.no\/<\/projectUrl>\n                <titles><br \/>\n                    <title xml:lang=\"en\">Randomized extraction of the New Norwegian corpus<\/title><br \/>\n                <\/titles><br \/>\n                <authors><br \/>\n                    <author><br \/>\n                        <lastName>Gammeltoft<\/lastName><br \/>\n                        <firstName> Peder<\/firstName><br \/>\n                    <\/author><br \/>\n                <\/authors><br \/>\n                <dates><br \/>\n                    <dateIssued>2021-01-29<\/dateIssued><br \/>\n                <\/dates><br \/>\n                <identifiers><br \/>\n                    <identifier type=\"Handle\">http:\/\/hdl.handle.net\/11509\/140<\/identifier><br \/>\n                <\/identifiers><br \/>\n                <contactPerson><br \/>\n                    <firstName>Peder<\/firstName><br \/>\n                    <lastName>Gammeltoft<\/lastName><br \/>\n                    <email>peder.gammeltoft@uib.no<\/email><br \/>\n                    <affiliation>University of Bergen Library<\/affiliation><br \/>\n                <\/contactPerson>\n                <publishers>\n                    <publisher>University of Bergen Library<\/publisher>\n                <\/publishers>\n            <\/bibliographicInfo><br \/>\n            <dataInfo><br \/>\n                <type>corpus<\/type><br \/>\n                <description>Randomized extraction of the New Norwegian Corpus (Nynorskkorpuset).<\/p>\n<p>Contains sentences in New Norwegian (Nynorsk) from the year 2000 and after. Tab-separated, one word pr. line, lemmatized and morphologically tagged, year and domain information is given. Annotation is done with the Oslo-Bergen tagger. Sentences in the Bokm\u00e5l standard have been removed.<\/p>\n<p>This corpus is intended for use in the development of language technology.<\/p>\n<p>Size: 3,3 million sentences, 57,5 million words.<\/description><br \/>\n                <languages><br \/>\n                    <language><br \/>\n                        <code>nno<\/code><br \/>\n                        <name>Norwegian Nynorsk<\/name><br \/>\n                    <\/language><br \/>\n                <\/languages><br \/>\n                <keywords><br \/>\n                    <keyword>Sentences<\/keyword><br \/>\n                    <keyword>Nynorsk<\/keyword><br \/>\n                <\/keywords>\n                <links>\n                    <link>http:\/\/no2014.uib.no\/korpuset\/conc_enkeltsok.htm<\/link>\n                <\/links>\n                <sizeInfo><br \/>\n                    <size><br \/>\n                        <size>3300000<\/size><br \/>\n                        <unit>sentences<\/unit><br \/>\n                    <\/size><br \/>\n                <\/sizeInfo><br \/>\n            <\/dataInfo>\n            <licenseInfo>\n                <license>\n                    <uri>http:\/\/creativecommons.org\/licenses\/by\/3.0\/<\/uri>\n                <\/license>\n            <\/licenseInfo>\n        <\/LINDAT_CLARIN><br \/>\n    <\/Components><br \/>\n<\/CMD><br \/>\n<\/metadata><\/record><\/p>\n","protected":false},"template":"","categories":[],"tags":[],"language-resource-type":[],"language-resource-origin":[7558],"class_list":["post-31351","language-resource","type-language-resource","status-publish","hentry"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v27.1 (Yoast SEO v27.1.1) - https:\/\/yoast.com\/product\/yoast-seo-premium-wordpress\/ -->\n<title>Randomized extraction of the New Norwegian corpus - Spr\u00e5kbanken<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/\" \/>\n<meta property=\"og:locale\" content=\"nb_NO\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"Randomized extraction of the New Norwegian corpus\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/\" \/>\n<meta property=\"og:site_name\" content=\"Spr\u00e5kbanken\" \/>\n<meta property=\"article:modified_time\" content=\"2025-02-10T09:56:01+00:00\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"Ansl. lesetid\" \/>\n\t<meta name=\"twitter:data1\" content=\"1 minutt\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/\",\"url\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/\",\"name\":\"Randomized extraction of the New Norwegian corpus - Spr\u00e5kbanken\",\"isPartOf\":{\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/#website\"},\"datePublished\":\"2025-02-10T09:38:55+00:00\",\"dateModified\":\"2025-02-10T09:56:01+00:00\",\"breadcrumb\":{\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/#breadcrumb\"},\"inLanguage\":\"nb-NO\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"Home\",\"item\":\"https:\/\/www.nb.no\/sprakbanken\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"Resources from the resource bank\",\"item\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/\"},{\"@type\":\"ListItem\",\"position\":3,\"name\":\"Randomized extraction of the New Norwegian corpus\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/#website\",\"url\":\"https:\/\/www.nb.no\/sprakbanken\/\",\"name\":\"Spr\u00e5kbanken\",\"description\":\"\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.nb.no\/sprakbanken\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"nb-NO\"}]}<\/script>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"Randomized extraction of the New Norwegian corpus - Spr\u00e5kbanken","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/","og_locale":"nb_NO","og_type":"article","og_title":"Randomized extraction of the New Norwegian corpus","og_url":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/","og_site_name":"Spr\u00e5kbanken","article_modified_time":"2025-02-10T09:56:01+00:00","twitter_card":"summary_large_image","twitter_misc":{"Ansl. lesetid":"1 minutt"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/","url":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/","name":"Randomized extraction of the New Norwegian corpus - Spr\u00e5kbanken","isPartOf":{"@id":"https:\/\/www.nb.no\/sprakbanken\/#website"},"datePublished":"2025-02-10T09:38:55+00:00","dateModified":"2025-02-10T09:56:01+00:00","breadcrumb":{"@id":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/#breadcrumb"},"inLanguage":"nb-NO","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-repo-clarino-uib-no-11509-140\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/www.nb.no\/sprakbanken\/"},{"@type":"ListItem","position":2,"name":"Resources from the resource bank","item":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/"},{"@type":"ListItem","position":3,"name":"Randomized extraction of the New Norwegian corpus"}]},{"@type":"WebSite","@id":"https:\/\/www.nb.no\/sprakbanken\/#website","url":"https:\/\/www.nb.no\/sprakbanken\/","name":"Spr\u00e5kbanken","description":"","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.nb.no\/sprakbanken\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"nb-NO"}]}},"lang":"nb","translations":{"nb":31351,"en":31354},"pll_sync_post":[],"_links":{"self":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource\/31351","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource"}],"about":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/types\/language-resource"}],"wp:attachment":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/media?parent=31351"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/categories?post=31351"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/tags?post=31351"},{"taxonomy":"language-resource-type","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource-type?post=31351"},{"taxonomy":"language-resource-origin","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource-origin?post=31351"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}