{"id":31856,"date":"2025-02-10T10:39:34","date_gmt":"2025-02-10T09:39:34","guid":{"rendered":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/"},"modified":"2025-02-10T10:56:45","modified_gmt":"2025-02-10T09:56:45","slug":"oai-clarino-uib-no-jos1m","status":"publish","type":"language-resource","link":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/","title":{"rendered":"Training Corpus jos1M"},"content":{"rendered":"<p><?xml version='1.0' encoding='utf-8'?><br \/>\n<record><\/p>\n<header><identifier>oai:clarino.uib.no:Jos1M<\/identifier><datestamp>2018-03-06T10:18:36Z<\/datestamp><setSpec \/><\/header>\n<p><metadata><CMD xmlns=\"http:\/\/www.clarin.eu\/cmd\/\"><br \/>\n<Header><br \/>\n<MdCreator>Cheikh Bamba Dione<\/MdCreator><br \/>\n<MdCreationDate>2017-03-28<\/MdCreationDate><br \/>\n<MdSelfLink>hdl:11495\/DE48-E976-8C42-5<\/MdSelfLink><br \/>\n<MdProfile>clarin.eu:cr1:p_1407745711925<\/MdProfile><br \/>\n<MdCollectionDisplayName>Clarino Bergen Centre &#8211; INESS<\/MdCollectionDisplayName><br \/>\n<\/Header><Resources><ResourceProxyList \/><JournalFileProxyList \/><br \/>\n<ResourceRelationList \/><br \/>\n<IsPartOfList \/><\/Resources><br \/>\n<Components><br \/>\n<corpusProfile><br \/>\n    <resourceCommonInfo ComponentId=\"clarin.eu:cr1:c_1396012485126\"><br \/>\n        <resourceType>corpus<\/resourceType><br \/>\n        <identificationInfo ComponentId=\"clarin.eu:cr1:c_1396012485125\"><br \/>\n            <resourceName xml:lang=\"sl\">Training Corpus jos1M<\/resourceName><br \/>\n            <description xml:lang=\"sl\">The jos1M corpus contains 1 million words of sampled paragraphs from the FidaPLUS corpus. It is meant to serve as a training corpus for word-level tagging of Slovene. This silver-standard corpus is annotated for morphosyntactic descriptions (fine grained PoS tags) and lemmas, with about one fourth of the most problematic annotations hand-validated. The corpus is available in source TEI P5 XML and in the simpler and smaller vertical format, used by various concordancers.<\/description><br \/>\n            <resourceShortName>jos1M<\/resourceShortName><br \/>\n            <url>http:\/\/clarino.uib.no\/iness\/landing-page?resource=jos1M&amp;view=short<\/url><br \/>\n            <url>http:\/\/clarino.uib.no\/iness\/landing-page?resource=jos1M<\/url><br \/>\n            <PID>hdl:11495\/DC84-BF60-3823-5<\/PID><br \/>\n        <\/identificationInfo><br \/>\n        <distributionInfo ComponentId=\"clarin.eu:cr1:c_1396012485124\">\n            <licenceInfo ComponentId=\"clarin.eu:cr1:c_1396012485158\">\n                <userCategory>Public<\/userCategory>\n                <licence ComponentId=\"clarin.eu:cr1:c_1447674760330\">\n                    <licenceFamily>Creative Commons (CC)<\/licenceFamily>\n                    <licenceName>Creative_Commons-BY-NC (CC-BY-NC)<\/licenceName>\n                    <licenceURL>http:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/<\/licenceURL>\n                    <conditionsOfUse>BY<\/conditionsOfUse><br \/>\n                    <conditionsOfUse>NC<\/conditionsOfUse>\n                <\/licence>\n            <\/licenceInfo>\n        <\/distributionInfo><br \/>\n        <contact><br \/>\n            <actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><br \/>\n                <actorType>person<\/actorType><br \/>\n                <role>author<\/role>\n                <personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\">\n                    <surname>Krek<\/surname><br \/>\n                    <givenName>Simon<\/givenName><br \/>\n                    <affiliation><br \/>\n                        <organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><br \/>\n                            <organizationName xml:lang=\"en\">\u201cJo\u017eef Stefan\u201d Institute<\/organizationName><br \/>\n                        <\/organizationInfo><br \/>\n                    <\/affiliation>\n                <\/personInfo>\n            <\/actorInfo><br \/>\n        <\/contact><br \/>\n        <metadataInfo ComponentId=\"clarin.eu:cr1:c_1407745711922\"><br \/>\n            <metadataCreationDate>2017-03-28<\/metadataCreationDate><br \/>\n            <metadataLastDateUpdated>2018-03-06<\/metadataLastDateUpdated><br \/>\n            <metadataCreator><br \/>\n                <actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><br \/>\n                    <actorType>person<\/actorType>\n                    <personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\">\n                        <surname xml:lang=\"no\">Dione<\/surname><br \/>\n                        <givenName xml:lang=\"no\">Cheikh Bamba<\/givenName><br \/>\n                        <sex>male<\/sex>\n                        <position>Researcher (Ph.D)<\/position>\n                        <affiliation><br \/>\n                            <organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><br \/>\n                                <organizationName xml:lang=\"en\">University of Bergen<\/organizationName><br \/>\n                                <organizationName xml:lang=\"no\">Universitetet i Bergen<\/organizationName><br \/>\n                                <organizationShortName xml:lang=\"no\">UiB<\/organizationShortName><br \/>\n                                <organizationShortName xml:lang=\"en\">UoB<\/organizationShortName><br \/>\n                                <departmentName xml:lang=\"en\">Department of Linguistic, Literary and Aesthetic Studies<\/departmentName><br \/>\n                            <\/organizationInfo><br \/>\n                        <\/affiliation>\n                    <\/personInfo>\n                    <communicationInfo ComponentId=\"clarin.eu:cr1:c_1352813745460\"><br \/>\n                        <email>clarin@uib.no<\/email><br \/>\n                        <email>iness@uib.no<\/email><br \/>\n                    <\/communicationInfo><br \/>\n                <\/actorInfo><br \/>\n            <\/metadataCreator><br \/>\n        <\/metadataInfo><br \/>\n        <resourceCreationInfo ComponentId=\"clarin.eu:cr1:c_1407745711921\"><br \/>\n            <resourceCreator><br \/>\n                <actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><br \/>\n                    <actorType>person<\/actorType>\n                    <personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\">\n                        <surname>Erjavec, Toma\u017e<\/surname><br \/>\n                        <affiliation><br \/>\n                            <organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><br \/>\n                                <organizationName>Jo\u017eef Stefan Institute<\/organizationName><br \/>\n                            <\/organizationInfo><br \/>\n                        <\/affiliation>\n                    <\/personInfo>\n                <\/actorInfo><br \/>\n                <actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><br \/>\n                    <actorType>person<\/actorType>\n                    <personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\">\n                        <surname>Krek, Simon<\/surname><br \/>\n                        <affiliation><br \/>\n                            <organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><br \/>\n                                <organizationName>Jo\u017eef Stefan Institute<\/organizationName><br \/>\n                            <\/organizationInfo><br \/>\n                        <\/affiliation>\n                    <\/personInfo>\n                <\/actorInfo><br \/>\n            <\/resourceCreator><br \/>\n        <\/resourceCreationInfo><br \/>\n    <\/resourceCommonInfo><br \/>\n    <corpusInfo ComponentId=\"clarin.eu:cr1:c_1407745711878\"><br \/>\n        <corpusType>Written Corpus<\/corpusType><br \/>\n        <corpusPartInfo ComponentId=\"clarin.eu:cr1:c_1407745711885\"><br \/>\n            <mediaType>text<\/mediaType><br \/>\n        <\/corpusPartInfo><br \/>\n        <corpusPartGeneralInfo ComponentId=\"clarin.eu:cr1:c_1407745711882\"><br \/>\n            <annotationInfo ComponentId=\"clarin.eu:cr1:c_1407745711924\"><br \/>\n                <annotationType>morphosyntacticAnnotation-posTagging<\/annotationType><br \/>\n                <annotationType>lemmatization<\/annotationType><br \/>\n            <\/annotationInfo><br \/>\n        <\/corpusPartGeneralInfo><br \/>\n    <\/corpusInfo><br \/>\n<\/corpusProfile><\/Components><\/CMD><\/metadata><\/record><\/p>\n","protected":false},"template":"","categories":[],"tags":[],"language-resource-type":[7569],"language-resource-origin":[7558],"class_list":["post-31856","language-resource","type-language-resource","status-publish","hentry"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v27.1 (Yoast SEO v27.1.1) - https:\/\/yoast.com\/product\/yoast-seo-premium-wordpress\/ -->\n<title>Training Corpus jos1M - Spr\u00e5kbanken<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/\" \/>\n<meta property=\"og:locale\" content=\"nb_NO\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"Training Corpus jos1M\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/\" \/>\n<meta property=\"og:site_name\" content=\"Spr\u00e5kbanken\" \/>\n<meta property=\"article:modified_time\" content=\"2025-02-10T09:56:45+00:00\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"Ansl. lesetid\" \/>\n\t<meta name=\"twitter:data1\" content=\"1 minutt\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/\",\"url\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/\",\"name\":\"Training Corpus jos1M - Spr\u00e5kbanken\",\"isPartOf\":{\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/#website\"},\"datePublished\":\"2025-02-10T09:39:34+00:00\",\"dateModified\":\"2025-02-10T09:56:45+00:00\",\"breadcrumb\":{\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/#breadcrumb\"},\"inLanguage\":\"nb-NO\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"Home\",\"item\":\"https:\/\/www.nb.no\/sprakbanken\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"Resources from the resource bank\",\"item\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/\"},{\"@type\":\"ListItem\",\"position\":3,\"name\":\"Training Corpus jos1M\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/#website\",\"url\":\"https:\/\/www.nb.no\/sprakbanken\/\",\"name\":\"Spr\u00e5kbanken\",\"description\":\"\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.nb.no\/sprakbanken\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"nb-NO\"}]}<\/script>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"Training Corpus jos1M - Spr\u00e5kbanken","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/","og_locale":"nb_NO","og_type":"article","og_title":"Training Corpus jos1M","og_url":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/","og_site_name":"Spr\u00e5kbanken","article_modified_time":"2025-02-10T09:56:45+00:00","twitter_card":"summary_large_image","twitter_misc":{"Ansl. lesetid":"1 minutt"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/","url":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/","name":"Training Corpus jos1M - Spr\u00e5kbanken","isPartOf":{"@id":"https:\/\/www.nb.no\/sprakbanken\/#website"},"datePublished":"2025-02-10T09:39:34+00:00","dateModified":"2025-02-10T09:56:45+00:00","breadcrumb":{"@id":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/#breadcrumb"},"inLanguage":"nb-NO","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.nb.no\/sprakbanken\/ressurskatalog\/oai-clarino-uib-no-jos1m\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/www.nb.no\/sprakbanken\/"},{"@type":"ListItem","position":2,"name":"Resources from the resource bank","item":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/"},{"@type":"ListItem","position":3,"name":"Training Corpus jos1M"}]},{"@type":"WebSite","@id":"https:\/\/www.nb.no\/sprakbanken\/#website","url":"https:\/\/www.nb.no\/sprakbanken\/","name":"Spr\u00e5kbanken","description":"","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.nb.no\/sprakbanken\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"nb-NO"}]}},"lang":"nb","translations":{"nb":31856,"en":31859},"pll_sync_post":[],"_links":{"self":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource\/31856","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource"}],"about":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/types\/language-resource"}],"wp:attachment":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/media?parent=31856"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/categories?post=31856"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/tags?post=31856"},{"taxonomy":"language-resource-type","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource-type?post=31856"},{"taxonomy":"language-resource-origin","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource-origin?post=31856"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}