{"id":30640,"date":"2025-02-10T10:38:16","date_gmt":"2025-02-10T09:38:16","guid":{"rendered":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank-2\/"},"modified":"2025-02-10T10:55:27","modified_gmt":"2025-02-10T09:55:27","slug":"oai-clarino-uib-no-bul-treebank","status":"publish","type":"language-resource","link":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/","title":{"rendered":"The Morphologically Annotated Part of BulTreeBank"},"content":{"rendered":"<p><?xml version=\"1.0\" encoding=\"utf-8\"?><br \/>\n<record><\/p>\n<header><identifier>oai:clarino.uib.no:bul-treebank<\/identifier><datestamp>2018-03-05T11:30:38Z<\/datestamp><setSpec>INESS<\/setSpec><\/header>\n<p><metadata><CMD xmlns=\"http:\/\/www.clarin.eu\/cmd\/\"><Header><MdCreator>Gunn Inger Lyse Samdal<\/MdCreator><MdCreationDate>2015-05-26<\/MdCreationDate><MdSelfLink>hdl:11495\/D935-7715-CE31-0<\/MdSelfLink><MdProfile>clarin.eu:cr1:p_1407745711925<\/MdProfile><MdCollectionDisplayName>Clarino UiB<\/MdCollectionDisplayName><\/Header><Resources><ResourceProxyList><ResourceProxy id=\"ref-resource\"><ResourceType mimetype=\"\">Resource<\/ResourceType><ResourceRef>hdl:11495\/D93F-C6E9-65D9-2<\/ResourceRef><\/ResourceProxy><ResourceProxy id=\"ref-landingpage\"><ResourceType mimetype=\"\">LandingPage<\/ResourceType><ResourceRef>hdl:11495\/D93F-C6E9-65D9-2<\/ResourceRef><\/ResourceProxy><\/ResourceProxyList><JournalFileProxyList\/><ResourceRelationList\/><IsPartOfList\/><\/Resources><Components><corpusProfile><resourceCommonInfo ComponentId=\"clarin.eu:cr1:c_1396012485126\" ref=\"ref-resource\"><resourceType>corpus<\/resourceType><identificationInfo ComponentId=\"clarin.eu:cr1:c_1396012485125\"><resourceName xml:lang=\"en\">The Morphologically Annotated Part of BulTreeBank<\/resourceName><description xml:lang=\"en\">This distribution represents only the morphological information encoded in BulTreeBank &#8211; HPSG-based Treebank of Bulgarian. It contains about 214000 tokens. It was used for the training of the TreeTagger for Bulgarian.<\/p>\n<p>It contains sentences from Bulgarian Grammar Textbooks, Newspapers, Literature and other sources of texts.<\/p>\n<p>Full documentation (Style Book, Tagset description) of the Treebank can be found on: http:\/\/www.bultreebank.org\/TechRep.html<\/description><resourceShortName xml:lang=\"en\">BulTreeBank-Morph<\/resourceShortName><url description=\"Landing page @ corpuscle\">http:\/\/clarino.uib.no\/korpuskel\/landing-page?resource=bul-treebank&amp;view=short<\/url><url description=\"General info page for BulTreebank\">http:\/\/www.bultreebank.org\/btbmorf\/<\/url><PID>hdl:11495\/D93F-C6E9-65D9-2<\/PID><identifier>bul-treebank<\/identifier><\/identificationInfo><distributionInfo ComponentId=\"clarin.eu:cr1:c_1396012485124\"><licenceInfo ComponentId=\"clarin.eu:cr1:c_1396012485158\"><userCategory>Public<\/userCategory><distributionAccessMedium>downloadable<\/distributionAccessMedium><distributionAccessMedium>accessibleThroughInterface<\/distributionAccessMedium><downloadLocation>http:\/\/www.bultreebank.org\/btbmorf\/<\/downloadLocation><executionLocation description=\"landing page @ Corpuscle\">https:\/\/hdl.handle.net\/11495\/D93F-C6E9-65D9-2<\/executionLocation><licence ComponentId=\"clarin.eu:cr1:c_1447674760330\"><licenceFamily>META-SHARE (MS)<\/licenceFamily><licenceName>META-SHARE NonCommercial NoRedistribution (MS-NC-NoReD)<\/licenceName><licenceURL>http:\/\/www.meta-net.eu\/meta-share\/meta-share-licenses\/META-SHARE%20NonCommercial%20NoRedistribution-v%201.0.pdf<\/licenceURL><conditionsOfUse>BY<\/conditionsOfUse><conditionsOfUse>ID<\/conditionsOfUse><conditionsOfUse>LRT<\/conditionsOfUse><conditionsOfUse>NC<\/conditionsOfUse><conditionsOfUse>NORED<\/conditionsOfUse><\/licence><\/licenceInfo><iprHolder><actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><actorType>person<\/actorType><personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\"><surname xml:lang=\"bg\">Simov<\/surname><givenName xml:lang=\"bg\">Kiril<\/givenName><sex>male<\/sex><position>Associate Professor<\/position><affiliation><organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><organizationName xml:lang=\"en\">Bulgarian Academy of Sciences<\/organizationName><departmentName xml:lang=\"en\">BulTreeBank Group, Linguistic Modelling Laboratory, IICT<\/departmentName><\/organizationInfo><\/affiliation><\/personInfo><communicationInfo ComponentId=\"clarin.eu:cr1:c_1352813745460\"><email>kivs@bultreebank.org<\/email><url>http:\/\/www.bultreebank.org\/btbmorf\/<\/url><\/p>\n<address>Acad. G.Bonchev 25A<\/address>\n<p><zipCode>1113<\/zipCode><city>Sofia<\/city><country>Bulgaria<\/country><telephoneNumber>+359888473413<\/telephoneNumber><\/communicationInfo><\/actorInfo><\/iprHolder><\/distributionInfo><contact><actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><actorType>person<\/actorType><personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\"><surname xml:lang=\"bg\">Simov<\/surname><givenName xml:lang=\"bg\">Kiril<\/givenName><sex>male<\/sex><position>Associate Professor<\/position><affiliation><organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><organizationName xml:lang=\"en\">Bulgarian Academy of Sciences<\/organizationName><departmentName xml:lang=\"en\">BulTreeBank Group, Linguistic Modelling Laboratory, IICT<\/departmentName><\/organizationInfo><\/affiliation><\/personInfo><communicationInfo ComponentId=\"clarin.eu:cr1:c_1352813745460\"><email>kivs@bultreebank.org<\/email><url>http:\/\/www.bultreebank.org\/btbmorf\/<\/url><\/p>\n<address>Acad. G.Bonchev 25A<\/address>\n<p><zipCode>1113<\/zipCode><city>Sofia<\/city><country>Bulgaria<\/country><telephoneNumber>+359888473413<\/telephoneNumber><\/communicationInfo><\/actorInfo><\/contact><metadataInfo ComponentId=\"clarin.eu:cr1:c_1407745711922\"><metadataCreationDate>2015-05-26<\/metadataCreationDate><source>This metadata is based on the metadata originally created in META-SHARE in 2012. The present metadata should be considered as authoritative.<\/source><originalMetadataSchema>META-SHARE<\/originalMetadataSchema><originalMetadataLink>http:\/\/metashare.nb.no\/repository\/browse\/the-morphologically-annotated-part-of-bultreebank\/b3f0ba40395711e2b66e001708556d5a5db5c7f848dc4048b06b47f7835d6956\/<\/originalMetadataLink><metadataLanguageName>English<\/metadataLanguageName><metadataLanguageId>en<\/metadataLanguageId><metadataLastDateUpdated>2018-03-05<\/metadataLastDateUpdated><metadataCreator><actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><actorType>person<\/actorType><personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\"><surname xml:lang=\"no\">Lyse<\/surname><givenName xml:lang=\"no\">Gunn Inger<\/givenName><sex>female<\/sex><position>Researcher (Ph.D)<\/position><affiliation><organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><organizationName xml:lang=\"en\">University of Bergen<\/organizationName><organizationName xml:lang=\"no\">Universitetet i Bergen<\/organizationName><organizationShortName xml:lang=\"no\">UiB<\/organizationShortName><organizationShortName xml:lang=\"en\">UoB<\/organizationShortName><departmentName xml:lang=\"en\">Department of Linguistic, Literary and Aesthetic Studies<\/departmentName><\/organizationInfo><\/affiliation><\/personInfo><communicationInfo ComponentId=\"clarin.eu:cr1:c_1352813745460\"><email>iness@uib.no<\/email><email>clarin@uib.no<\/email><\/communicationInfo><\/actorInfo><actorInfo ComponentId=\"clarin.eu:cr1:c_1396012485194\"><actorType>person<\/actorType><personInfo ComponentId=\"clarin.eu:cr1:c_1396012485192\"><surname xml:lang=\"bg\">Simov<\/surname><givenName xml:lang=\"bg\">Kiril<\/givenName><sex>male<\/sex><position>Associate Professor<\/position><affiliation><organizationInfo ComponentId=\"clarin.eu:cr1:c_1407745711883\"><organizationName xml:lang=\"en\">Bulgarian Academy of Sciences<\/organizationName><departmentName xml:lang=\"en\">BulTreeBank Group, Linguistic Modelling Laboratory, IICT<\/departmentName><\/organizationInfo><\/affiliation><\/personInfo><communicationInfo ComponentId=\"clarin.eu:cr1:c_1352813745460\"><email>kivs@bultreebank.org<\/email><url>http:\/\/www.bultreebank.org\/btbmorf\/<\/url><\/p>\n<address>Acad. G.Bonchev 25A<\/address>\n<p><zipCode>1113<\/zipCode><city>Sofia<\/city><country>Bulgaria<\/country><telephoneNumber>+359888473413<\/telephoneNumber><\/communicationInfo><\/actorInfo><\/metadataCreator><\/metadataInfo><resourceDocumentationInfo ComponentId=\"clarin.eu:cr1:c_1355150532301\"><documentationUnstructured ComponentId=\"clarin.eu:cr1:c_1355150532302\"><role>documentation<\/role><documentUnstructured>http:\/\/www.bultreebank.org\/btbmorf\/<\/documentUnstructured><\/documentationUnstructured><\/resourceDocumentationInfo><\/resourceCommonInfo><corpusInfo ComponentId=\"clarin.eu:cr1:c_1407745711878\" ref=\"ref-resource\"><corpusType>Written Corpus<\/corpusType><corpusPartInfo ComponentId=\"clarin.eu:cr1:c_1407745711885\"><mediaType>text<\/mediaType><\/corpusPartInfo><corpusPartGeneralInfo ComponentId=\"clarin.eu:cr1:c_1407745711882\"><sourceWorkInfo ComponentId=\"clarin.eu:cr1:c_1407745712071\"><workDescription>It contains sentences from Bulgarian Grammar Textbooks, Newspapers, Literature and other sources of texts. For a full text acknowledgement, see:<br \/>\nhttp:\/\/www.bultreebank.org\/TextAcknowledgements.html<\/workDescription><\/sourceWorkInfo><lingualityInfo ComponentId=\"clarin.eu:cr1:c_1355150532313\"><lingualityType>monolingual<\/lingualityType><\/lingualityInfo><languageInfo ComponentId=\"clarin.eu:cr1:c_1428388179423\"><languageId>bg<\/languageId><languageName>Bulgarian<\/languageName><\/languageInfo><sizeInfo ComponentId=\"clarin.eu:cr1:c_1353678848785\"><size>214000<\/size><sizeUnit>tokens<\/sizeUnit><\/sizeInfo><annotationInfo ComponentId=\"clarin.eu:cr1:c_1407745711924\"><annotationType>morphosyntacticAnnotation-posTagging<\/annotationType><tagset>http:\/\/www.bultreebank.org\/TechRep\/BTB-TR03.pdf<\/tagset><theoreticModel>HPSG<\/theoreticModel><annotationMode>mixed<\/annotationMode><annotationModeDetails>The morphological analyzer assigns all possible morphosyntactic analyses to tokens.The process of disambiguation is two-fold: first a set of &#8216;certain&#8217; rules are applied, to ensure full precision. Then the rest of the corpus has been disambiguated manually. (Source: p.2, http:\/\/www.bultreebank.org\/TechRep\/BTB-TR03.pdf)<\/annotationModeDetails><annotationManualUnstructured ComponentId=\"clarin.eu:cr1:c_1355150532325\"><role>annotationManual<\/role><documentUnstructured>Several documents can be found at: http:\/\/www.bultreebank.org\/TechRep.html.<br \/>\nSelected document: Kiril Simov, Petya Osenova and Milena Slavcheva. BTB-TR03: BulTreeBank Morphosyntactic Tagset. BulTreeBank Project Technical Report \u2116 03. 2004<\/documentUnstructured><\/annotationManualUnstructured><\/annotationInfo><\/corpusPartGeneralInfo><\/corpusInfo><\/corpusProfile><\/Components><\/CMD><\/metadata><\/record><\/p>\n","protected":false},"template":"","categories":[],"tags":[],"language-resource-type":[7572],"language-resource-origin":[7565],"class_list":["post-30640","language-resource","type-language-resource","status-publish","hentry"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v27.1 (Yoast SEO v27.1.1) - https:\/\/yoast.com\/product\/yoast-seo-premium-wordpress\/ -->\n<title>The Morphologically Annotated Part of BulTreeBank - Spr\u00e5kbanken<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/\" \/>\n<meta property=\"og:locale\" content=\"nb_NO\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"The Morphologically Annotated Part of BulTreeBank\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/\" \/>\n<meta property=\"og:site_name\" content=\"Spr\u00e5kbanken\" \/>\n<meta property=\"article:modified_time\" content=\"2025-02-10T09:55:27+00:00\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"Ansl. lesetid\" \/>\n\t<meta name=\"twitter:data1\" content=\"2 minutter\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/\",\"url\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/\",\"name\":\"The Morphologically Annotated Part of BulTreeBank - Spr\u00e5kbanken\",\"isPartOf\":{\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/#website\"},\"datePublished\":\"2025-02-10T09:38:16+00:00\",\"dateModified\":\"2025-02-10T09:55:27+00:00\",\"breadcrumb\":{\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/#breadcrumb\"},\"inLanguage\":\"nb-NO\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"Home\",\"item\":\"https:\/\/www.nb.no\/sprakbanken\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"Resources from the resource bank\",\"item\":\"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/\"},{\"@type\":\"ListItem\",\"position\":3,\"name\":\"The Morphologically Annotated Part of BulTreeBank\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.nb.no\/sprakbanken\/#website\",\"url\":\"https:\/\/www.nb.no\/sprakbanken\/\",\"name\":\"Spr\u00e5kbanken\",\"description\":\"\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.nb.no\/sprakbanken\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"nb-NO\"}]}<\/script>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"The Morphologically Annotated Part of BulTreeBank - Spr\u00e5kbanken","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/","og_locale":"nb_NO","og_type":"article","og_title":"The Morphologically Annotated Part of BulTreeBank","og_url":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/","og_site_name":"Spr\u00e5kbanken","article_modified_time":"2025-02-10T09:55:27+00:00","twitter_card":"summary_large_image","twitter_misc":{"Ansl. lesetid":"2 minutter"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/","url":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/","name":"The Morphologically Annotated Part of BulTreeBank - Spr\u00e5kbanken","isPartOf":{"@id":"https:\/\/www.nb.no\/sprakbanken\/#website"},"datePublished":"2025-02-10T09:38:16+00:00","dateModified":"2025-02-10T09:55:27+00:00","breadcrumb":{"@id":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/#breadcrumb"},"inLanguage":"nb-NO","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/oai-clarino-uib-no-bul-treebank\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/www.nb.no\/sprakbanken\/"},{"@type":"ListItem","position":2,"name":"Resources from the resource bank","item":"https:\/\/www.nb.no\/sprakbanken\/en\/resource-catalogue\/"},{"@type":"ListItem","position":3,"name":"The Morphologically Annotated Part of BulTreeBank"}]},{"@type":"WebSite","@id":"https:\/\/www.nb.no\/sprakbanken\/#website","url":"https:\/\/www.nb.no\/sprakbanken\/","name":"Spr\u00e5kbanken","description":"","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.nb.no\/sprakbanken\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"nb-NO"}]}},"lang":"en","translations":{"nb":30637,"en":30640},"pll_sync_post":[],"_links":{"self":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource\/30640","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource"}],"about":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/types\/language-resource"}],"wp:attachment":[{"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/media?parent=30640"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/categories?post=30640"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/tags?post=30640"},{"taxonomy":"language-resource-type","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource-type?post=30640"},{"taxonomy":"language-resource-origin","embeddable":true,"href":"https:\/\/www.nb.no\/sprakbanken\/wp-json\/wp\/v2\/language-resource-origin?post=30640"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}