<?xml version="1.0"?>
<oembed><version>1.0</version><provider_name>Centre for Language Technology</provider_name><provider_url>https://mtd.setur.fo/en</provider_url><author_name>Admin</author_name><author_url>https://mtd.setur.fo/en/author/admin/</author_url><title>WiLI-2018: Wikipedia Language Identification Database - M&#xE1;lt&#xF8;knidepilin</title><type>rich</type><width>600</width><height>338</height><html>&lt;blockquote class="wp-embedded-content" data-secret="f4v7PmKoGp"&gt;&lt;a href="https://mtd.setur.fo/en/resource/wili-2018-wikipedia-language-identification-database/"&gt;WiLI-2018: Wikipedia Language Identification Database&lt;/a&gt;&lt;/blockquote&gt;&lt;iframe sandbox="allow-scripts" security="restricted" src="https://mtd.setur.fo/en/resource/wili-2018-wikipedia-language-identification-database/embed/#?secret=f4v7PmKoGp" width="600" height="338" title="&#x201C;WiLI-2018: Wikipedia Language Identification Database&#x201D; &#x2014; M&#xE1;lt&#xF8;knidepilin" data-secret="f4v7PmKoGp" frameborder="0" marginwidth="0" marginheight="0" scrolling="no" class="wp-embedded-content"&gt;&lt;/iframe&gt;&lt;script&gt;
/*! This file is auto-generated */
!function(d,l){"use strict";l.querySelector&amp;&amp;d.addEventListener&amp;&amp;"undefined"!=typeof URL&amp;&amp;(d.wp=d.wp||{},d.wp.receiveEmbedMessage||(d.wp.receiveEmbedMessage=function(e){var t=e.data;if((t||t.secret||t.message||t.value)&amp;&amp;!/[^a-zA-Z0-9]/.test(t.secret)){for(var s,r,n,a=l.querySelectorAll('iframe[data-secret="'+t.secret+'"]'),o=l.querySelectorAll('blockquote[data-secret="'+t.secret+'"]'),c=new RegExp("^https?:$","i"),i=0;i&lt;o.length;i++)o[i].style.display="none";for(i=0;i&lt;a.length;i++)s=a[i],e.source===s.contentWindow&amp;&amp;(s.removeAttribute("style"),"height"===t.message?(1e3&lt;(r=parseInt(t.value,10))?r=1e3:~~r&lt;200&amp;&amp;(r=200),s.height=r):"link"===t.message&amp;&amp;(r=new URL(s.getAttribute("src")),n=new URL(t.value),c.test(n.protocol))&amp;&amp;n.host===r.host&amp;&amp;l.activeElement===s&amp;&amp;(d.top.location.href=t.value))}},d.addEventListener("message",d.wp.receiveEmbedMessage,!1),l.addEventListener("DOMContentLoaded",function(){for(var e,t,s=l.querySelectorAll("iframe.wp-embedded-content"),r=0;r&lt;s.length;r++)(t=(e=s[r]).getAttribute("data-secret"))||(t=Math.random().toString(36).substring(2,12),e.src+="#?secret="+t,e.setAttribute("data-secret",t)),e.contentWindow.postMessage({message:"ready",secret:t},"*")},!1)))}(window,document);
//# sourceURL=https://mtd.setur.fo/wp-includes/js/wp-embed.min.js
&lt;/script&gt;</html><thumbnail_url>https://i0.wp.com/mtd.setur.fo/wp-content/uploads/2023/11/wikipedia_logo_icon_169796.png?fit=512%2C512&amp;ssl=1</thumbnail_url><thumbnail_width>512</thumbnail_width><thumbnail_height>512</thumbnail_height><description>This contains 1,000 paragraphs in Faroese (and the same amount in all the other 234 languages). This means that there are 500 paragraphs in the training set and another 500 paragraphs in the test set. You can download the files for all 235 languages below.</description></oembed>
