<?xml version="1.0" encoding="utf-8"?><!DOCTYPE article  PUBLIC '-//OASIS//DTD DocBook XML V4.4//EN'  'http://www.docbook.org/xml/4.4/docbookx.dtd'><article><articleinfo><title>PDB</title><revhistory><revision><revnumber>59</revnumber><date>2022-09-09 07:04:06</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>58</revnumber><date>2020-11-30 13:27:15</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>57</revnumber><date>2020-10-01 08:47:11</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>56</revnumber><date>2020-07-02 17:02:01</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>55</revnumber><date>2020-05-27 16:30:57</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>54</revnumber><date>2020-01-30 12:25:12</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>53</revnumber><date>2020-01-30 12:25:01</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>52</revnumber><date>2020-01-30 12:22:42</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>51</revnumber><date>2020-01-30 12:14:58</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>50</revnumber><date>2019-04-25 12:52:21</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>49</revnumber><date>2019-04-25 12:51:04</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>48</revnumber><date>2019-01-18 11:07:14</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>47</revnumber><date>2019-01-18 11:01:25</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>46</revnumber><date>2019-01-18 10:03:41</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>45</revnumber><date>2018-10-05 15:07:35</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>44</revnumber><date>2018-10-05 15:07:18</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>43</revnumber><date>2018-10-05 14:57:51</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>42</revnumber><date>2018-10-05 14:54:01</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>41</revnumber><date>2018-10-05 14:50:51</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>40</revnumber><date>2018-10-05 14:50:08</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>39</revnumber><date>2018-10-05 14:48:25</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>38</revnumber><date>2018-10-05 14:47:18</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>37</revnumber><date>2018-10-05 14:46:51</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>36</revnumber><date>2018-10-05 14:46:19</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>35</revnumber><date>2018-10-05 14:43:59</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>34</revnumber><date>2018-10-05 14:38:09</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>33</revnumber><date>2018-10-05 14:37:23</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>32</revnumber><date>2018-10-05 14:36:43</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>31</revnumber><date>2018-10-05 14:22:07</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>30</revnumber><date>2018-10-05 14:21:40</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>29</revnumber><date>2018-10-05 14:18:38</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>28</revnumber><date>2018-09-10 14:00:32</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>27</revnumber><date>2018-09-10 13:54:51</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>26</revnumber><date>2018-09-10 13:46:31</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>25</revnumber><date>2018-09-10 13:34:57</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>24</revnumber><date>2018-09-10 13:33:22</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>23</revnumber><date>2018-09-10 09:44:24</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>22</revnumber><date>2018-09-10 09:32:43</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>21</revnumber><date>2018-08-25 22:28:44</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>20</revnumber><date>2018-08-25 22:28:14</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>19</revnumber><date>2018-07-23 21:02:34</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>18</revnumber><date>2018-07-23 20:58:36</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>17</revnumber><date>2018-07-23 20:58:17</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>16</revnumber><date>2018-07-18 19:02:44</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>15</revnumber><date>2018-07-18 18:55:57</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>14</revnumber><date>2018-07-18 18:55:13</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>13</revnumber><date>2018-07-18 18:54:38</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>12</revnumber><date>2018-07-18 18:53:57</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>11</revnumber><date>2018-06-22 13:57:31</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>10</revnumber><date>2018-06-22 13:56:36</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>9</revnumber><date>2018-06-15 09:35:57</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>8</revnumber><date>2018-06-15 09:26:56</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>7</revnumber><date>2018-03-22 11:03:53</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>6</revnumber><date>2018-03-22 11:03:07</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>5</revnumber><date>2018-03-22 11:02:57</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>4</revnumber><date>2017-06-27 09:21:08</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>3</revnumber><date>2017-06-12 20:32:55</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>2</revnumber><date>2017-05-24 17:45:46</date><authorinitials>AlinaWroblewska</authorinitials></revision><revision><revnumber>1</revnumber><date>2017-05-24 12:22:13</date><authorinitials>AlinaWroblewska</authorinitials></revision></revhistory></articleinfo><section><title>Polish Dependency Bank 2.0 (PDB 2.0)</title><para>PDB 2.0 is an extended version of <emphasis>Składnica zależnościowa</emphasis> (the first Polish dependency treebank). It consists of 22,152 trees and 350,001 tokens (i.e. 15.8 tokens per sentence on average). There are four parts of PDB 2.0: </para><orderedlist numeration="arabic"><listitem><para>NKJP1M-based trees (14K) </para></listitem><listitem><para>Projection-based trees (4K) </para></listitem><listitem><para>CDScorpus-based trees (2K) </para></listitem><listitem><para>OTHER trees (2K) </para></listitem></orderedlist><para>The PDB sentences contain some problematic linguistic phenomena, e.g. ellipsis, comparative constructions, constructions with the bi-functional subordinating conjunction JAKO, directed speech, interpolations and comments, nominative noun phrases used in the vocative function and many others. The Polish dependency relation types are as follows: abbrev_punct, adjunct, adjunct_compar, adjunct_qt, adjunct_rc, aglt, app, aux, comp, comp_ag, comp_fin, comp_inf, cond, conjunct, imp, item, mwe, ne, neg, obj, obj_th, pd, pre_coord, punct, refl, root, subj, vocative. Descritptions of Polish dependency relation types are at <ulink url="http://zil.ipipan.waw.pl/PDB/DepRelTypes"/>. Some dependents are annotated with semantic roles, e.g. Beneficiary/Recipient.  </para><para><emphasis role="strong">Download</emphasis>: The updated version of <ulink url="http://zil.ipipan.waw.pl/PDB/PDB?action=AttachFile&amp;do=get&amp;target=NKJP1M_Skladnica_sem.conll">Składnica zależnościowa</ulink> (the first version of PDB). If you wish to get the entire PDB corpus (22K sentences annotated with the dependency trees) please contact <emphasis>alina</emphasis> &lt;at&gt; <emphasis>ipipan.waw.pl</emphasis> (replace &lt;at&gt; with @). </para><section><title>PDB in Universal Dependencies format (PDB-UD)</title><para>PDB-UD is a conversion of PDB in the UD-like format. It is an extended and corrected version of the Polish UD treebank (the release 2.1). PDB-UD contains enhanced graphs, i.e. trees with enhanced edges encoding shared dependents of coordinated elements, e.g. <emphasis>Dziewczynka śpiewa i tańczy</emphasis> (The girl sings and dances), and shared governors of coordinated elements, e.g. <emphasis>Dziewczynka i chłopiec śpiewają</emphasis> (A girl and a boy sing). The Polish dependency types are listed <ulink url="https://universaldependencies.org/pl/dep">here</ulink>. </para><para>PDB-UD trees were used in two shared tasks: <ulink url="http://multiword.sourceforge.net/PHITE.php?sitesig=CONF&amp;page=CONF_04_LAW-MWE-CxG_2018___lb__COLING__rb__&amp;subpage=CONF_40_Shared_Task">LAW-MWE-CxG-2018</ulink> and <ulink url="http://poleval.pl">PolEval 2018</ulink>. </para><para><emphasis role="strong">Download:</emphasis> PDB-UD is publicly available on <ulink url="http://git.nlp.ipipan.waw.pl/alina/PDBUD"/> </para><para><emphasis role="strong">Download</emphasis>: Alternatively, you can download PDB-UD trees from <ulink url="https://github.com/UniversalDependencies/UD_Polish-PDB">UD repository</ulink>. </para></section><section><title>PDB-trained COMBO's  models</title><para>Natural language preprocessing models estimated on PDB and PDB-UD are available at <ulink url="http://zil.ipipan.waw.pl/PDB/COMBO"/>. </para><section><title>Publications</title></section><section><title>Acknowledgements</title><para>The creation of PDB was supported by grant no POIG.01.01.02-14-013/09 from Innovative Economy Operational Programme co-financed by the European Union (European Regional Development Fund) and by the grant from the Polish Ministry of Science and Higher Education as part of the investment in the CLARIN-PL research infrastructure (2016-2020). </para></section><section><title>Licence</title><para>The resources are distributed under the <ulink url="https://creativecommons.org/licenses/by-nc-sa/4.0/">CC BY-NC-SA 4.0</ulink> licence. </para></section><section><title>Contact</title><para>Any questions, comments? Please send them to Alina Wróblewska <code>&lt;alina AT SPAMFREE ipipan DOT waw DOT pl&gt;</code>. </para></section></section></section></article>