From 5779f6c21203e42a048f32128a0f4e567d921a8e Mon Sep 17 00:00:00 2001 From: milanmajchrak <90026355+milanmajchrak@users.noreply.github.com> Date: Mon, 16 Oct 2023 14:04:45 +0200 Subject: [PATCH] ufal/fe-license-static-pages-are-missing (#380) * Added static files and redirection * Html content is loaded from the static file and rendered in the component. * The html file content is showed in the `static/` route with the error page. The translation works. * Created routing for the `licenses` page and changed administrator license table to `licenses/manage-table` path * Show all licenses data. * All licenses are filtered by license label - PUB, ACA, RES * Added loading bar * Added redirect from license selector * Fixed tests. * Refactoring * Fixed lint error - unused import * Added docs and translations. * Removed accidentally added semicolon. * Added simple test if the html file content will be loaded. --- src/app/app-routing-paths.ts | 6 + src/app/app-routing.module.ts | 8 +- .../clarin-all-licenses-page.component.html | 34 + .../clarin-all-licenses-page.component.scss | 22 + ...clarin-all-licenses-page.component.spec.ts | 44 + .../clarin-all-licenses-page.component.ts | 71 ++ .../clarin-license-routing.module.ts | 32 +- .../clarin-licenses/clarin-license.module.ts | 2 + src/app/menu.resolver.ts | 3 +- src/app/shared/html-content.service.ts | 22 + src/app/shared/shared.module.ts | 4 +- .../static-page/static-page-routing-paths.ts | 6 + .../static-page/static-page-routing.module.ts | 19 + .../static-page/static-page.component.html | 3 + .../static-page/static-page.component.scss | 3 + .../static-page/static-page.component.spec.ts | 56 ++ src/app/static-page/static-page.component.ts | 87 ++ src/app/static-page/static-page.module.ts | 17 + .../section-license.component.html | 2 +- src/assets/i18n/cs.json5 | 20 +- src/assets/i18n/en.json5 | 16 +- src/static-files/error.html | 40 + src/static-files/licence-TAUS_QT21.html | 181 ++++ src/static-files/licence-UD-1.1.html | 159 +++ src/static-files/licence-UD-1.2.html | 252 +++++ src/static-files/licence-UD-1.3.html | 338 +++++++ src/static-files/licence-UD-1.4.html | 385 ++++++++ src/static-files/licence-UD-2.0.html | 415 ++++++++ src/static-files/licence-UD-2.1.html | 575 +++++++++++ src/static-files/licence-UD-2.2.html | 680 +++++++++++++ src/static-files/licence-UD-2.3.html | 714 ++++++++++++++ src/static-files/licence-UD-2.4.html | 800 +++++++++++++++ src/static-files/licence-UD-2.5.html | 848 ++++++++++++++++ src/static-files/licence-UDer-0.5.html | 95 ++ src/static-files/licence-UDer-1.0.html | 182 ++++ src/static-files/licence-UDer-1.1.html | 202 ++++ src/static-files/licence-hamledt-2.0.html | 241 +++++ src/static-files/licence-hamledt-3.0.html | 429 ++++++++ src/static-files/licence-hamledt.html | 85 ++ src/static-files/licence-mwe-1.0.html | 185 ++++ src/static-files/licence-mwe-1.1.html | 72 ++ src/static-files/licence-mwe-1.2-raw.html | 138 +++ src/static-files/licence-mwe-1.2.html | 65 ++ src/static-files/licence-mwe-literal.html | 55 ++ src/static-files/licence-pdtsl.html | 70 ++ src/static-files/licence-unisegs-1.0.html | 229 +++++ src/static-files/license-NLPC-WeC.html | 134 +++ src/static-files/license-PAWS.html | 99 ++ src/static-files/license-cnc-data.html | 76 ++ src/static-files/license-cnc.html | 153 +++ src/static-files/license-corefud-0.1.html | 100 ++ src/static-files/license-corefud-0.2.html | 99 ++ src/static-files/license-pcedt2.html | 102 ++ src/static-files/license-pdt2.html | 120 +++ .../license-templateXXXX-versionXX.html | 76 ++ src/static-files/license-ud-1.0.html | 53 + src/static-files/license-ud-2.6.html | 706 +++++++++++++ src/static-files/license-ud-2.7.html | 787 +++++++++++++++ src/static-files/license-ud-2.8.html | 863 ++++++++++++++++ src/static-files/license-ud-2.9.html | 924 ++++++++++++++++++ webpack/webpack.common.ts | 4 + 61 files changed, 12194 insertions(+), 14 deletions(-) create mode 100644 src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.html create mode 100644 src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.scss create mode 100644 src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.spec.ts create mode 100644 src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.ts create mode 100644 src/app/shared/html-content.service.ts create mode 100644 src/app/static-page/static-page-routing-paths.ts create mode 100644 src/app/static-page/static-page-routing.module.ts create mode 100644 src/app/static-page/static-page.component.html create mode 100644 src/app/static-page/static-page.component.scss create mode 100644 src/app/static-page/static-page.component.spec.ts create mode 100644 src/app/static-page/static-page.component.ts create mode 100644 src/app/static-page/static-page.module.ts create mode 100644 src/static-files/error.html create mode 100644 src/static-files/licence-TAUS_QT21.html create mode 100644 src/static-files/licence-UD-1.1.html create mode 100644 src/static-files/licence-UD-1.2.html create mode 100644 src/static-files/licence-UD-1.3.html create mode 100644 src/static-files/licence-UD-1.4.html create mode 100644 src/static-files/licence-UD-2.0.html create mode 100644 src/static-files/licence-UD-2.1.html create mode 100644 src/static-files/licence-UD-2.2.html create mode 100644 src/static-files/licence-UD-2.3.html create mode 100644 src/static-files/licence-UD-2.4.html create mode 100644 src/static-files/licence-UD-2.5.html create mode 100644 src/static-files/licence-UDer-0.5.html create mode 100644 src/static-files/licence-UDer-1.0.html create mode 100644 src/static-files/licence-UDer-1.1.html create mode 100644 src/static-files/licence-hamledt-2.0.html create mode 100644 src/static-files/licence-hamledt-3.0.html create mode 100644 src/static-files/licence-hamledt.html create mode 100644 src/static-files/licence-mwe-1.0.html create mode 100644 src/static-files/licence-mwe-1.1.html create mode 100644 src/static-files/licence-mwe-1.2-raw.html create mode 100644 src/static-files/licence-mwe-1.2.html create mode 100644 src/static-files/licence-mwe-literal.html create mode 100644 src/static-files/licence-pdtsl.html create mode 100644 src/static-files/licence-unisegs-1.0.html create mode 100644 src/static-files/license-NLPC-WeC.html create mode 100644 src/static-files/license-PAWS.html create mode 100644 src/static-files/license-cnc-data.html create mode 100644 src/static-files/license-cnc.html create mode 100644 src/static-files/license-corefud-0.1.html create mode 100644 src/static-files/license-corefud-0.2.html create mode 100644 src/static-files/license-pcedt2.html create mode 100644 src/static-files/license-pdt2.html create mode 100644 src/static-files/license-templateXXXX-versionXX.html create mode 100644 src/static-files/license-ud-1.0.html create mode 100644 src/static-files/license-ud-2.6.html create mode 100644 src/static-files/license-ud-2.7.html create mode 100644 src/static-files/license-ud-2.8.html create mode 100644 src/static-files/license-ud-2.9.html diff --git a/src/app/app-routing-paths.ts b/src/app/app-routing-paths.ts index f3e483ecda2..f44650e73e4 100644 --- a/src/app/app-routing-paths.ts +++ b/src/app/app-routing-paths.ts @@ -130,6 +130,12 @@ export function getLicensesModulePath() { return `/${LICENSES_MODULE_PATH}`; } + +export const LICENSES_MANAGE_TABLE_PATH = 'manage-table'; +export function getLicensesManageTablePath() { + return `/${LICENSES_MANAGE_TABLE_PATH}`; +} + export const CONTRACT_PAGE_MODULE_PATH = 'contract'; export function getLicenseContractPagePath() { return `/${CONTRACT_PAGE_MODULE_PATH}`; diff --git a/src/app/app-routing.module.ts b/src/app/app-routing.module.ts index 02419e43149..1ada63820ef 100644 --- a/src/app/app-routing.module.ts +++ b/src/app/app-routing.module.ts @@ -43,6 +43,7 @@ import { ServerCheckGuard } from './core/server-check/server-check.guard'; import { MenuResolver } from './menu.resolver'; import { ThemedPageErrorComponent } from './page-error/themed-page-error.component'; import { HANDLE_TABLE_MODULE_PATH } from './handle-page/handle-page-routing-paths'; +import { STATIC_PAGE_PATH } from './static-page/static-page-routing-paths'; @NgModule({ imports: [ @@ -259,7 +260,6 @@ import { HANDLE_TABLE_MODULE_PATH } from './handle-page/handle-page-routing-path { path: LICENSES_MODULE_PATH, loadChildren: () => import('./clarin-licenses/clarin-license.module').then((m) => m.ClarinLicenseModule), - canActivate: [SiteAdministratorGuard], }, { path: CONTRACT_PAGE_MODULE_PATH, @@ -272,6 +272,10 @@ import { HANDLE_TABLE_MODULE_PATH } from './handle-page/handle-page-routing-path loadChildren: () => import('./handle-page/handle-page.module').then((m) => m.HandlePageModule), canActivate: [SiteAdministratorGuard], }, + { + path: STATIC_PAGE_PATH, + loadChildren: () => import('./static-page/static-page.module').then((m) => m.StaticPageModule), + }, { path: '**', pathMatch: 'full', component: ThemedPageNotFoundComponent } ] } @@ -283,7 +287,7 @@ import { HANDLE_TABLE_MODULE_PATH } from './handle-page/handle-page-routing-path initialNavigation: 'enabledBlocking', preloadingStrategy: NoPreloading, onSameUrlNavigation: 'reload', -}) +}), ], exports: [RouterModule], }) diff --git a/src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.html b/src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.html new file mode 100644 index 00000000000..2d9c6d26ca4 --- /dev/null +++ b/src/app/clarin-licenses/clarin-all-licenses-page/clarin-all-licenses-page.component.html @@ -0,0 +1,34 @@ +
AGREEMENT ON THE USE OF DATA IN QT21
++
between
++
You, hereinafter referred to as the “QT21 User”, and
+Taus B.V., a limited liability company organized and existing under the laws of the
Netherlands, having its office at Keizersgracht 74, Amsterdam in the Netherlands, registered
with the Dutch Chamber of Commerce under registration number [37147141], hereby duly
represented by Mr. Jaap van der Meer (hereinafter: “TAUS”).
QT21 is a research action receiving funding from the European Union’s Horizon 2020 research and
innovation programme under grant agreement No 645452 between 2015 and 2018. TAUS, being a
project partner in QT21, offers data that will be used in QT21 to support statistical machine transla-
tion.
This Agreement is based on the TAUS ToU and sets forth the additional terms and conditions
applying to the Parties. It addresses the needs defined in section 29.3 of QT21 Grant Agreement, in
particular the ability to
(a) deposit in a research data repository and take measures to make it possible for third parties
to access, mine, exploit, reproduce and disseminate — free of charge for any user — the
WMT Data Set, including associated metadata, needed to validate the results presented in
scientific publications as soon as possible;
(b) provide information — via the repository — about tools and instruments at the disposal of
the beneficiaries and necessary for validating the results (and — where possible — provide the
tools and instruments themselves).
+
1.
+Definitions and rules of construction
+1.1
+The following words and phrases shall have the meanings and definitions set forth below:
+(a) “TAUS ToU” means the TAUS Terms of Use as of January 2016, attached as Annex I to
this Agreement;
(b) "QT21 User" means You, the contracting party. A QT21 User is any legal person or legal
entity who intends to use the WMT Data Set;
+
(c) "Agreement" means this agreement;
+(d) "Parties" means TAUS and QT21 User jointly;
+(e) “WMT Data Set” refers to the data collections that have been prepared for the QT21 Users
and that are originated from the TAUS data repository: benchmark data named
“TAUS_TEST_Datasets_for_QT21_WP3” as defined in the QT21 Data Management Plan.
+
2.
+The subject matter of this Agreement
++
2.1
+All terms and conditions of the TAUS ToU are fully incorporated in this Agreement and fully
apply unless explicitly stipulated otherwise in this Agreement in writing. In case of any
inconsistencies between the TAUS ToU and the terms and conditions as laid down in this
Agreement, the terms and conditions of this Agreement will prevail.
+
3.
+License
+3.1
+Subject to the terms and conditions of this Agreement, TAUS hereby grants to QT21 User
access to the WMT Data Set with the following rights:
i)
+the right to use the target side of the translation units into a commercial product,
provided that QT21 User may not resell the WMT Data Set as if it is its own new
translation;
ii)
+the right to make Derivative Works; and
+iii)
+the right to use or resell such Derivative Works commercially
+and for the following goals:
+i)
+research and benchmarking;
++
ii)
+piloting new solutions; and
++
iii)
+testing of new commercial services.
+3.2
+The license in Clause 3.1 of this Agreement is explicitly limited to the use as set forth in that
Clause and excludes any other use of the WMT Data Set.
+
3.3
+QT21 User shall not be entitled to and agrees that it shall not disclose and/or make available
the WMT Data Set to any Third Party.
3.4
+QT21 User does not need to be a TAUS Member to sign this Agreement.
++
4.
+No Warranty / No Liability / Indemnification
++
4.1
+TAUS makes no representation nor any warranty that the WMT Data Set are correct or fit for
any purpose.
4.2
+Except for liability arising from willful misconduct or gross negligence, TAUS will not be
liable for any damages, loss of business, profits, revenue, anticipated savings, indirect or
punitive damages or for any special, incidental or consequential losses with respect to the
WMT Data Set and/or the Database and Language Data Platform.
4.3
+QT21 User shall indemnify, defend and hold TAUS harmless for any losses, claims, damages,
awards, penalties or injuries incurred, including reasonable attorney’s fees, which arise from
any claim by any third party in relation to this Agreement, including the use of the WMT Data
Set and/or use of the Database and Language Data Platform.
+
5.
+Termination
+5.1
+The QT21 User rights granted in this Agreement are irrevocable, unless QT21 User breaches
any of the conditions of this Agreement, upon which QT21 User must immediately cease
access to, and use of, the WMT Data Set.
5.2
+To ensure the needs defined in section 29.3 of QT21 Grant Agreement, it is agreed that in the
case where TAUS is out of business, or changes ownership, the QT21 User rights set out in
this Agreement shall persist.
+
6.
+Miscellaneous
++
6.1
+This Agreement is meant to be signed online by QT21 User in the course of the download of
the WMT Data Set. Successful completion of the sign-up procedure shall mean the agreement
of TAUS to use the WMT Data Set in accordance with this Agreement.
+
6.2
+This Agreement and its terms and conditions cannot be assigned by a Party, without the other
Party's prior written consent, such consent not to be unreasonably withheld.
6.3
+This Agreement is open to any legal person or legal entity who intends to use the WMT Data
Set.
6.4
+If one clause is deemed invalid it does not harm the validity of the rest of the agreement.
++ + + +
These terms of use ("Terms of Use") apply to the use of the Dynamic Quality
Framework and the Database, as defined below. Please read these Terms of Use
carefully before using the Dynamic Quality Framework and the Database. The User
(as defined in Clause 1.1. (e) of these Terms of Use) accepts and agrees that the use of
the Dynamic Quality Framework and the Database is governed by these Terms of
Use and that it is bound by these Terms of Use.
1. Definitions
+1.1 The following words and phrases shall have the meanings and definitions set
forth below:
(a) “Affiliate” means an entity (i) which is directly or indirectly controlling such Party;
(i ) which is under the same direct or indirect ownership or control as such Party; or (i i)
which is directly or indirectly owned or controlled by such Party. For the purposes of
these Terms of Use, an entity shall be treated as being controlled by another if that
other entity; (i) has fifty percent (50%) or more of the votes in such entity; or (i ) is able
to direct its affairs and/or to control the composition of its board of directors or
equivalent body;
(b) Dynamic Quality Framework ("DQF") means a platform that consists of resources,
a knowledge base, Reports and tools, maintained and updated by TAUS;
(d) "Reports" means graphical reports, key performance indicators and
downloadable reports as well as the underlying data of the USER on which the
Reports are built, as generated by DQF based on the quality evaluations performed
by users of DQF;
(e) "User" is a party or individual that has paid an admission fee and is officially
registered as a user or a member of TAUS;
(f) "Database" means a collection of Data, systematically selected, processed,
maintained and updated by TAUS with its taxonomy of domain and private index
categories;
(g) "Data" means the Language Data as developed by User or licensed to User by a
third party under terms that allows User to provide the Data in the context of this
Agreement and supplied by User to TAUS for further use by itself, its members and
non-members;
(h) "Derivative Work" means a work based upon one or more preexisting works, such
as Data, in which a work may be recast, transformed or adapted. A work consisting of
editorial revisions, annotations, elaborations or other modifications, which as a whole
represent an original work of authorship, is a derivative work. Non-material
modifications to a preexisting work do not constitute a derivative work;
(i) “IP-Free” means Data that are free of Intellectual Property Rights;
+(j) “Intellectual Property Rights” means the copyrights and the sui generis database
rights of the User with respect to the Data, including any licensed copyrights and sui
generis database rights, but excluding any copyrights, sui generis database and
patent rights to the Database;
(k) "Language Data" means all data consisting of a source side of the translation, and
the matching target side, which has the same meaning as the source side in a
different language and associated metadata, indicating the language pair and other
pertinent information about this source/target pairs;
(l) “Language Data Platform” means the repository and the applications that together
comprise the platform to be used by members and users;
(m) "TAUS" means TAUS B.V., a Netherlands company, currently residing at Oosteinde
9, 1483 AB De Rijp, The Netherlands;
(n) "Taus Academic Rider Agreement" means the agreement attached as Annex 1 to
this Terms of Use to be signed by Academic members;
(o) “Terms of Membership” means the document that describes procedures,
obligations and rights of the members;
(p) “Parties” means TAUS and User;
+ +(q) “Proprietary Information” means all information, which is not known to the public
concerning the business of the User and including, but not limited in form to,
samples, recipes, prototypes, technical reports, manufacturing instructions, drawings
and formulae.
2. Grant of License and user rights to the Data and the Database
+2.1 These Terms of Use set inter alia forth the terms and conditions d under which
User shall supply and license Data to TAUS at no costs. User agrees to use
reasonable efforts to supply Data to TAUS on a regular basis. User grants TAUS a
non-exclusive royalty free worldwide license to use, copy, modify and merge the
Data in connection with the Database and the Language Data platform.
2.2 The Parties recognize the importance of quality of the Database. User has
familiarized itself with the Data and makes sure that the Data is of high quality. It is the
responsibility of the User to undo its Data from Proprietary Information. TAUS must
not knowingly use Data that contains Proprietary Information and TAUS must use
reasonable efforts to refer such Data to User.
2.3 Upon discovery, by either party, that the Data contains Proprietary Information or
other information which User is obligated to keep confidential, the discovering party
shall immediately inform the other party of such discovery. TAUS shall cooperate
fully with User in retrieving and removing such information from the Data, and shall
use best efforts to maintain the confidentiality of such information.
2.4 In consideration of the license grant pursuant to Article 2.1, and subject to Articles
2.5 and 2.6, the User obtains access to the Language Data and the Database provided
that the User is a member of TAUS.
2.5 Access to the Database and the Language Data includes the following limitative
rights:i) the right to use the target side of the translation units into a commercial
product, provided that User may not resell the Data as if it is its own new translation;i )
the right to make Derivative Works; andi i) the right to use or resell such Derivative
Works commercially.
2.6 The right to grant access pursuant to Article 2.5 includes the right to grant such
access to an Affiliate of User or a subcontractor, provided that such Affiliate or such
subcontractor i) will also be bound by all terms and conditions provided for in these
Terms of Use and User being responsible for compliance with the terms and Terms
of Use hereof by its Affiliate or subcontractor and i ) subcontractor is a member of
TAUS Data.
2.7 Any other use or more extensive use of the Data beyond the limited scope of
Articles 2.5 and 2.6, including but not limited to the redistribution, repackaging or
relicensing of the translation units (the original language data and the translation of
the original) in any form or subset, is not allowed.
2.8 Charges for access to the Database and the Language Data will be set out in the
Terms of Membership.
3. Right to use DQF
+3.1 TAUS grants User a personal, non-transferable, non-exclusive right to use DQF in
accordance with these Terms of Use.
3.2 The right to access and use DQF is limited to the remote access and/or use of
DQF by means of electronic access via the Internet for purposes of processing,
retrieving and leveraging the Data and the Reports.
3.3 Except as expressly stipulated in these Terms of Use or except as expressly
allowed by mandatory law, the User may not - nor permit any third party to - (a) copy,
make available, sublicense or otherwise commercialize DQF, (b) modify, translate or
otherwise create a derivative work of DQF, (c) disassemble, decompile or reverse
engineer the object code or source code of DQF.
3.4 TAUS may take technical measures to protect DQF. The User may not remove or
circumvent such technical measures.
3.5 TAUS reserves the right to audit - or to have a third party audit - whether User
complies with the granted rights regarding the use of DQF and the Reports.
3.6 The User is responsible for meeting the technical and functional requirements
(provided by TAUS to the User) in order to be able to access and use DQF. The use of
DQF and/or the Reports is for the USER's own account and risk. The use of electronic
communication facilities in order to gain access to DQF is also for the User's own
account and risk. Unless in case of intent or gross negligence, TAUS will in no event
be liable for any damage, loss or costs, including loss of Reports, or any inability of
the User to use DQF as a result of a shortcoming, defect or other malfunction of the
aforesaid electronic communication facilities. Furthermore, the risk of loss or theft of
or damage to the Reports will at all times be borne by the User.
3.7 The User has access to DQF and the Reports for as long as the User has paid an
admission fee. After a User stops paying admission fees TAUS keeps copies of the
User’s Reports for a period of 12 (twelve) months. If the User restarts using DQF within
12 months after having interrupted the usage, all Reports will still be available. If the
User restarts using DQF more than 12 months after having interrupted the usage, the
Reports will no longer be available.
3.8 Usage of the Reports is personal. TAUS ensures that data used to generate
Reports are anonymous.
3.9 TAUS will not automatically renew the User’s subscription. TAUS will notify the
User before the subscription expires. The User will then have to renew the
subscription.
4. User's obligations / Academic Members
+4.1 The USER warrants that it will correctly and properly use DQF, the Reports, the
Database and/or the Data which includes but is not limited to compliance with the
terms of these Terms of Use. The User may in any case not use DQF, the Reports, the
Database and/or the Data for any acts and/or conduct contrary to the law, public
order, public decency or these Terms of Use. Furthermore, the User's acts and/or
conduct must be in accordance with what may in all respects be expected of a
responsible and diligent User.
4.2 Academic Members (as defined in the TAUS Academic Rider Agreement) are also
bound by the terms and conditions as set forth in the TAUS Academic Rider
Agreement. To this end, Academic Members shall execute the TAUS Academic Rider
Agreement and return a signed copy to TAUS.
5. Intellectual property rights
+5.1 All intellectual and ownership rights, including but not limited to any and all
copyrights, sui generis database rights and patent rights in respect of DQF and the
Database exclusively vest in TAUS and its licensors. Furthermore, TAUS exclusively
owns all rights in any ideas, concepts, know-how, documentation, techniques with
respect to DQF, the Database as well as the technology available on the servers of
TAUS, unless the technology is licensed to TAUS. The User indicates upon submitting
the Data whether the User owns the Intellectual Property Rights to the Data, acts on
behalf of the owner of the Intellectual Property Rights (article 8.1) or submits Data that
are free of Intellectual Property Rights and are as such Fair-to-Share. The User does
not grant TAUS, without the prior written consent from the trademark owner, the right
to use any such trademarks.
6. Functioning of Database and DQF / Liability
+6.1 The Database and DQF are provided "as is" without warranty of any kind, express
or implied, including but not limited to warranties of merchantability, fitness for a
particular purpose and non-infringement. In no event shall TAUS vis-à-vis the User be
liable for any claim, damages or other liability, whether in an action of contract, tort or
otherwise, arising from, out, or in connection with the use of DQF, the Reports, the
Database and the Data.
6.2 TAUS shall not be liable for any damage, loss, demand, liability, claim, cost or
expense (including litigation costs and attorney's fees) of whatever kind, caused by or
resulting from the use of the DQF, the Reports, the Database and the Data.
6.3 This Article does not limit TAUS' liability for direct damages caused by gross
negligence or willful intent by TAUS or the board of directors or the executive
management of TAUS provided that User
7. Infringements
+7.1 User shall have the first right, but not the obligation, to bring any action to prevent
or terminate any infringement, misappropriation or other unauthorized use of the
Intellectual Property Rights licensed to TAUS under these Terms of Use. Within
fifteen (15 days) of any notice from TAUS of any such infringement, misappropriation,
or other unauthorized use, User shall notify TAUS whether User will bring any such
action. If any such action is brought by User, User shall have full control over the
prosecution and settlement or compromise of such action and shall assume all the
expenses and be entitled to all proceeds in respect of such action provided that
TAUS shall have the opportunity to review and comment in advance on any material
substantive filings or proceedings in such action. TAUS, at User’s expense, shall fully
cooperate with and assist User in such action and shall be the nominal plaintiff or join
as a co-plaintiff if and to the extent required by applicable law or requested by User.
7.2 If User in its discretion elects not to pursue any action against a Suspected
Infringer, User will notify TAUS whereupon TAUS may notify User of its desire to
pursue such action in its own name. If the possible infringement can reasonably be
expected to have material adverse effect on TAUS if no action is taken with respect
to the possible infringement, User shall permit TAUS, at its sole expense, to proceed
in its own name with the prosecution of any action with respect to stopping the
possible infringement, provided that User shall have the right to participate in such
action, at its own expense, shall have the opportunity to review and comment in
advance on any material substantive filings or proceedings in such action, and shall
approve of any settlement of any such action, which approval will not be
unreasonably withheld or delayed.
7.3 Notwithstanding the above, User shall have the final decision with regard to
bringing or proceeding with such action. If User, in its sole discretion, determines that
such action would not be in the best interest of User, User shall notify TAUS of such
determination, whereupon TAUS shall not bring such action against Suspected
Infringer, or if such action has commenced, to terminate such action.
8. Representations and Warranties of User
+8.1 User hereby represents and warrants that to the best of its knowledge i) in the
fulfillment of its obligations under these Terms of Use, User will not upload any data
which is violating, infringing or misappropriating any intellectual property rights,
proprietary information or any (trade) secrets of any third party and i ) has the right to
grant to TAUS the licenses contemplated in these Terms of Use. If User is not the
owner of the Intellectual Property Rights, the User will provide the name and contact
details of the owner of the Intellectual Property Rights, or the User will explicitly state
that the Data are free from Intellectual Property Rights.
8.2 User hereby further warrants that to the best of its knowledge Data submissions
do not contain any viruses, worms, spyware, or other components or instructions that
are malicious, deceptive or designed to harm or limit the functionality of a computer.
User warrants that procedures have been put in place that reduce the risk of
contamination of the Data with aforesaid shortcoming.
8.3 User makes no representation or warranty of any nature as to the correctness of
the Data.
8.4 User hereby agrees to indemnify TAUS for, to hold TAUS harmless against and to
reimburse TAUS for, any and all damages and/or expenses (including attorney’s
fees) resulting from any breach of one or more of the representations and warranties
set forth in Article 8.1 hereof, provided that TAUS: (a) provides written notice of the
claim and any such threatened claim promptly to User; (b) gives User sole control of
the defense and settlement of the claim; (c) provides to User, at User's expense, all
available information, assistance and authority to defend; and (d) has not compro
-
+mised or settled such proceeding without User's prior written consent.
+9. Miscellaneous
+9.1 TAUS may (i) suspend access to and/or the use of the DQF and the Database, or
(i ) terminate the granted rights to User, with immediate effect upon written notice if
User breaches the terms of these Terms of Use and/or otherwise acts unlawful
against TAUS (including but not limited to infringing TAUS' rights in DQF and the
Database). If the rights granted to User under these Terms of Use terminate, USER
shall immediately cease using DQF and the Database and destroy any and all entry
codes and/or passwords. Upon termination (for whatever reason) TAUS shall have no
duty or obligation to convert the Reports.
9.2 Dutch law shall govern these terms and Terms of Use. All matters arising out of or
relating to these terms and Terms of Use shall be irrevocably submitted to the
exclusive jurisdiction of the courts of Amsterdam, the Netherlands.
9.3 TAUS may amend these Terms of Use unilaterally. Any such amendments will be
duly reported to the User on beforehand. After such notification, any continued use of
DQF and the Database by User will subsequently constitute acceptance of the Terms
of Use (as amended).
9.4 In the event that one or more provisions of these Terms of Use should be
determined by an arbitral tribunal or court having competent jurisdiction to be null
and void or non-binding, the other provisions of these Terms of Use will continue to
be effective. In such case, the parties are obliged to replace the non-binding
provisions with other provisions that are binding, in such a way that the intended
economic result of the new provisions differs as little as possible from the intended
economic result of the original provisions, taking into account the object and the
purpose of these Terms of Use. If a part or parts of the Terms of Use rendered void,
invalid or unenforceable substantially impair the value of the whole Terms of Use to
any Party, such party may cancel and terminate the Terms of Use by giving written
notice to the other party.
9.5 Any term or condition of a purchase order, invoice or other communication
between the Parties which in any way differ from or add to the terms and Terms of
Use of these Terms of Use will not become binding upon the Parties unless made the
subject of an amendment to these Terms of Use. Either Party's failure to object to any
term or condition contained in any purchase order, invoice or other communication
between the Parties shall not be deemed a waiver of the provisions hereof.
9.6 User may stop using the services of TAUS at any time. Termination of the use of
the services under these Terms of Use does not affect Parties’ rights to use Data that
Parties legitimately obtained prior to the termination. Parties’ obligations and
restrictions as set out in these Terms of Use as regards the use of said Data after
termination will remain in effect.
9.7 Insofar as legally possible, Parties agree to exclude the applicability of articles 6:
227b and 6:227c of the Dutch Civil Code, inter alia, the duty to provide specific
information on e-contracting.
10. Non-Assignment
+10.1 These Terms of Use cannot be assigned by a Party, without the other Party’s prior
written consent, such consent not to be unreasonably withheld.
+Universal Dependencies v1.1 (referred to as "UD" in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the "User") are responsible for complying with the license terms applicable to those parts of UD, which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language directory. +
Treebank | +License | +
---|---|
Basque | +CC BY-NC-SA 3.0 | +
Bulgarian | +CC BY-NC-SA 3.0 | +
Croatian | +CC BY-SA 4.0 | +
Czech | +CC BY-NC-SA 3.0 | +
Danish | +GNU GPL Version 2 | +
English | +CC BY-SA 4.0 | +
Finnish | +CC BY-SA 4.0 | +
Finnish_FTB | +LGPLv3+ or CC BY 4.0 (dual license) | +
French | +CC BY-NC-SA 3.0 US | +
German | +CC BY-NC-SA 3.0 US | +
Greek | +CC BY-NC-SA 3.0 | +
Hebrew | +CC BY-NC-SA 4.0 | +
Hungarian | +CC BY-NC-SA 3.0 | +
Indonesian | +CC BY-NC-SA 3.0 US | +
Irish | +CC BY-SA 3.0 | +
Italian | +CC BY-NC-SA 3.0 | +
Persian | +CC BY-SA 4.0 | +
Spanish | +CC BY-NC-SA 3.0 US | +
Swedish | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL Version 2 | http://opensource.org/licenses/GPL-2.0 |
LGPLv3+ or CC BY 4.0 (dual license) |
+http://creativecommons.org/licenses/by/4.0/ +http://www.gnu.org/licenses/lgpl-3.0.html + |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v1.2 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD, which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Ancient_Greek | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic | +CC BY-NC-SA 3.0 | +
Basque | +CC BY-NC-SA 3.0 | +
Bulgarian | +CC BY-SA 4.0 | +
Croatian | +CC BY-SA 4.0 | +
Czech | +CC BY-NC-SA 3.0 | +
Danish | +GNU GPL 2.0 | +
Dutch | +GNU GPL 3.0 | +
English | +CC BY-SA 4.0 | +
Estonian | +CC BY-NC-SA 3.0 | +
Finnish | +CC BY-SA 4.0 | +
Finnish-FTB | +LGPLv3+ or CC BY 4.0 (dual license) | +
French | +CC BY-NC-SA 3.0 US | +
German | +CC BY-NC-SA 3.0 US | +
Gothic | +CC BY-NC-SA 3.0 | +
Greek | +CC BY-NC-SA 3.0 | +
Hebrew | +CC BY-NC-SA 4.0 | +
Hindi | +CC BY-NC-SA 4.0 | +
Hungarian | +CC BY-NC-SA 3.0 | +
Indonesian | +CC BY-NC-SA 3.0 US | +
Irish | +CC BY-SA 3.0 | +
Italian | +CC BY-NC-SA 3.0 | +
Japanese-KTC | +CC BY-SA 4.0 | +
Latin | +CC BY-NC-SA 2.5 | +
Latin-ITT | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Norwegian | +CC BY-NC-SA | +
Old_Church_Slavonic | +CC BY-NC-SA 3.0 | +
Persian | +CC BY-SA 4.0 | +
Polish | +GNU GPL 3.0 | +
Portuguese | +CC BY-NC-SA 3.0 | +
Romanian | +CC BY-SA 4.0 | +
Slovenian | +CC BY-NC-SA 4.0 | +
Spanish | +CC BY-NC-SA 3.0 US | +
Swedish | +CC BY-SA 4.0 | +
Tamil | +CC BY-NC-SA 3.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLv3+ or CC BY 4.0 (dual license) |
+http://creativecommons.org/licenses/by/4.0/ +http://www.gnu.org/licenses/lgpl-3.0.html + |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v1.3 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD, which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Ancient_Greek | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic | +CC BY-NC-SA 3.0 | +
Basque | +CC BY-NC-SA 3.0 | +
Bulgarian | +CC BY-NC-SA 3.0 | +
Catalan | +GNU GPL 3.0 | +
Chinese | +CC BY-NC-SA 4.0 | +
Croatian | +CC BY-SA 4.0 | +
Czech | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Danish | +GNU GPL 2.0 | +
Dutch | +GNU GPL 3.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
Estonian | +CC BY-NC-SA 4.0 | +
Finnish | +CC BY-SA 4.0 | +
Finnish-FTB | +LGPLv3+ or CC BY 4.0 (dual license) | +
French | +CC BY-NC-SA 3.0 US | +
Galician | +CC BY-NC-SA 3.0 | +
German | +CC BY-NC-SA 3.0 US | +
Gothic | +CC BY-NC-SA 3.0 | +
Greek | +CC BY-NC-SA 3.0 | +
Hebrew | +CC BY-NC-SA 4.0 | +
Hindi | +CC BY-NC-SA 4.0 | +
Hungarian | +CC BY-NC-SA 3.0 | +
Indonesian | +CC BY-NC-SA 3.0 US | +
Irish | +CC BY-SA 3.0 | +
Italian | +CC BY-NC-SA 3.0 | +
Japanese-KTC | +CC BY-SA 4.0 | +
Kazakh | +CC BY-SA 4.0 | +
Latin | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian | +CC BY-NC-SA 4.0 | +
Norwegian | +CC BY-NC-SA | +
Old_Church_Slavonic | +CC BY-NC-SA 3.0 | +
Persian | +CC BY-SA 4.0 | +
Polish | +GNU GPL 3.0 | +
Portuguese | +CC BY-NC-SA 3.0 | +
Portuguese-BR | +CC BY-NC-SA 3.0 US | +
Romanian | +CC BY-SA 4.0 | +
Russian | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Slovenian | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish | +CC BY-NC-SA 3.0 US | +
Spanish-AnCora | +GNU GPL 3.0 | +
Swedish | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Tamil | +CC BY-NC-SA 3.0 | +
Turkish | +CC BY-NC-SA | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLv3+ or CC BY 4.0 (dual license) |
+http://creativecommons.org/licenses/by/4.0/ +http://www.gnu.org/licenses/lgpl-3.0.html + |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v1.4 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD, which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Ancient_Greek | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic | +CC BY-NC-SA 3.0 | +
Basque | +CC BY-NC-SA 3.0 | +
Bulgarian | +CC BY-NC-SA 3.0 | +
Catalan | +GNU GPL 3.0 | +
Chinese | +CC BY-NC-SA 4.0 | +
Coptic | +CC BY 4.0 | +
Croatian | +CC BY-SA 4.0 | +
Czech | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Danish | +CC BY-SA 4.0 | +
Dutch | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
Estonian | +CC BY-NC-SA 4.0 | +
Finnish | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
French | +CC BY-NC-SA 3.0 US | +
Galician | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPLLR | +
German | +CC BY-NC-SA 3.0 US | +
Gothic | +CC BY-NC-SA 3.0 | +
Greek | +CC BY-NC-SA 3.0 | +
Hebrew | +CC BY-NC-SA 4.0 | +
Hindi | +CC BY-NC-SA 4.0 | +
Hungarian | +CC BY-NC-SA 3.0 | +
Indonesian | +CC BY-NC-SA 3.0 US | +
Irish | +CC BY-SA 3.0 | +
Italian | +CC BY-NC-SA 3.0 | +
Japanese | +CC BY-NC-SA 3.0 US | +
Japanese-KTC | +CC BY-SA 4.0 | +
Kazakh | +CC BY-SA 4.0 | +
Latin | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian | +CC BY-NC-SA 4.0 | +
Norwegian | +CC BY-NC-SA | +
Old_Church_Slavonic | +CC BY-NC-SA 3.0 | +
Persian | +CC BY-SA 4.0 | +
Polish | +GNU GPL 3.0 | +
Portuguese | +CC BY-NC-SA 3.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-BR | +CC BY-NC-SA 3.0 US | +
Romanian | +CC BY-SA 4.0 | +
Russian | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Sanskrit | +CC BY-SA 4.0 | +
Slovak | +CC BY-SA 4.0 | +
Slovenian | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish | +CC BY-NC-SA 3.0 US | +
Spanish-AnCora | +GNU GPL 3.0 | +
Swedish | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish_Sign_Language | +CC BY-SA 4.0 | +
Tamil | +CC BY-NC-SA 3.0 | +
Turkish | +CC BY-NC-SA | +
Ukrainian | +CC BY-NC-SA 4.0 | +
Uyghur | +CC BY-SA 4.0 | +
Vietnamese | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLLR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v2.0 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Ancient_Greek | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic | +CC BY-NC-SA 3.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Basque | +CC BY-NC-SA 3.0 | +
Belarusian | +CC BY-SA 4.0 | +
Bulgarian | +CC BY-NC-SA 3.0 | +
Catalan | +GNU GPL 3.0 | +
Chinese | +CC BY-NC-SA 4.0 | +
Coptic | +CC BY 4.0 | +
Croatian | +CC BY-SA 4.0 | +
Czech | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Danish | +CC BY-SA 4.0 | +
Dutch | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English | +CC BY-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
Estonian | +CC BY-NC-SA 4.0 | +
Finnish | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
French | +CC BY-NC-SA 3.0 US | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-Sequoia | +LGPLLR | +
Galician | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPLLR | +
German | +CC BY-NC-SA 3.0 US | +
Gothic | +CC BY-NC-SA 3.0 | +
Greek | +CC BY-NC-SA 3.0 | +
Hebrew | +CC BY-NC-SA 4.0 | +
Hindi | +CC BY-NC-SA 4.0 | +
Hungarian | +CC BY-NC-SA 3.0 | +
Indonesian | +CC BY-NC-SA 3.0 US | +
Irish | +CC BY-SA 3.0 | +
Italian | +CC BY-NC-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Japanese | +CC BY-NC-SA 3.0 US | +
Kazakh | +CC BY-SA 4.0 | +
Korean | +CC BY-NC-SA 3.0 US | +
Latin | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian | +CC BY-NC-SA 4.0 | +
Lithuanian | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-NC-SA | +
Norwegian-Nynorsk | +CC BY-NC-SA | +
Old_Church_Slavonic | +CC BY-NC-SA 3.0 | +
Persian | +CC BY-SA 4.0 | +
Polish | +GNU GPL 3.0 | +
Portuguese | +CC BY-SA 4.0 | +
Portuguese-BR | +CC BY-NC-SA 3.0 US | +
Romanian | +CC BY-SA 4.0 | +
Russian | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Sanskrit | +CC BY-SA 4.0 | +
Slovak | +CC BY-SA 4.0 | +
Slovenian | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish | +CC BY-NC-SA 3.0 US | +
Spanish-AnCora | +GNU GPL 3.0 | +
Swedish | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Tamil | +CC BY-NC-SA 3.0 | +
Turkish | +CC BY-NC-SA | +
Ukrainian | +CC BY-NC-SA 4.0 | +
Urdu | +CC BY-NC-SA 4.0 | +
Uyghur | +CC BY-SA 4.0 | +
Vietnamese | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLLR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v2.1 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Afrikaans | +CC BY-SA 4.0 | +
Ancient_Greek | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic | +CC BY-NC-SA 3.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Basque | +CC BY-NC-SA 3.0 | +
Belarusian | +CC BY-SA 4.0 | +
Bulgarian | +CC BY-NC-SA 3.0 | +
Buryat | +CC BY-SA 4.0 | +
Cantonese | +CC BY-SA 4.0 | +
Catalan | +GNU GPL 3.0 | +
Chinese | +CC BY-NC-SA 4.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 4.0 | +
Coptic | +CC BY 4.0 | +
Croatian | +CC BY-SA 4.0 | +
Czech | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish | +CC BY-SA 4.0 | +
Dutch | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English | +CC BY-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
Estonian | +CC BY-NC-SA 4.0 | +
Finnish | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
French | +CC BY-NC-SA 3.0 US | +
French-FTB | +LGPLLR | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-Sequoia | +LGPLLR | +
Galician | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPLLR | +
German | +CC BY-NC-SA 3.0 US | +
German-PUD | +CC BY-SA 3.0 | +
Gothic | +CC BY-NC-SA 3.0 | +
Greek | +CC BY-NC-SA 3.0 | +
Hebrew | +CC BY-NC-SA 4.0 | +
Hindi | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hungarian | +CC BY-NC-SA 3.0 | +
Indonesian | +CC BY-NC-SA 3.0 US | +
Irish | +CC BY-SA 3.0 | +
Italian | +CC BY-NC-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Japanese | +CC BY-NC-SA 3.0 US | +
Japanese-PUD | +CC BY-SA 3.0 | +
Kazakh | +CC BY-SA 4.0 | +
Korean | +CC BY-NC-SA 3.0 US | +
Kurmanji | +CC BY-SA 4.0 | +
Latin | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian | +CC BY-NC-SA 4.0 | +
Lithuanian | +CC BY-SA 4.0 | +
Marathi | +CC BY-SA 4.0 | +
North Sami | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic | +CC BY-NC-SA 3.0 | +
Persian | +CC BY-SA 4.0 | +
Polish | +GNU GPL 3.0 | +
Portuguese | +CC BY-SA 4.0 | +
Portuguese-BR | +CC BY-NC-SA 3.0 US | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Russian | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Sanskrit | +CC BY-SA 4.0 | +
Serbian | +CC BY-SA 4.0 | +
Slovak | +CC BY-SA 4.0 | +
Slovenian | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish | +CC BY-NC-SA 3.0 US | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish Sign Language | +CC BY-SA 4.0 | +
Tamil | +CC BY-NC-SA 3.0 | +
Telugu | +CC BY-SA 4.0 | +
Turkish | +CC BY-NC-SA | +
Turkish-PUD | +CC BY-SA 3.0 | +
Ukrainian | +CC BY-NC-SA 4.0 | +
Upper Sorbian | +CC BY-SA 4.0 | +
Urdu | +CC BY-NC-SA 4.0 | +
Uyghur | +CC BY-SA 4.0 | +
Vietnamese | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLLR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v2.2 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-GSD | +CC BY-NC-SA 4.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 4.0 | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
French-GSD | +CC BY-NC-SA 3.0 US | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-Sequoia | +LGPLLR | +
French-Spoken | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPLLR | +
German-GSD | +CC BY-NC-SA 3.0 US | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Indonesian-GSD | +CC BY-NC-SA 3.0 US | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-PUD | +CC BY-SA 3.0 | + +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-NC-SA 3.0 US | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-NC-SA 3.0 US | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian-LVTB | +CC BY-NC-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | + +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-SZ | +GNU GPL 3.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-NC-SA 3.0 US | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish-GSD | +CC BY-NC-SA 3.0 US | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | + +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Turkish-IMST | +CC BY-NC-SA | +
Turkish-PUD | +CC BY-SA 3.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLLR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-ND 3.0 | http + ://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v2.3 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-GSD | +CC BY-NC-SA 4.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 4.0 | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
French-FTB | +LGPLLR | +
French-GSD | +CC BY-NC-SA 3.0 US | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-Sequoia | +LGPLLR | +
French-Spoken | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPLLR | +
German-GSD | +CC BY-NC-SA 3.0 US | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Indonesian-GSD | +CC BY-NC-SA 3.0 US | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-PUD | +CC BY-SA 3.0 | + +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-NC-SA 3.0 US | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-NC-SA 3.0 US | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian-LVTB | +CC BY-NC-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | + +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-SZ | +GNU GPL 3.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-NC-SA 3.0 US | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish-GSD | +CC BY-NC-SA 3.0 US | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | + +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Turkish-IMST | +CC BY-NC-SA | +
Turkish-PUD | +CC BY-SA 3.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPLLR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Universal Dependencies v2.4 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Assyrian-AS | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-GSD | +CC BY-NC-SA 4.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 4.0 | +
Classical_Chinese-Kyoto | +PD | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Estonian-EWT | +CC BY-NC-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
French-FQB | +LGPL-LR | +
French-FTB | +LGPL-LR | +
French-GSD | +CC BY-NC-SA 3.0 US | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-Sequoia | +LGPL-LR | +
French-Spoken | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPL-LR | +
German-GSD | +CC BY-NC-SA 3.0 US | +
German-HDT | +CC BY-SA 4.0 | +
German-LIT | +CC BY-NC-SA 4.0 | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Indonesian-GSD | +CC BY-NC-SA 3.0 US | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Italian-VIT | +CC BY--NC-SA 3.0 | +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-NC-SA 3.0 US | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Karelian-KKPP | +CC BY-SA 4.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-NC-SA 3.0 US | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian-LVTB | +CC BY-NC-SA 4.0 | +
Lithuanian-ALKSNIS | +CC BY-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Mbya_Guarani-Dooley | +CC BY-SA 4.0 | +
Mbya_Guarani-Thomas | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Old_Russian-RNC | +CC BY-SA 4.0 | +
Old_Russian-TOROT | +CC BY-NC-SA 3.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-PDB | +CC BY-NC-SA 4.0 | +
Polish-PUD | +CC BY-SA 4.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-NC-SA 3.0 US | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-NC-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-GSD | +CC BY-NC-SA 3.0 US | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | + +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Turkish-GB | +CC BY-SA 4.0 | +
Turkish-IMST | +CC BY-NC-SA | +
Turkish-PUD | +CC BY-SA 3.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Welsh-CCG | +CC BY-SA 4.0 | +
Wolof-WTB | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
PD | public domain |
+Universal Dependencies v2.5 (referred to as “UD” in the rest of this document) is a collection of linguistic data and tools. +Each of the treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UD which you use. If you do not agree with the license terms, you must stop using UD and destroy all copies of UD data that you have obtained. +
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The additional software tools are provided as-is (without any warranty) and are redistributed under GNU GPL Version 2. +
+The license for every treebank included in the release is specified in the appropriate language/treebank directory. +
Treebank | +License | +
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Assyrian-AS | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Bhojpuri-BHTB | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-GSD | +CC BY-SA 4.0 | +
Chinese-GSDSimp | +CC BY-SA 4.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 4.0 | +
Classical_Chinese-Kyoto | +PD | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-Pronouns | +CC BY-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Estonian-EWT | +CC BY-NC-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
French-FQB | +LGPL-LR | +
French-FTB | +LGPL-LR | +
French-GSD | +CC BY-SA 4.0 | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-Sequoia | +LGPL-LR | +
French-Spoken | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPL-LR | +
German-GSD | +CC BY-SA 4.0 | +
German-HDT | +CC BY-SA 4.0 | +
German-LIT | +CC BY-NC-SA 4.0 | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Indonesian-GSD | +CC BY-SA 4.0 | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Italian-VIT | +CC BY-NC-SA 3.0 | +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-SA 4.0 | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Karelian-KKPP | +CC BY-SA 4.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Komi_Permyak-UH | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-SA 4.0 | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latvian-LVTB | +CC BY-SA 4.0 | +
Lithuanian-ALKSNIS | +CC BY-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Livvi-KKPP | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Mbya_Guarani-Dooley | +CC BY-NC-SA 4.0 | +
Mbya_Guarani-Thomas | +CC BY-NC-SA 4.0 | +
Moksha-JR | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Old_Russian-RNC | +CC BY-SA 4.0 | +
Old_Russian-TOROT | +CC BY-NC-SA 3.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-PDB | +CC BY-NC-SA 4.0 | +
Polish-PUD | +CC BY-SA 4.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-SA 4.0 | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Romanian-SiMoNERo | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-SA 4.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Scottish_Gaelic-ARCOSG | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Skolt_Sami-Giellagas | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-GSD | +CC BY-SA 4.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | +
Swiss_German-UZH | +CC BY-SA 4.0 | +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Turkish-GB | +CC BY-SA 4.0 | +
Turkish-IMST | +CC BY-NC-SA | +
Turkish-PUD | +CC BY-SA 3.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Welsh-CCG | +CC BY-SA 4.0 | +
Wolof-WTB | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
PD | public domain |
Universal Derivations v0.5 (referred to as “UDer” in the rest of this document) is a collection of linguistic data. Each of the resource has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UDer which you use. If you do not agree with the license terms, you must stop using UDer and destroy all copies of UDer data that you have obtained.
+You are specifically reminded that some of the treebanks permit only non-commercial usage. +
+The license for every resource included in the release is specified in the appropriate language/resource directory. +
Resource | +License | +
---|---|
cs-DeriNet | +CC BY-NC-SA 3.0 | +
de-DErivBase | +CC BY-SA 3.0 | +
en-WordNet | +CC BY-NC-SA 3.0 | +
es-DeriNetES | +CC BY-NC-SA 3.0 | +
et-EstWordNet | +CC BY-SA 3.0 | +
fa-DeriNetFA | +CC BY-NC-SA 4.0 | +
fi-FinnWordNet | +CC BY 3.0 | +
fr-Demonette | +CC BY-NC-SA 3.0 | +
la-WFL | +CC BY-NC-SA 4.0 | +
pl-PolishWFN | +CC BY-NC-SA 3.0 | +
pt-NomLexPT | +CC BY 4.0 | +
License | +URL | +
---|---|
CC BY-NC-SA 3.0 | https://creativecommons.org/licenses/by-nc-sa/3.0/legalcode |
CC BY-SA 3.0 | https://creativecommons.org/licenses/by-sa/3.0/legalcode |
CC BY-NC-SA 4.0 | https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode |
CC BY 3.0 | https://creativecommons.org/licenses/by/3.0/legalcode |
CC BY 4.0 | https://creativecommons.org/licenses/by/4.0/legalcode |
Universal Derivations v1.0 (referred to as “UDer” in the rest of this document) is a collection of linguistic + data. Each of the resource has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UDer which you use. If you do not agree with the license terms, you must stop using UDer and destroy all copies of UDer data that you have obtained.
+You are specifically reminded that some of the resources permit only non-commercial usage. +
+The license for every resource included in the release is specified in the appropriate language/resource directory. +
Resource | +License | +
---|---|
ca-EtymWordNetCA | +CC BY-SA 3.0 | +
cs-DeriNet | +CC BY-NC-SA 3.0 | +
cs-EtymWordNetCS | +CC BY-SA 3.0 | +
de-DErivBase | +CC BY-SA 3.0 | +
de-GCelex (scripts) | +GPL-3.0 | +
du-DCelex (scripts) | +GPL-3.0 | +
en-CatVar | +OSL-1.1 | +
en-ECelex (scripts) | +GPL-3.0 | +
en-WordNet | +CC BY-NC-SA 3.0 | +
es-DeriNetES | +CC BY-NC-SA 3.0 | +
et-EstWordNet | +CC BY-SA 3.0 | +
fa-DeriNetFA | +CC BY-NC-SA 4.0 | +
fi-FinnWordNet | +CC BY-SA 4.0 | +
fr-Demonette | +CC BY-NC-SA 3.0 | +
gd-EtymWordNetGD | +CC BY-SA 3.0 | +
hr-DerivBaseHR | +CC BY-SA 3.0 | +
it-DerIvaTario | +CC BY-SA 4.0 | +
la-WFL | +CC BY-NC-SA 4.0 | +
pl-EtymWordNetPL | +CC BY-SA 3.0 | +
pl-PolishWFN | +CC BY-NC-SA 3.0 | +
pt-EtymWordNetPT | +CC BY-SA 3.0 | +
pt-NomLexPT | +CC BY-SA 4.0 | +
ru-DerivBaseRU | +Apache-2.0 | +
ru-EtymWordNetRU | +CC BY-SA 3.0 | +
sh-EtymWordNetSH | +CC BY-SA 3.0 | +
sv-EtymWordNetSV | +CC BY-SA 3.0 | +
tr-EtymWordNetTR | +CC BY-SA 3.0 | +
License | +URL | +
---|---|
CC BY-NC-SA 4.0 | +https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode | +
CC BY-NC-SA 3.0 | +https://creativecommons.org/licenses/by-nc-sa/3.0/legalcode | +
CC BY-SA 4.0 | +https://creativecommons.org/licenses/by-sa/4.0/legalcode | +
CC BY-SA 3.0 | +https://creativecommons.org/licenses/by-sa/3.0/legalcode | +
Apache-2.0 | +https://www.apache.org/licenses/LICENSE-2.0.txt | +
GPL-3.0 | +https://www.gnu.org/licenses/gpl-3.0.html | +
OSL-1.1 | +https://fedoraproject.org/wiki/Licensing/OSL1.1 | +
Universal Derivations v1.1 (referred to as “UDer” in the rest of this document) is a collection of linguistic + data. Each of the resource has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UDer which you use. If you do not agree with the license terms, you must stop using UDer and destroy all copies of UDer data that you have obtained.
+You are specifically reminded that some of the resources permit only non-commercial usage. +
+The license for every resource included in the release is specified in the appropriate language/resource directory. +
Resource | +License | +
---|---|
ca-EtymWordNetCA | +CC BY-SA 3.0 | +
cs-DeriNet | +CC BY-NC-SA 3.0 | +
cs-EtymWordNetCS | +CC BY-SA 3.0 | +
de-DErivBase | +CC BY-SA 3.0 | +
de-GCelex (scripts) | +GPL-3.0 | +
du-DCelex (scripts) | +GPL-3.0 | +
en-CatVar | +OSL-1.1 | +
en-ECelex (scripts) | +GPL-3.0 | +
en-WordNet | +CC BY-NC-SA 3.0 | +
es-DeriNetES | +CC BY-NC-SA 3.0 | +
et-EstWordNet | +CC BY-SA 3.0 | +
fa-DeriNetFA | +CC BY-NC-SA 4.0 | +
fi-FinnWordNet | +CC BY-SA 4.0 | +
fr-Demonette | +CC BY-NC-SA 3.0 | +
gd-EtymWordNetGD | +CC BY-SA 3.0 | +
hr-CroDeriV | +CC BY-NC-SA 3.0 | +
hr-DerivBaseHR | +CC BY-SA 3.0 | +
it-DerIvaTario | +CC BY-SA 4.0 | +
la-WFL | +CC BY-NC-SA 4.0 | +
pl-EtymWordNetPL | +CC BY-SA 3.0 | +
pl-PolishWFN | +CC BY-NC-SA 3.0 | +
pt-EtymWordNetPT | +CC BY-SA 3.0 | +
pt-NomLexPT | +CC BY-SA 4.0 | +
ru-DerivBaseRU | +Apache-2.0 | +
ru-DeriNetRU | +CC BY-NC-SA 4.0 | +
ru-EtymWordNetRU | +CC BY-SA 3.0 | +
ru-GoldenCompoundAnalyses | +CC BY-NC 4.0 | +
sh-EtymWordNetSH | +CC BY-SA 3.0 | +
sl-Sloleks | +CC BY-NC-SA 4.0 | +
sv-EtymWordNetSV | +CC BY-SA 3.0 | +
tr-EtymWordNetTR | +CC BY-SA 3.0 | +
License | +URL | +
---|---|
CC BY-NC 4.0 | +https://creativecommons.org/licenses/by-nc/4.0/legalcode | +
CC BY-NC-SA 4.0 | +https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode | +
CC BY-NC-SA 3.0 | +https://creativecommons.org/licenses/by-nc-sa/3.0/legalcode | +
CC BY-SA 4.0 | +https://creativecommons.org/licenses/by-sa/4.0/legalcode | +
CC BY-SA 3.0 | +https://creativecommons.org/licenses/by-sa/3.0/legalcode | +
Apache-2.0 | +https://www.apache.org/licenses/LICENSE-2.0.txt | +
GPL-3.0 | +https://www.gnu.org/licenses/gpl-3.0.html | +
OSL-1.1 | +https://fedoraproject.org/wiki/Licensing/OSL1.1 | +
+HamleDT 2.0 (referred to as "HamleDT" in the rest of this document) is a collection of linguistic textual data in multiple languages. It is based on pre-existing data sets ("original treebanks"). Each of the original treebanks has its own license terms and you (the "User") are responsible for complying with the license terms applicable to those parts of HamleDT, which you use. If you do not agree with the license terms, you must stop using HamleDT and destroy all copies of HamleDT data that you have obtained. +
+You are specifically reminded that some of the original treebanks permit only non-commercial usage. +
+The additional tree transformations and the software performing the transformations is copyright Charles University, Faculty of Mathematics and Physics, Institute of Formal and Applied Linguistics ("we" or the "Provider"). It is provided as-is (without any warranty) and may be freely used, modified and redistributed under the GNU General Public License version 3.0 or the Perl Artistic License version 1.0. +
+The treebanks in HamleDT are organized in two groups: "Free" and "Patch". The Free group consists of treebanks whose license terms permit us redistributing them in full. For treebanks in the Patch group, we provide only our transformed annotation, without the underlying texts, lemmas and part of speech tags. If you legally obtained an original treebank, you can use the corresponding patch to transform the treebank to its HamleDT form. +
Lang. | +Treebank | +Web | +License | +
---|---|---|---|
ar | +Prague Arabic Dependency Treebank | +http://ufal.mff.cuni.cz/padt | +CC BY-NC-SA 3.0 | +
cs | +Prague Dependency Treebank | +http://ufal.mff.cuni.cz/pdt3.0 | +CC BY-NC-SA 3.0 | +
da | +CoNLL 2006 | +http://www.buch-kromann.dk/matthias/treebank/ | +GPL 3 | +
et | +Eesti keele puudepank | +http://vvv.cs.ut.ee/~kaili/Korpus/puud/ | +free download | +
fa | +Persian Dependency Treebank | +http://dadegan.ir/en/perdt | +GPL 3* | +
fi | +Turku Dependency Treebank | +http://bionlp.utu.fi/fintreebank.html | +CC BY-SA 3.0 | +
grc | +Ancient Greek Dependency Treebank | +http://nlp.perseus.tufts.edu/syntax/treebank/ | +CC BY-NC-SA 2.5 | +
la | +Latin Dependency Treebank | +http://nlp.perseus.tufts.edu/syntax/treebank/ | +CC BY-NC-SA 2.5 | +
nl | +CoNLL 2006 (Alpino) | +http://odur.let.rug.nl/~vannoord/trees/ | +GPL | +
pt | +CoNLL 2006 (Floresta Sintá(c)tica) | +http://www.linguateca.pt/Floresta/principal.html | +CC BY-NC-SA 3.0 | +
ro | +Resurse pentru Gramaticile de Dependenta | +http://www.phobos.ro/roric/texts/indexro.html | +free download | +
sv | +CoNLL 2006 (Talbanken05) | +http://stp.lingfil.uu.se/~nivre/research/Talbanken05.html | +research*, cite | +
ta | +Tamil Dependency Treebank | +http://ufal.mff.cuni.cz/~ramasamy/tamiltb/0.1/ | +CC BY-NC-SA 3.0 | +
Lang. | +Treebank | +Web | +
---|---|---|
bg | BulTreeBank / CoNLL 2006 | http://www.bultreebank.org/indexBTB.html | +
bn | Hyderabad Dependency Treebank / ICON 2010 | + |
ca | AnCora-CA | http://clic.ub.edu/corpus/ | +
de | TIGER Corpus / CoNLL 2009 | http://www.ims.uni-stuttgart.de/forschung/ressourcen/korpora/tiger.html | +
el | Greek Dependency Treebank / CoNLL 2007 | + |
en | Penn Treebank / CoNLL 2007 | http://www.cis.upenn.edu/~treebank/ | +
es | AnCora-ES | http://clic.ub.edu/corpus/ | +
eu | Basque Dependency Treebank | + |
hi | Hyderabad Dependency Treebank / COLING 2012 | + |
hu | Szeged Treebank | http://www.inf.u-szeged.hu/projectdirs/hlt/hu/Treebank/treebank2.html | +
it | Italian Syntactic-Semantic Treebank / CoNLL 2007 | http://www.ilc.cnr.it/viewpage.php/sez=ricerca/id=874/vers=ing | +
ja | Tübingen Treebank of Spoken Japanese (Tüba-J/S) | http://www.sfs.uni-tuebingen.de/en/ascl/resources/corpora/tueba-js.html | +
ru | SynTagRus | http://www.ruscorpora.ru/en/search-syntax.html | +
sk | Slovak Treebank | http://korpus.sk/ | +
sl | Slovene Dependency Treebank | http://nl.ijs.si/sdt/ | +
te | Hyderabad Dependency Treebank / ICON 2010 | + |
tr | METU-Sabanci (ODTÜ-Sabancı) Treebank | http://ii.metu.edu.tr/corpus | +
CC BY-NC-SA 3.0 http://creativecommons.org/licenses/by-nc-sa/3.0/
+CC BY-SA 3.0 http://creativecommons.org/licenses/by-sa/3.0/
+CC BY-NC-SA 2.5 http://creativecommons.org/licenses/by-nc-sa/2.5/
+GPL http://www.gnu.org/licenses/gpl.html
+fa: Persian Dependency Treebank: The download page contained the statement "I will use the treebank for research purposes only." The "Readme and Licence.txt" file says "only non-commercially". However, the included license is the standard GPL 3 (without any restrictions).
+sv: Talbanken05: The download page was saying at the time of retrieval: "The treebank comes with no guarantee but is freely available for research and educational purposes as long as proper credit is given for the work done to produce the material (both in Lund and in Växjö)."
+ ++The following research papers should be cited to give proper credit to the creators of the original treebanks and to us, the creators of HamleDT. +
+ +HamleDT 2.0: Rudolf Rosa, Jan Mašek, David Mareček, Martin Popel, Daniel Zeman, Zdeněk Žabokrtský (2014): HamleDT 2.0: Thirty Dependency Treebanks Stanfordized. In Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC 2014), pp. 2334–2341. ELDA, Reykjavík, Iceland.
+ar: Otakar Smrž, Viktor Bielický, Iveta Kouřilová, Jakub Kráčmar, Jan Hajič, Petr Zemánek (2008): Prague Arabic Dependency Treebank: A Word on the Million Words. In Proceedings of the Workshop on Arabic and Local Languages (LREC 2008), pp. 16–23. ELDA, Marrakech, Morocco.
+bg: Kiril Simov, Petya Osenova (2005): Extending the Annotation of BulTreeBank: Phase 2. In The Fourth Workshop on Treebanks and Linguistic Theories (TLT 2005), pp. 173–184. Barcelona, Spain.
+ca, es: Mariona Taulé, Maria Antònia Martí, Marta Recasens (2008): AnCora: Multilevel Annotated Corpora for Catalan and Spanish. In Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC 2008). ELDA, Marrakech, Morocco.
+cs: Eduard Bejček, Eva Hajičová, Jan Hajič, Pavlína Jínová, Václava Kettnerová, Veronika Kolářová, Marie Mikulová, Jiří Mírovský, Anna Nedoluzhko, Jarmila Panevová, Lucie Poláková, Magda Ševčíková, Jan Štěpánek, Šárka Zikánová (2013): Prague Dependency Treebank 3.0. http://hdl.handle.net/11858/00-097C-0000-0023-1AAF-3. Charles University in Prague, ÚFAL, Praha, Czechia.
+da: Matthias T. Kromann, Line Mikkelsen, Stine Kern Lynge (2004): Danish Dependency Treebank. http://code.google.com/p/copenhagen-dependency-treebank/. København, Denmark.
+de: Sabine Brants, Stefanie Dipper, Silvia Hansen, Wolfgang Lezius, George Smith (2002): The TIGER Treebank. In Proceedings of the Workshop on Treebanks and Linguistic Theories. Sozopol, Bulgaria.
+el: Prokopis Prokopidis, Elina Desipri, Maria Koutsombogera, Harris Papageorgiou, Stelios Piperidis (2005): Theoretical and Practical Issues in the Construction of a Greek Dependency Treebank. In Proceedings of the Fourth Workshop on Treebanks and Linguistic Theories (TLT 2005), pp. 149–160. Barcelona, Spain.
+en: Mitchell P. Marcus, Beatrice Santorini, Mary Ann Marcinkiewicz (1993): Building a Large Annotated Corpus of English: The Penn Treebank. In Computational Linguistics 19:2, pp. 313–330.
+et: Eckhard Bick, Heli Uibo, Kaili Müürisep (2004): Arborest – a VISL-Style Treebank Derived from an Estonian Constraint Grammar Corpus. In Proceedings of Treebanks and Linguistic Theories (TLT 2004).
+eu: Itzair Aduriz, María Jesús Aranzabe, Jose Mari Arriola, Aitziber Atutxa, Arantza Díaz de Ilarraza, Aitzpea Garmendia, Maite Oronoz (2003): Construction of a Basque Dependency Treebank. In Proceedings of the Second Workshop on Treebanks and Linguistic Theories (TLT 2003).
+fa: Mohammad Sadegh Rasooli, Amirsaeid Moloodi, Manouchehr Kouhestani, Behrouz Minaei-Bidgoli (2011): A Syntactic Valency Lexicon for Persian Verbs: The First Steps towards Persian Dependency Treebank. In 5th Language and Technology Conference (LTC): Human Language Technologies as a Challenge for Computer Science and Linguistics, pp. 227–231. Poznań, Poland.
+fi: Katri Haverinen, Timo Viljanen, Veronika Laippala, Samuel Kohonen, Filip Ginter, Tapio Salakoski (2010): Treebanking Finnish. In Proceedings of the Ninth International Workshop on Treebanks and Linguistic Theories (TLT9), pp. 79–90.
+grc, la: David Bamman, Gregory Crane (2011): The Ancient Greek and Latin Dependency Treebanks. In Language Technology for Cultural Heritage, pp. 79–98. ISBN 978-3-642-20227-8. Springer, Berlin / Heidelberg, Germany.
+it: Simonetta Montemagni, Francesco Barsotti, Marco Battista, Nicoletta Calzolari, Ornella Corazzari, Alessandro Lenci, Antonio Zampolli, Francesca Fanciulli, Maria Massetani, Remo Raffaelli, Roberto Basili, Maria Teresa Pazienza, Dario Saracino, Fabio Zanzotto, Nadia Mana, Fabio Pianesi, Rodolfo Delmonte (2003): Building the Italian Syntactic-Semantic Treebank. In Anne Abeillé (ed.): Building and Using Parsed Corpora, pp. 189–210. Kluwer, Dordrecht, Netherlands.
+hi, bn, te: Samar Husain, Prashanth Mannem, Bharat Ambati, Phani Gadde (2010): The ICON-2010 Tools Contest on Indian Language Dependency Parsing. In Proceedings of ICON-2010 Tools Contest on Indian Language Dependency Parsing. Kharagpur, India.
+hu: Dóra Csendes, János Csirik, Tibor Gyimóthy, András Kocsor (2005): The Szeged Treebank. In Text, Speech and Dialogue (TSD), pp. 123–131. Springer, Berlin / Heidelberg, Germany.
+ja: Yasuhiro Kawata, Julia Bartels (2000): Stylebook for the Japanese Treebank in Verbmobil, Report 240. Universität Tübingen, Tübingen, Germany.
+nl: Leonoor van der Beek, Gosse Bouma, Jan Daciuk, Tanja Gaustad, Robert Malouf, Gertjan van Noord, Robbert Prins, Begoña Villada (2002): Chapter 5. The Alpino Dependency Treebank. In Algorithms for Linguistic Processing NWO PIONIER Progress Report. Groningen, Netherlands.
+pt: Susana Afonso, Eckhard Bick, Renato Haber, Diana Santos (2002): "Floresta sintá(c)tica": A Treebank for Portuguese. In Proceedings of the Third International Conference on Language Resources and Evaluation (LREC 2002). ELDA, Las Palmas, Spain.
+ro: Mihaela Călăcean (2008): Data-driven Dependency Parsing for Romanian. Uppsala Universitet, Uppsala, Sweden.
+ru: Igor Boguslavsky, Svetlana Grigorieva, Nikolai Grigoriev, Leonid Kreidlin, Nadezhda Frid (2000): Dependency Treebank for Russian: Concept, Tools, Types of Information. In Proceedings of the 18th Conference on Computational Linguistics, vol. 2, pp. 987–991. ACL, Morristown, NJ, USA.
+sk: Mária Šimková, Radovan Garabík (2006): Синтаксическая разметка в Словацком национальном корпусе. In Tруды международной конференции Корпусная лингвистика – 2006, pp. 389–394. ISBN 5-288-04181-4. St. Petersburg University Press, Sankt-Peterburg, Russia.
+sl: Sašo Džeroski, Tomaž Erjavec, Nina Ledinek, Petr Pajas, Zdeněk Žabokrtský, Andreja Žele (2006): Towards a Slovene Dependency Treebank. In Proceedings of the Fifth International Conference on Language Resources and Evaluation (LREC 2006), pp. 1388–1391. ELDA, Genova, Italy.
+sv: Joakim Nivre, Jens Nilsson, Johan Hall (2006): Talbanken05: A Swedish Treebank with Phrase Structure and Dependency Annotation. In Proceedings of the Fifth International Conference on Language Resources and Evaluation (LREC 2006). ELDA, Genova, Italy.
+ta: Loganathan Ramasamy, Zdeněk Žabokrtský (2012): Prague Dependency Style Treebank for Tamil. In Proceedings of the Eighth International Conference on Language Resources and Evaluation (LREC 2012). ELDA, İstanbul, Turkey.
+tr: Nart B. Atalay, Kemal Oflazer, Bilge Say (2003): The Annotation Process in the Turkish Treebank. In Proceedings of the 4th International Workshop on Linguistically Interpreted Corpora (LINC). EACL, Budapest, Hungary.
+ ++ HamleDT 3.0 (referred to as “HamleDT” in the rest of this document) is a collection of linguistic textual data in multiple languages. It is based on pre-existing data sets (“original treebanks”). Each of the original treebanks has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of HamleDT, which you use. If you do not agree with the license terms, you must stop using HamleDT and destroy all copies of HamleDT data that you have obtained. +
+ You are specifically reminded that some of the original treebanks permit only non-commercial usage. +
+ The treebanks in HamleDT are organized in two groups: “Free” and “Patch”. The Free group consists of treebanks whose license terms permit us redistributing them in full. For treebanks in the Patch group, we provide only our transformed annotation, without the underlying texts, lemmas and part of speech tags. If you legally obtained an original treebank, you can use the corresponding patch to transform the treebank to its HamleDT form. +
+ The patches containing our tree transformations (as well as any accompanying software) are copyright Charles University, Faculty of Mathematics and Physics, Institute of Formal and Applied Linguistics (“we” or the “Provider”). It is provided as-is (without any warranty) and may be freely used, modified and redistributed under the GNU General Public License version 3.0 or the Perl Artistic License version 1.0. +
Note: the “-ud11” treebanks are taken from the Universal Dependencies release 1.1, see http://universaldependencies.github.io/docs/.
+ +Code | +Treebank | +Web | +License | +
---|---|---|---|
ar | +Prague Arabic Dependency Treebank | +http://ufal.mff.cuni.cz/padt | +CC BY-NC-SA 3.0 | +
bg-ud11 | +BulTreeBank / UD1.1 | +http://www.bultreebank.org/indexBTB.html | +CC BY-NC-SA 3.0 | +
cs | +Prague Dependency Treebank | +http://ufal.mff.cuni.cz/pdt3.0 | +CC BY-NC-SA 3.0 | +
da-ud11 | +Danish Dependency Treebank / UD1.1 | +http://www.buch-kromann.dk/matthias/treebank/ | +GNU GPL 2 | +
de-ud11 | +UD1.1 (from Google) | +http://universaldependencies.github.io/docs/#language-de | +CC BY-NC-SA 3.0 US | +
el-ud11 | +Greek Dependency Treebank / UD1.1 | +http://universaldependencies.github.io/docs/#language-el | +CC BY-NC-SA 3.0 | +
en-ud11 | +English Web Treebank (Stanford) / UD1.1 | +http://nlp.stanford.edu/software/stanford-dependencies.shtml | +CC BY-SA 4.0 | +
es-ud11 | +UD1.1 (from Google) | +http://universaldependencies.github.io/docs/#language-es | +CC BY-NC-SA 3.0 US | +
et | +Eesti keele puudepank | +http://vvv.cs.ut.ee/~kaili/Korpus/puud/ | +free download | +
eu-ud11 | +Basque Dependency Treebank / UD1.1 | +http://universaldependencies.github.io/docs/#language-eu | +CC BY-NC-SA 3.0 | +
fa | +Persian Dependency Treebank | +http://dadegan.ir/en/perdt | +GNU GPL 3* | +
fa-ud11 | +Uppsala Persian Dependency Treebank / UD1.1 | +http://universaldependencies.github.io/docs/#language-fa | +CC BY-SA 4.0 | +
fi-ud11 | +Turku Dependency Treebank / UD1.1 | +http://bionlp.utu.fi/fintreebank.html | +CC BY-SA 4.0 | +
fi-ud11ftb | +FinnTreeBank / UD1.1 | +http://www.ling.helsinki.fi/kieliteknologia/tutkimus/treebank/ | +LGPLv3+ or CC BY 4.0 (dual license) | +
fr-ud11 | +UD1.1 (from Google) | +http://universaldependencies.github.io/docs/#language-fr | +CC BY-NC-SA 3.0 US | +
ga-ud11 | +Irish Dependency Treebank / UD1.1 | +http://universaldependencies.github.io/docs/#language-ga | +CC BY-NC-SA 3.0 | +
grc | +Ancient Greek Dependency Treebank | +http://nlp.perseus.tufts.edu/syntax/treebank/ | +CC BY-NC-SA 2.5 | +
he-ud11 | +Hebrew Dependency Treebank / UD1.1 | +http://www.cs.bgu.ac.il/~yoavg/data/hebdeptb/ | +CC BY-NC-SA 4.0 | +
hr-ud11 | +SETimes.HR / UD1.1 | +http://universaldependencies.github.io/docs/#language-hr | +CC BY-SA 4.0 | +
hu-ud11 | +Szeged Treebank / UD1.1 | +http://www.inf.u-szeged.hu/projectdirs/hlt/hu/Treebank/treebank2.html | +CC BY-NC-SA 3.0 | +
id-ud11 | +UD1.1 (from Google) | +http://universaldependencies.github.io/docs/#language-id | +CC BY-NC-SA 3.0 US | +
it-ud11 | +Italian Stanford Dependency Treebank / UD1.1 | +http://universaldependencies.github.io/docs/#language-it | +CC BY-NC-SA 3.0 | +
la | +Latin Dependency Treebank | +http://nlp.perseus.tufts.edu/syntax/treebank/ | +CC BY-NC-SA 2.5 | +
la-it | +Index Thomisticus Treebank | +http://itreebank.marginalia.it/ | +CC BY-NC-SA 3.0 | +
nl | +CoNLL 2006 (Alpino) | +http://odur.let.rug.nl/~vannoord/trees/ | +GNU GPL | +
pl | +Składnica zależnościowa 0.5 | +http://zil.ipipan.waw.pl/Sk%C5%82adnica | +GNU GPL 3 | +
pt | +CoNLL 2006 (Floresta Sintá(c)tica) | +http://www.linguateca.pt/Floresta/principal.html | +CC BY-NC-SA 3.0 | +
ro | +Resurse pentru Gramaticile de Dependenta | +http://www.phobos.ro/roric/texts/indexro.html | +free download | +
sl | +Slovene Dependency Treebank / CoNLL 2006 | +http://nl.ijs.si/sdt/ | +research, cite | +
sv-ud11 | +Talbanken05 / UD1.1 | +http://stp.lingfil.uu.se/~nivre/research/Talbanken05.html | +CC BY-SA 4.0 | +
ta | +Tamil Dependency Treebank | +http://ufal.mff.cuni.cz/~ramasamy/tamiltb/0.1/ | +CC BY-NC-SA 3.0 | +
Lang. | +Treebank | +Web | +
---|---|---|
bn | +Hyderabad Dependency Treebank / ICON 2010 | ++ |
ca | +AnCora-CA | +http://clic.ub.edu/corpus/ | +
de | +TIGER Corpus / CoNLL 2009 | +http://www.ims.uni-stuttgart.de/forschung/ressourcen/korpora/tiger.html | +
en | +Penn Treebank / CoNLL 2007 | +http://www.cis.upenn.edu/~treebank/ | +
es | +AnCora-ES | +http://clic.ub.edu/corpus/ | +
hi | +Hyderabad Dependency Treebank / COLING 2012 | ++ |
ja | +Tübingen Treebank of Spoken Japanese (Tüba-J/S) | +http://www.sfs.uni-tuebingen.de/en/ascl/resources/corpora/tueba-js.html | +
ru | +SynTagRus | +http://www.ruscorpora.ru/en/search-syntax.html | +
sk | +Slovak Treebank | +http://korpus.sk/ | +
te | +Hyderabad Dependency Treebank / ICON 2010 | ++ |
tr | +METU-Sabanci (ODTÜ-Sabancı) Treebank | +http://ii.metu.edu.tr/corpus | +
CC BY-SA 4.0 http://creativecommons.org/licenses/by-sa/4.0/
+CC BY-NC-SA 4.0 http://creativecommons.org/licenses/by-nc-sa/4.0/
+CC BY-SA 3.0 http://creativecommons.org/licenses/by-sa/3.0/
+CC BY-NC-SA 3.0 http://creativecommons.org/licenses/by-nc-sa/3.0/
+CC BY-NC-SA 2.5 http://creativecommons.org/licenses/by-nc-sa/2.5/
+GNU (L)GPL http://www.gnu.org/licenses/gpl.html
+Perl Artistic L 1.0 http://www.perlfoundation.org/artistic_license_1_0
+fa: Persian Dependency Treebank: The download page contained the statement “I will use the treebank for research purposes only.” The “Readme and Licence.txt” file says “only non-commercially”. However, the included license is the standard GPL 3 (without any restrictions).
+ ++ The following research papers should be cited to give proper credit to the creators of the original treebanks and to us, the creators of HamleDT. +
+ +HamleDT: Daniel Zeman, Ondřej Dušek, David Mareček, Martin Popel, Loganathan Ramasamy, Jan Štěpánek, Zdeněk Žabokrtský, Jan Hajič (2014): HamleDT: Harmonized Multi-Language Dependency Treebank. In: Language Resources and Evaluation, 48(4) pp. 601–637, Springer, Dordrecht, Netherlands, ISSN 1574-020X.
+ +HamleDT 2.0: Rudolf Rosa, Jan Mašek, David Mareček, Martin Popel, Daniel Zeman, Zdeněk Žabokrtský (2014): HamleDT 2.0: Thirty Dependency Treebanks Stanfordized. In Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC 2014), pp. 2334–2341. ELDA, Reykjavík, Iceland.
+ +ar: Otakar Smrž, Viktor Bielický, Iveta Kouřilová, Jakub Kráčmar, Jan Hajič, Petr Zemánek (2008): Prague Arabic Dependency Treebank: A Word on the Million Words. In Proceedings of the Workshop on Arabic and Local Languages (LREC 2008), pp. 16–23. ELDA, Marrakech, Morocco.
+ +bg: Kiril Simov, Petya Osenova (2005): Extending the Annotation of BulTreeBank: Phase 2. In The Fourth Workshop on Treebanks and Linguistic Theories (TLT 2005), pp. 173–184. Barcelona, Spain.
+ +ca, es: Mariona Taulé, Maria Antònia Martí, Marta Recasens (2008): AnCora: Multilevel Annotated Corpora for Catalan and Spanish. In Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC 2008). ELDA, Marrakech, Morocco.
+ +cs: Eduard Bejček, Eva Hajičová, Jan Hajič, Pavlína Jínová, Václava Kettnerová, Veronika Kolářová, Marie Mikulová, Jiří Mírovský, Anna Nedoluzhko, Jarmila Panevová, Lucie Poláková, Magda Ševčíková, Jan Štěpánek, Šárka Zikánová (2013): Prague Dependency Treebank 3.0. http://hdl.handle.net/11858/00-097C-0000-0023-1AAF-3. Charles University in Prague, ÚFAL, Praha, Czechia.
+ +da: Matthias T. Kromann, Line Mikkelsen, Stine Kern Lynge (2004): Danish Dependency Treebank. http://code.google.com/p/copenhagen-dependency-treebank/. København, Denmark.
+ +de: Sabine Brants, Stefanie Dipper, Silvia Hansen, Wolfgang Lezius, George Smith (2002): The TIGER Treebank. In Proceedings of the Workshop on Treebanks and Linguistic Theories. Sozopol, Bulgaria.
+ +de-ud11, es-ud11, fr-ud11, id-ud11: Ryan McDonald, Joakim Nivre, Yvonne Quirmbach-Brundage, Yoav Goldberg, Dipanjan Das, Kuzman Ganchev, Keith Hall, Slav Petrov, Hao Zhang, Oscar Täckström, Claudia Bedini, Núria Bertomeu Castelló, Jungmee Lee (2013): Universal Dependency Annotation for Multilingual Parsing. In Proceedings of ACL. Sofija, Bulgaria.
+ +el: Prokopis Prokopidis, Elina Desipri, Maria Koutsombogera, Harris Papageorgiou, Stelios Piperidis (2005): Theoretical and Practical Issues in the Construction of a Greek Dependency Treebank. In Proceedings of the Fourth Workshop on Treebanks and Linguistic Theories (TLT 2005), pp. 149–160. Barcelona, Spain.
+ +en: Mitchell P. Marcus, Beatrice Santorini, Mary Ann Marcinkiewicz (1993): Building a Large Annotated Corpus of English: The Penn Treebank. In Computational Linguistics 19:2, pp. 313–330.
+ +en-ud11: Natalia Silveira, Timothy Dozat, Marie-Catherine de Marneffe, Samuel R. Bowman, Miriam Connor, John Bauer, Christopher D. Manning (2014): A Gold Standard Dependency Corpus for English. In Proceedings of LREC 2014. Reykjavík, Iceland.
+ +et: Eckhard Bick, Heli Uibo, Kaili Müürisep (2004): Arborest – a VISL-Style Treebank Derived from an Estonian Constraint Grammar Corpus. In Proceedings of Treebanks and Linguistic Theories (TLT 2004).
+ +eu: Itzair Aduriz, María Jesús Aranzabe, Jose Mari Arriola, Aitziber Atutxa, Arantza Díaz de Ilarraza, Aitzpea Garmendia, Maite Oronoz (2003): Construction of a Basque Dependency Treebank. In Proceedings of the Second Workshop on Treebanks and Linguistic Theories (TLT 2003).
+ +fa: Mohammad Sadegh Rasooli, Amirsaeid Moloodi, Manouchehr Kouhestani, Behrouz Minaei-Bidgoli (2011): A Syntactic Valency Lexicon for Persian Verbs: The First Steps towards Persian Dependency Treebank. In 5th Language and Technology Conference (LTC): Human Language Technologies as a Challenge for Computer Science and Linguistics, pp. 227–231. Poznań, Poland.
+ +fa-ud11: Mojgan Seraji (2015): Morphosyntactic Corpora and Tools for Persian (PhD thesis). Studia Linguistica Upsaliensia 16. Uppsala, Sweden.
+ +fi: Katri Haverinen, Timo Viljanen, Veronika Laippala, Samuel Kohonen, Filip Ginter, Tapio Salakoski (2010): Treebanking Finnish. In Proceedings of the Ninth International Workshop on Treebanks and Linguistic Theories (TLT9), pp. 79–90.
+ +fi-ud11ftb: Atro Voutilainen, Tanja Purtonen, Kristiina Muhonen, Krister Lindén (2012): Specifying Treebanks, Outsourcing Parsebanks: FinnTreeBank 3. In Proceedings of LREC 2012. İstanbul, Turkey.
+ +ga: Teresa Lynn, Jennifer Foster, Mark Dras, Lamia Tounsi (2014): Cross-lingual Transfer Parsing for Low-Resourced Languages: An Irish Case Study. In Proceedings of CLTW 2014. Dublin, Ireland.
+ +grc, la: David Bamman, Gregory Crane (2011): The Ancient Greek and Latin Dependency Treebanks. In Language Technology for Cultural Heritage, pp. 79–98. ISBN 978-3-642-20227-8. Springer, Berlin / Heidelberg, Germany.
+ +he: Yoav Goldberg (2011): Automatic Syntactic Processing of Modern Hebrew (PhD thesis). Ben Gurion University, Israel.
+ +hi, bn, te: Samar Husain, Prashanth Mannem, Bharat Ambati, Phani Gadde (2010): The ICON-2010 Tools Contest on Indian Language Dependency Parsing. In Proceedings of ICON-2010 Tools Contest on Indian Language Dependency Parsing. Kharagpur, India.
+ +hr: Željko Agić, Nikola Ljubešić (2014): The SETimes.HR Linguistically Annotated Corpus of Croatian. In Proceedings of LREC 2014, pp. 1724–1727. Reykjavík, Iceland.
+ +hu: Dóra Csendes, János Csirik, Tibor Gyimóthy, András Kocsor (2005): The Szeged Treebank. In Text, Speech and Dialogue (TSD), pp. 123–131. Springer, Berlin / Heidelberg, Germany.
+ +it: Simonetta Montemagni, Francesco Barsotti, Marco Battista, Nicoletta Calzolari, Ornella Corazzari, Alessandro Lenci, Antonio Zampolli, Francesca Fanciulli, Maria Massetani, Remo Raffaelli, Roberto Basili, Maria Teresa Pazienza, Dario Saracino, Fabio Zanzotto, Nadia Mana, Fabio Pianesi, Rodolfo Delmonte (2003): Building the Italian Syntactic-Semantic Treebank. In Anne Abeillé (ed.): Building and Using Parsed Corpora, pp. 189–210. Kluwer, Dordrecht, Netherlands.
+ +it-ud11: Cristina Bosco, Simonetta Montemagni, Maria Simi (2013): Converting Italian Treebanks: Towards an Italian Stanford Dependency Treebank. In Proceedings of the 7th Linguistic Annotation Workshop & Interoperability with Discourse (LAW VII & ID at ACL-2013), pp. 61–69. Sofija, Bulgaria.
+ +ja: Yasuhiro Kawata, Julia Bartels (2000): Stylebook for the Japanese Treebank in Verbmobil, Report 240. Universität Tübingen, Tübingen, Germany.
+ +la-it: Marco Passarotti, Felice Dell’Orletta (2010): Improvements in parsing the index thomisticus treebank. Revision, combination and a feature model for medieval Latin. In Training vol. 2, 61–024.
+ +nl: Leonoor van der Beek, Gosse Bouma, Jan Daciuk, Tanja Gaustad, Robert Malouf, Gertjan van Noord, Robbert Prins, Begoña Villada (2002): Chapter 5. The Alpino Dependency Treebank. In Algorithms for Linguistic Processing NWO PIONIER Progress Report. Groningen, Netherlands.
+ +pl: Alina Wróblewska, Adam Przepiórkowski (2014): Projection-based Annotation of a Polish Dependency Treebank. In Proceedings of the Ninth International Conference on Language Resources and Evaluation, LREC, pp. 2306–2312. Reykjavík, Iceland.
+ +pt: Susana Afonso, Eckhard Bick, Renato Haber, Diana Santos (2002): “Floresta sintá(c)tica”: A Treebank for Portuguese. In Proceedings of the Third International Conference on Language Resources and Evaluation (LREC 2002). ELDA, Las Palmas, Spain.
+ +ro: Mihaela Călăcean (2008): Data-driven Dependency Parsing for Romanian. Uppsala Universitet, Uppsala, Sweden.
+ +ru: Igor Boguslavsky, Svetlana Grigorieva, Nikolai Grigoriev, Leonid Kreidlin, Nadezhda Frid (2000): Dependency Treebank for Russian: Concept, Tools, Types of Information. In Proceedings of the 18th Conference on Computational Linguistics, vol. 2, pp. 987–991. ACL, Morristown, NJ, USA.
+ +sk: Mária Šimková, Radovan Garabík (2006): Синтаксическая разметка в Словацком национальном корпусе. In Tруды международной конференции Корпусная лингвистика – 2006, pp. 389–394. ISBN 5-288-04181-4. St. Petersburg University Press, Sankt-Peterburg, Russia.
+ +sl: Sašo Džeroski, Tomaž Erjavec, Nina Ledinek, Petr Pajas, Zdeněk Žabokrtský, Andreja Žele (2006): Towards a Slovene Dependency Treebank. In Proceedings of the Fifth International Conference on Language Resources and Evaluation (LREC 2006), pp. 1388–1391. ELDA, Genova, Italy.
+ +sv: Joakim Nivre, Jens Nilsson, Johan Hall (2006): Talbanken05: A Swedish Treebank with Phrase Structure and Dependency Annotation. In Proceedings of the Fifth International Conference on Language Resources and Evaluation (LREC 2006). ELDA, Genova, Italy.
+ +ta: Loganathan Ramasamy, Zdeněk Žabokrtský (2012): Prague Dependency Style Treebank for Tamil. In Proceedings of the Eighth International Conference on Language Resources and Evaluation (LREC 2012). ELDA, İstanbul, Turkey.
+ +tr: Nart B. Atalay, Kemal Oflazer, Bilge Say (2003): The Annotation Process in the Turkish Treebank. In Proceedings of the 4th International Workshop on Linguistically Interpreted Corpora (LINC). EACL, Budapest, Hungary.
+License Agreement for the HamleDT 1.0
+
+
+between
+
+
+the respective proprietors (see below the descriptions and terms for individual languages)
+
+(the Proprietor)
+
+
+
+and
+
+
+
+the User
+
+
+
+where
+
+I (the User) understand that HamleDT is based on many pre-existing treebanks, each of which has its authors and/or owners and license terms that are not identical for all the treebanks included. I have read the respective license terms, I understand them and I will use the data in accordance with them. I specifically acknowledge that some of the treebanks mentioned above permit only non-commercial usage.
+
+
+
+The additional tree transformations and the software performing the transformations is copyright Charles University, Faculty of Mathematics and Physics, Institute of Formal and Applied Linguistics. It is provided as-is (without any warranty) and may be freely used, modified and redistributed under the GNU General Public License version 3.0 or the Perl Artistic License version 1.0.
+
+
+lang. CoNLL license name web +ar 2007 own, LDC Prague Arabic Dependency Treebank http://ufal.mff.cuni.cz/padt +cs 2007 CC BY-NC-SA 3.0 Prague Dependency Treebank http://ufal.mff.cuni.cz/pdt2.5 +da 2006 GPL 3 Copenhagen Dependency Treebank http://code.google.com/p/copenhagen-dependency-treebank +nl 2006 GPL Alpino Treebank http://odur.let.rug.nl/~vannoord/trees/ +fi CC BY-SA 3.0 Turku Dependency Treebank http://bionlp.utu.fi/fintreebank.html +grc CC BY-NC-SA 2.5 Ancient Greek and Latin Dependency Treebanks http://nlp.perseus.tufts.edu/syntax/treebank/greek.html +la CC BY-NC-SA 2.5 Ancient Greek and Latin Dependency Treebanks http://nlp.perseus.tufts.edu/syntax/treebank/latin.html +fa *GPL 3 Persian Dependency Treebank http://dadegan.ir/en/persiandependencytreebank +pt 2006 CC BY-NC-SA 3.0 Floresta Sintá(c)tica http://www.linguateca.pt/floresta/info_floresta_English.html +ro free download Romanian Dependency Treebank http://www.phobos.ro/roric/texts/xml/ +sv 2006 *research, cite Talbanken05 http://w3.msi.vxu.se/~nivre/research/Talbanken05.html +ta CC BY-NC-SA 3.0 Tamil Dependency Treebank http://ufal.mff.cuni.cz/~ramasamy/tamiltb/0.1/ + +Licenses +CC BY-NC-SA 3.0 http://creativecommons.org/licenses/by-nc-sa/3.0/ +CC BY-SA 3.0 http://creativecommons.org/licenses/by-sa/3.0/ +CC BY-NC-SA 2.5 http://creativecommons.org/licenses/by-nc-sa/2.5/ +GPL http://www.gnu.org/licenses/gpl.html + +ar ============ Prague Arabic Dependency Treebank +http://ufal.mff.cuni.cz/padt/PADT_1.0/docs/PADT_license.html + +fa ============ Persian Dependency Treebank +The download page contains "I will use the treebank for research purposes only." +The "Readme and Licence.txt" contains "only non-commercially". +However, the included license is the standard GPL 3 (without any restrictions). + +sv ============ Talbanken05 +http://w3.msi.vxu.se/~nivre/research/Talbanken05.html: +"The treebank comes with no guarantee but is freely available for research and educational purposes as long as proper credit is given for the work done to produce the material (both in Lund and in Växjö)." + +Cite: +Joakim Nivre, Jens Nilsson and Johan Hall (2006) +Talbanken05: A Swedish Treebank with Phrase Structure and Dependency Annotation. +In Proceedings of the fifth international conference on Language Resources and Evaluation (LREC2006), May 24-26, 2006, Genoa, Italy. +http://w3.msi.vxu.se/~nivre/papers/talbanken05.pdf ++ + +
+PARSEME Shared Task VMWE Data (edition 1.0) is a collection of linguistic data and tools. +Each of the corpora has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts which you use. If you do not agree with the license terms, you must stop using the corpora and destroy all copies of the data that you have obtained. +
+The license for every corpus included in the release is specified in the appropriate language directory. The licenses for VMWE annotations (.parsemetsv) files +and morphological/syntactic data (.conllu) can be different, which is also indicated in the below table. All scripts in the bin/ folder in each of the language directories are licensed under CC-BY 4.0. +
Corpus | +Language code | +License for the VMWE annotations (.parsemetsv) | +License for the morphological/syntactic data (.conllu) | +
---|---|---|---|
Bulgarian | +BG | +CC BY 4.0 | +n/a | +
Czech | +CS | +CC BY-NC-SA 3.0 | +CC BY-NC-SA 3.0 | +
Greek | +EL | +CC BY-NC-SA 4.0 | +CC BY-NC-SA 4.0 | +
Farsi | +FA | +CC BY-NC-SA 4.0 (special license for the MULTEX-East corpus, see README.md file for Farsi) | +CC BY-NC-SA 4.0 (special license for the MULTEX-East corpus, see README.md file for Farsi) | +
French | +FR | +CC BY 4.0 | +CC BY-NC-SA 4.0 (UD corpus); LGPL-LR (Sequoia corpus) | +
German | +DE | +CC-BY 4.0 | +CC BY-NC-SA 3.0 US | +
Hebrew | +HE | +CC-BY-NC-SA 4.0 | +n/a | +
Hungarian | +HU | +CC BY 4.0 | +GNU GPL 3.0 | +
Italian | +IT | +CC BY-NC-SA 4.0 | +CC BY-NC-SA 4.0 | +
Lithuanian | +LT | +CC BY-NC-SA 4.0 | +n/a | +
Maltese | +MT | +CC BY 4.0 | +CC BY 4.0 | +
Polish | +PL | +CC-BY 4.0 | +GNU GPL 3.0 | +
Brazilian Portuguese | +PT | +CC BY-NC-SA 4.0 | +CC BY-NC-SA 4.0 | +
Romanian | +RO | +CC BY 4.0 | +CC BY 4.0 | +
Slovenian | +SL | +CC BY-NC-SA 4.0 | +CC BY-NC-SA 4.0 | +
Spanish | +ES | +CC BY 4.0 | +CC BY 4.0 (IXA corpus); GNU GPL 3.0 (Ancora corpus) | +
Swedish | +SV | +CC BY 4.0 | +CC BY-NC-SA 4.0 | +
Turkish | +TR | +CC BY-NC-SA 4.0 | +CC BY-NC-SA 4.0 | +
License | +URL | +
---|---|
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://infolingu.univ-mlv.fr/DonneesLinguistiques/Lexiques-Grammaires/lgpllr.html |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+PARSEME Shared Task VMWE Data (edition 1.1) is a collection of linguistic data and tools. +Each of the corpora has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts which you use. If you do not agree with the license terms, you must stop using the corpora and destroy all copies of the data that you have obtained. +
The license for every corpus included in the release is specified in the appropriate language directory. The licenses for VMWE annotations (column 11) and morphological/syntactic data (columns 1-10) can be different, which is also indicated in the table below. All files in the bin/ and trial/ folders are licensed under CC BY 4.0.
Language | +Language code | +VMWEs annotations (column 11) | +Morphological/syntactic data (columns 1-10) | +
---|---|---|---|
Bulgarian | BG | CC BY 4.0 | CC BY 4.0 |
German | DE | CC BY 4.0 | CC BY-NC-SA 3.0 US |
Greek | EL | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
English | EN | CC BY 4.0 | CC BY-SA 4.0 (UD Original corpus and UD LinES + corpus); CC BY-SA 3.0 (UD PUD corpus) |
Spanish | ES | CC BY 4.0 | CC BY 4.0 (IXA corpus); GNU GPL 3.0 (Ancora corpus); CC BY-NC-SA 3.0 US (UD corpus) |
Basque | EU | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Farsi | FA | CC BY-NC-SA 4.0 (special license for the MULTEX-East corpus, see README.md file for Farsi) | CC BY-NC-SA 4.0 (special license for the MULTEX-East corpus, see README.md file for Farsi) |
French | FR | CC BY 4.0 | CC BY-NC-SA 4.0 (UD corpus); LGPL-LR (Sequoia corpus) |
Hebrew | HE | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Hindi | HI | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Croatian | HR | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Hungarian | HU | CC BY 4.0 | GNU GPL 3.0 |
Italian | IT | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Lithuanian | LT | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Polish | PL | CC BY 4.0 | CC BY-SA 4.0 (columns 1-6 of sentences 120-2-*, 310-* and 330-*); GNU GPL 3.0 (columns 1-6 of remainder sentences); CC BY-SA 4.0 (columns 7-9 of all sentences) |
Portuguese | PT | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Romanian | RO | CC BY 4.0 | CC BY 4.0 |
Slovene | SL | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Turkish | TR | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
License | +URL | +
---|---|
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://infolingu.univ-mlv.fr/DonneesLinguistiques/Lexiques-Grammaires/lgpllr.html |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+PARSEME Shared Task Raw Corpus Data (edition 1.2) is a collection of linguistic data. +Each of the corpora has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts which you use. If you do not agree with the license terms, you must stop using the corpora and destroy all copies of the data that you have obtained. +
The license for every corpus included in the release is specified in the appropriate language directory.
Language | +Language code | +Licences | + +
---|---|---|
German | +DE | +CC BY-NC-SA 4.0 | + +
Greek | +EL | +CC-BY-NC-SA 4.0 (CoNLL 2017 part) CC-BY (Leipzig corpus collection part) |
+
+
Basque | +EU | +CC-BY-NC-SA 4.0 | + + +
French | +FR | +CC-BY-NC-SA 4.0 | + +
Hebrew | +HE | +CC-BY-NC-SA 4.0 | + +
Hindi | +HI | +CC-BY-NC-SA 4.0 | + +
Irish | +GA | +CC-BY 4.0 (Citizen's Information part) CC0 (ParaCrawl part) CC-BY 2.0 (Tatoeba part) + CC-BY-SA 3.0 (Vicipéid) Public Domain* (EU bookshop part) |
+
+
Italian | +IT | +CC-BY-NC-SA 4.0 | + +
Polish | +PL | +CC-BY-NC-SA 4.0 | + +
Portuguese | +PT | +CC-BY-NC-SA 4.0 | + +
Romanian | +RO | +CC-BY-NC-SA 4.0 | + +
Swedish | +SV | +CC-BY-NC-SA 4.0 | + +
Turkish | +TR | +CC-BY-NC-SA 4.0 | + +
Chinese | +ZH | +CC-BY-NC-SA 4.0 | + +
License | +URL | +
---|---|
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY 4.0 | https://creativecommons.org/licenses/by/4.0/ |
CC0 | https://creativecommons.org/share-your-work/public-domain/cc0/ |
CC BY 2.0 | https://creativecommons.org/licenses/by/2.0/ |
CC BY-SA 3.0 | https://creativecommons.org/licenses/by-sa/3.0/ |
Public Domain* | The source is public administration data from EU; see publications office of the european union copyright. The particular set of documents was gathered from EUbookshop (see J. Tiedemann, 2012, Parallel Data, Tools and Interfaces in OPUS. In Proceedings of the 8th International Conference on Language Resources and Evaluation (LREC 2012)). |
+PARSEME Shared Task VMWE Data (edition 1.2) is a collection of linguistic data and tools. +Each of the corpora has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts which you use. If you do not agree with the license terms, you must stop using the corpora and destroy all copies of the data that you have obtained. +
The license for every corpus included in the release is specified in the appropriate language directory. The licenses for VMWE annotations (column 11) and morphological/syntactic data (columns 1-10) can be different, which is also indicated in the table below. All files in the bin/ and trial/ folders are licensed under CC BY 4.0.
Language | +Language code | +VMWEs annotations (column 11) | +Morphological/syntactic data (columns 1-10) | +
---|---|---|---|
German | DE | CC BY 4.0 | CC BY-NC-SA 3.0 US |
Greek | EL | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Basque | EU | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
French | FR | CC BY 4.0 | CC BY-NC-SA 4.0 (UD corpus); LGPL-LR (Sequoia corpus) |
Hebrew | HE | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Hindi | HI | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Irish | GA | CC BY-SA 3.0 | CC BY 4.0 |
Italian | IT | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Polish | PL | CC BY 4.0 | CC BY-SA 4.0 (columns 1-6 of sentences 120-2-*, 310-* and 330-*); GNU GPL 3.0 (columns 1-6 of remainder sentences); CC BY-SA 4.0 (columns 7-9 of all sentences) |
Portuguese | PT | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Romanian | RO | CC BY 4.0 | CC BY 4.0 |
Swedish | SV | CC BY 4.0 | CC BY-SA 4.0 |
Turkish | TR | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Chinese | ZH | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
License | +URL | +
---|---|
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://infolingu.univ-mlv.fr/DonneesLinguistiques/Lexiques-Grammaires/lgpllr.html |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
The Multilingual corpus of literal occurrences of multiword expressions is a collection of linguistic data in 5
+ languages. Each of the corpora has its own license terms and you (the “User”) are responsible for complying with
+ the license terms applicable to those parts which you use. If you do not agree with the license terms, you must
+ stop using the corpora and destroy all copies of the data that you have obtained.
+ The license for every corpus included in the release is specified in the appropriate language directory.
Language | +Language code | +POS-tags (column 2) | +Other data (columns 1 and 3-9) | +
---|---|---|---|
Basque | EU | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
German | DE | CC BY-NC-SA 3.0 US | CC BY 4.0 |
Greek | EL | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
Polish | PL | CC BY-SA 4.0 and GNU GPL 3.0 | CC BY 4.0 |
Portuguese | PT | CC BY-NC-SA 4.0 | CC BY-NC-SA 4.0 |
License | +URL | +
---|---|
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
CC BY-NC-SA 3.0 US | http://creativecommons.org/licenses/by-nc-sa/3.0/us/ |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
+Research-Usage License Agreement for the PDTSL + +between + +Institute of Formal and Applied Linguistics +Faculty of Mathematics and Physics +Charles University +Malostranské náměstí 25 +CZ-11800 Praha +Czech Republic +E-mail: hajic@ufal.mff.cuni.cz +http://ufal.mff.cuni.cz/ +(the Proprietor) + +and + +the User + +whereas + +A. The Prague Dependency Treebank of Spoken Language (PDTSL) is a collection of data developed at and by the Proprietor under the following support: projects MSM0021620838, ME838 and LC536 of Ministry of Education, Youth and Sports of the Czech Republic, GA405/06/0589 of the Grant Agency of the Czech Republic and EU Grant FP6-IST-5-34434-IP. + +B. The Proprietor is the copyright holder of PDTSL and is entitled to grant a license to the User. + +C. The User is an academic, educational, research or other organization, or an individual wishing to make use of PDTSL for research and/or education purposes. + +It is hereby agreed as follows: + +1. This agreement is made on the date of submission and effective immediately. + +2. The User is granted a non-exclusive license to use, modify, enlarge or enrich PDTSL to extract information directly or indirectly in any form and volume, provided that PDTSL itself or any derivative work is used only by the User her/himself or his/her immediate collaborators, employees, managers and/or her/his students from the same Institution for research purposes only, and provided she/he is continuously observing all the terms and conditions contained in this Agreement. If any part of PDTSL contains its own license or an additional restriction, the more restrictive version and/or amendment of the license shall be in effect, unless specifically stated otherwise in such a part. In particular, all the documentation which is provided in either RTF, PDF or PostScript format should be considered a personal copy of the respective Author's reprint and handled as such. + +3. The User shall not use PDTSL itself or any derivative work (including but not limited to statistics obtained by using it or any derivative work thereof) based on it (however small the contribution of PDTSL to such derivative work is) in whatever form for commercial purposes of any kind, nor for a deployment in any routinely used application, regardless whether it is of commercial nature or not. + +4. The User shall include the following notice in all publications or publicly available materials, regardless of their form (printed, electronic, or other), describing work which uses PDTSL: " The Prague Dependency Treebank of Spoken Language - PDTSL has been developed by the Institute of Formal and Applied Linguistics, http://ufal.mff.cuni.cz/." In the case of printed materials, such as papers, journal articles, etc., one publication most suitable for reference with regard to User's work should be included from the list in the PDTSL documentation; in the case of electronic publications on the Internet, the reference to the aforementioned web page should be included as a web link. + +Due to Proprietor's obligations with regard to the text copyright holders, text examples and citations from PDTSL or any derivative work (regardless whether they include any annotations or not) are limited to 200 words per publication or series of publications on the same topic (whether printed, electronic, or in any other form). + +5. The User agrees not to re-distribute or otherwise make publicly available PDTSL, or any derivative work based on it as described in paragraph 3, to a third party without a prior written permission of the Proprietor, with the exception of examples and citations as described in paragraph 4. + +6. The User undertakes to adopt any security measures needed to protect the Proprietors' copyright in PDTSL and undertakes to take all reasonable steps to ensure that no unauthorized use is made of PDTSL and of any copies, derivative works or extracts thereof. + +7. Any usage of PDTSL which does not conform to the specification set forth in the 3rd paragraph of this Agreement (such as, e.g., commercial usage of PDTSL) is subject of separate negotiations and a written contract between the User and the Proprietor and/or other parties. The Proprietor is in general not obliged to enter and/or conclude such negotiations. + +8. PDTSL is provided as is. Therefore the Proprietor does not warrant the usefulness of PDTSL for any purpose, regardless of formulations which can be found at some places in the accompanying documentation stating the intended purpose and use of PDTSL. + +9. If the User reports to the Proprietor any discovered errors, inconsistencies or suggested corrections or improvements to PDTSL, the Proprietor undertake: (a) to maintain these comments in confidence and to use them only for the purposes of improving, modifying and/or maintaining PDTSL, (b) not to disclose the comments except in confidence to those of their employees or directors who need to know the same for the aforesaid purpose. + +10. Should the Users by themselves or anyone acting on their behalf fail to comply with any of the conditions in this agreement (save with the written consent of the Proprietor) this agreement shall terminate immediately and PDTSL, its copies and derivative works based on it shall be destroyed at the User's site and at all sites under his control. Such termination shall be without prejudice to any claim which the Proprietor may have either for monies due and/or damages and/or otherwise. + +11. Failure by the Proprietor to exercise or enforce any rights in this agreement shall not be deemed to be a waiver of any such right nor operate so as to bar the exercise or enforcement thereof at any time or times thereafter. + +12. This agreement terminates if (a) the User destroys all copies of PDTSL or any derivative work thereof, (b) the User or its Institution ceases to exist, unless all its obligations are transferred to a new entity, which is then considered to be bound by this Agreement. The User or its successor shall inform the Proprietor about any such transfer or succession; failure to do so will terminate this Agreement after one month after such transfer or succession. (c) the Proprietor ceases to exist without a legal successor. + +13. The Proprietor shall keep the information about the User provided when submitting this Agreement in confidentiality and will not disclose it to other parties, except in a summary form such that individual users will not be identified, unless they specifically agree to such a disclosure in writing. + +14. This agreement is governed by the laws of the Czech Republic and all disputes concerning this agreement will be resolved by its jurisdiction. ++ +
Universal Segmentations 1.0 (referred to as “UniSegments” in the rest of this document) is a collection of linguistic data. Each of the resource has its own license terms and you (the “User”) are responsible for complying with the license terms applicable to those parts of UniSegments which you use. If you do not agree with the license terms, you must stop using UniSegments and destroy all copies of UniSegments data that you have obtained.
+You are specifically reminded that some of the resources permit only non-commercial usage. +
+The license for every resource included in the release is specified in the appropriate language/resource directory. +
Resource | +License | +
---|---|
ben-KCIS | +CC BY-NC 4.0 | +
cat-MorphyNet | +CC BY-SA 3.0 | +
ces-DeriNet | +CC BY-NC-SA 3.0 | +
ces-MorphyNet | +CC BY-SA 3.0 | +
deu-DerivBaseDE | +CC BY-SA 3.0 | +
deu-MorphyNet | +CC BY-SA 3.0 | +
eng-MorphoLex | +CC BY-NC-SA 4.0 | +
eng-MorphyNet | +CC BY-SA 3.0 | +
fas-PersianMorphSegLex | +CC BY-NC-SA 4.0 | +
fin-MorphyNet | +CC BY-SA 3.0 | +
fra-Demonette | +CC BY-NC-SA 3.0 | +
fra-Echantinom | +CC BY 4.0 | +
fra-MorphoLex | +CC BY-NC-SA 4.0 | +
fra-MorphyNet | +CC BY-SA 3.0 | +
hbs-MorphyNet | +CC BY-SA 3.0 | +
hin-KCIS | +CC BY-NC 4.0 | +
hrv-CroDeriV | +CC BY-SA 3.0 | +
hun-MorphyNet | +CC BY-SA 3.0 | +
hye-Uniparser | +MIT | +
ita-DerIvaTario | +CC BY-SA 4.0 | +
ita-MorphyNet | +CC BY-SA 3.0 | +
kan-KCIS | +CC BY-NC 4.0 | +
kpv-Uniparser | +MIT | +
lat-WordFormationLatin | +CC BY-NC-SA 4.0 | +
mal-KCIS | +CC BY-NC 4.0 | +
mar-KCIS | +CC BY-NC 4.0 | +
mdf-Uniparser | +MIT | +
mhr-Uniparser | +MIT | +
mon-MorphyNet | +CC BY-SA 3.0 | +
myv-Uniparser | +MIT | +
pol-MorphyNet | +CC BY-SA 3.0 | +
por-MorphyNet | +CC BY-SA 3.0 | +
rus-DerivBaseRU | +Apache-2.0 | +
rus-MorphyNet | +CC BY-SA 3.0 | +
spa-MorphyNet | +CC BY-SA 3.0 | +
swe-MorphyNet | +CC BY-SA 3.0 | +
tgk-Uniparser | +MIT | +
udm-Uniparser | +MIT | +
License | +URL | +
---|---|
Apache-2.0 | +https://www.apache.org/licenses/LICENSE-2.0.txt | +
CC BY-NC-SA 4.0 | +https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode | +
CC BY 4.0 | +https://creativecommons.org/licenses/by/4.0/legalcode | +
CC BY-NC-SA 3.0 | +https://creativecommons.org/licenses/by-nc-sa/3.0/legalcode | +
CC BY-SA 3.0 | +https://creativecommons.org/licenses/by-sa/3.0/legalcode | +
CC BY-SA 4.0 | +https://creativecommons.org/licenses/by-sa/4.0/legalcode | +
CC BY-NC 4.0 | +https://creativecommons.org/licenses/by-nc/4.0/legalcode | +
MIT | +https://opensource.org/licenses/MIT | +
to use the NLP Centre data set.
(further as “Agreement”)
The Collection has been obtained by crawling the Internet. + Due to the size of the Collection it has not been practicable to obtain permission from + copyright owners to provide the Collection for the uses permitted under this + Agreement (“Permitted Uses”).
I understand that all the documents in the Collection are documents which have been at some time made publicly available on the + Internet and which have been collected using a process which respects the commonly accepted + methods (such as robots.txt) for indicating that the documents should not be so collected.
Owners of copyright in individual documents may choose to request deletion of these documents from the Collection.
The limitation on permitted use contained in the following section is intended to reduce the risk of any action being brought by + copyright owners, but if this happens I agree to bear all associated liability.
The Collection may only be used for research and development of natural-language processing, information-retrieval or document-understanding systems.
Summaries, analyses and interpretations of the linguistic properties of the Collection may be derived and published, + provided it is not possible to reconstruct the Collection from these summaries.
Small excerpts of the Collection may be displayed to others or published in a scientific or technical context, + solely for the purpose of describing the research and development carried out and related issues.
All efforts must be made not to infringe the rights of any third party including, but not limited to, + the authors and publishers of any excerpts used in accordance with clause 3 above in this “Permitted Uses” section.
I must make sure that I only display the Collection to or share the Collection with persons who also signed this Agreement with NLP Centre.
I undertake to delete within thirty days of receiving notice all copies of any nominated document + that is part of the Collection whenever requested to do so by either:
NLP Centre; or
the owner of copyright for the particular document.
The Collection is provided "as is", without warranty of any kind, express or implied, including but not limited to the warranties of merchantability, + fitness for a particular purpose and noninfringement. In no event shall the NLP Centre be liable for any claim, damages or + other liability, whether in an action of contract, tort or otherwise, arising in any way of the use of the Collection.
Either NLP Centre or me may terminate this Agreement at any time by notifying the other party in writing. + On termination of the Agreement I shall destroy all copies of the Collection.
This Agreement is governed by the laws of the Czech Republic.
PAWS is a parallel, multilingual corpus. The English Part is based on Penn Treebank 3 and therefore to use + PAWS, you need a license for Treebank 3.
+ +The dependency annotation of the English data, as well as all the Czech data + is licensed under the terms of CC-BY-NC-SA 3.0. +
+By accepting this license and downloading the data you declare you have a valid + license for Treebank 3. +
+This agreement is made on the date when signed by both parties and effective immediately.
The User is granted a royalty-free, non-exclusive license to use, modify, enlarge or enrich the CNCD to extract information directly or indirectly in any form and volume, provided that the CNCD itself or any derivative work is used only by the User themselves or their immediate collaborators, employees, managers and/or their students from the same Institution for research purposes only, and provided they are continuously observing all the terms and conditions contained in this Agreement.
The User shall not use the CNCD itself or any derivative work (including but not limited to statistics obtained by using it or any derivative work thereof) based on it (however small the contribution of CNCD to such derivative work is) in whatever form for commercial purposes of any kind.
In all publications or publicly available materials, regardless of their form (printed, electronic, or other), describing work which uses the CNCD, the User shall include a notice mentioning the fact that CNCD is based on the Particular Corpus, developed at the Institute of the Czech National Corpus and available from http://korpus.cz/. In the case of electronic publications on the Internet, the reference to the aforementioned web page should be included as a web link. In the case of printed materials, such as papers, journal articles etc., a given publication should be cited in the list of references. The citing information is located at the bottom of the web page describing the Particular Corpus that is linked from http://wiki.korpus.cz/doku.php/en:cnk:uvod
The User agrees not to re-distribute or otherwise make publicly available the CNCD, or any derivative work based on it as described in paragraph 3, to a third party without a prior written permission of the Proprietor.
The User undertakes to adopt any security measures needed to protect the Proprietor's copyright in CNCD and undertakes to take all reasonable steps to ensure that no unauthorized use is made of CNCD and of any copies, derivative works or extracts thereof.
Any usage of CNCD which does not conform to the specification set forth in this Agreement is subject to separate negotiations and a written contract between the User and the Proprietor and/or other parties. The Proprietor is in general not obliged to enter and/or conclude such negotiations.
The CNCD is provided as is. Therefore the Proprietor does not warrant the usefulness of CNCD for any purpose.
Should the User by themselves or anyone acting on their behalf fail to comply with any of the conditions in this agreement, this agreement shall terminate immediately and CNCD, its copies and derivative works based on it shall be destroyed at the User's site and at all sites under their control. Such termination shall be without prejudice to any claim which the Proprietor may have either for monies due and/or damages and/or otherwise.
This agreement terminates if (a) the User destroys all copies of CNCD or any derivative work thereof, (b) the User or their Institution ceases to exist, unless all their obligations are transferred to a new entity, which is then considered to be bound by this Agreement. The User or their successor shall inform the Proprietor about any such transfer or succession; failure to do so will terminate this Agreement after one month after such transfer or succession. (c) the Proprietor ceases to exist without a legal successor.
This agreement is governed by the laws of the Czech Republic and all disputes concerning this agreement will be resolved by its jurisdiction.
This + agreement is made on the date when signed by both parties and + effective immediately.
The + User is granted a royalty-free, non-exclusive license to use, + modify, enlarge or enrich the SCD to extract information directly + or indirectly in any form and volume, provided that the SCD itself + or any derivative work is used only by the User themselves or their + immediate collaborators, employees, managers and/or their students + from the same Institution for research purposes only, and provided + they are continuously observing all the terms and conditions + contained in this Agreement.
The + User shall not use the SCD itself or any derivative work (including + but not limited to statistics obtained by using it or any + derivative work thereof) based on it (however small the + contribution of SCD to such derivative work is) in whatever form + for commercial purposes of any kind.
In + all publications or publicly available materials, regardless of + their form (printed, electronic, or other), describing work which + uses the SCD, the User shall include a notice mentioning the fact + that SCD are based on the respective SYN-series corpus, + developed at the Institute of the Czech National Corpus and + available from http://korpus.cz/. In the case of electronic + publications on the Internet, the reference to the aforementioned + web page should be included as a web link. In the case of printed + materials, such as papers, journal articles etc., one publication + should be included from the list given for the respective corpus on + http://korpus.cz/.
Due + to Proprietor's obligations with regard to the text copyright + holders, text examples and citations from SCD or any derivative + work are limited to 100 words per example/citation and, at the same + time, 1000 words per publication or series of publications on the + same topic (regardless whether printed, electronic, or in any other + form).
The + User agrees not to re-distribute or otherwise make publicly + available the SCD, or any derivative work based on it as described + in paragraph 3, to a third party without a prior written permission + of the Proprietor.
The + User undertakes to adopt any security measures needed to protect + the Proprietor's copyright in SCD and undertakes to take all + reasonable steps to ensure that no unauthorized use is made of SCD + and of any copies, derivative works or extracts thereof.
Any + usage of SCD which does not conform to the specification set forth + in this Agreement is subject to separate negotiations and a written + contract between the User and the Proprietor and/or other parties. + The Proprietor is in general not obliged to enter and/or conclude + such negotiations.
The + SCD is provided as is. Therefore the Proprietor does not warrant + the usefulness of SCD for any purpose.
Should + the User by themselves or anyone acting on their behalf fail to + comply with any of the conditions in this agreement, this agreement + shall terminate immediately and SCD, its copies and derivative + works based on it shall be destroyed at the User's site and at all + sites under their control. Such termination shall be without + prejudice to any claim which the Proprietor may have either for + monies due and/or damages and/or otherwise.
This + agreement terminates if (a) the User destroys all copies of SCD or + any derivative work thereof, (b) the User or their Institution + ceases to exist, unless all their obligations are transferred to a + new entity, which is then considered to be bound by this Agreement. + The User or their successor shall inform the Proprietor about any + such transfer or succession; failure to do so will terminate this + Agreement after one month after such transfer or succession. (c) + the Proprietor ceases to exist without a legal successor.
This + agreement is governed by the laws of the Czech Republic and all + disputes concerning this agreement will be resolved by its + jurisdiction.
CorefUD v0.1 (referred to as “CorefUD” in the rest of this document) + is a collection of linguistic data. Each of the corpora has its own license terms + and you (the “User”) are responsible for complying with the license terms + applicable to those parts of CorefUD which you use. If you do not agree with the license terms, + you must stop using CorefUD and destroy all copies of CorefUD data that you have obtained.
+You are specifically reminded that some of the corpora + permit only non-commercial usage.
+The license for every corpus included in the release is specified in the appropriate + corpus directory.
+Corpus | License |
---|---|
CorefUD_Catalan-AnCora | +GNU GPL 3.0 | +
CorefUD_Czech-PCEDT | +CC BY-NC-SA 3.0 | +
CorefUD_Czech-PDT | +CC BY-NC-SA 4.0 | +
CorefUD_English-GUM | +CC BY-NC-SA 4.0 | +
CorefUD_English-ParCorFull | +CC BY-NC 4.0 | +
CorefUD_French-Democrat | +CC BY-SA 4.0 | +
CorefUD_German-ParCorFull | +CC BY-NC 4.0 | +
CorefUD_German-PotsdamCC | +CC BY-NC-SA 4.0 | +
CorefUD_Hungarian-SzegedKoref | +CC BY 4.0 | +
CorefUD_Lithuanian-LCC | +CLARIN-LT End User License | +
CorefUD_Polish-PCC | +CC BY 3.0 | +
CorefUD_Russian-RuCor | +CC BY-SA 4.0 | +
CorefUD_Spanish-AnCora | +GNU GPL 3.0 | +
License | URL |
---|---|
CC BY 3.0 | http://creativecommons.org/licenses/by/3.0/ |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-NC 4.0 | http://creativecommons.org/licenses/by-nc/4.0/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CLARIN-LT End User License | https://clarin.vdu.lt/licenses/eula/PUB_CLARIN-LT_End-User-Licence-Agreement_EN-LT.htm |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
CorefUD v0.2 (referred to as “CorefUD” in the rest of this document) + is a collection of linguistic data. Each of the corpora has its own license terms + and you (the “User”) are responsible for complying with the license terms + applicable to those parts of CorefUD which you use. If you do not agree with the license terms, + you must stop using CorefUD and destroy all copies of CorefUD data that you have obtained.
+You are specifically reminded that some of the corpora + permit only non-commercial usage.
+The license for every corpus included in the release is specified in the appropriate + corpus directory.
+Corpus | License |
---|---|
CorefUD_Catalan-AnCora | +CC BY 4.0 | +
CorefUD_Czech-PCEDT | +CC BY-NC-SA 3.0 | +
CorefUD_Czech-PDT | +CC BY-NC-SA 4.0 | +
CorefUD_English-GUM | +CC BY-NC-SA 4.0 | +
CorefUD_English-ParCorFull | +CC BY-NC 4.0 | +
CorefUD_French-Democrat | +CC BY-SA 4.0 | +
CorefUD_German-ParCorFull | +CC BY-NC 4.0 | +
CorefUD_German-PotsdamCC | +CC BY-NC-SA 4.0 | +
CorefUD_Hungarian-SzegedKoref | +CC BY 4.0 | +
CorefUD_Lithuanian-LCC | +CLARIN-LT End User License | +
CorefUD_Polish-PCC | +CC BY 3.0 | +
CorefUD_Russian-RuCor | +CC BY-SA 4.0 | +
CorefUD_Spanish-AnCora | +CC BY 4.0 | +
License | URL |
---|---|
CC BY 3.0 | http://creativecommons.org/licenses/by/3.0/ |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-NC 4.0 | http://creativecommons.org/licenses/by-nc/4.0/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CLARIN-LT End User License | https://clarin.vdu.lt/licenses/eula/PUB_CLARIN-LT_End-User-Licence-Agreement_EN-LT.htm |
Prague Czech English Dependency Treebank 2.0 (PCEDT) is a parallel, + bilingual corpus. The English Part is based on Penn Treebank 3 and + therefore to use PCEDT, you need a license for Treebank 3. +
+ +The dependency annotation of the English data, as well as all the Czech data + is licensed under the terms of CC-BY-NC-SA 3.0. +
+By accepting this license and downloading the data you declare you have a valid + license for Treebank 3. +
+The Prague Dependency Treebank version 2.0 (PDT 2.0) is a collection of textual data and documentation containing linguistic annotations and software tools for their processing as described in the documentation, developed at and by the Proprietor under the following support: Ministry of Education of the Czech Republic projects No. VS96151, LN00A063, 1P05ME752, MSM0021620838, and LC536, Grant Agency of the Czech Republic grants Nos. 405/96/0198, 405/96/K214 and 405/03/0913, research funds of the Faculty of Mathematics and Physics, Charles University, Czech Republic, Grant Agency of the Academy of Sciences of the Czech Republic No. 1ET101120503 and 1ET101120413, Grant Agency of the Charles University No. 489/04, 350/05, 352/05 and 375/05 and the U.S. NSF Grant #IIS9732388.
+The Proprietor is the copyright holder of PDT 2.0 and is entitled to grant a license to the User.
+The User is an academic, educational or research institution, or other organization, or an individual wishing to make use of PDT 2.0 for research and/or education purposes.
+This agreement is made on the date of submission and effective immediately.
+The User is granted a non-exclusive license to use, modify, enlarge or enrich PDT 2.0 to extract information directly or indirectly in any form and volume, provided that PDT 2.0 itself or any derivative work is used only by the User her/himself or his/her immediate collaborators, employees, managers and/or her/his students from the same Institution for research purposes only, and provided she/he is continuously observing all the terms and conditions contained in this Agreement. If any part of PDT 2.0 contains its own license or an additional restriction, the more restrictive version and/or amendment of the license shall be in effect, unless specifically stated otherwise in such a part. In particular, all the documentation which is provided in either RTF, PDF or PostScript format should be considered a personal copy of the respective Author's reprint and handled as such.
+The User shall not use PDT 2.0 itself or any derivative work (including but not limited to statistics obtained by using it or any derivative work thereof) based on it (however small the contribution of PDT 2.0 to such derivative work is) in whatever form for commercial purposes of any kind, nor for a deployment in any routinely used application, regardless whether it is of commercial nature or not.
+The User shall include the following notice in all publications or publicly available materials, regardless of their form (printed, electronic, or other), describing work which uses PDT 2.0: "The Prague Dependency Treebank, version 2.0 has been developed by the Institute of Formal and Applied Linguistics, http://ufal.mff.cuni.cz/
." In the case of printed materials, such as papers, journal articles, etc., one publication most suitable for reference with regard to User's work should be included from the list in the PDT 2.0 documentation; in the case of electronic publications on the Internet, the reference to the aforementioned web page should be included as a web link. Due to Proprietor's obligations with regard to the text copyright holders, text examples and citations from PDT 2.0 or any derivative work (regardless whether they include any annotations or not) are limited to 200 words per publication or series of publications on the same topic (whether printed, electronic, or in any other form).
The User agrees not to re-distribute or otherwise make publicly available PDT 2.0, or any derivative work based on it as described in paragraph 3, to a third party without a prior written permission of the Proprietor, with the exception of examples and citations as described in paragraph 4.
+The User undertakes to adopt any security measures needed to protect the Proprietors' copyright in PDT 2.0 and undertakes to take all reasonable steps to ensure that no unauthorized use is made of PDT 2.0 and of any copies, derivative works or extracts thereof.
+Any usage of PDT 2.0 which does not conform to the specification set forth in the 3rd paragraph of this Agreement (such as, e.g., commercial usage of PDT 2.0) is subject of separate negotiations and a written contract between the User and the Proprietor and/or other parties. The Proprietor is in general not obliged to enter and/or conclude such negotiations.
+PDT 2.0 is provided as is. Therefore the Proprietor does not warrant the usefulness of PDT 2.0 for any purpose, regardless of formulations which can be found at some places in the accompanying documentation stating the intended purpose and use of PDT 2.0.
+If the User reports to the Proprietor any discovered errors, inconsistencies or suggested corrections or improvements to PDT 2.0, the Proprietor undertake: (a) to maintain these comments in confidence and to use them only for the purposes of improving, modifying and/or maintaining PDT 2.0, (b) not to disclose the comments except in confidence to those of their employees or directors who need to know the same for the aforesaid purpose.
+Should the Users by themselves or anyone acting on their behalf fail to comply with any of the conditions in this agreement (save with the written consent of the Proprietor) this agreement shall terminate immediately and PDT 2.0, its copies and derivative works based on it shall be destroyed at the User's site and at all sites under his control. Such termination shall be without prejudice to any claim which the Proprietor may have either for monies due and/or damages and/or otherwise.
+Failure by the Proprietor to exercise or enforce any rights in this agreement shall not be deemed to be a waiver of any such right nor operate so as to bar the exercise or enforcement thereof at any time or times thereafter.
+This agreement terminates if (a) the User destroys all copies of PDT 2.0 or any derivative work thereof, (b) the User or its Institution ceases to exist, unless all its obligations are transferred to a new entity, which is then considered to be bound by this Agreement. The User or its successor shall inform the Proprietor about any such transfer or succession; failure to do so will terminate this Agreement after one month after such transfer or succession. (c) the Proprietor ceases to exist without a legal successor.
+The Proprietor shall keep the information about the User provided when submitting this Agreement in confidentiality and will not disclose it to other parties, except in a summary form such that individual users will not be identified, unless they specifically agree to such a disclosure in writing.
+This agreement is governed by the laws of the Czech Republic and all disputes concerning this agreement will be resolved by its jurisdiction.
+XXXX XXXX
XXXX XXXX
XXXX XXXX
XXXX XXXX
XXXX XXXX
XXXX XXXX
XXXX XXXX
XXXX XXXX
+tools: +GNU General Public License, version 2, cf. file tools/LICENSE in tools.zip + +docs: +Apache license 2.0, cf. file docs/LICENSE in docs.zip + +Czech treebank: +Creative Commons BY-NC-SA 3.0, cf. file cs/LICENSE in universal-dependencies-1.0.tgz + +English treebank: +Creative Commons Attribution-ShareAlike 4.0 International license, cf. file en/LICENSE in universal-dependencies-1.0.tgz + +Finnish treebank: +Creative Commons Attribution-ShareAlike 4.0 International license, cf. file fi/LICENSE in universal-dependencies-1.0.tgz + +French treebank: +Creative Commons BY-NC-SA 3.0, cf. file fr/LICENSE in universal-dependencies-1.0.tgz + +German treebank: +Creative Commons BY-NC-SA 3.0, cf. file de/LICENSE in universal-dependencies-1.0.tgz + +Hungarian treebank: +Creative Commons BY-NC-SA 3.0, cf. file hu/LICENSE in universal-dependencies-1.0.tgz + +Irish treebank: +CC BY-SA 3.0, cf. file ga/LICENSE in universal-dependencies-1.0.tgz + +Italian treebank: +Creative Commons Attribution-ShareAlike 3.0 Unported, cf. file it/LICENSE in universal-dependencies-1.0.tgz + +Spanish treebank: +Creative Commons BY-NC-SA 3.0, cf. file es/LICENSE in universal-dependencies-1.0.tgz + +Swedish treebank: +CC BY-SA 3.0, cf. file sv/LICENSE in universal-dependencies-1.0.tgz ++ +
Universal Dependencies v2.6 (referred to as “UD” in the rest of this document) + is a collection of linguistic data and tools. Each of the treebanks has its own license terms + and you (the “User”) are responsible for complying with the license terms + applicable to those parts of UD which you use. If you do not agree with the license terms, + you must stop using UD and destroy all copies of UD data that you have obtained.
+You are specifically reminded that some of the treebanks + permit only non-commercial usage.
+The additional software tools are provided as-is (without any warranty) and are redistributed + under GNU GPL Version 2.
+The license for every treebank included in the release is specified in the appropriate + treebank directory.
+Treebank | License |
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Albanian-TSA | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Assyrian-AS | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Bhojpuri-BHTB | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-GSD | +CC BY-SA 4.0 | +
Chinese-GSDSimp | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 3.0 | +
Classical_Chinese-Kyoto | +PD | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-GUMReddit | +CC BY 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-Pronouns | +CC BY-SA 4.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Estonian-EWT | +CC BY-NC-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
French-FQB | +LGPL-LR | +
French-FTB | +LGPL-LR | +
French-GSD | +CC BY-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-Sequoia | +LGPL-LR | +
French-Spoken | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPL-LR | +
German-GSD | +CC BY-SA 4.0 | +
German-HDT | +CC BY-SA 4.0 | +
German-LIT | +CC BY-NC-SA 4.0 | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Icelandic-PUD | +CC BY-SA 4.0 | +
Indonesian-GSD | +CC BY-SA 4.0 | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-TWITTIRO | +CC BY-SA 4.0 | +
Italian-VIT | +CC BY-NC-SA 3.0 | +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-SA 4.0 | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Karelian-KKPP | +CC BY-SA 4.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Komi_Permyak-UH | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-SA 4.0 | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-LLCT | +CC BY-SA 4.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latvian-LVTB | +CC BY-SA 4.0 | +
Lithuanian-ALKSNIS | +CC BY-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Livvi-KKPP | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Mbya_Guarani-Dooley | +CC BY-NC-SA 4.0 | +
Mbya_Guarani-Thomas | +CC BY-NC-SA 4.0 | +
Moksha-JR | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Old_Russian-RNC | +CC BY-SA 4.0 | +
Old_Russian-TOROT | +CC BY-NC-SA 3.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-PDB | +CC BY-NC-SA 4.0 | +
Polish-PUD | +CC BY-SA 4.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-SA 4.0 | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-SiMoNERo | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Sanskrit-Vedic | +CC BY-SA 4.0 | +
Scottish_Gaelic-ARCOSG | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Skolt_Sami-Giellagas | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-GSD | +CC BY-SA 4.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | +
Swiss_German-UZH | +CC BY-SA 4.0 | +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tagalog-Ugnayan | +CC BY-NC-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Turkish-GB | +CC BY-SA 4.0 | +
Turkish-IMST | +CC BY-NC-SA 4.0 | +
Turkish-PUD | +CC BY-SA 3.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Welsh-CCG | +CC BY-SA 4.0 | +
Wolof-WTB | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
License | URL |
---|---|
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
PD | public domain |
Universal Dependencies v2.7 (referred to as “UD” in the rest of this document) + is a collection of linguistic data and tools. Each of the treebanks has its own license terms + and you (the “User”) are responsible for complying with the license terms + applicable to those parts of UD which you use. If you do not agree with the license terms, + you must stop using UD and destroy all copies of UD data that you have obtained.
+You are specifically reminded that some of the treebanks + permit only non-commercial usage.
+The additional software tools are provided as-is (without any warranty) and are redistributed + under GNU GPL Version 2.
+The license for every treebank included in the release is specified in the appropriate + treebank directory.
+Treebank | License |
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Akkadian-RIAO | +CC BY-SA 3.0 | +
Akuntsu-TuDeT | +CC BY-SA 4.0 | +
Albanian-TSA | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Apurina-UFPA | +CC BY-SA 4.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Assyrian-AS | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Bhojpuri-BHTB | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-GSD | +CC BY-SA 4.0 | +
Chinese-GSDSimp | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 3.0 | +
Chukchi-HSE | +CC BY-SA 4.0 | +
Classical_Chinese-Kyoto | +PD | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-GUMReddit | +CC BY 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-Pronouns | +CC BY-SA 4.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Estonian-EWT | +CC BY-NC-SA 4.0 | +
Faroese-FarPaHC | +CC BY-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-OOD | +CC BY-SA 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
French-FQB | +LGPL-LR | +
French-FTB | +LGPL-LR | +
French-GSD | +CC BY-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-Sequoia | +LGPL-LR | +
French-Spoken | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPL-LR | +
German-GSD | +CC BY-SA 4.0 | +
German-HDT | +CC BY-SA 4.0 | +
German-LIT | +CC BY-NC-SA 4.0 | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Icelandic-IcePaHC | +CC BY-SA 4.0 | +
Icelandic-PUD | +CC BY-SA 4.0 | +
Indonesian-CSUI | +CC BY-SA 4.0 | +
Indonesian-GSD | +CC BY-SA 4.0 | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-TWITTIRO | +CC BY-SA 4.0 | +
Italian-VIT | +CC BY-NC-SA 3.0 | +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-SA 4.0 | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Karelian-KKPP | +CC BY-SA 4.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Khunsari-AHA | +CC BY-SA 4.0 | +
Komi_Permyak-UH | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-SA 4.0 | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-LLCT | +CC BY-SA 4.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latvian-LVTB | +CC BY-SA 4.0 | +
Lithuanian-ALKSNIS | +CC BY-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Livvi-KKPP | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Manx-Cadhan | +GNU GPL 3.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Mbya_Guarani-Dooley | +CC BY-NC-SA 4.0 | +
Mbya_Guarani-Thomas | +CC BY-NC-SA 4.0 | +
Moksha-JR | +CC BY-SA 4.0 | +
Munduruku-TuDeT | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
Nayini-AHA | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Old_Russian-RNC | +CC BY-SA 4.0 | +
Old_Russian-TOROT | +CC BY-NC-SA 3.0 | +
Old_Turkish-Tonqq | +CC0 1.0 | +
Persian-PerDT | +CC BY-SA 4.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-PDB | +CC BY-NC-SA 4.0 | +
Polish-PUD | +CC BY-SA 4.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-SA 4.0 | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-SiMoNERo | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Sanskrit-Vedic | +CC BY-SA 4.0 | +
Scottish_Gaelic-ARCOSG | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Skolt_Sami-Giellagas | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Soi-AHA | +CC BY-SA 4.0 | +
South_Levantine_Arabic-MADAR | +CC BY-SA 4.0 | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-GSD | +CC BY-SA 4.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | +
Swiss_German-UZH | +CC BY-SA 4.0 | +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tagalog-Ugnayan | +CC BY-NC-SA 4.0 | +
Tamil-MWTT | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Tupinamba-TuDeT | +CC BY-SA 4.0 | +
Turkish-BOUN | +CC BY-SA 4.0 | +
Turkish-GB | +CC BY-SA 4.0 | +
Turkish-IMST | +CC BY-NC-SA 4.0 | +
Turkish-PUD | +CC BY-SA 3.0 | +
Turkish_German-SAGT | +CC BY-NC-SA 4.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Welsh-CCG | +CC BY-SA 4.0 | +
Wolof-WTB | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
License | URL |
---|---|
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC0 1.0 | http://creativecommons.org/publicdomain/zero/1.0/ |
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
PD | public domain |
Universal Dependencies v2.8 (referred to as “UD” in the rest of this document) + is a collection of linguistic data and tools. Each of the treebanks has its own license terms + and you (the “User”) are responsible for complying with the license terms + applicable to those parts of UD which you use. If you do not agree with the license terms, + you must stop using UD and destroy all copies of UD data that you have obtained.
+You are specifically reminded that some of the treebanks + permit only non-commercial usage.
+The additional software tools are provided as-is (without any warranty) and are redistributed + under GNU GPL Version 2.
+The license for every treebank included in the release is specified in the appropriate + treebank directory.
+Treebank | License |
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Akkadian-RIAO | +CC BY-SA 3.0 | +
Akuntsu-TuDeT | +CC BY-SA 4.0 | +
Albanian-TSA | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Apurina-UFPA | +CC BY-SA 4.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Assyrian-AS | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Beja-NSC | +CC BY-SA 4.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Bhojpuri-BHTB | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +GNU GPL 3.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-GSD | +CC BY-SA 4.0 | +
Chinese-GSDSimp | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 3.0 | +
Chukchi-HSE | +CC BY-SA 4.0 | +
Classical_Chinese-Kyoto | +PD | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-GUMReddit | +CC BY 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-Pronouns | +CC BY-SA 4.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Estonian-EWT | +CC BY-NC-SA 4.0 | +
Faroese-FarPaHC | +CC BY-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-OOD | +CC BY-SA 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
French-FQB | +LGPL-LR | +
French-FTB | +LGPL-LR | +
French-GSD | +CC BY-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-Sequoia | +LGPL-LR | +
French-Spoken | +CC BY-SA 4.0 | +
Frisian_Dutch-Fame | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPL-LR | +
German-GSD | +CC BY-SA 4.0 | +
German-HDT | +CC BY-SA 4.0 | +
German-LIT | +CC BY-NC-SA 4.0 | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Guajajara-TuDeT | +CC BY-SA 4.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Icelandic-IcePaHC | +CC BY-SA 4.0 | +
Icelandic-Modern | +CC BY-SA 4.0 | +
Icelandic-PUD | +CC BY-SA 4.0 | +
Indonesian-CSUI | +CC BY-SA 4.0 | +
Indonesian-GSD | +CC BY-SA 4.0 | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Irish-TwittIrish | +CC BY-SA 4.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-TWITTIRO | +CC BY-SA 4.0 | +
Italian-VIT | +CC BY-NC-SA 3.0 | +
Italian-Valico | +CC BY-SA 4.0 | +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-SA 4.0 | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Kaapor-TuDeT | +CC BY-SA 4.0 | +
Kangri-KDTB | +CC BY-SA 4.0 | +
Karelian-KKPP | +CC BY-SA 4.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Khunsari-AHA | +CC BY-SA 4.0 | +
Kiche-IU | +CC BY-SA 4.0 | +
Komi_Permyak-UH | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-SA 4.0 | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-LLCT | +CC BY-SA 4.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latin-UDante | +CC BY-NC-SA 3.0 | +
Latvian-LVTB | +CC BY-SA 4.0 | +
Lithuanian-ALKSNIS | +CC BY-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Livvi-KKPP | +CC BY-SA 4.0 | +
Low_Saxon-LSDC | +CC BY-SA 4.0 | +
Makurap-TuDeT | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Manx-Cadhan | +GNU GPL 3.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Mbya_Guarani-Dooley | +CC BY-NC-SA 4.0 | +
Mbya_Guarani-Thomas | +CC BY-NC-SA 4.0 | +
Moksha-JR | +CC BY-SA 4.0 | +
Munduruku-TuDeT | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
Nayini-AHA | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | +
Old_East_Slavic-RNC | +CC BY-SA 4.0 | +
Old_East_Slavic-TOROT | +CC BY-NC-SA 3.0 | +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Old_Turkish-Tonqq | +CC0 1.0 | +
Persian-PerDT | +CC BY-SA 4.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-PDB | +CC BY-NC-SA 4.0 | +
Polish-PUD | +CC BY-SA 4.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-SA 4.0 | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-ArT | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-SiMoNERo | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Sanskrit-Vedic | +CC BY-SA 4.0 | +
Scottish_Gaelic-ARCOSG | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Skolt_Sami-Giellagas | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Soi-AHA | +CC BY-SA 4.0 | +
South_Levantine_Arabic-MADAR | +CC BY-SA 4.0 | +
Spanish-AnCora | +GNU GPL 3.0 | +
Spanish-GSD | +CC BY-SA 4.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | +
Swiss_German-UZH | +CC BY-SA 4.0 | +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tagalog-Ugnayan | +CC BY-NC-SA 4.0 | +
Tamil-MWTT | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Tupinamba-TuDeT | +CC BY-SA 4.0 | +
Turkish-BOUN | +CC BY-SA 4.0 | +
Turkish-FrameNet | +CC BY-SA 4.0 | +
Turkish-GB | +CC BY-SA 4.0 | +
Turkish-IMST | +CC BY-NC-SA 4.0 | +
Turkish-Kenet | +CC BY-SA 4.0 | +
Turkish-PUD | +CC BY-SA 3.0 | +
Turkish-Penn | +CC BY-SA 4.0 | +
Turkish-Tourism | +CC BY-SA 4.0 | +
Turkish_German-SAGT | +CC BY-NC-SA 4.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Welsh-CCG | +CC BY-SA 4.0 | +
Western_Armenian-ArmTDP | +CC BY-SA 4.0 | +
Wolof-WTB | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
Yupik-SLI | +CC BY-SA 4.0 | +
License | URL |
---|---|
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC0 1.0 | http://creativecommons.org/publicdomain/zero/1.0/ |
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
PD | public domain |
Universal Dependencies v2.9 (referred to as “UD” in the rest of this document) + is a collection of linguistic data and tools. Each of the treebanks has its own license terms + and you (the “User”) are responsible for complying with the license terms + applicable to those parts of UD which you use. If you do not agree with the license terms, + you must stop using UD and destroy all copies of UD data that you have obtained.
+You are specifically reminded that some of the treebanks + permit only non-commercial usage.
+The additional software tools are provided as-is (without any warranty) and are redistributed + under GNU GPL Version 2.
+The license for every treebank included in the release is specified in the appropriate + treebank directory.
+Treebank | License |
---|---|
Afrikaans-AfriBooms | +CC BY-SA 4.0 | +
Akkadian-PISANDUB | +CC BY-SA 4.0 | +
Akkadian-RIAO | +CC BY-SA 3.0 | +
Akuntsu-TuDeT | +CC BY-SA 4.0 | +
Albanian-TSA | +CC BY-SA 4.0 | +
Amharic-ATT | +CC BY-SA 4.0 | +
Ancient_Greek-PROIEL | +CC BY-NC-SA 3.0 | +
Ancient_Greek-Perseus | +CC BY-NC-SA 2.5 | +
Apurina-UFPA | +CC BY-SA 4.0 | +
Arabic-NYUAD | +CC BY-SA 4.0 | +
Arabic-PADT | +CC BY-NC-SA 3.0 | +
Arabic-PUD | +CC BY-SA 3.0 | +
Armenian-ArmTDP | +CC BY-SA 4.0 | +
Armenian-BSUT | +CC BY-SA 4.0 | +
Assyrian-AS | +CC BY-SA 4.0 | +
Bambara-CRB | +CC BY-SA 4.0 | +
Basque-BDT | +CC BY-NC-SA 3.0 | +
Beja-NSC | +CC BY-SA 4.0 | +
Belarusian-HSE | +CC BY-SA 4.0 | +
Bengali-BRU | +CC BY-SA 4.0 | +
Bhojpuri-BHTB | +CC BY-SA 4.0 | +
Breton-KEB | +CC BY-SA 4.0 | +
Bulgarian-BTB | +CC BY-NC-SA 3.0 | +
Buryat-BDT | +CC BY-SA 4.0 | +
Cantonese-HK | +CC BY-SA 4.0 | +
Catalan-AnCora | +CC BY 4.0 | +
Chinese-CFL | +CC BY-SA 4.0 | +
Chinese-GSD | +CC BY-SA 4.0 | +
Chinese-GSDSimp | +CC BY-SA 4.0 | +
Chinese-HK | +CC BY-SA 4.0 | +
Chinese-PUD | +CC BY-SA 3.0 | +
Chukchi-HSE | +CC BY-SA 4.0 | +
Classical_Chinese-Kyoto | +PD | +
Coptic-Scriptorium | +CC BY 4.0 | +
Croatian-SET | +CC BY-SA 4.0 | +
Czech-CAC | +CC BY-SA 4.0 | +
Czech-CLTT | +CC BY-SA 4.0 | +
Czech-FicTree | +CC BY-NC-SA 4.0 | +
Czech-PDT | +CC BY-NC-SA 3.0 | +
Czech-PUD | +CC BY-SA 4.0 | +
Danish-DDT | +CC BY-SA 4.0 | +
Dutch-Alpino | +CC BY-SA 4.0 | +
Dutch-LassySmall | +CC BY-SA 4.0 | +
English-Atis | +CC BY-SA 4.0 | +
English-ESL | +CC BY-SA 4.0 | +
English-EWT | +CC BY-SA 4.0 | +
English-GUM | +CC BY-NC-SA 4.0 | +
English-GUMReddit | +CC BY 4.0 | +
English-LinES | +CC BY-NC-SA 4.0 | +
English-PUD | +CC BY-SA 3.0 | +
English-ParTUT | +CC BY-NC-SA 4.0 | +
English-Pronouns | +CC BY-SA 4.0 | +
Erzya-JR | +CC BY-SA 4.0 | +
Estonian-EDT | +CC BY-NC-SA 4.0 | +
Estonian-EWT | +CC BY-NC-SA 4.0 | +
Faroese-FarPaHC | +CC BY-SA 4.0 | +
Faroese-OFT | +CC BY-SA 4.0 | +
Finnish-FTB | +CC BY 4.0 | +
Finnish-OOD | +CC BY-SA 4.0 | +
Finnish-PUD | +CC BY-SA 4.0 | +
Finnish-TDT | +CC BY-SA 4.0 | +
French-FQB | +LGPL-LR | +
French-FTB | +LGPL-LR | +
French-GSD | +CC BY-SA 4.0 | +
French-PUD | +CC BY-SA 3.0 | +
French-ParTUT | +CC BY-NC-SA 4.0 | +
French-ParisStories | +CC BY-SA 4.0 | +
French-Rhapsodie | +CC BY-SA 4.0 | +
French-Sequoia | +LGPL-LR | +
Frisian_Dutch-Fame | +CC BY-SA 4.0 | +
Galician-CTG | +CC BY-NC-SA 3.0 | +
Galician-TreeGal | +LGPL-LR | +
German-GSD | +CC BY-SA 4.0 | +
German-HDT | +CC BY-SA 4.0 | +
German-LIT | +CC BY-NC-SA 4.0 | +
German-PUD | +CC BY-SA 3.0 | +
Gothic-PROIEL | +CC BY-NC-SA 3.0 | +
Greek-GDT | +CC BY-NC-SA 3.0 | +
Guajajara-TuDeT | +CC BY-SA 4.0 | +
Hebrew-HTB | +CC BY-NC-SA 4.0 | +
Hindi-HDTB | +CC BY-NC-SA 4.0 | +
Hindi-PUD | +CC BY-SA 3.0 | +
Hindi_English-HIENCS | +CC BY-SA 4.0 | +
Hungarian-Szeged | +CC BY-NC-SA 3.0 | +
Icelandic-IcePaHC | +CC BY-SA 4.0 | +
Icelandic-Modern | +CC BY-SA 4.0 | +
Icelandic-PUD | +CC BY-SA 4.0 | +
Indonesian-CSUI | +CC BY-SA 4.0 | +
Indonesian-GSD | +CC BY-SA 4.0 | +
Indonesian-PUD | +CC BY-SA 3.0 | +
Irish-IDT | +CC BY-SA 3.0 | +
Irish-TwittIrish | +CC BY-SA 4.0 | +
Italian-ISDT | +CC BY-NC-SA 3.0 | +
Italian-PUD | +CC BY-SA 3.0 | +
Italian-ParTUT | +CC BY-NC-SA 4.0 | +
Italian-PoSTWITA | +CC BY-NC-SA 4.0 | +
Italian-TWITTIRO | +CC BY-SA 4.0 | +
Italian-VIT | +CC BY-NC-SA 3.0 | +
Italian-Valico | +CC BY-SA 4.0 | +
Japanese-BCCWJ | +CC BY-NC-SA 4.0 | +
Japanese-BCCWJLUW | +CC BY-NC-SA 4.0 | +
Japanese-GSD | +CC BY-SA 4.0 | +
Japanese-GSDLUW | +CC BY-SA 4.0 | +
Japanese-Modern | +CC BY-NC-ND 3.0 | +
Japanese-PUD | +CC BY-SA 3.0 | +
Japanese-PUDLUW | +CC BY-SA 3.0 | +
Javanese-CSUI | +CC BY-SA 4.0 | +
Kaapor-TuDeT | +CC BY-SA 4.0 | +
Kangri-KDTB | +CC BY-SA 4.0 | +
Karelian-KKPP | +CC BY-SA 4.0 | +
Karo-TuDeT | +CC BY-SA 4.0 | +
Kazakh-KTB | +CC BY-SA 4.0 | +
Khunsari-AHA | +CC BY-SA 4.0 | +
Kiche-IU | +CC BY-SA 4.0 | +
Komi_Permyak-UH | +CC BY-SA 4.0 | +
Komi_Zyrian-IKDP | +CC BY-SA 4.0 | +
Komi_Zyrian-Lattice | +CC BY-SA 4.0 | +
Korean-GSD | +CC BY-SA 4.0 | +
Korean-Kaist | +CC BY-SA 4.0 | +
Korean-PUD | +CC BY-SA 3.0 | +
Kurmanji-MG | +CC BY-SA 4.0 | +
Latin-ITTB | +CC BY-NC-SA 3.0 | +
Latin-LLCT | +CC BY-SA 4.0 | +
Latin-PROIEL | +CC BY-NC-SA 3.0 | +
Latin-Perseus | +CC BY-NC-SA 2.5 | +
Latin-UDante | +CC BY-NC-SA 3.0 | +
Latvian-LVTB | +CC BY-SA 4.0 | +
Ligurian-GLT | +C-UDA 1.0 | +
Lithuanian-ALKSNIS | +CC BY-SA 4.0 | +
Lithuanian-HSE | +CC BY-SA 4.0 | +
Livvi-KKPP | +CC BY-SA 4.0 | +
Low_Saxon-LSDC | +CC BY-SA 4.0 | +
Makurap-TuDeT | +CC BY-SA 4.0 | +
Maltese-MUDT | +CC BY-SA 4.0 | +
Manx-Cadhan | +GNU GPL 3.0 | +
Marathi-UFAL | +CC BY-SA 4.0 | +
Mbya_Guarani-Dooley | +CC BY-NC-SA 4.0 | +
Mbya_Guarani-Thomas | +CC BY-NC-SA 4.0 | +
Moksha-JR | +CC BY-SA 4.0 | +
Munduruku-TuDeT | +CC BY-SA 4.0 | +
Naija-NSC | +CC BY-SA 4.0 | +
Nayini-AHA | +CC BY-SA 4.0 | +
Neapolitan-RB | +CC BY-SA 4.0 | +
North_Sami-Giella | +CC BY-SA 4.0 | +
Norwegian-Bokmaal | +CC BY-SA 4.0 | +
Norwegian-Nynorsk | +CC BY-SA 4.0 | +
Norwegian-NynorskLIA | +CC BY-SA 4.0 | +
Old_Church_Slavonic-PROIEL | +CC BY-NC-SA 3.0 | +
Old_East_Slavic-RNC | +CC BY-SA 4.0 | +
Old_East_Slavic-TOROT | +CC BY-NC-SA 3.0 | +
Old_French-SRCMF | +CC BY-NC-SA 3.0 | +
Old_Turkish-Tonqq | +CC0 1.0 | +
Persian-PerDT | +CC BY-SA 4.0 | +
Persian-Seraji | +CC BY-SA 4.0 | +
Polish-LFG | +GNU GPL 3.0 | +
Polish-PDB | +CC BY-NC-SA 4.0 | +
Polish-PUD | +CC BY-SA 4.0 | +
Portuguese-Bosque | +CC BY-SA 4.0 | +
Portuguese-GSD | +CC BY-SA 4.0 | +
Portuguese-PUD | +CC BY-SA 3.0 | +
Romanian-ArT | +CC BY-SA 4.0 | +
Romanian-Nonstandard | +CC BY-SA 4.0 | +
Romanian-RRT | +CC BY-SA 4.0 | +
Romanian-SiMoNERo | +CC BY-SA 4.0 | +
Russian-GSD | +CC BY-SA 4.0 | +
Russian-PUD | +CC BY-SA 3.0 | +
Russian-SynTagRus | +CC BY-NC-SA 4.0 | +
Russian-Taiga | +CC BY-SA 4.0 | +
Sanskrit-UFAL | +CC BY-SA 4.0 | +
Sanskrit-Vedic | +CC BY-SA 4.0 | +
Scottish_Gaelic-ARCOSG | +CC BY-SA 4.0 | +
Serbian-SET | +CC BY-SA 4.0 | +
Skolt_Sami-Giellagas | +CC BY-SA 4.0 | +
Slovak-SNK | +CC BY-SA 4.0 | +
Slovenian-SSJ | +CC BY-NC-SA 4.0 | +
Slovenian-SST | +CC BY-NC-SA 4.0 | +
Soi-AHA | +CC BY-SA 4.0 | +
South_Levantine_Arabic-MADAR | +CC BY-SA 4.0 | +
Spanish-AnCora | +CC BY 4.0 | +
Spanish-GSD | +CC BY-SA 4.0 | +
Spanish-PUD | +CC BY-SA 3.0 | +
Swedish-LinES | +CC BY-NC-SA 4.0 | +
Swedish-PUD | +CC BY-SA 4.0 | +
Swedish-Talbanken | +CC BY-SA 4.0 | +
Swedish_Sign_Language-SSLC | +CC BY-SA 4.0 | +
Swiss_German-UZH | +CC BY-SA 4.0 | +
Tagalog-TRG | +CC BY-SA 4.0 | +
Tagalog-Ugnayan | +CC BY-NC-SA 4.0 | +
Tamil-MWTT | +CC BY-SA 4.0 | +
Tamil-TTB | +CC BY-NC-SA 3.0 | +
Tatar-NMCTT | +CC BY-SA 4.0 | +
Telugu-MTG | +CC BY-SA 4.0 | +
Thai-PUD | +CC BY-SA 3.0 | +
Tupinamba-TuDeT | +CC BY-SA 4.0 | +
Turkish-Atis | +CC BY-SA 4.0 | +
Turkish-BOUN | +CC BY-SA 4.0 | +
Turkish-FrameNet | +CC BY-SA 4.0 | +
Turkish-GB | +CC BY-SA 4.0 | +
Turkish-IMST | +CC BY-NC-SA 4.0 | +
Turkish-Kenet | +CC BY-SA 4.0 | +
Turkish-PUD | +CC BY-SA 3.0 | +
Turkish-Penn | +CC BY-SA 4.0 | +
Turkish-Tourism | +CC BY-SA 4.0 | +
Turkish_German-SAGT | +CC BY-NC-SA 4.0 | +
Ukrainian-IU | +CC BY-NC-SA 4.0 | +
Upper_Sorbian-UFAL | +CC BY-SA 4.0 | +
Urdu-UDTB | +CC BY-NC-SA 4.0 | +
Uyghur-UDT | +CC BY-SA 4.0 | +
Vietnamese-VTB | +CC BY-SA 4.0 | +
Warlpiri-UFAL | +CC BY-SA 4.0 | +
Welsh-CCG | +CC BY-SA 4.0 | +
Western_Armenian-ArmTDP | +CC BY-SA 4.0 | +
Wolof-WTB | +CC BY-SA 4.0 | +
Xibe-XDT | +CC BY-NC-SA 3.0 | +
Yakut-YKTDT | +CC BY-SA 4.0 | +
Yoruba-YTB | +CC BY-SA 4.0 | +
Yupik-SLI | +CC BY-SA 4.0 | +
License | URL |
---|---|
C-UDA 1.0 | https://cdla.dev/computational-use-of-data-agreement-v1-0/ |
CC BY 4.0 | http://creativecommons.org/licenses/by/4.0/ |
CC BY-NC-ND 3.0 | http://creativecommons.org/licenses/by-nc-nd/3.0/ |
CC BY-NC-SA 2.5 | http://creativecommons.org/licenses/by-nc-sa/2.5/ |
CC BY-NC-SA 3.0 | http://creativecommons.org/licenses/by-nc-sa/3.0/ |
CC BY-NC-SA 4.0 | http://creativecommons.org/licenses/by-nc-sa/4.0/ |
CC BY-SA 3.0 | http://creativecommons.org/licenses/by-sa/3.0/ |
CC BY-SA 4.0 | http://creativecommons.org/licenses/by-sa/4.0/ |
CC0 1.0 | http://creativecommons.org/publicdomain/zero/1.0/ |
GNU GPL 2.0 | http://opensource.org/licenses/GPL-2.0 |
GNU GPL 3.0 | http://opensource.org/licenses/GPL-3.0 |
LGPL-LR | http://www.ida.liu.se/~sarst/bitse/lgpllr.html |
PD | public domain |