summaryrefslogtreecommitdiff
path: root/corpus/arwiki
diff options
context:
space:
mode:
authorLars-Dominik Braun <lars@6xq.net>2020-05-10 10:48:38 +0200
committerLars-Dominik Braun <lars@6xq.net>2020-05-10 10:49:23 +0200
commit244197b5f8b1f4d73d4ab9ac838334860b55662c (patch)
treece2d8cd63289f3457f227adea6fbcb0896e8dc26 /corpus/arwiki
parent58a062d4f93b2ba362a94522d1a9b8e7c7f13469 (diff)
downloadlulua-244197b5f8b1f4d73d4ab9ac838334860b55662c.tar.gz
lulua-244197b5f8b1f4d73d4ab9ac838334860b55662c.tar.bz2
lulua-244197b5f8b1f4d73d4ab9ac838334860b55662c.zip
report: Add translated source table, asymmetry definition
Also fix the layout break point.
Diffstat (limited to 'corpus/arwiki')
-rw-r--r--corpus/arwiki/metadata.yaml10
1 files changed, 8 insertions, 2 deletions
diff --git a/corpus/arwiki/metadata.yaml b/corpus/arwiki/metadata.yaml
index 2a1ff72..b033919 100644
--- a/corpus/arwiki/metadata.yaml
+++ b/corpus/arwiki/metadata.yaml
@@ -1,8 +1,14 @@
source:
- name: Arabic Wikipedia
+ name:
+ en: Arabic Wikipedia
+ ar: ويكيبيديا العربية
url: https://ar.wikipedia.org/
extractor:
name: wikiextractor
url: https://github.com/attardi/wikiextractor/tree/3162bb6c3c9ebd2d15be507aa11d6fa818a454ac
date: 2019-07-01
-count: [857386, articles]
+count:
+ num: 857386
+ kind:
+ en: articles
+ ar: مقالة