summaryrefslogtreecommitdiff
path: root/corpus/bbcarabic
diff options
context:
space:
mode:
authorLars-Dominik Braun <lars@6xq.net>2020-05-10 10:48:38 +0200
committerLars-Dominik Braun <lars@6xq.net>2020-05-10 10:49:23 +0200
commit244197b5f8b1f4d73d4ab9ac838334860b55662c (patch)
treece2d8cd63289f3457f227adea6fbcb0896e8dc26 /corpus/bbcarabic
parent58a062d4f93b2ba362a94522d1a9b8e7c7f13469 (diff)
downloadlulua-244197b5f8b1f4d73d4ab9ac838334860b55662c.tar.gz
lulua-244197b5f8b1f4d73d4ab9ac838334860b55662c.tar.bz2
lulua-244197b5f8b1f4d73d4ab9ac838334860b55662c.zip
report: Add translated source table, asymmetry definition
Also fix the layout break point.
Diffstat (limited to 'corpus/bbcarabic')
-rw-r--r--corpus/bbcarabic/metadata.yaml10
1 files changed, 8 insertions, 2 deletions
diff --git a/corpus/bbcarabic/metadata.yaml b/corpus/bbcarabic/metadata.yaml
index d1c06a5..085b80f 100644
--- a/corpus/bbcarabic/metadata.yaml
+++ b/corpus/bbcarabic/metadata.yaml
@@ -1,7 +1,13 @@
source:
- name: BBC Arabic
+ name:
+ en: BBC Arabic
+ ar: بي بي سي العربية
url: http://www.bbc.com/arabic
extractor:
name: Custom scripts
date: 2019-07
-count: [149901, articles]
+count:
+ num: 149901
+ kind:
+ en: articles
+ ar: مقالة