The Data Lake seems to have no data for many (most?) wikis.
select wiki_db, count(*)
from wmf.mediawiki_history
where
snapshot = "2017-04" and
wiki_db in ("arwiki", "cswiki", "commonswiki", "dawiki", "enwiki", "enwiktionary", "kowiki", "itwiki", "zhwiki") and
event_timestamp >= "201701"
group by wiki_db;
wiki_db _c1
commonswiki 18474976
enwiki 22939154
dawiki 248147
3 rows selected (60.582 seconds)This applies to older snapshots and older data too:
select wiki_db, count(*)
from wmf.mediawiki_history
where
snapshot = "2017-02" and
wiki_db in ("arwiki", "cswiki", "commonswiki", "dawiki", "enwiki", "enwiktionary", "kowiki", "itwiki", "zhwiki") and
event_timestamp >= "201601"
group by wiki_db;
wiki_db _c1
enwiki 79402391
commonswiki 64383940
dawiki 632861
3 rows selected (84.672 seconds)However, the pre-Labs snapshots seem to be fine.
select wiki_db, count(*)
from wmf.mediawiki_history
where
snapshot = "2016-12_private" and
wiki_db in ("arwiki", "cswiki", "commonswiki", "dawiki", "enwiki", "enwiktionary", "kowiki", "itwiki", "zhwiki") and
event_timestamp >= "201601"
group by wiki_db;
wiki_db _c1
enwiktionary 7029529
dawiki 514631
commonswiki 54721834
zhwiki 4568247
cswiki 1466825
itwiki 8224350
arwiki 4918431
enwiki 67648716
kowiki 2847875
9 rows selected (95.034 seconds)