SQL
x
-- Resultset 1: summary
SELECT is_biographical, COUNT(*) AS number_of_articles, AVG(number_of_categories), STDDEV(number_of_categories), MIN(number_of_categories), MAX(number_of_categories)
FROM
(
SELECT (EXISTS (SELECT 1
FROM categorylinks isbio
WHERE isbio.cl_to LIKE '%birth%'
AND isbio.cl_from=artpage.page_id)) AS is_biographical,
(SELECT COUNT(*)
FROM categorylinks countcats
JOIN page catpage
ON catpage.page_namespace=14 AND catpage.page_title=countcats.cl_to
LEFT JOIN page_props
ON pp_page=catpage.page_id AND pp_propname='hiddencat'
WHERE countcats.cl_from=artpage.page_id
AND pp_propname IS NULL) AS number_of_categories,
artpage.page_len,
artpage.page_title AS article
FROM page artpage
WHERE artpage.page_id IN (SELECT page_id
FROM page
WHERE page_namespace=0
AND page_is_redirect=0
AND page_random BETWEEN 0.5 AND 0.51)
GROUP BY is_biographical,
artpage.page_len,
article
) sq
GROUP BY is_biographical;
-- Resultset 2: data - same as the large subquery above
SELECT (EXISTS (SELECT 1
FROM categorylinks isbio
WHERE isbio.cl_to LIKE '%birth%'
AND isbio.cl_from=artpage.page_id)) AS is_biographical,
(SELECT COUNT(*)
FROM categorylinks countcats
JOIN page catpage
ON catpage.page_namespace=14 AND catpage.page_title=countcats.cl_to
LEFT JOIN page_props
ON pp_page=catpage.page_id AND pp_propname='hiddencat'
WHERE countcats.cl_from=artpage.page_id
AND pp_propname IS NULL) AS number_of_categories,
artpage.page_len,
artpage.page_title AS article
FROM page artpage
WHERE artpage.page_id IN (SELECT page_id
FROM page
WHERE page_namespace=0
AND page_is_redirect=0
AND page_random BETWEEN 0.5 AND 0.51)
GROUP BY is_biographical,
artpage.page_len,
article;
By running queries you agree to the Cloud Services Terms of Use and you irrevocably agree to release your SQL under CC0 License.
All SQL code is licensed under CC0 License.