Toggle navigation
Home
New Query
Recent Queries
Discuss
Database tables
Database names
MediaWiki
Wikibase
Replicas browser and optimizer
Login
History
Fork
Fork of
Bad links from wikis to c, m, mw, species: disambigs
by
Achim55
This query is marked as a draft
This query has been published
by
Achim55
.
Toggle Highlighting
SQL
USE dewiki_p; #USE dewikisource_p; #USE dewikivoyage_p; #USE dewiktionary_p; #USE enwiki_p; #USE eswiki_p; #USE frwiki_p; #USE itwiki_p; #USE nlwiki_p; #USE svwiki_p; #USE specieswiki_p; SET @w = LEFT (DATABASE(), LENGTH(DATABASE()) - 2); SET @l = (SELECT lang FROM meta_p.wiki WHERE dbname = @w); SET @lenm = LENGTH('https://meta.wikimedia.org/wiki/'); SET @lenmw = LENGTH('https://www.mediawiki.org/wiki/'); SET @lenspec = LENGTH('https://species.wikimedia.org/wiki/'); #white list SET @pm = '^$'; SET @pmw = '^$'; SET @pspec = '^$'; #dummies IF (@w = 'dewiki') THEN SET @pspec = '^Wikispecies$'; ELSEIF (@w = 'enwiki') THEN SET @pm = '(?:^Copy_to_|^Copy_section_to_Wikisource$|^Main_Page$|^Outline_of_Wikipedia$|^Wikipedia_statistics$)'; SET @pmw = '(?:^Main_Page$|^Outline_of_Wikipedia$)'; SET @pspec = '(^C\._elegans_.disambiguation.$|^Main_Page$|^Outline_of_Wikipedia$)'; ELSEIF (@w = 'itwiki') THEN SET @pspec = '^Utenti_'; END IF; SELECT now() AS timestamp; ##### Meta ##### #empty links, no target given (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[m:', REPLACE (iwl_title, '_', ' '), ']]') AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_title NOT REGEXP @pm WHERE iwl_prefix IN ('m', 'meta', 'metawikipedia') AND iwl_title REGEXP '^ *$' ) UNION #broken interwiki links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[m:', REPLACE (iwl_title, '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = iwl_title), '?cat?', '')) AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @pm WHERE iwl_prefix IN ('m', 'meta', 'metawikipedia') AND iwl_title NOT LIKE '%:%' #temp AND NOT EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_title = iwl_title AND cp.page_namespace = 0) ) UNION #broken external links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[m:', REPLACE ((SUBSTRING(REPLACE (el_to, CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenm + 1, @lenm))), '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = (SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenm + 1, @lenm)))), '?cat?', '')) AS wikipage FROM externallinks INNER JOIN page wp ON wp.page_id = el_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @pm WHERE ((el_to LIKE 'https://meta.wikimedia.org/wiki/%') OR (el_to LIKE 'http://meta.wikimedia.org/wiki/%')) AND el_to NOT LIKE '%//meta.wikimedia.org/wiki/%:%' #temp AND el_to NOT LIKE '%#%' #temp AND el_to NOT LIKE '%\%%' #temp AND NOT EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_namespace = 0 AND cp.page_title = SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenm + 1, @lenm)) ) ) UNION ##### MediaWiki ##### #empty links, no target given (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[mw:', REPLACE (iwl_title, '_', ' '), ']]') AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_title NOT REGEXP @pmw WHERE iwl_prefix IN ('mw', 'mediawiki', 'mediawikiwiki') AND iwl_title REGEXP '^ *$' ) UNION #broken interwiki links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[mw:', REPLACE (iwl_title, '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = iwl_title), '?cat?', '')) AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @pmw WHERE iwl_prefix IN ('mw', 'mediawiki', 'mediawikiwiki') AND iwl_title NOT LIKE '%:%' #temp AND NOT EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_title = iwl_title AND cp.page_namespace = 0) ) UNION #broken external links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[mw:', REPLACE ((SUBSTRING(REPLACE (el_to, CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenmw + 1, @lenmw))), '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = (SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenmw + 1, @lenmw)))), '?cat?', '')) AS wikipage FROM externallinks INNER JOIN page wp ON wp.page_id = el_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @pmw WHERE ((el_to LIKE 'https://www.mediawiki.org/wiki/%') OR (el_to LIKE 'http://www.mediawiki.org/wiki/%')) AND el_to NOT LIKE '%//www.mediawiki.org/wiki/%:%' #temp AND el_to NOT LIKE '%#%' #temp AND el_to NOT LIKE '%\%%' #temp AND NOT EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_namespace = 0 AND cp.page_title = SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenmw + 1, @lenmw)) ) ) UNION #empty links, no target given (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[species:', REPLACE (iwl_title, '_', ' '), ']]') AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_title NOT REGEXP @pspec WHERE iwl_prefix IN ('species', 'wikispecies') AND iwl_title REGEXP '^ *$' ) UNION #broken interwiki links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[species:', REPLACE (iwl_title, '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = iwl_title), '?cat?', '')) AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @pspec WHERE iwl_prefix IN ('species', 'wikispecies') AND iwl_title NOT LIKE '%:%' #temp AND NOT EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_title = iwl_title AND cp.page_namespace = 0) ) UNION #broken external links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[species:', REPLACE ((SUBSTRING(REPLACE (el_to, CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenspec + 1, @lenspec))), '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = (SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenspec + 1, @lenspec)))), '?cat?', '')) AS wikipage FROM externallinks INNER JOIN page wp ON wp.page_id = el_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @pspec WHERE ((el_to LIKE 'https://species.wikimedia.org/wiki/%') OR (el_to LIKE 'http://species.wikimedia.org/wiki/%')) AND el_to NOT LIKE '%//species.wikimedia.org/wiki/%:%' #temp AND el_to NOT LIKE '%#%' #temp AND el_to NOT LIKE '%\%%' #temp AND NOT EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_namespace = 0 AND cp.page_title = SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenspec + 1, @lenspec)) ) ) ORDER BY wikipage LIMIT 1000;
By running queries you agree to the
Cloud Services Terms of Use
and you irrevocably agree to release your SQL under
CC0 License
.
Submit Query
Stop Query
All SQL code is licensed under
CC0 License
.
Checking query status...