Toggle navigation
Home
New Query
Recent Queries
Discuss
Database tables
Database names
MediaWiki
Wikibase
Replicas browser and optimizer
Login
History
Fork
Fork of
Bad links from wikis to c, m, mw, species: disambigs
by
Achim55
This query is marked as a draft
This query has been published
by
Achim55
.
Toggle Highlighting
SQL
USE dewiki_p; #USE dewikisource_p; #USE dewikivoyage_p; #USE dewiktionary_p; #USE enwiki_p; #USE eswiki_p; #USE frwiki_p; #USE itwiki_p; #USE nlwiki_p; SET @w = LEFT (DATABASE(), LENGTH(DATABASE()) - 2); SET @l = (SELECT lang FROM meta_p.wiki WHERE dbname = @w); SET @lenm = LENGTH('https://meta.wikimedia.org/wiki/'); SET @lenmw = LENGTH('https://www.mediawiki.org/wiki/'); SET @lenspec = LENGTH('https://species.wikimedia.org/wiki/'); SET @p = '^$'; #dummy IF (@w = 'dewiki') THEN SET @p = '^Wikispecies$'; ELSEIF (@w = 'enwiki') THEN SET @p = '(?:^Copy_to_|^Copy_section_to_Wikisource$|^Main_Page$|^Outline_of_Wikipedia$|^Wikipedia_statistics$)'; #ELSEIF (@w = 'frwiki') THEN # SET @p = '^[0-9]{4}'; #ELSEIF (@w = 'nlwiki') THEN # SET @p = 'Wikipedia:Commonscat_'; END IF; SELECT now() AS timestamp; #empty links, no target given (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:m:', REPLACE (iwl_title, '_', ' '), ']]') AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_title NOT REGEXP @p WHERE iwl_prefix IN ('m', 'meta', 'metawikipedia') AND iwl_title REGEXP '^ *$' ) UNION (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:mw:', REPLACE (iwl_title, '_', ' '), ']]') AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_title NOT REGEXP @p WHERE iwl_prefix IN ('mw', 'mediawiki', 'mediawikiwiki') AND iwl_title REGEXP '^ *$' ) UNION (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:species:', REPLACE (iwl_title, '_', ' '), ']]') AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_title NOT REGEXP @p WHERE iwl_prefix IN ('species', 'wikispecies') AND iwl_title REGEXP '^ *$' ) UNION #broken interwikilinks (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:m:', REPLACE (iwl_title, '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = iwl_title), '?cat?', '')) AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @p WHERE iwl_prefix IN ('m', 'meta', 'metawikipedia') AND iwl_title NOT LIKE '%:%' #temp AND NOT EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_title = iwl_title AND cp.page_namespace = 0) ) UNION (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:mw:', REPLACE (iwl_title, '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = iwl_title), '?cat?', '')) AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @p WHERE iwl_prefix IN ('mw', 'mediawiki', 'mediawikiwiki') AND iwl_title NOT LIKE '%:%' #temp AND NOT EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_title = iwl_title AND cp.page_namespace = 0) ) UNION (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:species:', REPLACE (iwl_title, '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = iwl_title), '?cat?', '')) AS wikipage FROM iwlinks INNER JOIN page wp ON wp.page_id = iwl_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @p WHERE iwl_prefix IN ('species', 'wikispecies') AND iwl_title NOT LIKE '%:%' #temp AND NOT EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_title = iwl_title AND cp.page_namespace = 0) ) UNION #broken external interwiki links (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:m:', REPLACE ((SUBSTRING(REPLACE (el_to, CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenm + 1, @lenm))), '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = (SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenm + 1, @lenm)))), '?cat?', '')) AS wikipage FROM externallinks INNER JOIN page wp ON wp.page_id = el_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @p WHERE ((el_to LIKE 'https://meta.wikimedia.org/wiki/%') OR (el_to LIKE 'http://meta.wikimedia.org/wiki/%')) AND el_to NOT LIKE '%//meta.wikimedia.org/wiki/%:%' #temp AND el_to NOT LIKE '%#%' #temp AND el_to NOT LIKE '%\%%' #temp AND NOT EXISTS (SELECT 1 FROM metawiki_p.page cp WHERE cp.page_namespace = 0 AND cp.page_title = SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenm + 1, @lenm)) ) ) UNION (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:mw:', REPLACE ((SUBSTRING(REPLACE (el_to, CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenmw + 1, @lenmw))), '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = (SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenmw + 1, @lenmw)))), '?cat?', '')) AS wikipage FROM externallinks INNER JOIN page wp ON wp.page_id = el_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @p WHERE ((el_to LIKE 'https://www.mediawiki.org/wiki/%') OR (el_to LIKE 'http://www.mediawiki.org/wiki/%')) AND el_to NOT LIKE '%//www.mediawiki.org/wiki/%:%' #temp AND el_to NOT LIKE '%#%' #temp AND el_to NOT LIKE '%\%%' #temp AND NOT EXISTS (SELECT 1 FROM mediawikiwiki_p.page cp WHERE cp.page_namespace = 0 AND cp.page_title = SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenmw + 1, @lenmw)) ) ) UNION (SELECT CONCAT('# [[', IF (wp.page_namespace = 14, ':{{ns:14}}:', ''), REPLACE (wp.page_title, '_', ' '), ']] ', '→ [[:species:', REPLACE ((SUBSTRING(REPLACE (el_to, CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenspec + 1, @lenspec))), '_', ' '), ']]', IF (EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_namespace = 14 AND cp.page_title = (SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenspec + 1, @lenspec)))), '?cat?', '')) AS wikipage FROM externallinks INNER JOIN page wp ON wp.page_id = el_from AND wp.page_namespace IN (0, 14) AND wp.page_is_redirect = 0 AND wp.page_title NOT REGEXP @p WHERE ((el_to LIKE 'https://species.wikimedia.org/wiki/%') OR (el_to LIKE 'http://species.wikimedia.org/wiki/%')) AND el_to NOT LIKE '%//species.wikimedia.org/wiki/%:%' #temp AND el_to NOT LIKE '%#%' #temp AND el_to NOT LIKE '%\%%' #temp AND NOT EXISTS (SELECT 1 FROM specieswiki_p.page cp WHERE cp.page_namespace = 0 AND cp.page_title = SUBSTRING(REPLACE (REPLACE (el_to, '#mw-subcategories', ''), CONCAT('?uselang=', @l), ''), IF ((LEFT (el_to, 5) = 'https'), @lenspec + 1, @lenspec)) ) ) ORDER BY wikipage LIMIT 1000;
By running queries you agree to the
Cloud Services Terms of Use
and you irrevocably agree to release your SQL under
CC0 License
.
Submit Query
Stop Query
All SQL code is licensed under
CC0 License
.
Checking query status...