Fork of
enwiki domains with disallowed characters
by ⵓ
This query is marked as a draft
This query has been published
by ShakespeareFan00.
SQL
x
WITH u AS (
SELECT page_title, el_to_domain_index
FROM externallinks
JOIN page ON page_id = el_from
WHERE page.page_namespace =0 and el_to_domain_index REGEXP '.*([%&~@#;+=~"\'£\<\>\(\)#\$]+).*' collate 'utf8mb3_general_ci' and (el_to_domain_index like 'http%')
UNION ALL
SELECT page_title, el_to_domain_index
FROM externallinks
JOIN page ON page_id = el_from
WHERE page.page_namespace =0 and el_to_domain_index LIKE '%..%' and (el_to_domain_index like 'http%')
)
SELECT u.page_title as output , u.el_to_domain_index
FROM u
ORDER BY length(u.el_to_domain_index) desc
;/* &~‘@*(),!?_#$€£^;+=<> */
;
By running queries you agree to the Cloud Services Terms of Use and you irrevocably agree to release your SQL under CC0 License.
All SQL code is licensed under CC0 License.