Modul:UrlCheck: Unterschied zwischen den Versionen
K (%) |
K (+: in pattern) |
||
Zeile 70: | Zeile 70: | ||
-- path check | -- path check | ||
if aPath ~= '' and | if aPath ~= '' and | ||
not mw.ustring.match( aPath, '^[-A-Za-z0-9¡-ÿ_.,~%%+&;#*?!=()@/]*$' ) then | not mw.ustring.match( aPath, '^[-A-Za-z0-9¡-ÿ_.,~%%+&:;#*?!=()@/]*$' ) then | ||
return 23 | return 23 | ||
end | end |
Version vom 29. März 2020, 07:27 Uhr
Die Dokumentation für dieses Modul kann unter Modul:UrlCheck/doc erstellt werden
-- documentation local UrlCheck = { suite = 'vCard', serial = '2020-03-28', item = 40849609 } -- module import local ui = mw.loadData( 'Module:UrlCheck/i18n') -- module variable local uc = {} function uc.ip4( address ) local parts = { address:match( '(%d+)%.(%d+)%.(%d+)%.(%d+)' ) }, value if #parts == 4 then for _, value in pairs( parts ) do if tonumber( value ) < 0 or tonumber( value ) > 255 then return false end end return true -- ok end return false end function uc.isUrl( url ) -- return codes 0 through 2 reserved if not url or type( url ) ~= 'string' then return 3 end local s = mw.text.trim( url ), count if s == '' then return 3 elseif #s > 2048 then -- limitation because of search engines or IE return 4 elseif s:find( '%s' ) or s:find( '%c' ) or s:match( '^%.' ) then return 5 end -- https://max:muster@www.example.com:8080/index.html?p1=A&p2=B#ressource -- protocol s, count = s:gsub( '^https?://', '' ) if count == 0 then s, count = s:gsub( '^//', '' ) end if count == 0 then -- missing or wrong protocol return 6 end local user = '', at local password = '' local host = '' local port = '' local aPath = '' local topLevel = '' -- split path from host at = s:find( '/' ) if at then aPath = s:sub( at + 1, #s ) s = s:sub( 1, at - 1 ) if not s then return 7 end end -- path check if aPath ~= '' and not mw.ustring.match( aPath, '^[-A-Za-z0-9¡-ÿ_.,~%%+&:;#*?!=()@/]*$' ) then return 23 end if s:find( '%.%.' ) or s:find( '%.@' ) or s:find( '@[%.%-]' ) or s:find( '%-%.' ) or s:find( '%.%-' ) or s:find( '%./' ) or s:find( '/%.' ) then return 8 end -- user and password _, count = s:gsub( '@', '@' ) if count > 1 then return 9 elseif count == 1 then at = s:find( '@' ) user = s:sub( 1, at - 1 ) host = s:sub( at + 1, #s ) if not user or not s then return 10 end _,count = user:gsub( ':', ':' ) if count > 1 then return 11 elseif count == 1 then at = user:find( ':' ) password = user:sub( at + 1, #user ) user = user:sub( 1, at - 1 ) if not user or not password then return 12 elseif #user > 64 then return 13 end end else host = s end if host == '' then return 14 end -- host and port _, count = host:gsub( ':', ':' ) if count > 1 then return 15 elseif count == 1 then at = host:find( ':' ) port = host:sub( at + 1, #host ) host = host:sub( 1, at - 1 ) if not host or not port then return 16 elseif not port:match( '^[1-9]%d*$' ) or tonumber( port ) > 65535 then return 17 end end -- handle host part if #host > 253 then return 18 end -- getting top-level domain at = host:match( '^.*()%.' ) -- find last dot if not at then return 19 end topLevel = host:sub( at + 1, #host ) if not topLevel then return 20 end -- future: check of top-level domain if uc.ip4( host ) then -- is ip4 address return 2 elseif not mw.ustring.match( host, '^[%w%.%-]+%.%a%a+$' ) then return 22 elseif not host:match( '^[%w%.%-]+%.%a%a+$' ) then return 1 -- matches domain only in UTF 8 mode end return 0 end function uc.checkUrl( frame ) local args = frame.args args.url = args.url or '' args.show = args.show or '' local result = uc.isUrl( args.url ) if args.show:lower() == 'msg' then if ui[ result ] then return ui[ result ] else return ui.unknown end end return result end return uc