Մոդուլ:URL

Վիքիպեդիայից՝ ազատ հանրագիտարանից

--
-- This module implements {{URL}}
--
-- See unit tests at [[Module:URL/testcases]]

local p = {}
 
local function safeUri(s)
	local success, uri = pcall(function()
		return mw.uri.new(s)
	end)
	if success then
		return uri
	end
end

local function extractUrl(args)
	for name, val in pairs(args) do
		if name ~= 2 and name ~= "msg" then
			local url = name .. "=" .. val;
			url = mw.ustring.gsub(url, '^[Hh][Tt][Tt][Pp]([Ss]?):(/?)([^/])', 'http%1://%3')
			local uri = safeUri(url);
			if uri and uri.host then
				return url
			end
		end
	end
end

function p._url(url, text, msg)
	url = mw.text.trim(url or '')
	text = mw.text.trim(text or '')
	local nomsg = (msg or ''):sub(1,1):lower() == "n" or msg == 'false' -- boolean: true if msg is "false" or starts with n or N

	if url == '' then
		if text == '' then
			if nomsg then
				return nil
			else
				return mw.getCurrentFrame():expandTemplate{ title = 'tlx', args = { 'URL', "''example.com''", "''optional display text''" } }
			end
		else
			return text
		end
	end

	-- If the URL contains any unencoded spaces, encode them, because MediaWiki will otherwise interpret a space as the end of the URL.
	url = mw.ustring.gsub(url, '%s', function(s) return mw.uri.encode(s, 'PATH') end)

	-- If there is an empty query string or fragment id, remove it as it will cause mw.uri.new to throw an error
	url = mw.ustring.gsub(url, '#$', '')
	url = mw.ustring.gsub(url, '%?$', '')

	-- If it's an HTTP[S] URL without the double slash, fix it.
	url = mw.ustring.gsub(url, '^[Hh][Tt][Tt][Pp]([Ss]?):(/?)([^/])', 'http%1://%3')

	local uri = safeUri(url)

	-- Handle URL's without a protocol and URL's that are protocol-relative, 
	-- e.g. www.example.com/foo or www.example.com:8080/foo, and //www.example.com/foo
	if uri and (not uri.protocol or (uri.protocol and not uri.host)) and url:sub(1, 2) ~= '//' then
		url = 'http://' .. url
		uri = safeUri(url)
	end

	if text == '' then
		if uri then
			if uri.path == '/' then uri.path = '' end

			local port = ''
			if uri.port then port = ':' .. uri.port end

			text = mw.ustring.lower(uri.host or '') .. port .. (uri.relativePath or '')

			-- Add <wbr> before _/.-# sequences
			text = mw.ustring.gsub(text,"(/+)","<wbr/>%1")      -- This entry MUST be the first. "<wbr/>" has a "/" in it, you know.
			text = mw.ustring.gsub(text,"(%.+)","<wbr/>%1")
			-- text = mw.ustring.gsub(text,"(%-+)","<wbr/>%1") 	-- DISABLED for now
			text = mw.ustring.gsub(text,"(%#+)","<wbr/>%1")
			text = mw.ustring.gsub(text,"(_+)","<wbr/>%1")
		else -- URL is badly-formed, so just display whatever was passed in
			text = url
		end
	end

	return mw.ustring.format('<span class="url">[%s %s]</span>', url, text)
end

--[[
The main entry point for calling from Template:URL.
--]]
function p.url(frame)
	local templateArgs = frame.args
	local parentArgs = frame:getParent().args
	local url = templateArgs[1] or parentArgs[1]
	local text = templateArgs[2] or parentArgs[2] or ''
	local msg = templateArgs.msg or parentArgs.msg or ''
	url = url or extractUrl(templateArgs) or extractUrl(parentArgs) or ''
	return p._url(url, text, msg)
end

--[[
The entry point for calling from the forked Template:URL2.
This function returns no message by default.
It strips out wiki-link markup, html tags, and everything after a space.
--]]
function p.url2(frame)
	local templateArgs = frame.args
	local parentArgs = frame:getParent().args
	local url = templateArgs[1] or parentArgs[1]
	local text = templateArgs[2] or parentArgs[2] or ''
	-- default to no message
	local msg = templateArgs.msg or parentArgs.msg or 'no'
	url = url or extractUrl(templateArgs) or extractUrl(parentArgs) or ''
	-- if the url came from a Wikidata call, it might have a pen icon appended
	-- we want to keep that and add it back at the end.
	local u1, penicon = mw.ustring.match( url, "(.*)(&nbsp;<span class='penicon.*)" )
	if penicon then url = u1 end
	-- strip out html tags and [ ] from url
	url = (url or ''):gsub("<[^>]*>", ""):gsub("[%[%]]", "")
	-- truncate anything after a space
	url = url:gsub("%%20", " "):gsub(" .*", "")
	return (p._url(url, text, msg) or "") .. (penicon or "")
end

function startsWith( source, substring )
	if mw.ustring.len( substring ) > mw.ustring.len( source ) then
		return false
	end
	return mw.ustring.sub( source, 1, mw.ustring.len( substring ) ) == substring
end

function formatUrlImpl( source, title )
	local scheme, host, path
	local arg1, arg2 = source, title
	source = mw.text.trim( source, "%[%] " )
	local titleDelimeterPosition = mw.ustring.find( source, " ", 1 )
	if titleDelimeterPosition then
		if not title or title == "" then
			title = mw.ustring.sub( source, titleDelimeterPosition + 1 )
		end
		source = mw.ustring.sub( source, 1, titleDelimeterPosition - 1 )
	end
	
	local hostStartPosition
	local schemeDelimeterPosition = mw.ustring.find( source, "://", 1, true )
	if schemeDelimeterPosition then
		scheme = mw.ustring.sub( source, 1, schemeDelimeterPosition + 2)
		hostStartPosition = schemeDelimeterPosition + 3
	elseif mw.ustring.find( source, "^//", 1 ) then
		scheme = "//"
		hostStartPosition = 3
	else
		scheme = "http://"
		source = scheme .. source
		hostStartPosition = 8
	end

	if title then
		local finds = mw.ustring.find( arg1, "[", 1, true )
		if titleDelimeterPosition and finds and finds > titleDelimeterPosition + 1 then
			-- Если titleDelimeterPosition промазал мимо скобки и нашел пробел раньше неё, к примеру "a [b  c]",
			-- то свернуть всю нашу хиромантию и выдать первый аргумент без изменений.
			if arg2 == nil then
				return arg1 .. '[[Կատեգորիա:Վիքիպեդիա:Հոդվածներ Module:URL-ի բարդ մուտքով]]'
			-- Если есть arg2, а мы распарсить ссылку не смогли, и значит заменить title не сможем корректно, это есть ошибка.
			-- С другой стороны, если arg2 нет, а arg1 очень сложный, то возможно это нормальный ход вещей,
			-- и на вход в модуль дана уже очень сильно оформленная ссылка.
			else
				return arg1 .. '[[Կատեգորիա:Վիքիպեդիա:Հոդվածներ Module:URL-ի սխալ աշխատանքով]]'
			end
		end
		return '[' .. source .. ' ' .. title .. ']'
	end

	local hostDelimeterPosition = mw.ustring.find( source, "/", hostStartPosition, true )
	if hostDelimeterPosition then
		host = mw.ustring.sub( source, hostStartPosition, hostDelimeterPosition - 1 )
		if hostDelimeterPosition == mw.ustring.len( source ) then
			path = nil
		else
			path = mw.ustring.sub( source, hostDelimeterPosition + 1 )
		end
	else
		host = mw.ustring.sub( source, hostStartPosition )
	end

	-- post-split format options
	if startsWith( host, 'www.' ) then
		host = mw.ustring.sub( host, 5 )
	end
	host = mw.language.new( 'en' ):lc( host )

	if path and path ~= '' and path ~= '/' then
		return '[' .. source .. ' ' .. host .. '/' .. path .. ']'
	else
		return '[' .. source .. ' ' .. host .. ']'
	end
end

function p.formatUrl( frame )
	local url = frame.args[1] or ''
	local title = frame.args[2] or ''

	url = mw.text.trim( url )
	title = mw.text.trim( title )

	if url == '' then
		return nil
	end
	if title == '' then
		title = nil
	end
	return formatUrlImpl( url, title )
end

function p.formatUrlSingle( context, options, url )
	url = mw.text.trim( url )
	if url == '' then
		return nil
	end
	local title = nil
	if ( options['text'] and options['text'] ~= '' ) then
		title = options['text']
	end
	return formatUrlImpl( url, title )
end

return p