Jump to content

Module:PopulationFromWikidata

Permanently protected module
From Wikipedia, the free encyclopedia
This is an old revision of this page, as edited by Pppery (talk | contribs) at 15:48, 1 July 2022 (Avoid Lua error at Hammond Island (Queensland). Neither this edit nor my requested template-protection mean I endorse the usage of this module). The present address (URL) is a permanent link to this revision, which may differ significantly from the current revision.

---------------- Defining variables--------------------
local Pop_P = "P1082" 	-- population property
local Applies_P = "P518"	-- applies to part property
local Pointin_P = "P585" -- point in time property
local DetMeth_P = "P459"	-- determination method property
local RefURL_P = "P854"		-- reference URL
local RefTitle_P = "P1476"	-- reference title
local RefPubIn_P = "P1433"	--reference published in property	
local DatePub_P = "P577"	-- date of publication property
local Publisher_P = "P123"	-- publisher property
local Retrieved_P = "P813"	-- retrieved property
local CensusAU_I = "Q5058971"	-- Australian census item
local Instof_P = "P31"			-- instance of property

local SAL_I = "Q33112019" 	-- state suburb item (includes SSC and SAL)
--local GCCSA_I = "Q112762887"			-- Greater Capital City Statistical Area item
local LGA_I = "Q33127844"			-- Local Government Area item
local UCL_I = "Q33127891"		-- Urban Centre or Locality
--local SA2_I = "Q33128776"		-- SA2
local ILOC_I = "Q112729549"		-- Indigenous Location


local item = nil

--------------- Function GetRefsForClaim to check, collate and format all the reference components----------------------

function GetRefsForClaim(claim, defaulttitle)								
	local refs = ""
	for b,x in pairs(claim.references) do																	-- Loop through all references in a claim and pull out the components
		local refurl = ""																					-- initialise an empty URL, check if there is one then populate with the actual value (if not it stays as an empty string)
		if claim.references[b].snaks[RefURL_P] ~= nil then
			refurl = claim.references[b].snaks[RefURL_P][1].datavalue.value	
		end
		
		local reftitle = defaulttitle																		-- Initialise the default title as the Wikidata item title. This is the fallback title if one isn't provided in the references
		if claim.references[b].snaks[RefTitle_P] ~= nil then
			reftitle = claim.references[b].snaks[RefTitle_P][1].datavalue.value.text
		end
		
		local detmet = mw.wikibase.getEntity(claim.qualifiers[DetMeth_P][1].datavalue.value.id)					-- Get the dertermination method item
		
		local pubinlabel = ""																					--Initalising an empty published in label. This is the last option for this value.
		if claim.references[b].snaks[RefPubIn_P] ~= nil then													--Checking if the published in part of reference exists (it should for all references)
			local pubin = mw.wikibase.getEntity(claim.references[b].snaks[RefPubIn_P][1].datavalue.value.id)	--If it does then grab the published item and the label of that item
			pubinlabel = pubin.labels.en.value
		end
								
		local refwork = pubinlabel																				-- This value is used for non-census references, or as a fall-back value for census references with missing parts
		local pubdate = ""																						-- This is the fallback option if published date is missing (no date)
		if claim.references[b].snaks[DatePub_P] ~= nil then														-- This is the second option for the published date (given with references - this is used for non-census references)
			pubdate = mw.language.getContentLanguage():formatDate('j F Y', claim.references[b].snaks[DatePub_P][1].datavalue.value.time)
		end
		
		if detmet.claims[Instof_P] ~=nil and detmet.claims[Instof_P][1].mainsnak.datavalue.value.id == CensusAU_I then		-- Checking for census references (which will have different refwork and published date sources)
			refwork = detmet.labels.en.value.." "..pubinlabel																-- Concatenating to get work - determination method + published in (this overwrites the refwork value for census references)
			if detmet.claims[DatePub_P] ~=nil then
				pubdate = mw.language.getContentLanguage():formatDate('j F Y', detmet.claims[DatePub_P][1].mainsnak.datavalue.value.time) -- Overwrite the published date value if the determination method item has a date published (for census references)
			end
		end
		
		local refpublisher = ""																								-- The publisher is empty if missing
		if detmet.claims[Publisher_P] ~= nil then
			local publisheritem = mw.wikibase.getEntity(detmet.claims[Publisher_P][1].mainsnak.datavalue.value.id)			-- Get the determination method item and the publisher item ID
			refpublisher = publisheritem.labels.en.value																	-- Get the label of the publisher item
		end
		
		local refaccessdate = ""																							-- The retrieved date fallback is empty
		if claim.references[b].snaks[Retrieved_P] ~= nil then
			refaccessdate = mw.language.getContentLanguage():formatDate('j F Y', claim.references[b].snaks[Retrieved_P][1].datavalue.value.time) -- Populate the retrieved date if it's there
		end
		
		local appliespart = mw.wikibase.getEntity(claim.qualifiers[Applies_P][1].datavalue.value.id).labels.en.value					-- The ABS geography type for the particular claim (to use in reference name)
		local pointintime = mw.language.getContentLanguage():formatDate('Y', claim.qualifiers[Pointin_P][1].datavalue.value.time)		-- Getting the point in time as a YYYY (to use in the reference name)
		
		local citewebargs = {																								--Putting all the cite_web arguments into a list (for a single reference)
			url = refurl,
			title = reftitle.." ("..appliespart..")" ,
			date = pubdate,
			work = refwork,
			author = "[["..refpublisher.."]]",																				-- Changed the publisher to author for now to match existing population references
			accessdate = refaccessdate
		}
		
		local wdeditpencil = mw.getCurrentFrame():expandTemplate{title = 'EditAtWikidata', args = {qid = item.id, pid = claim.id, nbsp = 1}}		--Call the Edit At Wikidata template (to add the edit pencil to end of references)
		
		local reference = mw.getCurrentFrame():expandTemplate{ title = 'cite web', args = citewebargs }						--expand template to feed arguments to cite_web

		refs = refs..mw.getCurrentFrame():extensionTag{ name = 'ref', content = reference..wdeditpencil, { name = refwork.."_"..pointintime.."_"..appliespart.."_"..reftitle } }	--Add the reference from this iteration to the list of references for this particular claim
--			 
	end	
	return refs																												-- List of references to be given to reflist
end	

---------------- This ListForInfobox function is being used to grab the correct population value ---------------

local p = {} 

function p.ListForInfobox( frame )					  
	local luaplacetype = ""															--initialise the local place type
	local articleplacetype = frame.args.type										-- bring in the place type entered into Infobox Australian place template
	if articleplacetype == "town" or articleplacetype == "Town" then				-- Check which place type and match to the equivalent ABS geographic area "city", "suburb", "town", "lga", "region"
		luaplacetype = UCL_I
	elseif articleplacetype == "suburb" or articleplacetype == "suburb" then
		luaplacetype = SAL_I
	elseif articleplacetype == "city" or articleplacetype == "City" then
		luaplacetype = UCL_I
	elseif articleplacetype == "lga" or articleplacetype == "LGA" then
		luaplacetype = LGA_I
	elseif articleplacetype == "region" or articleplacetype == "Region" then	-- for now saying region == LGA_I... but unclear what is most apprpriate ABS geography type.... can revise
		luaplacetype = LGA_I
	end	
	
	if frame.args.wikidata ~= nil and frame.args.wikidata ~= "" then			-- checking if there's a linked Wikidata item for the article
		item = mw.wikibase.getEntity(frame.args.wikidata)						-- this is the default item specified by the wikidata parameter in the template
	else 
		item = mw.wikibase.getEntity() 											-- If there's a Wikidata item connected to the article it will find it here.
	end
	

--	mw.logObject(item)
	
 --------------- CHECK: If item.claims[Pop_P] is nil. If it is return an empty string ----------------------
	if item == nil or item.claims[Pop_P] == nil then
		return	""										
	end
	
	
------------ PART 1: Find claims with (1) point in time is not nil, (2) applies to part is not nil, (3) determination method is not nil and (4) References table is not empty-------------

	local validpopclaims = {}													--initialise the blank claim table for storing all population claims that satisfy the four conditions 
	z=0																			-- initialise the table row count
	for j, s in pairs(item.claims[Pop_P]) do
		if	s.qualifiers ~= nil and 
		    s.qualifiers[Pointin_P]~= nil and
			s.qualifiers[Applies_P] ~= nil and 
			s.qualifiers[DetMeth_P] ~= nil and 
			s.references ~= nil then
	
			z=z+1																
			validpopclaims[z]=s													-- give the claim a new key in the table
		end
	end	

--------------- CHECK: If count of validpopclaims is less than one (eg 0) then return a html message. This checks we have something from which to get a population value and basic reference.--------------
	if #validpopclaims <1 then
		return ""
	end
	
--------------- PART 2: Compare claim 'applies to part' values against template place type-------------------------
 		local templategeog = {}												--initialise the blank claim table for if the template type matches to Wikidata claim applies to part
		local othergeog = {}												--initialise the blank claim table for when the template type doesn't match Wikidata claims applies to part
		c=0
		d=0
		for i, q in pairs(validpopclaims) do
			if q.qualifiers[Applies_P][1].datavalue.value.id == luaplacetype then		--filter for claims where applies to part = Infobox template type
				c=c+1																	-- give the claim a new key in the table											
				templategeog[c]=q														-- claims with Infobox template type geography
			else
				d=d+1
				othergeog[d]=q															-- claims with geography other than specified in the Infobox template type.
			end
		end	

----------PART 3: Get claims with the maximum 'Point in time' values ------------------
----------PART 3A: Find the max date of claims with template geography-----------------

	local maxclaimspertemplategeog = nil												--initialise the blank claim corresponding to the max date
	for k, v in pairs(templategeog) do													--loop through all the claims with geography type = Infobox template type
		local tclaimdate = v.qualifiers[Pointin_P][1].datavalue.value.time
		if  maxclaimspertemplategeog == nil
			or (maxclaimspertemplategeog ~= nil
				and tclaimdate >= maxclaimspertemplategeog.qualifiers[Pointin_P][1].datavalue.value.time)
			then								 
				maxclaimspertemplategeog=v
		end
	end


----------PART 3B: Find the max date of claims with non-Infobox template geography-----------------

	local maxclaimsperothergeog = {}

	for l, m in pairs(othergeog) do														--loop through all the claims with geography type = non Infobox place type
		local oclaimdate = m.qualifiers[Pointin_P][1].datavalue.value.time
		local claimgeog = m.qualifiers[Applies_P][1].datavalue.value.id
		if  maxclaimsperothergeog[claimgeog] == nil										-- using the applies to part value as the table key
			or (maxclaimsperothergeog[claimgeog] ~= nil
				and oclaimdate >= maxclaimsperothergeog[claimgeog].qualifiers[Pointin_P][1].datavalue.value.time)  -- checking the max date for a particular geography value
			then								 
				maxclaimsperothergeog[claimgeog]=m										-- overwrites with a geography-max date claim pair whenever the point in time is bigger than the last iteration.
		end
	end

	

------------------------------Return to template--------------------------------	    
    local div = mw.html.create( 'div' )																				-- formulate giving the value back to the Infobox Australian place template
    if maxclaimspertemplategeog ~=nil then																			-- Situation 1: Getting population for max date claim where applies to part matches the Infobox place type
    	local appliespartitem = mw.wikibase.getEntity(maxclaimspertemplategeog.qualifiers[Applies_P][1].datavalue.value.id)
		local templategeogrefs = GetRefsForClaim(maxclaimspertemplategeog, item.labels.en.value)					-- Getting the references for max date claim where Wikidata applies to part matches the Infobox place type
		div:wikitext(mw.language.getContentLanguage():formatNum(tonumber(maxclaimspertemplategeog.mainsnak.datavalue.value.amount)).." ("..appliespartitem.labels.en.value.." "..mw.language.getContentLanguage():formatDate('Y', maxclaimspertemplategeog.qualifiers[Pointin_P][1].datavalue.value.time)..")"..templategeogrefs)  --Return the population value, applies to part, point in time, reference 
   
    elseif articleplacetype == "town" or articleplacetype == "Town" then											-- Situation 2: Getting population for max date claims where Infobox place type = town. If no UCL populations (earlier default) then get ILOC and SAL populations.
    	if maxclaimsperothergeog[ILOC_I]~=nil then
    		local appliespartILOC = mw.wikibase.getEntity(maxclaimsperothergeog[ILOC_I].qualifiers[Applies_P][1].datavalue.value.id)
			local ILOCrefs = GetRefsForClaim(maxclaimsperothergeog[ILOC_I], item.labels.en.value)					-- Getting the references for max date claim where applies to part = ILOC
			div:wikitext("\n* "..mw.language.getContentLanguage():formatNum(tonumber(maxclaimsperothergeog[ILOC_I].mainsnak.datavalue.value.amount)).." ("..appliespartILOC.labels.en.value.." "..mw.language.getContentLanguage():formatDate('Y', maxclaimsperothergeog[ILOC_I].qualifiers[Pointin_P][1].datavalue.value.time)..")"..ILOCrefs) --Return the population value, applies to part, point in time, reference 
    	end
		if maxclaimsperothergeog[SAL_I]~=nil then
    		local appliespartSAL = mw.wikibase.getEntity(maxclaimsperothergeog[SAL_I].qualifiers[Applies_P][1].datavalue.value.id)
			local SALrefs = GetRefsForClaim(maxclaimsperothergeog[SAL_I], item.labels.en.value)						-- Getting the references for max date claim where applies to part = SAL
			div:wikitext("\n* "..mw.language.getContentLanguage():formatNum(tonumber(maxclaimsperothergeog[SAL_I].mainsnak.datavalue.value.amount)).." ("..appliespartSAL.labels.en.value.." "..mw.language.getContentLanguage():formatDate('Y', maxclaimsperothergeog[SAL_I].qualifiers[Pointin_P][1].datavalue.value.time)..")"..SALrefs)		--Return the population value, applies to part, point in time, reference
		end
	else
		for a, w in pairs(maxclaimsperothergeog) do																	-- Situation 3: Getting population for max date claims where applies to part doesn't = Infobox place type, and Infobox place type doesn't = town.
			local appliespartitem = mw.wikibase.getEntity(maxclaimsperothergeog[a].qualifiers[Applies_P][1].datavalue.value.id)
			local othergeogrefs = GetRefsForClaim(w, item.labels.en.value)
			div:wikitext("\n* "..mw.language.getContentLanguage():formatNum(tonumber(maxclaimsperothergeog[a].mainsnak.datavalue.value.amount)).." ("..appliespartitem.labels.en.value.." "..mw.language.getContentLanguage():formatDate('Y', maxclaimsperothergeog[a].qualifiers[Pointin_P][1].datavalue.value.time)..")"..othergeogrefs)  	--Return the list of population value, applies to part, point in time, reference
		end 
    end
	return tostring( div ) .. '[[Category:Australian place articles using Wikidata population values]]'
end

return p