Module:Sandbox/Jts1882/CladeN

--NOTE: this module contains functions for generating the table structure of the clade tree in two ways: -- (1) the original method was generated by a number of function calls from the template using --       function p.openTable(frame) - creates wikitext code to open the HTML table --       function p.node(frame)  - deals with the first node (|1,|label1) and creates wikitext for top row of the table --       function p.nodeN(frame) - deals with a sister nodes (|2-17), adding a row each time it is called --       function p.closeTable - closes the HTML table -- (2) the revised method is called by the template with one instruction; it has three functions: --       p.main(frame) - opens and closes table, loops through the children of node, main is invoked once and controls the rest, calling ... --       p.addTaxon(childNumber, nodeLeaf) - the nuts and bolts; code dealing with each child node --       p.addLabel(childNumber) - adds the label text

local p = {}

--============================== main function (for Method 2) =========================== -- main function, which will --[[Main function to generate the table structure of the tree

Usage: Template: User:Jts1882/sandbox/templates/CladeN ]]

function p.main(frame)

local cladeString = "" local maxChildren = 20 -- currently 17 in the clade/cladex templates local childNumber = 0 local lastNode = 0 local nodeCount = 0 -- total leafs plus new clade branches local leafCount = 0 -- just the terminal leaves local cladeCount = 0 -- new clade calls (each with a table) local childCount = 0 -- number of leaves in the clade (can use to set bottom of bracket in addTaxon	local totalCount = 0	--Note: this preprocessing loop gets information about the whole structure (number of nodes, leaves etc)		it makes a redundant calls to the templates through transclusion, but doen't affect the template depths; 		it would probably be better to store the transcluded nodes in a table (a job for later)	 --[[ disable proprocessing loop	while 	childNumber < maxChildren do -- preprocessing loop		childNumber = childNumber + 1 -- so we start with 1		local nodeLeaf,data = mw.getCurrentFrame:getParent.args[tostring(childNumber)] or "" -- get data from |N=		if nodeLeaf ~= "" then			childCount = childCount + 1  -- this counts child elements in this clade		    for i in string.gmatch(nodeLeaf, "|| rowspan") do -- count number of rows started (transclusion)   				nodeCount = nodeCount + 1     		end		    for i in string.gmatch(nodeLeaf, "{| cellspacing") do -- count number of tables started (transclusion)   				cladeCount = cladeCount + 1     		end           -- _, cladeCount = string.gsub(nodeLeaf, "{| cellspacing", "")            --_, nodeCount = string.gsub(nodeLeaf, "|| rowspan", "")            --totalCount = totalCount + nodeCount			lastNode = childNumber		--	if data ~= nil then totalCount = totalCount + tonumber(data) else totalCount = totalCount + 1 end		end

--cladeString = cladeString .. '\n' .. ' count= ' .. totalCount

end ]]	   nodeCount = nodeCount + childCount --(elements passed down by transduction plus current child elements) cladeCount = cladeCount + 1       --(elements passed down by transduction plus current clade) leafCount = nodeCount-cladeCount+1 totalCount =leafCount-- cladeCount --nodeCount

local testing = false --testing = true                 -- COMMENT OUT TO GET MODULE RUNNING WITHOUT THE TEST if testing then local dataString = p.test(1) cladeString = cladeString .. dataString return cladeString end

local tableStyle = frame.args.style or "" local tableStyleString = ' style="' .. tableStyle .. '" ' if tableStyle == '' then tableStyleString = "" end local captionName =mw.getCurrentFrame:getParent.args['caption'] or "" local captionStyle = mw.getCurrentFrame:getParent.args['captionstyle'] or ""

-- open table --cladeString = cladeString .. '{| cellspacing=0 cellpadding=0 border=0 style="' .. tableStyle .. '"' cladeString = cladeString .. '{|cellspacing=0 cellpadding=0 ' .. tableStyleString --cladeString = cladeString .. '{| cellspacing=0 ' .. tableStyleString -- NOTE: cellpadding supposedly not supported in HTML5

-- add caption if captionName ~= "" then cladeString = cladeString .. '\n|+style="' .. captionStyle .. '"|' .. captionName end -- global nodeParameters (unnumber, i.e. color, thickness, state) apply to whole node bracket, --   but can be overrriden by branchParameters (numbered, e.g. color2, thickness2, state2) nodeColor = mw.getCurrentFrame:getParent.args['color'] or "black" nodeThickness = tonumber(mw.getCurrentFrame:getParent.args['thickness']) or 1 nodeState = mw.getCurrentFrame:getParent.args['state'] or "solid" local moreNeeded = true childNumber = 0 lastNode = 0

--get child elements (add more rows for each child of node; each child is two rows)	   the function addTaxon is called to add the rows for each child element;	    each child add two rows: the first cell of each row contains the label or sublabel (below the line label), respectively;	    the second cell spans both rows and contains the leaf name or a new clade structure	    a third cell on the top row is sometimes added to contain a group  to the right while 	childNumber < maxChildren do -- disable moreNeeded -- while childNumber < 17 and moreNeeded == true do		childNumber = childNumber + 1 -- so we start with 1 local nodeLeaf = mw.getCurrentFrame:getParent.args[tostring(childNumber)] or "" -- get data from |N= local nodeLabel = mw.getCurrentFrame:getParent.args['label'..tostring(childNumber)] or "" -- get data from |labelN= local newickString = mw.getCurrentFrame:getParent.args['newick'..tostring(childNumber)] or "" -- get data from |labelN= if newickString ~= "" then -- if using a newick string instead of a clade structure if nodeLabel == "" then -- use labelN by default, otherwise use root name from Newick string nodeLabel = p.getNewickOuterterm(newickString) -- need to use terminal part of newick string for label end cladeString = cladeString .. '\n' .. p.addTaxon(childNumber, p.newick(0, newickString), nodeLabel) lastNode = childNumber elseif nodeLeaf ~= "" then -- if the node contains a leaf name or clade structue cladeString = cladeString .. '\n' .. p.addTaxon(childNumber, nodeLeaf, nodeLabel) lastNode = childNumber else moreNeeded = false -- no |N= so don't look for more -- Note: this changes the behaviour. If there is no |2, it won't look for |3 or |4, which clade does (is this desirable?) -- this has been disabled to allow consistent behaviour with clade/cladex (it will check to the limit set) end end

--finish last row by adding cell with no left border        note: the row was started in addTaxon, but the cell not added as left border yet to be determined;              here the cell is added to the last child node with no left border as it is below the bracket             this will be moved to addTaxon when the number of the last child is known local subLabel = mw.getCurrentFrame:getParent.args['sublabel'..tostring(lastNode)] or "" -- request in addLabel --use subLabel for annotating the clade structues to use structure information (DEBUGGIING ONLY) --subLabel= '(N=' .. totalCount .. ')' --cladeString = cladeString .. '\n' .. '| style="border: 0; padding: 0; vertical-align: top;" | ' cladeString = cladeString .. '\n' .. '|style="border:0;vertical-align:top;text-align:center;"|' .. p.addLabel(lastNode-1,subLabel)

-- footer description (add addition row spanning two columns at bottom of table)   	this is designed to provide the description below the whole clade structure (mimicking cladogram);    	however, it can also be used to add labels and spacing to the whole clade structre local footerText = mw.getCurrentFrame:getParent.args['footer'] or "" local footerStyle = mw.getCurrentFrame:getParent.args['footerstyle'] or ""

if footerText ~= "" then --cladeString = cladeString .. ' Test       ' cladeString = cladeString .. '\n|-style="' .. footerStyle .. '"\n|colspan="2"| ' .. footerText .. ' ||'	end

-- close table (wikitext to close table) cladeString = cladeString .. '\n|}' return cladeString end

--2, |3 ...) use a left border to create the vertical line of the bracket	    the first child element doesn't use a left border for the first cell in the top row (as it is above the bracket)	     the last child doesn't use a left border for the first cell in the second row (as it is above the bracket)	     a complication is that the number of the last child node is not known;	     	as a result the cells will be added to the row on the next iteration or after the main loop finishes function p.addTaxon(childNumber, nodeLeaf, nodeLabel)

-- get leaf and labels --local nodeLeaf = mw.getCurrentFrame:getParent.args[tostring(childNumber)] or ""    -- used passed variable to avoid redundancy --local nodeLabel = mw.getCurrentFrame:getParent.args['label'..tostring(childNumber)] or "" -- request in addLabel -- get formating parameters for branch (default to global nodeParameters) --   - the branch parameters have a number, e.g. |colorN, |thicknessN, |stateN --   - the node parameters have no number, e.g. |color, |thickness, |state local branchThickness = tonumber(mw.getCurrentFrame:getParent.args['thickness'..tostring(childNumber)]) or nodeThickness local branchColor = mw.getCurrentFrame:getParent.args['color'..tostring(childNumber)] or nodeColor --"black" local branchStyle = mw.getCurrentFrame:getParent.args['style'..tostring(childNumber)] or "" local branchState = mw.getCurrentFrame:getParent.args['state'..tostring(childNumber)] or nodeState -- "solid" if branchState == 'double' then if branchThickness < 2 then branchThickness = 3 end end -- need thick line for double

-- the left border takes node parameters, the bottom border takes branch parameters local bottomBorder = tostring(branchThickness) ..'px ' .. branchState .. ' ' .. branchColor local leftBorder  =  tostring(nodeThickness)   ..'px ' .. nodeState .. ' ' .. nodeColor -- variables for right hand bar or bracket --local barColor = "" local barRight = mw.getCurrentFrame:getParent.args['bar'..tostring(childNumber)] or "0" local barBottom = mw.getCurrentFrame:getParent.args['barend'..tostring(childNumber)] or "0" local barTop   = mw.getCurrentFrame:getParent.args['barbegin'..tostring(childNumber)] or "0" local barLabel = mw.getCurrentFrame:getParent.args['barlabel'..tostring(childNumber)] or "" local groupLabel = mw.getCurrentFrame:getParent.args['grouplabel'..tostring(childNumber)] or "" local groupLabelStyle = mw.getCurrentFrame:getParent.args['labelstyle'..tostring(childNumber)] or ""

--replace colours with format string; need right bar for all three options if barRight ~= "0" then barRight  = "2px solid " .. barRight end if barTop   ~= "0" then barRight  = "2px solid " .. barTop   end if barBottom ~= "0" then barRight = "2px solid " .. barBottom end if barTop   ~= "0" then barTop    = "2px solid " .. barTop   end if barBottom ~= "0" then barBottom = "2px solid " .. barBottom end -- now construct wikitext local styleString = '' local cladeString = ''

-- first add cell to the spacing row (for 2-17); it completes the previous row 	   why is this here rather than at the end of each row? 		To allow left border (here while extending bracket) or not (end of bracket) if childNumber ~= 1 then local subLabel = mw.getCurrentFrame:getParent.args['sublabel'..tostring(childNumber-1)] or "" -- request in addLabel

--styleString = ' style="border-left:' .. leftBorder ..';border-top:0;border-right:0;border-bottom:0;vertical-align:top;text-align:center;"' styleString = ' style="border:0;border-left:' .. leftBorder ..';vertical-align:top;text-align:center;"' --cladeString = cladeString .. '| ' .. styleString .. ' | ' -- for sublabel ' | y ' cladeString = cladeString .. '|' .. styleString .. '|' .. p.addLabel(childNumber-1,subLabel) end -- new row cladeString = cladeString .. '\n|-'

-- now add cell with label styleString = '' if childNumber == 1 then -- the width gives minimum spacing when all labels are empty (was 1.5em) --styleString = ' style="width:1em;border-bottom:' .. bottomBorder .. ';border-left:0;border-top:0;border-right:0;padding:0 0.2em;vertical-align:bottom;text-align:center;' .. branchStyle .. '"' styleString = ' style="width:1em;border:0;padding:0 0.2em;border-bottom:' .. bottomBorder .. ';vertical-align:bottom;text-align:center;' .. branchStyle .. '"' else -- for 2-17 styleString = ' style="border:0;padding:0 0.2em;border-left:' .. leftBorder .. ';border-bottom:' .. bottomBorder .. ';vertical-align:bottom;text-align:center;' .. branchStyle .. '"' end cladeString = cladeString .. '\n|' .. styleString .. '|' .. p.addLabel(childNumber,nodeLabel) -- p.addLabel(nodeLabel)

-- add cell with leaf (which may be a table with transluded content) --cladeString = cladeString .. '|| rowspan=2 style="border: 0; padding: 0; border-right: ' .. barRight .. ';border-bottom: ' .. barBottom .. ';border-top: ' .. barTop .. ';' .. branchStyle .. ' " | ' styleString = '' if barRight ~= "0"  then styleString = 'style="border:0;padding:0;border-right:' .. barRight .. ';border-bottom:' .. barBottom .. ';border-top:' .. barTop .. ';' .. branchStyle .. '"' else styleString = 'style="border:0;padding:0;' .. branchStyle .. '"' end

cladeString = cladeString .. '||rowspan=2 ' .. styleString .. '|'   -- note: this is where leading spaces can be added to labels and leaves. This was commented out in the clade template. Most trees seem to have added spaces, to would need to check for existing spaces; however, cladex uses it   -- or could use padding:0 0.2em in cell style as for labels cladeString = cladeString .. '\n' .. nodeLeaf -- stuff for right-hand bar-bracket if barRight ~= "0"  then cladeString = cladeString .. ' '            -- add spaces between leaf text and bar if barLabel ~= "" then -- cladeString = cladeString .. '\n| ' .. barLabel end -- experiment for labeling the bar cladeString = cladeString .. '' .. barLabel ..' ' end end if groupLabel ~= ""then --cladeString = cladeString .. ' '            -- add spaces between leaf text and bar (could use padding) cladeString = cladeString .. '' .. groupLabel ..' ' end

-- add row	(needed because of rowspan=2); -- note: the cell will be added on the next iteration of addTaxon (with left border) or after the main loop (without left border) local branchStyleString = 'style="' .. branchStyle .. '" ' if branchStyle ==  then branchStyleString =  end -- avoid empty style elements cladeString = cladeString .. '\n|-' .. branchStyleString -- TODO code to put whole row here instead of completing on next call to addTaxon or after main loop

return cladeString end

-- adds text for label or sublabel to a cell function p.addLabel(childNumber,nodeLabel) --local nodeLabel = mw.getCurrentFrame:getParent.args['label'..tostring(childNumber)] or ""

local firstChars = string.sub(nodeLabel, 1,2) -- get first two characters; will be {{ if no parameter (for Old method?) --if nodeLabel ~= "{{{label1}}}" then if firstChars == "{{{" or nodeLabel == "" then return ' ' --' ' -- remove space to reduce post-expand include size (the width=1.5em handles spacing) else -- spaces can cause wrapping and can break tree structure, hence use span with nowrap class --return ' ' .. nodeLabel .. ' '		-- a better method for template expansion size is to replace spaces with nonbreaking spaces -- however, there is a problem if labels have a styling element (e.g. <span style= ..., <span title= ...) local stylingElementDetected = false if string.find(nodeLabel, "span ") ~= nil then  stylingElementDetected = true end if string.find(nodeLabel, " style") ~= nil then stylingElementDetected = true end if stylingElementDetected == true then return ' ' .. nodeLabel .. ' '   	else local nowrapString = string.gsub(nodeLabel," ", " ") -- replace spaces with non-breaking space return nowrapString end end end

--=================== Newick string handling function ============================= function p.getNewickOuterterm(newickString) return string.gsub(newickString, "%b", "")  -- delete parenthetic term end function p.newick(count,newickString) local cladeString = "" count = count+1 --start table cladeString = cladeString .. '{| cellspacing=0 cellpadding=0 border=0 ' --	newickString = string.gsub(newickString, ",%s*", ",") -- remove spaces after commas (need to watch this) local j,k j,k = string.find(newickString, '%(.*%)')                -- find location of outer parenthesised term local innerTerm = string.sub(newickString, j+1, k-1)     -- select content in parenthesis local outerTerm = string.gsub(newickString, "%b%s*", "")  -- delete parenthetic term [added %s* ?] --if outerTerm == 'panthera' then outerTerm = "x" end    -- how is this set in local variable for inner nodes? outerTerm = tostring(count) -- need to remove commas in bracket terms before split, so temporarily replace commas between brackets local innerTerm2 = string.gsub(innerTerm, "%b",  function (n)                                         	return string.gsub(n, ",%s*", "XXX")  -- also strip spaces after commas here                                            end) --cladeString = cladeString .. '\n' .. p.addTaxon(1, innerTerm2, "")

local s = strsplit(innerTerm2, ",") local i=1 while s[i] do restoredString = string.gsub(s[i],"XXX%s*", ",")  -- convert back to commas --restoredString = s[i] local outerTerm = string.gsub(restoredString, "%b", "") if string.find(restoredString, '%(.*%)') then --cladeString = cladeString .. '\n' .. p.addTaxon(i, restoredString, "x") cladeString = cladeString .. '\n' .. p.addTaxon(i, p.newick(count,restoredString), outerTerm) -- p.addTaxon(2, p.newick(count,newickString2), "root") else cladeString = cladeString .. '\n' .. p.addTaxon(i, restoredString, "") --count)		end		i=i+1	end

-- close table cladeString = cladeString .. '\n' .. '| style="border: 0; padding: 0; vertical-align: top;" | \n|}' return cladeString end -- emulate a standard split string function function strsplit(inputstr, sep) if sep == nil then sep = "%s" end local t={} ; i=1 for str in string.gmatch(inputstr, "([^"..sep.."]+)") do               t[i] = str i = i + 1 end return t end

-- Bits from Peter Coxhead's module --   https://en.wikipedia.org/w/index.php?title=Module:Autotaxobox&action=edit

--nLevels|TAXON}} function p.nLevels(frame) local currTaxon = frame.args[1] local i = 1 local maxN = 2 local searching = true while searching and i < maxN do --local parent = frame:expandTemplate{ title = 'Template:Taxonomy/' .. currTaxon, args = {['machine code'] = 'parent' } } local parent = frame:expandTemplate{ title = currTaxon, args = {['machine code'] = 'parent' } } if parent ~= '' then currTaxon = parent i = i + 1 else searching = false end end if searching then return currTaxon --maxN .. '+'	else return i	end end

--listAll|TAXON}} function p.listAll(frame) local currTaxon = frame.args[1] local i = 1 local searching = true local maxN = 100 local lst = currTaxon while i < maxN and searching do local currCall = 'Template:Taxonomy/' .. currTaxon local parent = frame:expandTemplate{ title = currCall, args = {['machine code'] = 'parent' } } if parent ~= '' then currTaxon = parent lst = lst .. ', ' .. currTaxon i = i + 1 else searching = false end end if searching then lst = lst .. '...' end return lst .. ' (' .. i .. ')' end

-- =================== experimental Newick to clade parser function =============================

--[[Function of convert Newick strings to clade format

Usage: {{#invoke:Module:Sandbox/Jts1882/CladeN|newickConverter|newickstring={{{NEWICK_STRING}}} }} ]] function p.newickConverter(frame) local newickString = frame.args['newickstring'] if newickString == '{{{newickstring}}}' then return newickString end

-- show the Newick string local cladeString = '' local levelNumber = 1          --  for depth of iteration local childNumber = 1          --  number of sister elements on node  (always one for root) -- converted the newick string to the clade structure cladeString = cladeString .. '{{clade' cladeString = cladeString .. p.newickParseLevel(newickString, levelNumber, childNumber) cladeString = cladeString .. '\r}}'

local resultString = '' local option = mw.getCurrentFrame:getParent.args['option'] or '' if option == 'tree' then --show the transcluded clade diagram resultString =  cladeString else -- show the Newick string resultString = ' '..newickString..' ' -- show the converted clade structure resultString = resultString .. ' '.. cladeString ..' ' end --resultString = frame:expandTemplate{ title = 'clade', frame:preprocess(cladeString) }

return resultString end

--labelN=labelname     2. the left hand term in parenthesis has common delimited child nodes, each of which can be           i.  a taxon name which just needs:  |N=leafname            ii. a Newick string which needs further processing through reiteration function p.newickParseLevel(newickString,levelNumber,childNumber)

local cladeString = "" local indent = p.getIndent(levelNumber) --levelNumber=levelNumber+1 local j=0 local k=0 j,k = string.find(newickString, '%(.*%)')                -- find location of outer parenthesised term local innerTerm = string.sub(newickString, j+1, k-1)     -- select content in parenthesis local outerTerm = string.gsub(newickString, "%b", "")  -- delete parenthetic term

cladeString = cladeString .. indent .. '|label'..childNumber..'=' .. outerTerm cladeString = cladeString .. indent .. '|' .. childNumber..'=' .. '{{clade'

levelNumber=levelNumber+1 indent = p.getIndent(levelNumber) -- protect commas in inner parentheses from split; temporarily replace commas between parentheses local innerTerm2 = string.gsub(innerTerm, "%b",  function (n)	                                         	return string.gsub(n, ",%s*", "XXX")  -- also strip spaces after commas here	                                            end) local s = strsplit(innerTerm2, ",") local i=1 while s[i] do restoredString = string.gsub(s[i],"XXX", ",")  -- convert back to commas local outerTerm = string.gsub(restoredString, "%b", "") if string.find(restoredString, '%(.*%)') then --cladeString = cladeString .. indent .. '|y' .. i .. '=' .. p.newickParseLevel(restoredString,levelNumber+1,i) cladeString = cladeString .. p.newickParseLevel(restoredString,levelNumber,i) else cladeString = cladeString .. indent .. '|' .. i .. '=' .. restoredString --.. '(level=' .. levelNumber .. ')' end i=i+1 end --   end -- end splitting of strings

cladeString = cladeString .. indent .. '}}'     return cladeString end

function p.getIndent(levelNumber) local indent = "\r" local extraIndent = mw.getCurrentFrame:getParent.args['indent'] or 0 while tonumber(extraIndent) > 0 do indent = indent .. " " -- an extra indent to make aligining compound trees easier extraIndent = extraIndent - 1 end while levelNumber > 1 do indent = indent .. "  "		levelNumber = levelNumber-1 end return indent end

function p.newickstuff(newickString)

end

--

function p.test(dummy) local dataString = "" dataString =	"NEWCLADE:" local childNumber =0 local lastNode = 0 while 	childNumber < 17 do -- disable moreNeeded childNumber = childNumber + 1 -- so we start with 1 local nodeLeaf = mw.getCurrentFrame:getParent.args[tostring(childNumber)] or "" -- get data from |N= --local nodeLabel = mw.getCurrentFrame:getParent.args['label'..tostring(childNumber)] or "" -- get data from |labelN= if nodeLeaf ~= "" then dataString = dataString .. tostring(childNumber)

local firstChars = string.sub(nodeLeaf, 1,2) -- get first two characters --if nodeLabel ~= "{{{label1}}}" then if firstChars == "{{" then dataString = dataString .. 'XXX' .. nodeLeaf end dataString = dataString .. 'LEAF:' .. nodeLeaf lastNode = childNumber end end local numClades=0 local numBranches=0 -- _, count = string.gsub(dataString, "NEWCLADE", "NEXT") for i in string.gmatch(dataString, "NEWCLADE") do  		numClades = numClades + 1 end dataString =  dataString .. ' (numClades=' .. numClades .. ')' for i in string.gmatch(dataString, "LEAF") do  		numBranches = numBranches + 1 end dataString =  dataString .. ' (numClades=' .. numClades .. ')' dataString =  dataString .. ' (numBranches=' .. numBranches .. ')' mw:log(numClades) --return 'numClades=' .. numClades .. '; numBranches=' .. numBranches return dataString end function p.test2(target) local target ="User:Jts1882/sandbox/templates/Template:Passeroidea" local result = mw.getCurrentFrame:expandTemplate{ title = target, args = {['style'] = '' } } return result end

-- this must be at end

return p