Module:Chem2

From Azupedia
Jump to navigation Jump to search

This module implements {{chem2}}. Please see its documentation for details.


local getArgs = require('Module:Arguments').getArgs
local p = {} -- module's table


local am = {}  -- Elements with wiki links
am.H="[[:en:Hydrogen|H]]";am.He="[[:en:Helium|He]]";
am.Li="[[:en:Lithium|Li]]";am.Be="[[:en:Beryllium|Be]]";am.B="[[:en:Boron|B]]";am.C="[[:en:Carbon|C]]";am.N="[[:en:Nitrogen|N]]";am.O="[[:en:Oxygen|O]]";am.F="[[:en:Fluorine|F]]";am.Ne="[[:en:Neon|Ne]]";
am.Na="[[:en:Sodium|Na]]";am.Mg="[[:en:Magnesium|Mg]]";am.Al="[[:en:Aluminium |Al]]";am.Si="[[:en:Silicon|Si]]";am.P="[[:en:Phosphorus|P]]";am.S="[[:en:Sulfur|S]]";am.Cl="[[:en:Chlorine|Cl]]";am.Ar="[[:en:Argon|Ar]]";
am.K="[[:en:Potassium|K]]";am.Ca="[[:en:Calcium|Ca]]";am.Sc="[[:en:Scandium|Sc]]";am.Ti="[[:en:Titanium|Ti]]";am.V="[[:en:Vanadium|V]]";am.Cr="[[:en:Chromium|Cr]]";am.Mn="[[:en:Manganese|Mn]]";am.Fe="[[:en:Iron|Fe]]";am.Co="[[:en:Cobalt|Co]]";am.Ni="[[:en:Nickel|Ni]]";am.Cu="[[:en:Copper|Cu]]";am.Zn="[[:en:Zinc|Zn]]";am.Ga="[[:en:Gallium|Ga]]";am.Ge="[[:en:Germanium|Ge]]";am.As="[[:en:Arsenic|As]]";am.Se="[[:en:Selenium|Se]]";am.Br="[[:en:Bromine|Br]]";am.Kr="[[:en:Krypton|Kr]]";am.Rb="[[:en:Rubidium|Rb]]";
am.Sr="[[:en:Strontium|Sr]]";am.Y="[[:en:Yttrium|Y]]";am.Zr="[[:en:Zirconium|Zr]]";am.Nb="[[:en:Niobium|Nb]]";am.Mo="[[:en:Molybdenum|Mo]]";am.Tc="[[:en:Technetium|Tc]]";am.Ru="[[:en:Ruthenium|Ru]]";am.Rh="[[:en:Rhodium|Rh]]";am.Pd="[[:en:Palladium|Pd]]";am.Ag="[[:en:Silver|Ag]]";am.Cd="[[:en:Cadmium|Cd]]";am.In="[[:en:Indium|In]]";am.Sn="[[:en:Tin|Sn]]";am.Sb="[[:en:Antimony|Sb]]";am.Te="[[:en:Tellurium|Te]]";am.I="[[:en:Iodine|I]]";am.Xe="[[:en:Xenon|Xe]]";
am.Cs="[[:en:Caesium|Cs]]";am.Ba="[[:en:Barium|Ba]]";am.La="[[:en:Lanthanum|La]]";am.Ce="[[:en:Cerium|Ce]]";am.Pr="[[:en:Praseodymium|Pr]]";am.Nd="[[:en:Neodymium|Nd]]";am.Pm="[[:en:Promethium|Pm]]";am.Sm="[[:en:Samarium|Sm]]";am.Eu="[[:en:Europium|Eu]]";am.Gd="[[:en:Gadolinium|Gd]]";am.Tb="[[:en:Terbium|Tb]]";am.Dy="[[:en:Dysprosium|Dy]]";am.Ho="[[:en:Holmium|Ho]]";am.Er="[[:en:Erbium|Er]]";am.Tm="[[:en:Thulium|Tm]]";am.Yb="[[:en:Ytterbium|Yb]]";am.Lu="[[:en:Lutetium|Lu]]";am.Hf="[[:en:Hafnium|Hf]]";am.Ta="[[:en:Tantalum|Ta]]";am.W="[[:en:Tungsten|W]]";am.Re="[[:en:Rhenium|Re]]";am.Os="[[:en:Osmium|Os]]";am.Ir="[[:en:Iridium|Ir]]";am.Pt="[[:en:Platinum|Pt]]";am.Au="[[:en:Gold|Au]]";am.Hg="[[:en:Mercury (element)|Hg]]";am.Tl="[[:en:Thallium|Tl]]";am.Pb="[[:en:Lead|Pb]]";am.Bi="[[:en:Bismuth|Bi]]";am.Po="[[:en:Polonium|Po]]";am.At="[[:en:Astatine|At]]";am.Rn="[[:en:Radon|Rn]]";
am.Fr="[[:en:Francium|Fr]]";am.Ra="[[:en:Radium|Ra]]";am.Ac="[[:en:Actinium|Ac]]";am.Th="[[:en:Thorium|Th]]";am.Pa="[[:en:Protactinium|Pa]]";am.U="[[:en:Uranium|U]]";am.Np="[[:en:Neptunium|Np]]";am.Pu="[[:en:Plutonium|Pu]]";am.Am="[[:en:Americium|Am]]";am.Cm="[[:en:Curium|Cm]]";am.Bk="[[:en:Berkelium|Bk]]";am.Cf="[[:en:Californium|Cf]]";am.Es="[[:en:Einsteinium|Es]]";am.Fm="[[:en:Fermium|Fm]]";am.Md="[[:en:Mendelevium|Md]]";am.No="[[:en:Nobelium|No]]";am.Lr="[[:en:Lawrencium|Lr]]";am.Rf="[[:en:Rutherfordium|Rf]]";am.Db="[[:en:Dubnium|Db]]";am.Sg="[[:en:Seaborgium|Sg]]";am.Bh="[[:en:Bohrium|Bh]]";am.Hs="[[:en:Hassium|Hs]]";am.Mt="[[:en:Meitnerium|Mt]]";am.Ds="[[:en:Darmstadtium|Ds]]";am.Rg="[[:en:Roentgenium|Rg]]";am.Cp="[[:en:Copernicium|Cp]]";am.Nh="[[:en:Nihonium|Nh]]";am.Fl="[[:en:Flerovium|Fl]]";am.Mc="[[:en:Moscovium|Mc]]";am.Lv="[[:en:Livermorium|Lv]]";am.Ts="[[:en:Tennessine|Ts]]";am.Og="[[:en:Oganesson|Og]]";

local T_ELEM = 0         -- token types
local T_NUM = 1          -- number
local T_OPEN = 2         -- open '('
local T_CLOSE = 3        -- close ')'
local T_PM_CHARGE = 4    -- + or −
local T_WATER = 6        -- .xH2O x number
local T_CRYSTAL = 9      -- .x
local T_CHARGE = 8       -- charge (x+), (x-)
local T_SUF_CHARGE = 10  -- suffix and charge e.g. 2+ from H2+
local T_SUF_CHARGE2 = 12 -- suffix and (charge) e.g. 2(2+) from He2(2+)
local T_SPECIAL = 14     -- starting with \ e.g. \d for double bond (=)
local T_SPECIAL2 = 16    -- starting with \y{x} e.g. \i{12} for isotope with mass number 12
local T_ARROW_R = 17     -- match: ->
local T_ARROW_EQ = 18    -- match: <->
local T_UNDERSCORE = 19  -- _{ ... }
local T_CARET = 20       -- ^{ ... }
local T_NOCHANGE = 30        -- Anything else like ☃

function su(up, down) -- like template:su
  if (down == "") then 
    return "<span style=\"display:inline-block; margin-bottom:-0.3em; vertical-align:0.8em; line-height:1.2em; font-size:70%; text-align:left;\">" .. up .. "<br /></span>";
  else
    return "<span style=\"display:inline-block; margin-bottom:-0.3em; vertical-align:-0.4em; line-height:1.2em; font-size:70%; text-align:left;\">" .. up .. "<br />" .. down .. "</span>";
  end
end

function DotIt()
  return '&middot;'
end


function item(f) -- (iterator) returns one token (type, value) at a time from the formula 'f'
   local i = 1
   local first = "true";

   return function ()
	local t, x = nil, nil

        if (first == "true" and f:match('^[0-9]', i)) then 
                 x = f:match('^[%d.]+', i); t = T_NOCHANGE; i = i + x:len();   -- matching coefficient (need a space first)

        elseif i <= f:len() then
                              x = f:match('^%s+[%d.]+', i); t = T_NOCHANGE;  -- matching coefficient (need a space first)
		if not x then x = f:match('^%s[+]', i); t = T_NOCHANGE; end       -- matching + (H2O + H2O)
		if not x then x = f:match('^%&%#[%w%d]+%;', i); t = T_NOCHANGE; end       -- &#...;
		if not x then x = f:match('^%<%-%>', i); t = T_ARROW_EQ; end       -- matching <->
		if not x then x = f:match('^%-%>', i); t = T_ARROW_R; end       -- matching ->
		if not x then x = f:match('^%u%l*', i); t = T_ELEM; end        -- matching symbols like Aaaaa
		if not x then x = f:match('^%d+[+-]', i); t = T_SUF_CHARGE; end        -- matching x+, x-
		if not x then x = f:match('^%d+%(%d*[+-]%)', i); t = T_SUF_CHARGE2; end        -- matching x(y+/-), x(+/-)
		if not x then x = f:match('^%(%d*[+-]%)', i); t = T_CHARGE; end        -- matching (x+) (xx+), (x-) (xx-)
		if not x then x = f:match('^[%d.]+', i); t = T_NUM; end        -- matching number
		if not x then x = f:match('^[(|{|%[]', i); t = T_OPEN; end     -- matching ({[
		if not x then x = f:match('^[)|}|%]]', i); t = T_CLOSE; end           -- matching )}]
		if not x then x = f:match('^[+-]', i); t = T_PM_CHARGE; end        -- matching + or -
		if not x then x = f:match('^%*[%d.]*H2O', i); t = T_WATER; end -- Crystal water
		if not x then x = f:match('^%*[%d.]*', i); t = T_CRYSTAL; end -- Crystal
		if not x then x = f:match('^[\\].{%d+}', i); t = T_SPECIAL2; end -- \y{x}
		if not x then x = f:match('^[\\].', i); t = T_SPECIAL; end -- \x
		if not x then x = f:match('^_{[^}]*}', i); t = T_UNDERSCORE; end -- _{...}
		if not x then x = f:match('^\^{[^}]*}', i); t = T_CARET; end -- ^{...}
		if not x then x = f:match('^.', i); t = T_NOCHANGE; end  --the rest - one by one
		if x then i = i + x:len(); else i = i + 999; error("Invalid character in formula!!!!!!! : "..f) end
	end
        first = "false"
	return t, x
	end
   end

function p._chem(args)
   
local f = args[1] or ''

   f = string.gsub(f, "–", "-")  -- replace – with - (hyphen not ndash)
   f = string.gsub(f, "−", "-")  -- replace – with - (hyphen not minus sign)

   local sumO = 0
   local formula = ''
   local t, x

   local link = args['link'] or ""
   local auto = args['auto'] or ""

   if not (link == '') then formula = formula .. "[[" .. link .. "|"; end   -- wikilink start [[link|
 
   for t, x in item(f) do 
      if     t == T_ELEM then if (auto == '') then formula = formula .. x elseif am[x] then formula = formula .. am[x]; am[x] = x else formula = formula .. x end 
      elseif t == T_COEFFICIENT then formula = formula .. x
      elseif t == T_NUM   then formula = formula .. su("", x);
      elseif t == T_OPEN  then formula = formula .. x; sumO = sumO + 1;        -- ( {
      elseif t == T_CLOSE then formula = formula .. x; sumO = sumO -1;         -- ) }
      elseif t == T_PM_CHARGE    then formula = formula .. su(string.gsub(x, "-", "−"), "");
      elseif t == T_SUF_CHARGE then 
           formula = formula .. su(string.gsub(string.match(x, "[+-]"), "-", "−"), string.match(x, "%d+"), "");
      elseif t == T_SUF_CHARGE2 then 
          formula = formula .. su(string.sub(string.gsub(string.match(x, "%(%d*[+-]"), "-", "−"), 2, -1), string.match(x, "%d+"))
      elseif t == T_CHARGE then formula = formula .. "<sup>"; if string.match(x, "%d+") then formula = formula .. string.match(x, "%d+"); end formula = formula .. string.gsub(string.match(x, "[%+-]"), "-", "−") .. "</sup>";  -- can not concatenat a nil value from string.match(x, "%d+");
      elseif t == T_CRYSTAL then formula = formula .. DotIt() .. string.gsub( x, "*", '', 1 );
      elseif t == T_SPECIAL then
          parameter = string.sub(x, 2, 2) -- x fra \x  
          if       parameter == "s" then formula = formula .. "−"   -- single bond
            elseif parameter == "d" then formula = formula .. "="   -- double bond
            elseif parameter == "t" then formula = formula .. "≡"   -- tripple bond
            elseif parameter == "q" then formula = formula .. "≣"   -- Quadruple bond
            elseif parameter == "h" then formula = formula .. "η"   -- η, hapticity
            elseif parameter == "*" then formula = formula .. "*"   -- *, normal *
            elseif parameter == "-" then formula = formula .. "-"   -- -
            elseif parameter == "\\" then formula = formula .. "\\"   -- \
            elseif parameter == "\'" then formula = formula .. "&#39;"   -- html-code for '
          end
      elseif t == T_SPECIAL2 then  -- \y{x}
         parameter = string.sub(x, 2, 2) -- y fra \y{x} 
          if parameter  == "h" then --[[Hapticity]]
             if (auto == '') then formula = formula .. "η<sup>" .. string.match(x, '%d+') .. "</sup>-"
               else
             formula = formula .. "[[Hapticity|η<sup>" .. string.match(x, '%d+') .. "</sup>]]-"
             end
          elseif parameter == "m" then formula = formula .. "μ<sup>" .. string.match(x, '%d+') .. "</sup>-" -- mu ([[bridging ligand]])
          end
      elseif t == T_WATER then 
        if string.match(x, "^%*[%d.]") then 
            formula = formula .. DotIt() .. string.match(x, "%f[%.%d]%d*%.?%d*%f[^%.%d%]]") .. "H<sub>2</sub>O";
        else
          formula = formula .. DotIt() .. "H<sub>2</sub>O";
        end  
      elseif t == T_UNDERSCORE  then formula = formula .. su("", string.sub(x,3,-2)) -- x contains _{string}
      elseif t == T_CARET then formula = formula .. su(string.sub(x,3,-2), "") -- x contains ^{string}
      elseif t == T_ARROW_R then formula = formula .. " → "
      elseif t == T_ARROW_EQ then formula = formula .. " ⇌ "
      elseif t == T_NOCHANGE  then formula = formula .. x;  -- The rest - everything which isn't captured by the regular expresions. E.g. wikilinks and pipes
     
      else error('unreachable - ???') end -- in fact, unreachable

end

   if not (link == nil or link == '') then formula = formula .. "]]"; end   -- wikilink closing ]]

   return '<span class="chemf nowrap">' .. formula .. '</span>' 
end

function p.chem(frame)
	local args = getArgs(frame)
	return p._chem(args)
end

return p