Lunarpedia talk:Autostub2
Database
James Rogers is working on improving the data set. -- Strangelv 10:51, 2 February 2007 (PST)
Source Code
Revision as of Test 2, with successful generation of an XML file for importation. Please note that the <PRE> tag fails to stop the ampersand markup from being converted into symbols that the importer will choke on if the code is run as is. -- Strangelv 10:51, 2 February 2007 (PST)
#%#%#%#%#%#%#%#%#%#%#%#%#%#%#%# # # # Element Autostub Generator # # # # Public Domain # # # #%#%#%#%#%#%#%#%#%#%#%#%#%#%#%# def DePluralize(wordish): wordish=wordish.strip() #print "WORDISH=", wordish #print "TRUNC=", wordish[:-2], wordish[:-1] if wordish[-2:] == "es": return wordish[:-2] elif wordish[-1:] == "s": return wordish[:-1] elif 1: raise InputError, "No plural???" def XMLproof(textish): outp = "" for q in textish: if q == "<": outp += "<" elif q == ">": outp += ">" elif q == "&": outp += "&" elif q == '"': outp += """ elif q == ":": outp += "%3A" else: outp += q return outp def ShellBRK(shell): # parse into chunks shells = shell.split(" ") # escape if only one chunk if len(shells) == 1: return shell # reassemble with breaks last = "0" outp = "" for q in shells: if last == "0": outp = q+" "; last=q[0] else: if q[0] == last: outp += q+" "; last = q[0] #; print "nobreak" else: outp += "<BR/>"+q+" "; last = q[0] #; print last, q[0] return outp def TmpBRK(stringish): # parse into chunks textish = stringish.split(" ") # escape if only one chunk if len(textish) == 1: return stringish # reassemble with breaks last = "0" outp = "" for q in textish: if last == "0": outp = q; last = q else: outp += "<BR/>"+q return outp def linebrk(listish): newlist = [] for q in listish: newlist += [q+"\n"] return newlist def dostub(thisentry): """Create stub article from database """ # # Set up variables to generate # the element article stub # # database: 00 Atomic number # 01 Symbol # 02 Name # 03 Availability # 04 Importance # 05 Group # 06 Period # 07 Series # 08 Normal Phase # 09 Mass # 10 Density # 11 Melt Point # 12 Boil Point # 13 Above Prev # 14 Above # 15 Above Next # 16 Prev # 17 Next # 18 Below Prev # 19 Below # 20 Below Next # 21 Atomic Radius (pm) # 22 Bohr Atomic Radius (pm) # 23 Covalent Radius (pm) # 24 Van der Waals Radius (pm) # 25 Ionic Radius (pm) # 26 1st Ion Potential (energy required to remove one electron, forming a cation, measured in eV # 27 Electron Shell Configuration # 28 Electrons per Shell # 29 Electronegativity # 30 Electron Affinity # 31 Oxidation States # 32 Magnetism # 33 Crystal Structure # #%#%#%#%#%#%#%#%#%#%#%#%#%#%%#%#%#%#%# # name = thisentry[ 2] # name of element (Iron) symbol = thisentry[ 1] # element symbol (Fe) number = thisentry[ 0] # atomic number (26) mass = thisentry[ 9] # atomic mass (55.845) gprev = thisentry[14] # up one (none) gnext = thisentry[19] # down one (Ruthenium) imp = thisentry[ 4] # importance (important) avail = thisentry[ 3] # availability (ubiquitous) group = thisentry[ 5] # in this group (8) # phase = thisentry[ 8] # normal phase density = thisentry[10] # density melt = thisentry[11] # melt point boil = thisentry[12] # boil point period = thisentry[ 6] # period series = thisentry[ 7] # series arad = thisentry[21] # atomic radius brad = thisentry[22] # Bohr atomic radius crad = thisentry[23] # covalant radius vrad = thisentry[24] # Van der Waals radius irad = thisentry[25] # Ionic Radius fionp = thisentry[26] # First Ion Potential elesh = thisentry[27] # electron shell config epersh = thisentry[28] # electrons per shell eneg = thisentry[29] # electronegativity eaff = thisentry[30] # electron affinity oxid = thisentry[31] # oxidation states mag = thisentry[32] # magnetism cry = thisentry[33] # crystalline structure # #%#%#%#%#%#%#%#%#%#%#%#%#%#%%#%#%#%#%# # # start generating the article here: # to_out = [] to_out += ["{{Test Element "] to_out += ["name=" + name] to_out += ["symbol=" + symbol] to_out += ["available=" + avail] to_out += ["need=" + imp] to_out += ["number=" + number] if (mass[0] == "["): to_out += ["mass=" + mass] else: to_out += ["mass=" + str(float(mass))] to_out += ["group=" + group] to_out += ["period=" + period] to_out += ["phase=" + phase] to_out += ["series=" + series] to_out += ["density=" + density] to_out += ["melts=" + TmpBRK(melt)] to_out += ["boils=" + TmpBRK(boil)] #to_out+= ["isotopes="] to_out += ["prior="+get_element(number,-1)] to_out += ["next="+get_element(number,1)] to_out += ["above="+get_element(gprev,0)] to_out += ["aprior="+get_element(gprev,-1)] to_out += ["anext="+get_element(gprev,1)] to_out += ["below="+get_element(gnext,0)] to_out += ["bprior="+get_element(gnext,-1)] to_out += ["bnext="+get_element(gnext,1)] #for q in to_out: print q #print; print to_out += ["radius=" + arad] to_out += ["bohr=" + brad] to_out += ["covalent=" + crad] to_out += ["vdwr=" + vrad] to_out += ["irad=" + irad] to_out += ["ipot=" + fionp] # print elesh #to_out+= ["econfig=" + ShellBRK(elesh)] to_out += ["econfig=" + XMLproof(elesh)] to_out += ["eshell=" + epersh] to_out += ["enega=" + eneg] to_out += ["eaffin=" + eaff] to_out += ["oxstat=" + oxid] to_out += ["magn=" + mag] to_out += ["cryst=" + cry] # Tidily install pipes for the table to_out = tidypipes(to_out) to_out += ["}}"] to_out +=["{{Script Test}}"] # print "VARS=", name, series, group, DePluralize(series) if group != "19": #print "name is ", type(name) #print "series is ", type(series) #print "series_de is ", type(DePluralize(series)) #print "group is ", type(group) to_out += ["'''"+name+"''' is a "+DePluralize(series)+" in group "+group+"."] else: to_out += ["'''"+name+"''' is a "+DePluralize(series)+" metal."] if cry: to_out += ["It has a "+cry+" crystalline structure."] #print mass, mass[0] if mass[0] == "[": #print "RAD" to_out += ["It does not have any isotopes considered to be natural. Its longest-lived known isotope has an atomic number of "+mass[1:-1]] to_out += ["<BR/><BR/>\n\n"] to_out += [""] to_out += [""] to_out += [""] to_out += ["{"+"{Test Autostub}"+"}"] # to_out += docategories(typecat) #["[[Category:"+typecat+"]]"] to_out += ['<DIV ID="catlinks"><P CLASS="catlinks">[[Special:Categories&article=Lunarpedia%3AAutostub2_test7a|Categories]]: [[:Category:Stubs|Stubs]] | [[:Category:Elements|Elements]]'] to_out += ["</P></DIV><!-- fake category box -- see commented out text above for actual script output -->"] to_out += ["<!-- Generated by a late alpha version of Autostub2 -->"] to_out = linebrk(to_out) return to_out # def main(): # # load database # didxml = templatetop() # for q in database: didxml += dostub(q) + templatemid(); print ".", # didxml += templatefin() # # save didxml def tidypipes(table): """takes a list oy strings, finds the longest one, and tidily adds pipes to the right of each line. maxlen: maximum length table: input list of strings table2: output list of strings """ maxlen = 0 for q in table: if len(q)>maxlen: maxlen = len(q) table2 = [] for q in table: qq = q while (len(qq)<maxlen): qq += " " table2 += [qq+" |"] return table2 def LtBlau(textish): return "<FONT color="#7F7FFF">"+textish+"</FONT>" def replacer(stringie, old, new): """ """ name2="" for q in stringie: if q == old: name2 += new else: name2 += q return name2 def refbreak(ref): """ """ return replacer(ref,";",";<BR/>") def get_element(number,shift): """if a number is a number, return the element symbol corresponding to number+shift """ global DB #if number = "N/A": return "N/A" #print number, shift try: number = int(number) except: return "<SMALL><FONT color="#7F7F7F">N/A</FONT></SMALL>" if number+shift>118: return "<SMALL><FONT color="#7F7F7F">N/A</FONT></SMALL>" #; print ">=118" if number+shift<1: return "<SMALL><FONT color="#7F7F7F">N/A</FONT></SMALL>" #; print "<=1" #print "no special cases" #print "[[Mediawiki:Sandbox|"+str(DB[number+int(shift)][1])+"]]" return "[[Mediawiki:Sandbox|"+LtBlau(str(DB[number+int(shift)][1]))+"]]" ##def (): ## """ ## """ ## return "() not implemented" def StartXML(): out = [['<mediawiki xmlns="http://www.mediawiki.org/xml/export-0.3/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.mediawiki.org/xml/export-0.3/ http://www.mediawiki.org/xml/export-0.3.xsd" version="0.3" xml:lang="en">\n']] out += [' <siteinfo>\n'] out += [' <sitename>Lunarpedia</sitename>\n'] out += [' </siteinfo>\n'] return out def EndXML(): out = [['</mediawiki>\n']] return out def ArtXML(title, contrib, date, text): '''XML markup for article in file title -- title of article contrib -- name of script (ie Autostub2) text -- the article ''' out = [[' <page>\n']] out += [' <title>'+title+'</title>\n'] out += [' <revision>\n'] out += [' <timestamp>'+date+'</timestamp>'] out += [' <contributor>\n'] out += [' <username>'+contrib+'</username>\n'] out += [' </contributor>\n'] #out += [' <text xml:space="preserve">'+text+'</text>'] out += [' <text xml:space="preserve">'] out += text out += ['</text>\n'] out += [' </revision>\n'] out += [' </page>\n'] return out # TSV sorter # Public Domain def TSVinput(filename): """tab separated database parser """ # Open filename tsv=open(filename) # Convert to list ## get list of lines biglist = tsv.readlines() #for q in tsv: # biglist += q tsv.close() ## parse lines #for q in biglist: print q newlist = [] for q in biglist: newlist += [q.split("\t")] # print max(max(newlist)) # return list return newlist #Item = ["28","Ni","Nickel","58.6934000000","N/A","46","","","10"] #Item = ["26","Fe","Iron","55.8450000000","N/A","44","important","ubiquietous","8"] #Atomic number, symbol, name, atomic mass, previous in group, next in group, importance, availahbility, group number #What=dostub(Item) DB=TSVinput("/home/Luna/Elements_H206.csv") gotit = StartXML() #print DB[26][2] #print DB[6][2] gotit += ArtXML("Lunarpedia:Autostub2 test 7a","Autostub2","2007-02-09T12:00:00Z",dostub(DB[ 1])) gotit += ArtXML("Lunarpedia:Autostub2 test 7b","Autostub2","2007-02-09T12:00:00Z",dostub(DB[ 72])) gotit += ArtXML("Lunarpedia:Autostub2 test 7c","Autostub2","2007-02-09T12:00:00Z",dostub(DB[118])) gotit += EndXML() def Stringify(listish): stringish = "" for q in listish: if type(q) == type('str'): stringish += q #print "str" elif type(q) == type([]): stringish += Stringify(q) #print "list" else: print type(q) print q raise TypeError, "non-string non-list!!!" return stringish outdone = Stringify(gotit) #print outdone do_xml=open('/home/Luna/autostub2test7.xml', 'w') do_xml.write(outdone) do_xml.close() # shell = "1s2 2s2 2p6 3s2 3p6 3d10 4s2 4p6 4d10 4f14 5s2 5p6 5d10 5f14 6s2 6p6 6d10 7s2 7p1" # print ShellBRK(shell)