import os, re, urllib
## -----------------------------------------------------------------
## Purpose: make a nice publication page with an ADS database link
## Author: Aymeric Spiga 19/05/2012
## -----------------------------------------------------------------
## NB: uses BIBTEX2HTML https://www.lri.fr/~filliatr/bibtex2html/doc/manual.html
## ... and of course NASA ADS http://adsabs.harvard.edu/
## -----------------------------------------------------------------
def makepage(authorref,
bibstyle = "-s custom -nokeys",
listyear = [0],
customcond = None,
embedded = False,
linkads = None,
title = None,
retrieve = True,
addpdf = None,
addlink = None):
htmlcontent = ""
### HEADER
if embedded:
htmlfile = open('header.html','r')
htmlcontent = htmlfile.read()
htmlfile.close()
#else:
if title is None:
htmlcontent = htmlcontent + "
"+authorref+"'s publications
"
elif title == "":
pass
else:
htmlcontent = htmlcontent + title
### if linkads is None, we set it to "link.authorref"
if linkads is None:
linkads = 'link.'+authorref
### GET INFO FROM ADS
if retrieve:
print "retrieving info from ADS"
linkfile = open(linkads,'r')
url = linkfile.read()
linkfile.close()
html = urllib.urlopen(url).read()
bibfile = open(linkads+'.bib','w')
print >> bibfile,html
bibfile.close()
### if only one year and no customcond, make it useful. ask for years >= this value
if len(listyear) == 1 and customcond is None:
customcond = "-c 'year>=%s'" % (listyear[0])
listyear[0] = 99
### ADD LINK WITH YEARS IN HEADER
if customcond is None or len(listyear) > 1:
htmlcontent += "Year: "
for year in listyear:
htmlcontent += ""+str(year)+". "
if addlink is not None: htmlcontent += "
"+addlink
### YEAR LOOP
for year in listyear:
author = authorref+str(year)
print author
# 0. define condition
# if not user-defined, make it simply year in each listyear instance
# if user-defined, then customcond will be the condition (possibly several)
if customcond is None and len(listyear) > 1: cond = "-c 'year=%s'" % (year)
elif len(listyear) > 1: cond = customcond + " -c 'year=%s'" % (year)
else: cond = customcond
# 1. select items ARTICLE in the big bib file
# put those in a dedicated author.bib file
arg = \
cond,\
'"ARTICLE"',\
author+'.txt',\
author+'.bib',\
linkads+'.bib'
cmd = "bib2bib --quiet %s -c '$type=%s' -oc %s -ob %s %s" % (arg)
os.system(cmd)
# modify the bib file to insert pdf links
# the trick is to use the line adsurl and expect pdf to have the same name as ADS reference
# ... then besides this, it is necessary to link pdfs or rename those
# ... the online repository is indicated by addpdf
if retrieve:
if addpdf is not None:
bibcontent = ''
for line in open(linkads+'.bib'):
bibcontent += line
if 'adsurl' in line:
line = line.replace('adsurl','localpdf')
line = line.replace('http://cdsads.u-strasbg.fr/abs/',addpdf)
line = line.replace('},','.pdf},')
line = line.replace('%','_')
bibcontent += line
bibfile2 = open('temp','w')
print >> bibfile2,bibcontent
bibfile2.close()
os.system('mv temp '+linkads+'.bib')
# 2. make the html page from the author.bib file
if customcond is None or len(listyear) > 1:
header = '' % (year)
header += "%.0f .
" % (year)
if embedded: header += '
'
else:
header = ''
header = '"'+header+'"'
arg = \
bibstyle,\
header,\
author+'.bib'
cmd = "bibtex2html -q \
--both \
-m ads.tex \
%s \
-nf adsurl 'ADS link' \
-nf localpdf 'PDF version' \
-r -d --revkeys \
-nofooter --nodoc \
--header %s -nokeywords \
%s" % (arg)
os.system(cmd)
# 3. load page content and delete intermediate HTML file
htmlfile = open(author+'.html','r')
htmlcontent = htmlcontent + htmlfile.read()
htmlfile.close()
os.system("rm -rf "+author+'.html')
## make a few corrections
## bibcontent = open(author+'.bib','r').read()
## bibcontent.replace('\grl','Yeah')
find = re.compile(r'bib')
htmlcontent = find.sub('Bibtex entry',htmlcontent)
find = re.compile(r'Bibtex entry.html')
htmlcontent = find.sub('bib.html',htmlcontent)
find = re.compile(r'DOI')
htmlcontent = find.sub('Journal website',htmlcontent)
#find = re.compile(r'.pdf')
#htmlcontent = find.sub('PDF version',htmlcontent)
find = re.compile(r'')
htmlcontent = find.sub('',htmlcontent)
find = re.compile(r'')
htmlcontent = find.sub(' | ',htmlcontent)
htmlcontent += '''
Generated with
BibTeX2HTML
and NASA ADS
and a bit of Python '''
if embedded:
htmlfile = open('footer.html','r')
htmlcontent += htmlfile.read()
htmlfile.close()
htmlmain = open(authorref+'.html','w')
print >> htmlmain, htmlcontent
htmlmain.close()
|