CGI script output

s urls = [] pmids = [] #People who cited this paper years = [] #Year of the paper for elm in ps: if elm.attrib == {'class': 'title'}: url_string = elm.find('{http://www.w3.org/1999/xhtml}a').get('href') urls.append("http://www.ncbi.nlm.nih.gov" + url_string ) pmids.append(url_string[url_string.rfind('/')+1:]) if elm.attrib == {'class': 'details'}: for txt in elm.itertext(): if txt[2:6].isdigit(): years.append(txt[2:6]) new_ids = [] new_years = [] cache.append ( pmid_in ) if len(pmids) > 0: #if we found something new for pmid in pmids: if pmid not in cache: super_new, super_year = whocitedme(pmid, cache) if super_new is not None: new_ids.append( super_new ) new_years.append( super_year ) return new_ids + pmids, new_years + years else: return None, None def search_pubmed(term): params= { 'db': 'pubmed', 'tool': 'test', 'email':'test@test.com', 'term': term, 'usehistory':'y', 'retmax':20 } url = 'http://eutils.ncbi.nlm.nih.gov/entrez/eutils/esearch.fcgi?' + urllib.urlencode(params) tree = ET.fromstring(urllib.urlopen(url).read()) params['query_key'] = tree.find("./QueryKey").text params['WebEnv'] = tree.find("./WebEnv").text params['retmode'] = 'xml' url = 'http://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?' + urllib.urlencode(params) data = urllib.urlopen(url).read() return data def xml_to_papers(data): tree = ET.fromstring(data) articles = tree.findall("./PubmedArticle/MedlineCitation") papers = [] for article in articles: paper = dict() paper["journal_name"] = article.find("./Article/Journal/ISOAbbreviation").text paper["title"] = article.find("./Article/ArticleTitle").text paper["authors"] = digest_authors(article.findall("./Article/AuthorList/Author")) paper["issue"] = digest_issue(article.find("./Article/Journal/JournalIssue")) paper["year"] = digest_year(article) paper["page_num"] = checkXML(article, "./Article/Pagination/MedlinePgn") paper["pmid"] = article.find("./PMID").text paper["doi"] = checkXML(article, "./Article/ELocationID") papers.append(paper) return papers def citelist_to_hist(deepyearlist): flatlist = list(flatten(deepyearlist)) output = [0 for x in range(120)] # output[0] = num papers in 1900, [1] = 1901 etc... for year in flatlist: output[int(year)-1900] += 1 return output def sum_hist(hist_list): output = [0 for x in range(len(hist_list))] # output[n] = sum(hist_list[0]...hist_list[n]) output[0] = hist_list[0] for index in range(1, len(hist_list)): output[index] = output[index-1] + hist_list[index] return output def first_non_zero(lst): for index in range(len(lst)): if lst[index] > 0: return index def last_non_zero(lst): for index in range(len(lst)-1, 0, -1): if lst[index] > 0: return index def offset_hist(size_by_year, last_year_index): #reduce it is so the first year with a citation is element zero output = [] index = first_non_zero(size_by_year) for ind in range(index, last_year_index+1): output.append(size_by_year[ind]) return output print "Content-Type: text/html" print print "" url = os.environ["REQUEST_URI"] prased_url = urlparse.urlparse(url) params = urlparse.parse_qs(prased_url.query) pmid = False if len(params["pmid"][0]) == 8 and str(params["pmid"][0]).isdigit(): pmid = str(params["pmid"][0]) #Else PMID IS ILLEGALLY FORMATTED if not (pmid==False): searched_paper_xml = search_pubmed(pmid) paper = xml_to_papers(searched_paper_xml) paper = paper[0] cache = [] print "

" deepest = last_non_zero(family_tree) famly_str = "" for depth in range(0, deepest+1): if depth == deepest-1: linkage = " and " elif depth == deepest: linkage = "." else: linkage = ", " if depth == 0: famly_str += str(family_tree[0]) + " children" + linkage elif depth == 1: famly_str += str(family_tree[1]) + " grandchildren" + linkage elif depth == 2: famly_str += str(family_tree[2]) + " great-grandchildren" + linkage elif depth == 3: famly_str += str(family_tree[3]) + " great-great (or more) grandchildren" print "Your paper has a family tree with a total of " + str(sum(family_tree)) + " papers in it." print "
" print "Your family tree is made up of " + famly_str + "." offset_str = str(math.exp(offset)) slope_str = str(slope) unbiased_str = str(math.exp(offset)/slope) print "According to the citation tree, your paper's original citability was", offset_str[0:4], "and your field citability was", slope_str[0:4] + ". This means your paper had a non-biased impact of", unbiased_str[0:4] print "