{ "translatorID": "9499c586-d672-42d6-9ec4-ee9594dcc571", "label": "The Hindu (old)", "creator": "Prashant Iyengar and Michael Berkowitz", "target": "^https?://(www\\.)?hindu\\.com", "minVersion": "1.0.0b4.r5", "maxVersion": "", "priority": 100, "inRepository": true, "translatorType": 4, "browserSupport": "gcsibv", "lastUpdated": "2014-04-04 09:55:32" } function detectWeb(doc, url) { if (doc.evaluate('//h2[@class="r"]/a[@class="l"]', doc, null, XPathResult.ANY_TYPE, null).iterateNext()) { return "multiple"; } else { return "newspaperArticle"; } } function regexMeta(str, item) { var re = /NAME\=\"([\w\W]*?)\"\s+CONTENT\=\"([\w\W]*?)\"/; var stuff = str.match(re); if (stuff) { if (stuff[1] == "PAGEHEAD") { item.section = stuff[2].split(/\s+/)[0]; } if (stuff[1] == "ZONE") { item.place = stuff[2].split(/\s+/)[0]; } if (stuff[1] == "EXPORTTIME") { item.date = stuff[2].split(/\s+/)[0]; } if (stuff[1] == "PAGENUMBER") { item.pages = stuff[2].split(/\s+/)[0]; } } } function doWeb(doc, url) { var arts = new Array(); if (detectWeb(doc, url) == "multiple") { var xpath = '//h2[@class="r"]/a[@class="l"]'; var links = doc.evaluate(xpath, doc, null, XPathResult.ANY_TYPE, null); var link; var items = new Object(); while (link = links.iterateNext()) { items[link.href] = link.textContent; } items = Zotero.selectItems(items); for (var i in items) { arts.push(i); } } else { arts = [url]; } for each (var art in arts) { Zotero.debug(art); Zotero.Utilities.HTTP.doGet(art, function(text) { var newItem = new Zotero.Item("newspaperArticle"); newItem.publicationTitle = "The Hindu"; newItem.url = art; //title var t = /\[\w\W]*\:([\w\W]*?)<\/TITLE/; newItem.title = Zotero.Utilities.unescapeHTML(Zotero.Utilities.capitalizeTitle(text.match(t)[1])); var auth = /\([\w\W]*?)\/; if (text.match(auth)) { //newItem.author=Zotero.Utilities.cleanAuthor(text.match(auth)[1]); cleanauth=Zotero.Utilities.cleanTags(text.match(auth)[1]); newItem.creators.push(Zotero.Utilities.cleanAuthor(cleanauth, "author")); } newItem.publicationTitle="The Hindu"; newItem.attachments = [{"title":"The Hindu Snapshot", mimeType:"text/html", url:art}]; //hooray for real meta tags! var meta = //g; var metaTags = text.match(meta); for (var i = 0 ; i