parent
9a35ac52a3
commit
97bf3de7a8
@ -1,68 +1,88 @@
|
|||||||
|
/* Copyright (C) 2014 Alinson Xavier
|
||||||
|
*
|
||||||
|
* This file is part of Scholarium.
|
||||||
|
*
|
||||||
|
* Scholarium is free software: you can redistribute it and/or modify it under
|
||||||
|
* the terms of the GNU General Public License as published by the Free
|
||||||
|
* Software Foundation, either version 3 of the License, or (at your option)
|
||||||
|
* any later version.
|
||||||
|
*
|
||||||
|
* This software is distributed in the hope that it will be useful, but WITHOUT
|
||||||
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||||
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||||
|
* more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License along with
|
||||||
|
* this software. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
|
||||||
function ScopusParser()
|
function ScopusParser()
|
||||||
{
|
{
|
||||||
};
|
}
|
||||||
|
|
||||||
ScopusParser.prototype._parse_results_page = function(url, callback)
|
ScopusParser.prototype._parse_results_page = function(url, callback)
|
||||||
{
|
{
|
||||||
var iframe = document.createElement("iframe");
|
var iframe = document.createElement("iframe");
|
||||||
$(iframe).hide();
|
$(iframe).hide();
|
||||||
document.body.appendChild(iframe);
|
document.body.appendChild(iframe);
|
||||||
iframe.src = url;
|
iframe.src = url;
|
||||||
$(iframe).load(function()
|
$(iframe).load(function()
|
||||||
{
|
{
|
||||||
var articles = [];
|
var articles = [];
|
||||||
var ibody = $(iframe).contents()[0];
|
var ibody = $(iframe).contents()[0];
|
||||||
|
|
||||||
var select_pages = $(ibody.getElementsByName("resultsPerPage").item(0));
|
|
||||||
if(select_pages.val() != 200) {
|
|
||||||
select_pages.val(200);
|
|
||||||
select_pages.change();
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
$(ibody).find(".resultItemLists li").each(function(index, li)
|
var select_pages = $(ibody.getElementsByName("resultsPerPage").item(0));
|
||||||
{
|
if(select_pages.val() != 200)
|
||||||
var article = {};
|
{
|
||||||
|
select_pages.val(200);
|
||||||
$(li).find(".docTitle a").each(function(index, tag) {
|
select_pages.change();
|
||||||
article.url = tag.href;
|
return;
|
||||||
article.title = $(tag).text();
|
}
|
||||||
});
|
|
||||||
|
|
||||||
$(li).find("a[href*='citedby']").each(function(index, tag) {
|
$(ibody).find(".resultItemLists li").each(function(index, li)
|
||||||
article.citations_url = tag.href;
|
{
|
||||||
article.n_citations = parseInt($(tag).text());
|
var article = {};
|
||||||
});
|
|
||||||
|
|
||||||
$(li).find('.hidden-label').each(function(index, tag) {
|
|
||||||
if($(tag).text().indexOf("Year") == 0)
|
|
||||||
article.year = parseInt($.trim($(tag).next().text()));
|
|
||||||
|
|
||||||
if($(tag).text().indexOf("Authors") == 0)
|
$(li).find(".docTitle a").each(function(index, tag)
|
||||||
article.authors = $.trim($(tag).next().text());
|
{
|
||||||
|
article.url = tag.href;
|
||||||
|
article.title = $(tag).text();
|
||||||
|
});
|
||||||
|
|
||||||
if($(tag).text().indexOf("Source") == 0)
|
$(li).find("a[href*='citedby']").each(function(index, tag)
|
||||||
article.source = $.trim($(tag).next().text());
|
{
|
||||||
});
|
article.citations_url = tag.href;
|
||||||
|
article.n_citations = parseInt($(tag).text());
|
||||||
|
});
|
||||||
|
|
||||||
|
$(li).find('.hidden-label').each(function(index, tag)
|
||||||
|
{
|
||||||
|
if($(tag).text().indexOf("Year") == 0)
|
||||||
|
article.year = parseInt($.trim($(tag).next().text()));
|
||||||
|
|
||||||
if(!('n_citations' in article)) {
|
if($(tag).text().indexOf("Authors") == 0)
|
||||||
article.citations_url = undefined;
|
article.authors = $.trim($(tag).next().text());
|
||||||
article.n_citations = 0;
|
|
||||||
}
|
|
||||||
|
|
||||||
article._id = $.md5(article.title + article.authors);
|
|
||||||
|
|
||||||
articles.push(article);
|
if($(tag).text().indexOf("Source") == 0)
|
||||||
});
|
article.source = $.trim($(tag).next().text());
|
||||||
|
});
|
||||||
|
|
||||||
callback(articles);
|
if(!('n_citations' in article)) {
|
||||||
document.body.removeChild(iframe);
|
article.citations_url = undefined;
|
||||||
|
article.n_citations = 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
article._id = $.md5(article.title + article.authors);
|
||||||
|
articles.push(article);
|
||||||
});
|
});
|
||||||
|
|
||||||
|
callback(articles);
|
||||||
|
document.body.removeChild(iframe);
|
||||||
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
ScopusParser.prototype.parse = function(url, callback)
|
ScopusParser.prototype.parse = function(url, callback)
|
||||||
{
|
{
|
||||||
if(url === undefined) return;
|
if(!url) return;
|
||||||
//if(url.indexOf("/results/") > 0 || url.indexOf("/search/") > 0)
|
this._parse_results_page(url, callback);
|
||||||
this._parse_results_page(url, callback);
|
|
||||||
}
|
}
|
||||||
|
@ -1,72 +1,91 @@
|
|||||||
|
/* Copyright (C) 2014 Alinson Xavier
|
||||||
|
*
|
||||||
|
* This file is part of Scholarium.
|
||||||
|
*
|
||||||
|
* Scholarium is free software: you can redistribute it and/or modify it under
|
||||||
|
* the terms of the GNU General Public License as published by the Free
|
||||||
|
* Software Foundation, either version 3 of the License, or (at your option)
|
||||||
|
* any later version.
|
||||||
|
*
|
||||||
|
* This software is distributed in the hope that it will be useful, but WITHOUT
|
||||||
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||||
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||||
|
* more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License along with
|
||||||
|
* this software. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
|
||||||
function WebOfScienceParser()
|
function WebOfScienceParser()
|
||||||
{
|
{
|
||||||
};
|
}
|
||||||
|
|
||||||
WebOfScienceParser.prototype._parse_results_page = function(url, callback)
|
WebOfScienceParser.prototype._parse_results_page = function(url, callback)
|
||||||
{
|
{
|
||||||
console.log("parsing");
|
console.log("parsing");
|
||||||
var iframe = document.createElement("iframe");
|
var iframe = document.createElement("iframe");
|
||||||
$(iframe).hide();
|
$(iframe).hide();
|
||||||
document.body.appendChild(iframe);
|
document.body.appendChild(iframe);
|
||||||
iframe.src = url;
|
iframe.src = url;
|
||||||
|
|
||||||
$(iframe).load(function()
|
|
||||||
{
|
|
||||||
var articles = [];
|
|
||||||
var ibody = $(iframe).contents()[0];
|
|
||||||
|
|
||||||
var select_pages = $(ibody.getElementsByName("pageSize").item(0));
|
|
||||||
if(select_pages.val() != 50) {
|
|
||||||
select_pages.val(50);
|
|
||||||
select_pages.change();
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
$(ibody).find(".search-results-content").each(function(index, li)
|
|
||||||
{
|
|
||||||
var article = {};
|
|
||||||
|
|
||||||
$(li).find("a[href^='/full_record']").each(function(index, tag) {
|
|
||||||
article.url = tag.href;
|
|
||||||
article.title = $.trim($(tag).text());
|
|
||||||
});
|
|
||||||
|
|
||||||
$(li).next().find("a[href^='/CitingArticles']").each(function(index, tag) {
|
$(iframe).load(function()
|
||||||
article.citations_url = tag.href;
|
{
|
||||||
article.n_citations = parseInt($(tag).text());
|
var articles = [];
|
||||||
});
|
var ibody = $(iframe).contents()[0];
|
||||||
|
|
||||||
$(li).find('span.label').each(function(index, tag) {
|
|
||||||
//if($(tag).text().indexOf("By:") == 0)
|
|
||||||
// article.year = parseInt($.trim($(tag).next().text()));
|
|
||||||
|
|
||||||
if($(tag).text().indexOf("By:") == 0) {
|
var select_pages = $(ibody.getElementsByName("pageSize").item(0));
|
||||||
article.authors = $.trim($(tag).parent().text()).replace(/^By: /,"");
|
if(select_pages.val() != 50)
|
||||||
var source_year = $.trim($(tag).parent().next().text());
|
{
|
||||||
article.source = source_year.replace(/Published.*/, "").replace(/\s\s+/g, ", ").replace(/, $/, "");
|
select_pages.val(50);
|
||||||
article.year = parseInt(source_year.substr(source_year.length-4));
|
select_pages.change();
|
||||||
}
|
return;
|
||||||
});
|
}
|
||||||
|
|
||||||
if(!('n_citations' in article)) {
|
$(ibody).find(".search-results-content").each(function(index, li)
|
||||||
article.citations_url = undefined;
|
{
|
||||||
article.n_citations = 0;
|
var article = {};
|
||||||
}
|
|
||||||
|
|
||||||
article._id = $.md5(article.title + article.authors);
|
|
||||||
|
|
||||||
articles.push(article);
|
$(li).find("a[href^='/full_record']").each(function(index, tag)
|
||||||
|
{
|
||||||
|
article.url = tag.href;
|
||||||
|
article.title = $.trim($(tag).text());
|
||||||
|
});
|
||||||
|
|
||||||
console.log(article);
|
$(li).next().find("a[href^='/CitingArticles']").each(function(index, tag)
|
||||||
});
|
{
|
||||||
|
article.citations_url = tag.href;
|
||||||
|
article.n_citations = parseInt($(tag).text());
|
||||||
|
});
|
||||||
|
|
||||||
|
$(li).find('span.label').each(function(index, tag)
|
||||||
|
{
|
||||||
|
if($(tag).text().indexOf("By:") == 0)
|
||||||
|
{
|
||||||
|
article.authors = $.trim($(tag).parent().text()).replace(/^By: /,"");
|
||||||
|
var source_year = $.trim($(tag).parent().next().text());
|
||||||
|
article.source = source_year.replace(/Published.*/, "")
|
||||||
|
.replace(/\s\s+/g, ", ").replace(/, $/, "");
|
||||||
|
article.year = parseInt(source_year.substr(source_year.length-4));
|
||||||
|
}
|
||||||
|
});
|
||||||
|
|
||||||
callback(articles);
|
if(!('n_citations' in article))
|
||||||
document.body.removeChild(iframe);
|
{
|
||||||
|
article.citations_url = undefined;
|
||||||
|
article.n_citations = 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
article._id = $.md5(article.title + article.authors);
|
||||||
|
articles.push(article);
|
||||||
});
|
});
|
||||||
|
|
||||||
|
callback(articles);
|
||||||
|
document.body.removeChild(iframe);
|
||||||
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
WebOfScienceParser.prototype.parse = function(url, callback)
|
WebOfScienceParser.prototype.parse = function(url, callback)
|
||||||
{
|
{
|
||||||
if(!url) return;
|
if(!url) return;
|
||||||
this._parse_results_page(url, callback);
|
this._parse_results_page(url, callback);
|
||||||
}
|
}
|
||||||
|
Reference in new issue