Reorganizing.

This commit is contained in:
2014-10-02 07:02:09 -04:00
parent 60d2747327
commit 47987d8db1
19 changed files with 9 additions and 32487 deletions

View File

@@ -0,0 +1,33 @@
/* Copyright (C) 2014 Alinson Xavier
*
* This file is part of Scholarium.
*
* Scholarium is free software: you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation, either version 3 of the License, or (at your option)
* any later version.
*
* This software is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
* more details.
*
* You should have received a copy of the GNU General Public License along with
* this software. If not, see <http://www.gnu.org/licenses/>.
*/
function GenericParser()
{
this.scopus_parser = new ScopusParser();
this.web_of_science_parser = new WebOfScienceParser();
}
GenericParser.prototype.parse = function(url, callback)
{
if(url.indexOf("scopus.com") >= 0)
this.scopus_parser.parse(url, callback);
if(url.indexOf("webofknowledge.com") >= 0)
this.web_of_science_parser.parse(url, callback);
}

View File

@@ -0,0 +1,88 @@
/* Copyright (C) 2014 Alinson Xavier
*
* This file is part of Scholarium.
*
* Scholarium is free software: you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation, either version 3 of the License, or (at your option)
* any later version.
*
* This software is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
* more details.
*
* You should have received a copy of the GNU General Public License along with
* this software. If not, see <http://www.gnu.org/licenses/>.
*/
function ScopusParser()
{
}
ScopusParser.prototype._parse_results_page = function(url, callback)
{
var iframe = document.createElement("iframe");
$(iframe).hide();
document.body.appendChild(iframe);
iframe.src = url;
$(iframe).load(function()
{
var articles = [];
var ibody = $(iframe).contents()[0];
var select_pages = $(ibody.getElementsByName("resultsPerPage").item(0));
if(select_pages.val() != 200)
{
select_pages.val(200);
select_pages.change();
return;
}
$(ibody).find(".resultItemLists li").each(function(index, li)
{
var article = {};
$(li).find(".docTitle a").each(function(index, tag)
{
article.url = tag.href;
article.title = $(tag).text();
});
$(li).find("a[href*='citedby']").each(function(index, tag)
{
article.citations_url = tag.href;
article.n_citations = parseInt($(tag).text());
});
$(li).find('.hidden-label').each(function(index, tag)
{
if($(tag).text().indexOf("Year") == 0)
article.year = parseInt($.trim($(tag).next().text()));
if($(tag).text().indexOf("Authors") == 0)
article.authors = $.trim($(tag).next().text());
if($(tag).text().indexOf("Source") == 0)
article.source = $.trim($(tag).next().text());
});
if(!('n_citations' in article)) {
article.citations_url = undefined;
article.n_citations = 0;
}
article._id = $.md5(article.title + article.authors);
articles.push(article);
});
callback(articles);
document.body.removeChild(iframe);
});
}
ScopusParser.prototype.parse = function(url, callback)
{
if(!url) return;
this._parse_results_page(url, callback);
}

View File

@@ -0,0 +1,91 @@
/* Copyright (C) 2014 Alinson Xavier
*
* This file is part of Scholarium.
*
* Scholarium is free software: you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation, either version 3 of the License, or (at your option)
* any later version.
*
* This software is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
* more details.
*
* You should have received a copy of the GNU General Public License along with
* this software. If not, see <http://www.gnu.org/licenses/>.
*/
function WebOfScienceParser()
{
}
WebOfScienceParser.prototype._parse_results_page = function(url, callback)
{
console.log("parsing");
var iframe = document.createElement("iframe");
$(iframe).hide();
document.body.appendChild(iframe);
iframe.src = url;
$(iframe).load(function()
{
var articles = [];
var ibody = $(iframe).contents()[0];
var select_pages = $(ibody.getElementsByName("pageSize").item(0));
if(select_pages.val() != 50)
{
select_pages.val(50);
select_pages.change();
return;
}
$(ibody).find(".search-results-content").each(function(index, li)
{
var article = {};
$(li).find("a[href^='/full_record']").each(function(index, tag)
{
article.url = tag.href;
article.title = $.trim($(tag).text());
});
$(li).next().find("a[href^='/CitingArticles']").each(function(index, tag)
{
article.citations_url = tag.href;
article.n_citations = parseInt($(tag).text());
});
$(li).find('span.label').each(function(index, tag)
{
if($(tag).text().indexOf("By:") == 0)
{
article.authors = $.trim($(tag).parent().text()).replace(/^By: /,"");
var source_year = $.trim($(tag).parent().next().text());
article.source = source_year.replace(/Published.*/, "")
.replace(/\s\s+/g, ", ").replace(/, $/, "");
article.year = parseInt(source_year.substr(source_year.length-4));
}
});
if(!('n_citations' in article))
{
article.citations_url = undefined;
article.n_citations = 0;
}
article._id = $.md5(article.title + article.authors);
articles.push(article);
});
callback(articles);
document.body.removeChild(iframe);
});
}
WebOfScienceParser.prototype.parse = function(url, callback)
{
if(!url) return;
this._parse_results_page(url, callback);
}