From e37c14357a44fed6ffd208dacc0d0241fa22ef4c Mon Sep 17 00:00:00 2001 From: Alexander Clifford Date: Fri, 19 May 2023 13:47:41 -0700 Subject: [PATCH] Removes JXON use for native DOMParser for Pubmed abstract parsing --- javascript/web/ReferenceDetails.js | 80 ++++++++++++++---------------- package-lock.json | 8 --- package.json | 1 - 3 files changed, 37 insertions(+), 52 deletions(-) diff --git a/javascript/web/ReferenceDetails.js b/javascript/web/ReferenceDetails.js index 0e20649c3..10ff014cd 100644 --- a/javascript/web/ReferenceDetails.js +++ b/javascript/web/ReferenceDetails.js @@ -34,11 +34,6 @@ var golr_response = require('bbop-response-golr'); // And a basic response. var rest_response = require('bbop-rest-response').base; -// // XML. -// var xpath = require('xpath'); -// var dom = require('xmldom').DOMParser; -var jxon = require('jxon'); - // Aliases. var dlimit = defs.download_limit; @@ -273,51 +268,41 @@ function ReferenceDetailsInit(){ // Run. ncbi_engine.register('success', function(resp, man){ - var xml = resp.raw(); - //console.log(xml); - - var jx = null; - if( typeof xml === 'string' ){ - jx = jxon.stringToJs(xml); - }else{ - jx = jxon.xmlToJs(xml); - } - console.log(jx); + // Previous check for string vs json unneeded due to request parameters always being XML. + var xml = xmlParser.parseFromString(resp.raw(), 'text/xml'); + console.log(xml); + var BASE_ARTICLE_PATH = 'PubmedArticleSet PubmedArticle'; + var FULL_ARTICLE_PATH = BASE_ARTICLE_PATH + ' MedlineCitation Article'; // Our operating object. - if( ! jx.PubmedArticleSet.PubmedArticle ){ + if( ! xml.querySelector(BASE_ARTICLE_PATH) ){ UnableToMakeContact('No such PubMed ID.'); - }else if( ! jx.PubmedArticleSet.PubmedArticle.MedlineCitation.Article ){ + }else if( ! xml.querySelector(FULL_ARTICLE_PATH) ){ UnableToMakeContact('No such Article.'); }else{ - var op = jx.PubmedArticleSet.PubmedArticle.MedlineCitation.Article; + var op = xml.querySelector(FULL_ARTICLE_PATH); // Title. - var title = 'n/a'; - if( op.ArticleTitle ){ - title = op.ArticleTitle; - } + var title = getXmlContent(op, 'ArticleTitle', 'n/a'); // Date. var date = 'n/a'; - if( op.ArticleDate ){ - var year = op.ArticleDate.Year || '???'; - var month = op.ArticleDate.Month || '???'; - var day = op.ArticleDate.Day || '???'; + if( op.querySelector('AritcleDate') ){ + var missingValue = '???'; + var year = getXmlContent(op, 'ArticleDate.Year', missingValue); + var month = getXmlContent(op, 'ArticleDate.Month', missingValue); + var day = getXmlContent(op, 'ArticleDate.Day', missingValue); date = [year, month, day].join('-'); } // Authors. var authors = 'n/a'; - if( op.AuthorList && op.AuthorList.Author ){ + if( op.querySelector('AuthorList Author') ){ var acache = []; - us.each(op.AuthorList.Author, function(auth){ - var name = ''; - if( auth.ForeName ){ name += auth.ForeName; } - //if( auth.Initials ){ name+=' '+auth.Initials+'.'; } - if( auth.LastName ){ name +=' '+auth.LastName; } - acache.push(name); + us.each(op.querySelectorAll('AuthorList Author'), function(auth){ + var name = [getXmlContent(auth, 'ForeName', ''), getXmlContent(auth, 'LastName', '')].join(' ').trim(); + acache.push(name); }); if( ! us.isEmpty(acache) ){ authors = acache.join(', '); @@ -326,19 +311,17 @@ function ReferenceDetailsInit(){ // Abstract; list or string. var abstract = 'n/a'; - if( op.Abstract && op.Abstract.AbstractText ){ - if( us.isArray(op.Abstract.AbstractText) ){ - + var abstractXml = op.querySelectorAll('Abstract AbstractText'); + if( abstractXml.length > 1 ){ var abscache = []; - us.each(op.Abstract.AbstractText, function(abs){ - if( abs._ ){ abscache.push(abs._); } + us.each(asbtractXml, function(abs){ + if( abs.textContent ){ abscache.push(abs.textContent); } }); if( ! us.isEmpty(abscache) ){ - abstract = abscache.join('
'); + abstract = abscache.join('
'); } - }else if( us.isString(op.Abstract.AbstractText) ){ - abstract = op.Abstract.AbstractText; - } + }else if( abstractXml.length === 1 ){ + abstract = abstractXml[0].textContent; } // Render. @@ -422,7 +405,6 @@ function ReferenceDetailsInit(){ 'db': 'pubmed', 'id': id_part }; - var meth = 'GET'; ncbi_engine.start(url + path, pay, 'GET'); }catch (e) { @@ -555,3 +537,15 @@ function _shrink_wrap(elt_id){ } } } + +// Not certain what minimal browser support here is so avoided default parameter values (Chrome 49, Firefox 15, IE 11, Opera 36, Safari 9). +function getXmlContent(xml, path, default_value){ + var content = xml.querySelector(path); + if( content ){ + return content.textContent; + }else if(default_value === undefined){ + return null; + }else{ + return default_value; + } +} \ No newline at end of file diff --git a/package-lock.json b/package-lock.json index 6839455fc..dc31eb09f 100644 --- a/package-lock.json +++ b/package-lock.json @@ -8222,14 +8222,6 @@ "integrity": "sha512-qpcRocdkUmf+UTNBYx5w6dexX5J31AKK1OmPwH630a83DdVVUIngk55RSAiIGpQyoH0dlr872VHfPjnQnK1qDQ==", "dev": true }, - "jxon": { - "version": "2.0.0-beta.5", - "resolved": "https://registry.npmjs.org/jxon/-/jxon-2.0.0-beta.5.tgz", - "integrity": "sha1-O2qUEE+YAe5oL9BWZF/1Rz2bND4=", - "requires": { - "xmldom": "^0.1.21" - } - }, "kdbush": { "version": "1.0.1", "resolved": "https://registry.npmjs.org/kdbush/-/kdbush-1.0.1.tgz", diff --git a/package.json b/package.json index 7cab68e48..d9f8d70a3 100644 --- a/package.json +++ b/package.json @@ -44,7 +44,6 @@ "express": "4.16.3", "golr-conf": "0.0.3", "jquery": "3.3.1", - "jxon": "2.0.0-beta.5", "markdown": "0.5.0", "marked": "0.3.19", "minerva-requests": "0.0.15",