-
Notifications
You must be signed in to change notification settings - Fork 20
/
MARC21XML.js
442 lines (376 loc) · 18.3 KB
/
MARC21XML.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
{
"translatorID": "ce0ab080-7d72-4fa3-ab4b-4bd8950f3379",
"label": "MARC21XML",
"creator": "Philipp Zumstein",
"target": "xml",
"minVersion": "3.0",
"maxVersion": "",
"priority": 100,
"displayOptions": {
"exportNotes": false,
"Zusammenfassung": true
},
"inRepository": true,
"translatorType": 2,
"browserSupport": "g",
"lastUpdated": "2019-11-05 18:45:00"
}
// DISCLAIMER:
// There are different cataloguing rules, specification of MARC dialects,
// various usage over time and places. This export translator will follow
// the current MARC21 bibliographic format which is described online:
// http://www.loc.gov/marc/bibliographic/
// MODS to MARC21 mapping:
// http://www.loc.gov/standards/mods/v3/mods2marc-mapping.html
// source for MARC21 XML examples (replace idn number):
// https://portal.dnb.de/opac.htm?method=requestMarcXml&idn=999678876
// Some more useful links:
// https://github.com/zotero/translators/blob/master/MARC.js
// https://github.com/zotero/translators/issues/762
// https://forums.zotero.org/discussion/38956/export-of-zotero-citation-to-marc-format-for-import-into-koha-lms
var recordLength;
var countFields = {"controlfield" : 0, "datafield" : 0, "subfield" : 0 };
var ns = "http://www.loc.gov/MARC21/slim";
var xmlDocument;
var typeMap = {
//default value "a" for every written text is taken (e.g. for book, article, report, webpage,...), everything else should be declared here
"artwork" : "k",
"audioRecording" : "j",
"computerProgram" : "m",
"film" : "g",
"manuscript" : "t",
"map" : "e",//"f" is normally less likely
"podcast" : "i",
"presentation" : "a",//slides -> a, speech -> i
"radioBroadcast" : "i",
"tvBroadcast" : "g",
"videoRecording" : "g"
};
var secondTypeMap = {//based on 008/24-27
"patent" : "j",
"statute" : "l",
"thesis" : "m",
"case" : "v"
};
String.prototype.replaceAt=function(index, character) {
return this.substr(0, index) + character + this.substr(index+character.length);
};
function fillZerosLeft(text, size) {
if (!text) text = '';
if (typeof text == 'number') text=text.toString();
missingCharacters = size-text.length;
if (missingCharacters>0) {
text = Array(missingCharacters+1).join('0') + text;
}
return text;
}
// @property can either a string which will be attachad as a textNode
// or just the Boolean "true" which will then just create the nodes
// without any content
function mapProperty(parentElement, elementName, attributes, property) {
if (!property) return null;
//var xmlDocument = parentElement.ownerDocument,
newElement = xmlDocument.createElementNS(ns, elementName);
if(attributes) {
for(var i in attributes) {
newElement.setAttribute(i, attributes[i]);
}
}
if (property && (typeof property == "string" || typeof property == "number") ) {
newElement.appendChild(xmlDocument.createTextNode(property));
recordLength += property.toString().length;
}
countFields[elementName]++;//for calculating the record length
parentElement.appendChild(newElement);
return newElement;
}
function doExport() {
Zotero.setCharacterSet("utf-8");
var parser = new DOMParser();
xmlDocument = parser.parseFromString('<collection xmlns="http://www.loc.gov/MARC21/slim" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.loc.gov/MARC21/slim http://www.loc.gov/standards/marcxml/schema/MARC21slim.xsd" />', 'application/xml');
var item, i;
while ((item = Zotero.nextItem())) {
Z.debug(item);
var exportNotes = Zotero.getOption("exportNotes");
//these two variables are important for several places
var typeOfRecord = "a";
if (typeMap[item.itemType]) typeOfRecord = typeMap[item.itemType];
var bibliographicLevel = "m";//default
if (item.itemType == "bookSection" || item.itemType == "conferencePaper" || item.itemType == "dictionaryEntry" || item.itemType == "encyclopediaArticle" || item.itemType == "journalArticle" || item.itemType == "magazineArticle" || item.itemType == "newspaperArticle") {
bibliographicLevel = "a";
}
//initial value
recordLength = 26;// 24 length of the leader + 1 record terminator + 1 field terminator after the leader and directory
var recordNode = mapProperty(xmlDocument.documentElement, "record", {"type" : "Bibliographic"} , true);
var currentFieldNode;
//BEGIN of the export
//leader will be added later, but before this node
var firstChild = mapProperty(recordNode, "controlfield", {"tag" : "001"}, item.itemID );
var cleanedDateModified = item.dateModified.replace(/\D/g , '');//format must be YYYYMMDDHHMMSS
mapProperty(recordNode, "controlfield", {"tag" : "005"}, cleanedDateModified + '.0' );
var dateFirst = ZU.strToDate(item.dateAdded);
var dateFirstString = dateFirst.year.substr(2,2) + fillZerosLeft(dateFirst.month,2) + fillZerosLeft(dateFirst.day,2);
var date;
var datePublicationString;
if (item.date) {
date = ZU.strToDate(item.date);
if (date.year) {
if (date.month) {
if (date.day) {
datePublicationString = 'e'+ date.year + fillZerosLeft(date.month,2) + fillZerosLeft(date.day,2);
} else {
datePublicationString = 'e'+date.year + fillZerosLeft(date.month,2)+'uu';
}
} else {
datePublicationString = 's'+date.year+' ';
}
} else {//date without year, possible?
datePublicationString = 'n ';
}
} else {//unknown date
datePublicationString = 'n ';
}
//position 18-34 where | is indicating that we don't have this information
var details = '|||||||||||||||||';
if (secondTypeMap[item.itemType]) details = details.replaceAt(24-18, secondTypeMap[item.itemType]);
if (item.itemType == "computerProgram") details = details.replaceAt(26-18, 'b');
if (item.itemType == "conferencePaper") details = details.replaceAt(29-18, '1');
if (item.itemType == "letter") details = details.replaceAt(33-18, 'i');
mapProperty(recordNode, "controlfield", {"tag" : "008"}, dateFirstString + datePublicationString + '|||'+ details +'||||u' );
if (item.ISBN) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "020", "ind1" : " ", "ind2" : " " } , true);
var cleanedISBN = item.ISBN.replace(/[a-zA-Z,\.;:\-_]/g, '');//can there be more than one isbn in the item.ISBN field?
if (cleanedISBN != item.ISBN) {
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , cleanedISBN );
mapProperty(currentFieldNode, "subfield", {"code" : "9"} , item.ISBN );
} else {
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.ISBN );
}
}
if (item.ISSN && bibliographicLevel == "m") {//see also field 773 for e.g. articles
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "022", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.ISSN );
}
if (item.DOI) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "024", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.DOI );
mapProperty(currentFieldNode, "subfield", {"code" : "2"} , "doi" );
}
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "040", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "c"} , 'Zotero' );//not strictly a Marc organization code, but we should mention the Zotero as the 'cataloguing tool' somewhere and here is a good place and is implicitely referred because of the 'u' in 008/37
if (item.language) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "041", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.language );
}
if (item.callNumber) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "090", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.callNumber );
}
//100 vs 700 and 110 vs 710
//--> practical decision: move everything to the 7xx fields
//because we cannot decide about "Main Entry" fields
//especially in regards with the different cataloguing rules
if (item.shortTitle) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "210", "ind1" : "0", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.shortTitle );
}
if (item.title) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "245", "ind1" : "1", "ind2" : "0" } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.title );
if (bibliographicLevel == "m") {
mapProperty(currentFieldNode, "subfield", {"code" : "n"} , item.volume );
}
var responsibleAgents = [];
for (let creator of item.creators) {
responsibleAgents.push([creator.firstName, creator.lastName].join(" "));
}
if (responsibleAgents.length > 0) {
mapProperty(currentFieldNode, "subfield", {"code" : "c"} , responsibleAgents.join(", "));
}
}
if (item.edition) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "250", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.edition );
}
if (item.scale) {//for cartographic maps
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "255", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.scale );
}
if (item.version || item.system || item.programmingLanguage || item.company) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "256", "ind1" : " ", "ind2" : " " } , true );//is there a better place for this information?
var computerFileArray = [];
if (item.version) computerFileArray.push(item.version);
if (item.system) computerFileArray.push(item.system);
if (item.programmingLanguage) computerFileArray.push(item.programmingLanguage);
if (item.company) computerFileArray.push(item.company);
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , computerFileArray.join(", ") );
}
if (item.publisher || item.place || date) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "260", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.place );
mapProperty(currentFieldNode, "subfield", {"code" : "b"} , item.publisher );
if (date && date.year) {//date was defined in the beginning
mapProperty(currentFieldNode, "subfield", {"code" : "c"} , date.year );
}
}
if (item.numPages || item.numberOfVolumes || item.runningTime) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "300", "ind1" : " ", "ind2" : " " } , true );
var extensionArray = [];
if (item.numberOfVolumes) {
if ( item.numPages.match(/[a-zA-Z]/) ) {
extensionArray.push( item.numberOfVolumes );
} else {
extensionArray.push( item.numberOfVolumes + " v." );
}
}
if (item.numPages) {
if ( item.numPages.match(/[a-zA-Z]/) ) {
extensionArray.push( item.numPages );
} else {
extensionArray.push( item.numPages + " p." );
}
}
if (item.runningTime) {
extensionArray.push( item.runningTime );
}
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , extensionArray.join(" : ") );
}
if (item.medium || item.artworkSize) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "340", "ind1" : " ", "ind2" : " " }, true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.medium );
mapProperty(currentFieldNode, "subfield", {"code" : "b"} , item.artworkSize );
}
if (item.seriesTitle || item.seriesNumber) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "490", "ind1" : "0", "ind2" : " " }, true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.seriesTitle );
mapProperty(currentFieldNode, "subfield", {"code" : "v"} , item.seriesNumber );
}
if (item.notes.length>0 && exportNotes) {
var noteArray = [];
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "500", "ind1" : " ", "ind2" : " " } , true );
for (i=0; i<item.notes.length; i++) {
noteArray.push(item.notes[i].note);
}
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , noteArray.join("; ") );
}
if (item.extra) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "500", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.extra );
}
if (item.thesisType || item.university) {//thesis
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "502", "ind1" : " ", "ind2" : " " } , true );
var thesisArray = [];
if (item.university) {
thesisArray.push(item.university);
}
if (item.thesisType) {
thesisArray.push(item.thesisType);
}
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , thesisArray.join(", ") );
}
if (item.type && item.itemType =="report") {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "513", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.type );
}
if (item.abstractNote && Zotero.getOption("Zusammenfassung")) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "520", "ind1" : " ", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.abstractNote );
}
if (item.tags.length>0) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "573", "ind1" : " ", "ind2" : " " } , true );
for (i=0; i<item.tags.length; i++) {
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.tags[i].tag );
}
}
for (i=0; i<item.creators.length; i++) {
var creator = item.creators[i];
if (!creator.fieldMode) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "700", "ind1" : "1", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , creator.lastName + ', ' + creator.firstName);
} else {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "710", "ind1" : "2", "ind2" : " " } , true);
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , creator.lastName );
}
if (creator.creatorType != "author") {
mapProperty(currentFieldNode, "subfield", {"code" : "e"} , creator.creatorType );
}
}
//note 711 is repeatable but the subfield not. Thus, we create two different if statements.
if (item.conferenceName) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "711", "ind1" : "2", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.conferenceName );
}
if (item.meetingName) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "711", "ind1" : "2", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "a"} , item.meetingName );
}
if (bibliographicLevel == "a") {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "773", "ind1" : "0", "ind2" : " " } , true );
var subfieldCode;
if (item.itemType == "conferencePaper") {
subfieldCode = "m2am";
}
if (item.itemType == "bookSection" || item.itemType == "dictionaryEntry" || item.itemType == "encyclopediaArticle") {
subfieldCode = "nnam";
}
if (item.itemType == "journalArticle" || item.itemType == "magazineArticle" || item.itemType == "newspaperArticle") {
subfieldCode = "nnas";
}
mapProperty(currentFieldNode, "subfield", {"code" : "7"} , subfieldCode );
mapProperty(currentFieldNode, "subfield", {"code" : "t"} , item.publicationTitle );
var descriptionArray = [];
var siciDescription = ""; //https://en.wikipedia.org/wiki/Serial_Item_and_Contribution_Identifier
if (item.volume) {
descriptionArray.push(item.volume);
siciDescription += item.volume;
}
if (item.issue) {
descriptionArray.push(item.issue);
siciDescription += ":" + item.issue;
}
if (item.pages) {
descriptionArray.push(item.pages);
siciDescription += "<" + parseInt(item.pages);
}
mapProperty(currentFieldNode, "subfield", {"code" : "g"} , descriptionArray.join(', ') );
mapProperty(currentFieldNode, "subfield", {"code" : "p"} , item.journalAbbreviation );
mapProperty(currentFieldNode, "subfield", {"code" : "q"} , siciDescription );
mapProperty(currentFieldNode, "subfield", {"code" : "x"} , item.ISSN );
//maybe move some other fields if journalArticle?
}
if (item.url) {
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "856", "ind1" : "4", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "u"} , item.url );
}
for (i=0; i<item.attachments.length; i++) {
var link = item.attachments[i];
currentFieldNode = mapProperty(recordNode, "datafield", {"tag" : "856", "ind1" : "4", "ind2" : " " } , true );
mapProperty(currentFieldNode, "subfield", {"code" : "u"} , link.url );
mapProperty(currentFieldNode, "subfield", {"code" : "q"} , link.mimeType );
}
//finally, we will calculate the leader and add it as first child
recordLength += countFields.controlfield*13+countFields.datafield*15+countFields.subfield*2;
//controlfields: 12 characters in the directory + 1 field terminator
//datafields: 12 characters in the directory + 2 indicators + 1 field terminator
//subfields: 1 subfield code + 1 subfield terminator
//base address of data starts after the leader and the directory
var baseAdressData = 24+countFields.controlfield*12+countFields.datafield*12+1;
var leaderContent = fillZerosLeft(recordLength,5) + "n" + typeOfRecord + bibliographicLevel +" a22" + fillZerosLeft(baseAdressData,5) +"zu 4500";
var newElement = xmlDocument.createElementNS(ns, "leader");
newElement.appendChild(xmlDocument.createTextNode(leaderContent));
recordNode.insertBefore(newElement, firstChild);
}
Zotero.write('<?xml version="1.0"?>'+"\n");
var serializer = new XMLSerializer();
var xmlDoc = serializer.serializeToString(xmlDocument);
// simple pretty print XML for MARC XML data
var pretty = xmlDoc.replace(/<record/g, "\n<record")
.replace(/<leader/g, "\n\t<leader")
.replace(/<controlfield/g, "\n\t<controlfield")
.replace(/<datafield/g, "\n\t<datafield")
.replace(/<\/datafield/g, "\n\t</datafield")
.replace(/<subfield/g, "\n\t\t<subfield")
.replace(/<\/record/g, "\n</record")
.replace("</collection", "\n</collection");
Zotero.write(pretty);
}