21.3. HOW TO: Extract additional metadata from the web page of a digitised work#

The viewers you use to examine digitised resources in Trove embed some metadata that isn’t available through the Trove API. This includes a JSON-ified version of the item’s MARC record (presumably copied from the NLA catalogue), as well as structural information used by the viewer itself, such as a list of pages in a digitised book.

This metadata can be useful in a number of different contexts. For example, you can extract the number of pages in a digitised book, then use this number to automatically download the full text or a PDF. The GLAM Workbench includes an example where geospatial coordinates are extracted from the MARC data to add to a harvest of digitised maps.

import json
import re

import requests
from IPython.display import JSON

work_id = "https://nla.gov.au/nla.obj-362059651/"

# Get the HTML page
response = requests.get(work_id)

# Search for the JSON string using regex
try:
    work_data = re.search(
        r"var work = JSON\.parse\(JSON\.stringify\((\{.*\})", response.text
    ).group(1)
except AttributeError:
    # Just in case it's not there...
    work_data = "{}"
    print("No data found!")

# Load the JSON data
data = json.loads(work_data)

data
{'id': '36205965',
 'collection': 'nla.aus',
 'type': 'work',
 'form': 'Book',
 'subType': 'book',
 'bibLevel': 'Item',
 'bibId': '653766',
 'holdingNumber': 'JAFp BIO 92',
 'pid': 'nla.obj-362059651',
 'title': "Lord Robert Cecil's gold fields diary",
 'accessConditions': 'Unrestricted',
 'copyrightPolicy': 'Out of Copyright',
 'recordSource': 'NLACat',
 'digitalStatus': 'Captured',
 'startDate': '01 January 1945',
 'creator': 'Salisbury, Robert Cecil, marquess of, 1830-1903. 338373 9112d83c-f87f-5a34-a022-bea98d9ee823',
 'extent': '32 p., [20] p. of plates : ill. ; 18 cm.',
 'publisherName': 'Melbourne University Press',
 'allowSearchEngineIndexing': 'false',
 'findingAidAvailable': 'No',
 'isOriginalCopyAvaliable': 'false',
 'ocrMetsCopyAvaliable': 'true',
 'partnerNucs': [],
 'parentProjectIds': [],
 'projectIds': [],
 'marcData': {'record': [{'leader': {'type': 'Bibliographic',
     'content': '01205cam a2200289 a 4500'},
    'datafield': [{'ind2': ' ',
      'ind1': 1,
      'subfield': [{'code': 'a', 'content': 2617933},
       {'code': 'z', 'content': 9324621}],
      'tag': '019'},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 9, 'content': '(AuCNLDY)577939'},
      'tag': '035'},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 653766},
      'tag': '035'},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': [{'code': 'a', 'content': 'NNCU:A'},
       {'code': 'b', 'content': 'eng'},
       {'code': 'c', 'content': 'NNCU:A'},
       {'code': 'd', 'content': 'AUC:LSM'}],
      'tag': '040'},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 'anuc'},
      'tag': '042'},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 'u-at-vi'},
      'tag': '043'},
     {'ind2': 4,
      'ind1': 0,
      'subfield': [{'code': 'a', 'content': '994.5/03'},
       {'code': 2, 'content': 19}],
      'tag': '082'},
     {'ind2': ' ',
      'ind1': 1,
      'subfield': [{'code': 'a', 'content': 'Salisbury, Robert Cecil,'},
       {'code': 'c', 'content': 'marquess of,'},
       {'code': 'd', 'content': '1830-1903.'},
       {'code': 0, 'content': 338373},
       {'code': 9, 'content': '9112d83c-f87f-5a34-a022-bea98d9ee823'}],
      'tag': 100},
     {'ind2': 0,
      'ind1': 1,
      'subfield': [{'code': 'a',
        'content': "Lord Robert Cecil's gold fields diary /"},
       {'code': 'c',
        'content': 'with introduction and notes by Sir Ernest Scott.'}],
      'tag': 245},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': '2nd ed.'},
      'tag': 250},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': [{'code': 'a', 'content': 'Carlton, Vic. :'},
       {'code': 'b', 'content': 'Melbourne University Press,'},
       {'code': 'c', 'content': 1945}],
      'tag': 260},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': [{'code': 'a', 'content': '32 p., [20] p. of plates :'},
       {'code': 'b', 'content': 'ill. ;'},
       {'code': 'c', 'content': '18 cm.'}],
      'tag': 300},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': [{'code': 'a', 'content': 'Also available online'},
       {'code': 'u', 'content': 'http://nla.gov.au/nla.obj-362059651'}],
      'tag': 530},
     {'ind2': 0,
      'ind1': 1,
      'subfield': [{'code': 'a', 'content': 'Salisbury, Robert Cecil,'},
       {'code': 'c', 'content': 'marquess of,'},
       {'code': 'd', 'content': '1830-1903.'}],
      'tag': 600},
     {'ind2': 0,
      'ind1': ' ',
      'subfield': [{'code': 'a', 'content': 'Gold mines and mining'},
       {'code': 'z', 'content': 'Victoria.'}],
      'tag': 650},
     {'ind2': 0,
      'ind1': ' ',
      'subfield': [{'code': 'a', 'content': 'Victoria'},
       {'code': 'x', 'content': 'Description and travel.'}],
      'tag': 651},
     {'ind2': ' ',
      'ind1': 1,
      'subfield': [{'code': 'a', 'content': 'Scott, Ernest,'},
       {'code': 'd', 'content': '1868-1939.'}],
      'tag': 700},
     {'ind2': 1,
      'ind1': 4,
      'subfield': [{'code': 'z',
        'content': 'National Library of Australia digitised item. JAFp BIO 92 copy'},
       {'code': 'u', 'content': 'http://nla.gov.au/nla.obj-362059651'},
       {'code': 'x', 'content': 'fulltext'}],
      'tag': 856},
     {'ind2': 'f',
      'ind1': 'f',
      'subfield': [{'code': 'i',
        'content': '2c2be5dd-982b-5020-ac7c-f8820fc3ae34'},
       {'code': 's', 'content': 'b08c2134-2fff-5812-bdd3-a55d68f73fa1'}],
      'tag': 999}],
    'controlfield': [{'tag': '001', 'content': 653766},
     {'tag': '005', 'content': 20230828121255.5},
     {'tag': '008', 'content': '830518s1945    vraa          000 0aeng d'}]},
   {'leader': {'type': 'Holdings', 'content': '00000nam a2200000 a 4500'},
    'datafield': [{'ind2': ' ',
      'ind1': 8,
      'subfield': [{'code': 'b', 'content': 'AUSP'},
       {'code': 'h', 'content': 'Np 994.5 SAL'}],
      'tag': 852},
     {'ind2': 0,
      'ind1': ' ',
      'subfield': {'code': 'z', 'content': 'N pbk'},
      'tag': 866},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 'NLA'},
      'tag': 954}],
    'controlfield': [{'tag': '001', 'content': 2912182},
     {'tag': '004', 'content': 653766}]},
   {'leader': {'type': 'Holdings', 'content': '00000nam a2200000 a 4500'},
    'datafield': [{'ind2': ' ',
      'ind1': 8,
      'subfield': [{'code': 'b', 'content': 'PET'},
       {'code': 'h', 'content': 'JAFp BIO 92'}],
      'tag': 852},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 'NLA'},
      'tag': 954}],
    'controlfield': [{'tag': '001', 'content': 2912183},
     {'tag': '004', 'content': 653766}]},
   {'leader': {'type': 'Holdings', 'content': '00000nam a2200000 a 4500'},
    'datafield': [{'ind2': ' ',
      'ind1': 8,
      'subfield': [{'code': 'b', 'content': 'PET'},
       {'code': 'h', 'content': 'JAFp GEN SAL'}],
      'tag': 852},
     {'ind2': 0,
      'ind1': ' ',
      'subfield': {'code': 'z', 'content': 'FC copy'},
      'tag': 866},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 'NLA'},
      'tag': 954}],
    'controlfield': [{'tag': '001', 'content': 2912184},
     {'tag': '004', 'content': 653766}]},
   {'leader': {'type': 'Holdings', 'content': '00000nam a2200000 a 4500'},
    'datafield': [{'ind2': ' ',
      'ind1': 8,
      'subfield': [{'code': 'b', 'content': 'AUSLP'},
       {'code': 'h', 'content': 'NLp 994.5 SAL'}],
      'tag': 852},
     {'ind2': 0,
      'ind1': ' ',
      'subfield': {'code': 'z', 'content': 'NL pbk'},
      'tag': 866},
     {'ind2': ' ',
      'ind1': ' ',
      'subfield': {'code': 'a', 'content': 'NLA'},
      'tag': 954}],
    'controlfield': [{'tag': '001', 'content': 4042315},
     {'tag': '004', 'content': 653766}]}]},
 'children': {'page': [{'id': '36205990',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362059904',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551350,
      'filename': None,
      'filesize': 357765,
      'technicalmetadata': {'width': 1926, 'height': 2840}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 16436560}]},
   {'id': '36206003',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060036',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551354,
      'filename': None,
      'filesize': 325233,
      'technicalmetadata': {'width': 1743, 'height': 2808}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14709600}]},
   {'id': '36206017',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060175',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551358,
      'filename': None,
      'filesize': 332757,
      'technicalmetadata': {'width': 1766, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14976176}]},
   {'id': '36206030',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060307',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551362,
      'filename': None,
      'filesize': 290972,
      'technicalmetadata': {'width': 1642, 'height': 2649}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13074028}]},
   {'id': '36206043',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060433',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551366,
      'filename': None,
      'filesize': 316353,
      'technicalmetadata': {'width': 1694, 'height': 2798}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14244196}]},
   {'id': '36206056',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060563',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551370,
      'filename': None,
      'filesize': 308812,
      'technicalmetadata': {'width': 1678, 'height': 2739}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13813536}]},
   {'id': '36206069',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060694',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551374,
      'filename': None,
      'filesize': 315081,
      'technicalmetadata': {'width': 1688, 'height': 2792}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14165840}]},
   {'id': '36206082',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060828',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551378,
      'filename': None,
      'filesize': 314714,
      'technicalmetadata': {'width': 1690, 'height': 2782}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14129776}]},
   {'id': '36206095',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362060959',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551382,
      'filename': None,
      'filesize': 315411,
      'technicalmetadata': {'width': 1700, 'height': 2792}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14266964}]},
   {'id': '36206108',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061083',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551386,
      'filename': None,
      'filesize': 310531,
      'technicalmetadata': {'width': 1674, 'height': 2783}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14004236}]},
   {'id': '36206121',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061212',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551390,
      'filename': None,
      'filesize': 316813,
      'technicalmetadata': {'width': 1706, 'height': 2804}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14378908}]},
   {'id': '36206134',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061349',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551394,
      'filename': None,
      'filesize': 309855,
      'technicalmetadata': {'width': 1670, 'height': 2796}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14036000}]},
   {'id': '36206147',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061476',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551398,
      'filename': None,
      'filesize': 321690,
      'technicalmetadata': {'width': 1706, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14469512}]},
   {'id': '36206160',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061603',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551402,
      'filename': None,
      'filesize': 302721,
      'technicalmetadata': {'width': 1645, 'height': 2750}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13599008}]},
   {'id': '36206173',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061731',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551406,
      'filename': None,
      'filesize': 302730,
      'technicalmetadata': {'width': 1661, 'height': 2743}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13696764}]},
   {'id': '36206186',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061862',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551410,
      'filename': None,
      'filesize': 309234,
      'technicalmetadata': {'width': 1669, 'height': 2783}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13962668}]},
   {'id': '36206199',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362061995',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551414,
      'filename': None,
      'filesize': 318131,
      'technicalmetadata': {'width': 1694, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14369336}]},
   {'id': '36206212',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062124',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551418,
      'filename': None,
      'filesize': 307502,
      'technicalmetadata': {'width': 1665, 'height': 2787}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13949196}]},
   {'id': '36206225',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062250',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551422,
      'filename': None,
      'filesize': 310439,
      'technicalmetadata': {'width': 1664, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14114880}]},
   {'id': '36206238',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062384',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551426,
      'filename': None,
      'filesize': 301196,
      'technicalmetadata': {'width': 1648, 'height': 2763}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13687828}]},
   {'id': '36206251',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062514',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551430,
      'filename': None,
      'filesize': 309281,
      'technicalmetadata': {'width': 1666, 'height': 2775}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13897256}]},
   {'id': '36206264',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062649',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551434,
      'filename': None,
      'filesize': 305751,
      'technicalmetadata': {'width': 1630, 'height': 2806}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13748248}]},
   {'id': '36206277',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062779',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551438,
      'filename': None,
      'filesize': 308294,
      'technicalmetadata': {'width': 1640, 'height': 2796}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13783776}]},
   {'id': '36206290',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362062905',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551442,
      'filename': None,
      'filesize': 305747,
      'technicalmetadata': {'width': 1612, 'height': 2830}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13713280}]},
   {'id': '36206303',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063031',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551446,
      'filename': None,
      'filesize': 306590,
      'technicalmetadata': {'width': 1640, 'height': 2797}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13788724}]},
   {'id': '36206316',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063165',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551450,
      'filename': None,
      'filesize': 299724,
      'technicalmetadata': {'width': 1625, 'height': 2789}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13623720}]},
   {'id': '36206329',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063296',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551454,
      'filename': None,
      'filesize': 295007,
      'technicalmetadata': {'width': 1595, 'height': 2737}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13124464}]},
   {'id': '36206342',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063426',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551458,
      'filename': None,
      'filesize': 297779,
      'technicalmetadata': {'width': 1588, 'height': 2812}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13423928}]},
   {'id': '36206355',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063555',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551462,
      'filename': None,
      'filesize': 296505,
      'technicalmetadata': {'width': 1609, 'height': 2771}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13402596}]},
   {'id': '36206368',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063681',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551466,
      'filename': None,
      'filesize': 295690,
      'technicalmetadata': {'width': 1601, 'height': 2749}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13230876}]},
   {'id': '36206381',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063813',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551470,
      'filename': None,
      'filesize': 295336,
      'technicalmetadata': {'width': 1602, 'height': 2732}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13157308}]},
   {'id': '36206394',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362063942',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551474,
      'filename': None,
      'filesize': 297440,
      'technicalmetadata': {'width': 1594, 'height': 2794}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13388024}]},
   {'id': '36206407',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064075',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551478,
      'filename': None,
      'filesize': 289403,
      'technicalmetadata': {'width': 1569, 'height': 2764}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13037244}]},
   {'id': '36206420',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064205',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551482,
      'filename': None,
      'filesize': 294963,
      'technicalmetadata': {'width': 1593, 'height': 2786}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13341424}]},
   {'id': '36206433',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064331',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551486,
      'filename': None,
      'filesize': 300005,
      'technicalmetadata': {'width': 1599, 'height': 2784}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13381884}]},
   {'id': '36206446',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064462',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551490,
      'filename': None,
      'filesize': 295397,
      'technicalmetadata': {'width': 1599, 'height': 2778}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13353752}]},
   {'id': '36206459',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064599',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551494,
      'filename': None,
      'filesize': 293873,
      'technicalmetadata': {'width': 1584, 'height': 2754}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13114076}]},
   {'id': '36206472',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064729',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551498,
      'filename': None,
      'filesize': 289866,
      'technicalmetadata': {'width': 1554, 'height': 2783}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13001488}]},
   {'id': '36206485',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064858',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551502,
      'filename': None,
      'filesize': 300002,
      'technicalmetadata': {'width': 1639, 'height': 2761}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13603936}]},
   {'id': '36206498',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362064987',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551506,
      'filename': None,
      'filesize': 317983,
      'technicalmetadata': {'width': 1738, 'height': 2754}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14387576}]},
   {'id': '36206511',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065113',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551510,
      'filename': None,
      'filesize': 322407,
      'technicalmetadata': {'width': 1728, 'height': 2786}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14470684}]},
   {'id': '36206524',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065244',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551514,
      'filename': None,
      'filesize': 333367,
      'technicalmetadata': {'width': 1762, 'height': 2830}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14987704}]},
   {'id': '36206537',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065373',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551518,
      'filename': None,
      'filesize': 330449,
      'technicalmetadata': {'width': 1754, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14877328}]},
   {'id': '36206550',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065503',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551522,
      'filename': None,
      'filesize': 324108,
      'technicalmetadata': {'width': 1752, 'height': 2786}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14669868}]},
   {'id': '36206563',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065633',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551526,
      'filename': None,
      'filesize': 315480,
      'technicalmetadata': {'width': 1716, 'height': 2762}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14246788}]},
   {'id': '36206576',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065767',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551530,
      'filename': None,
      'filesize': 324317,
      'technicalmetadata': {'width': 1750, 'height': 2788}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14665132}]},
   {'id': '36206589',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362065894',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551534,
      'filename': None,
      'filesize': 326781,
      'technicalmetadata': {'width': 1742, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14775888}]},
   {'id': '36206602',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066023',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551538,
      'filename': None,
      'filesize': 333360,
      'technicalmetadata': {'width': 1780, 'height': 2830}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 15140296}]},
   {'id': '36206615',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066153',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551542,
      'filename': None,
      'filesize': 314707,
      'technicalmetadata': {'width': 1706, 'height': 2755}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14128324}]},
   {'id': '36206628',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066287',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551546,
      'filename': None,
      'filesize': 324455,
      'technicalmetadata': {'width': 1758, 'height': 2790}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14742720}]},
   {'id': '36206641',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066417',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551550,
      'filename': None,
      'filesize': 321925,
      'technicalmetadata': {'width': 1732, 'height': 2808}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14618624}]},
   {'id': '36206654',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066547',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551554,
      'filename': None,
      'filesize': 329478,
      'technicalmetadata': {'width': 1779, 'height': 2795}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14945160}]},
   {'id': '36206667',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066673',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551558,
      'filename': None,
      'filesize': 308578,
      'technicalmetadata': {'width': 1682, 'height': 2747}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 13889596}]},
   {'id': '36206680',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066807',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551562,
      'filename': None,
      'filesize': 323456,
      'technicalmetadata': {'width': 1750, 'height': 2763}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14533588}]},
   {'id': '36206693',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362066935',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551566,
      'filename': None,
      'filesize': 324834,
      'technicalmetadata': {'width': 1718, 'height': 2822}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 14569580}]},
   {'id': '36205977',
    'subType': 'page',
    'title': "Lord Robert Cecil's gold fields diary",
    'bibId': '653766',
    'pid': 'nla.obj-362059771',
    'form': 'Book',
    'accessConditions': 'Unrestricted',
    'copyrightPolicy': 'Out of Copyright',
    'bibLevel': 'Part',
    'digitalStatus': 'Captured',
    'holdingNumber': 'JAFp BIO 92',
    'copies': [{'copyrole': 'access',
      'blobId': 11551346,
      'filename': None,
      'filesize': 361053,
      'technicalmetadata': {'width': 1938, 'height': 2801}},
     {'copyrole': 'm', 'access': 'false', 'filesize': 16310064}]}],
  'article': [],
  'chapter': [{'id': '36207811',
    'subType': 'chapter',
    'subUnitNo': '1',
    'pid': 'nla.obj-362078119',
    'bibLevel': 'Section',
    'existson': [{'id': '36205990', 'page': 'nla.obj-362059904'},
     {'id': '36206003', 'page': 'nla.obj-362060036'},
     {'id': '36206017', 'page': 'nla.obj-362060175'},
     {'id': '36206030', 'page': 'nla.obj-362060307'},
     {'id': '36206043', 'page': 'nla.obj-362060433'},
     {'id': '36206056', 'page': 'nla.obj-362060563'},
     {'id': '36206069', 'page': 'nla.obj-362060694'}]},
   {'id': '36207820',
    'subType': 'chapter',
    'subUnitNo': '2',
    'pid': 'nla.obj-362078203',
    'bibLevel': 'Section',
    'existson': [{'id': '36206095', 'page': 'nla.obj-362060959'},
     {'id': '36206082', 'page': 'nla.obj-362060828'},
     {'id': '36206108', 'page': 'nla.obj-362061083'},
     {'id': '36206121', 'page': 'nla.obj-362061212'},
     {'id': '36206134', 'page': 'nla.obj-362061349'},
     {'id': '36206147', 'page': 'nla.obj-362061476'},
     {'id': '36206160', 'page': 'nla.obj-362061603'},
     {'id': '36206173', 'page': 'nla.obj-362061731'},
     {'id': '36206186', 'page': 'nla.obj-362061862'},
     {'id': '36206199', 'page': 'nla.obj-362061995'},
     {'id': '36206212', 'page': 'nla.obj-362062124'},
     {'id': '36206225', 'page': 'nla.obj-362062250'},
     {'id': '36206238', 'page': 'nla.obj-362062384'},
     {'id': '36206251', 'page': 'nla.obj-362062514'},
     {'id': '36206264', 'page': 'nla.obj-362062649'},
     {'id': '36206277', 'page': 'nla.obj-362062779'},
     {'id': '36206290', 'page': 'nla.obj-362062905'},
     {'id': '36206303', 'page': 'nla.obj-362063031'},
     {'id': '36206316', 'page': 'nla.obj-362063165'},
     {'id': '36206329', 'page': 'nla.obj-362063296'},
     {'id': '36206342', 'page': 'nla.obj-362063426'},
     {'id': '36206355', 'page': 'nla.obj-362063555'},
     {'id': '36206368', 'page': 'nla.obj-362063681'},
     {'id': '36206381', 'page': 'nla.obj-362063813'},
     {'id': '36206394', 'page': 'nla.obj-362063942'},
     {'id': '36206407', 'page': 'nla.obj-362064075'},
     {'id': '36206420', 'page': 'nla.obj-362064205'},
     {'id': '36206433', 'page': 'nla.obj-362064331'},
     {'id': '36206446', 'page': 'nla.obj-362064462'},
     {'id': '36206459', 'page': 'nla.obj-362064599'},
     {'id': '36206472', 'page': 'nla.obj-362064729'},
     {'id': '36206485', 'page': 'nla.obj-362064858'},
     {'id': '36206498', 'page': 'nla.obj-362064987'},
     {'id': '36206511', 'page': 'nla.obj-362065113'},
     {'id': '36206524', 'page': 'nla.obj-362065244'},
     {'id': '36206537', 'page': 'nla.obj-362065373'},
     {'id': '36206550', 'page': 'nla.obj-362065503'},
     {'id': '36206563', 'page': 'nla.obj-362065633'},
     {'id': '36206576', 'page': 'nla.obj-362065767'},
     {'id': '36206589', 'page': 'nla.obj-362065894'},
     {'id': '36206602', 'page': 'nla.obj-362066023'},
     {'id': '36206615', 'page': 'nla.obj-362066153'},
     {'id': '36206628', 'page': 'nla.obj-362066287'},
     {'id': '36206641', 'page': 'nla.obj-362066417'},
     {'id': '36206654', 'page': 'nla.obj-362066547'},
     {'id': '36206667', 'page': 'nla.obj-362066673'},
     {'id': '36206680', 'page': 'nla.obj-362066807'},
     {'id': '36206693', 'page': 'nla.obj-362066935'},
     {'id': '36205977', 'page': 'nla.obj-362059771'}]}],
  'book': [],
  'volume': [],
  'other': []},
 'topLevelCollection': 'nla.obj-362059651'}

Get information about pages#

Depending on the format, the children field can contain information about pages, chapters, and articles contained within the digitised work. Books and periodical issues should include page data. To find the number of pages, you just need to get the length of the page list.

# How many pages are there?
len(data["children"]["page"])
56

If you want to get the identifiers for each individual page, just loop through the list of pages saving the pid value.

page_ids = [p["pid"] for p in data["children"]["page"]]
page_ids[:5]
['nla.obj-362059904',
 'nla.obj-362060036',
 'nla.obj-362060175',
 'nla.obj-362060307',
 'nla.obj-362060433']

These page identifiers can be used to download images of the pages.

Get MARC catalogue data#

The MARC data is contained in the marcData field. This field can contain multiple records – the main metadata is contained in the Bibliographic record. To retrieve a value you need to know the MARC tag and subfield for the field you’re interested in. You can then loop through the datafield list until you find the tag and subfield, and extract the value from the content field.

The functions below will extract the value of a given MARC tag and subfield from the embedded metadata.

def find_field_content(record, tag, subfield):
    """
    Loop through a MARC record looking for tag/subfield.
    If found, return the subfield value.
    """
    try:
        for field in record["datafield"]:
            if str(field["tag"]) == tag:
                if isinstance(field["subfield"], list):
                    for sfield in field["subfield"]:
                        if sfield["code"] == subfield:
                            return sfield["content"]
                else:
                    if field["subfield"]["code"] == subfield:
                        return field["subfield"]["content"]
    except (KeyError, TypeError):
        pass
    return None


def get_marc_field(work_data, tag, subfield):
    """
    Find the Bibliographic record in the MARC data and find the value
    of a given tag and subfield.
    """
    if "marcData" in work_data and work_data["marcData"]:
        for record in work_data["marcData"]["record"]:
            if record["leader"]["type"] == "Bibliographic":
                value = find_field_content(record, tag, subfield)
                break
    return value

For example, the main title of a work is in MARC tag 245, subfield a.

get_marc_field(data, "245", "a")
"Lord Robert Cecil's gold fields diary /"

The subfield c contains a ‘statement of responsibility’.

get_marc_field(data, 245, "c")